diff --git a/docs/CREATING_CM.md b/docs/CREATING_CM.md
new file mode 100644
index 00000000..2b81beba
--- /dev/null
+++ b/docs/CREATING_CM.md
@@ -0,0 +1,65 @@
+# CREATING CM directories
+
+*** BY FAR THE SAFEST WAY IS TO USE QUICKSCRAPE ***
+
+Any other method is likely to lead to fies out of sync unless you are acreful with what you are doing.
+However it can be sometimes useful to create CMDirs from single files.
+This documentation may not have been thoroughly checked.
+
+## Input
+
+For a command: 
+
+``` norma -i foo/bar/a12345.suffix -o plugh/xyzzy```
+
+the system will create a CMDir of the form:
+
+``` plugh/xyzzy/a12345```
+
+It will then use ```suffix``` to create either reserved files (e.g. ```fulltext.xml```) in the CMDir or reserved subdirectories
+of the form:
+
+``` plugh/xyzzy/a12345/image```
+
+to hold the images. As there can be several images (e.g.  ```plugh/xyzzy/a12345.png``` ) we use the given names, such as:
+
+``` plugh/xyzzy/a12345/image/a12345.png```
+
+This is verbose and also leads to a separate CMDir for each image.
+
+## File types
+
+The following suffixes are supported:
+
+### Single reserved files
+
+The CMDir is generated from the ```-o mydir``` parameter and the input baseNames ```(FilenameUtile.getBaseName())```
+
+```mydir/bar``` is the CMDir.
+
+```foo/bar.xml``` is copied to ```mydir/bar/fulltext.xml```
+```foo/bar.html``` is copied to ```mydir/bar/fulltext.html```
+```foo/bar.pdf``` is copied to ```mydir/bar/fulltext.pdf```
+```foo/bar.epub``` is copied to ```mydir/bar/fulltext.epub```
+```foo/bar.txt``` is copied to ```mydir/bar/fulltext.txt```
+
+### Image files
+
+```foo/bar.png``` is copied to ```mydir/bar/image/bar.png```
+
+Analogous copies for:
+ ```gif```, ```jpg```, ```tif```
+ 
+### Supplemental Data files
+
+```foo/bar.doc``` is copied to ```mydir/bar/supplement/bar.png```
+
+Analogous copies for:
+ ```docx```, ```csv```, ```tex```, ```ppt```, ```pptx```, ...
+ 
+### SVG Data files
+
+```foo/bar.svg``` is copied to ```mydir/bar/svg/bar.svg```
+
+ 
+ 
\ No newline at end of file
diff --git a/examples/hocr-tesseract-ijsem-140.zip b/examples/hocr-tesseract-ijsem-140.zip
new file mode 100644
index 00000000..cce1b2a2
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140.zip differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000026-0-000.pbm2.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000026-0-000.pbm2.png
new file mode 100644
index 00000000..35d9f3ef
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000026-0-000.pbm2.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000026-0-000.pbm2.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000026-0-000.pbm2.png.hocr
new file mode 100644
index 00000000..b4b1c774
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000026-0-000.pbm2.png.hocr
@@ -0,0 +1,736 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000026-0-000.pbm2.png"; bbox 0 0 1716 1245; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 141 1063 178 1081">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 141 1063 178 1081">
+     <span class='ocr_line' id='line_1_1' title="bbox 141 1063 178 1081; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 141 1063 178 1081; x_wconf 90' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 260 206 305 224">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 260 206 305 224">
+     <span class='ocr_line' id='line_1_2' title="bbox 260 206 305 224; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 260 206 305 224; x_wconf 78' lang='eng'><em>0.02</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 267 953 292 971">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 267 953 292 971">
+     <span class='ocr_line' id='line_1_3' title="bbox 267 953 292 971; baseline 0 0"><span class='ocrx_word' id='word_1_3' title='bbox 267 953 292 971; x_wconf 84' lang='eng'><em>67</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 382 871 403 888">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 382 871 403 888">
+     <span class='ocr_line' id='line_1_4' title="bbox 382 871 403 888; baseline 0 0"><span class='ocrx_word' id='word_1_4' title='bbox 382 871 403 888; x_wconf 85' lang='eng'>81</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 544 458 565 475">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 544 458 565 475">
+     <span class='ocr_line' id='line_1_5' title="bbox 544 458 565 475; baseline 0 0"><span class='ocrx_word' id='word_1_5' title='bbox 544 458 565 475; x_wconf 90' lang='eng'><em>71</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 804 0 1461 28">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 804 0 1461 28">
+     <span class='ocr_line' id='line_1_6' title="bbox 804 0 1461 28; baseline 0 -6"><span class='ocrx_word' id='word_1_6' title='bbox 804 5 828 22; x_wconf 82' lang='eng'>68</span> <span class='ocrx_word' id='word_1_7' title='bbox 837 12 899 14; x_wconf 94' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_8' title='bbox 907 3 929 22; x_wconf 92' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 941 3 1109 28; x_wconf 80' lang='eng' dir='ltr'><em>kentL/Ckyensis</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 1119 3 1189 22; x_wconf 87' lang='eng' dir='ltr'>NRRL</span> <span class='ocrx_word' id='word_1_11' title='bbox 1200 0 1310 22; x_wconf 79' lang='eng' dir='ltr'><em>8—24129T</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 1320 3 1461 28; x_wconf 88' lang='eng' dir='ltr'><em>(AY183357)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 817 28 837 30">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 817 28 837 30">
+     <span class='ocr_line' id='line_1_7' title="bbox 817 28 837 30; baseline 0 1215"><span class='ocrx_word' id='word_1_13' title='bbox 817 28 837 30; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 836 12 837 45">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 836 12 837 45">
+     <span class='ocr_line' id='line_1_8' title="bbox 836 12 837 45; baseline 0 1200"><span class='ocrx_word' id='word_1_14' title='bbox 836 12 837 45; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 817 28 819 90">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 817 28 819 90">
+     <span class='ocr_line' id='line_1_9' title="bbox 817 28 819 90; baseline 0 1155"><span class='ocrx_word' id='word_1_15' title='bbox 817 28 819 90; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 837 31 1366 59">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 837 31 1366 59">
+     <span class='ocr_line' id='line_1_10' title="bbox 837 31 1366 59; baseline 0 -6"><span class='ocrx_word' id='word_1_16' title='bbox 837 43 867 45; x_wconf 96' lang='eng'>—</span> <span class='ocrx_word' id='word_1_17' title='bbox 879 34 902 53; x_wconf 89' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 913 33 1054 58; x_wconf 80' lang='eng' dir='ltr'><em>rifamycinica</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 1064 33 1120 53; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 1130 31 1215 53; x_wconf 79' lang='eng' dir='ltr'><em>46095T</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 1225 33 1366 59; x_wconf 85' lang='eng' dir='ltr'><em>(AY083603)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 817 88 853 90">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 817 88 853 90">
+     <span class='ocr_line' id='line_1_11' title="bbox 817 88 853 90; baseline 0 1155"><span class='ocrx_word' id='word_1_22' title='bbox 817 88 853 90; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 860 92 1479 149">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 860 92 1479 149">
+     <span class='ocr_line' id='line_1_12' title="bbox 860 92 1384 119; baseline 0.002 -6"><span class='ocrx_word' id='word_1_23' title='bbox 860 94 883 113; x_wconf 95' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 894 94 1033 119; x_wconf 83' lang='eng' dir='ltr'><em>pretoriensis</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 1043 94 1113 113; x_wconf 90' lang='eng' dir='ltr'>NRRL</span> <span class='ocrx_word' id='word_1_26' title='bbox 1123 92 1234 114; x_wconf 85' lang='eng' dir='ltr'><em>B-24133T</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 1244 94 1384 119; x_wconf 87' lang='eng' dir='ltr'><em>(AY183357)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 944 122 1479 149; baseline 0 -5"><span class='ocrx_word' id='word_1_28' title='bbox 944 124 967 144; x_wconf 93' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 979 124 1171 149; x_wconf 83' lang='eng' dir='ltr'><em>vancoresmycina</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 1182 124 1238 144; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 1248 122 1333 144; x_wconf 77' lang='eng' dir='ltr'><em>44592T</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 1343 124 1479 149; x_wconf 88' lang='eng' dir='ltr'><em>(AJ508240)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 853 135 937 136">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 853 135 937 136">
+     <span class='ocr_line' id='line_1_14' title="bbox 853 135 937 136; baseline 0 1109"><span class='ocrx_word' id='word_1_33' title='bbox 853 135 937 136; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 781 58 1435 159">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 781 61 1435 100">
+     <span class='ocr_line' id='line_1_15' title="bbox 781 61 1435 100; baseline 0 -17"><span class='ocrx_word' id='word_1_34' title='bbox 781 83 806 100; x_wconf 71' lang='eng'><em>93</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 853 73 870 74; x_wconf 37' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 879 64 902 83; x_wconf 98' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 913 64 1083 89; x_wconf 80' lang='eng' dir='ltr'><em>lexingtonensis</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 1093 64 1163 83; x_wconf 88' lang='eng' dir='ltr'>NRRL</span> <span class='ocrx_word' id='word_1_39' title='bbox 1173 61 1284 83; x_wconf 78' lang='eng' dir='ltr'><em>B-24131T</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 1294 63 1435 89; x_wconf 88' lang='eng' dir='ltr'><em>(AY183358)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 751 164 1042 166">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 751 164 1042 166">
+     <span class='ocr_line' id='line_1_16' title="bbox 751 164 1042 166; baseline 0 1079"><span class='ocrx_word' id='word_1_41' title='bbox 751 164 1042 166; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 819 167 843 184">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 819 167 843 184">
+     <span class='ocr_line' id='line_1_17' title="bbox 819 167 843 184; baseline 0 0"><span class='ocrx_word' id='word_1_42' title='bbox 819 167 843 184; x_wconf 90' lang='eng'><em>74</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 786 109 788 227">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 786 109 788 227">
+     <span class='ocr_line' id='line_1_18' title="bbox 786 109 788 227; baseline 0 1018"><span class='ocrx_word' id='word_1_43' title='bbox 786 109 788 227; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 708 219 753 221">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 708 219 753 221">
+     <span class='ocr_line' id='line_1_19' title="bbox 708 219 753 221; baseline 0 1024"><span class='ocrx_word' id='word_1_44' title='bbox 708 219 753 221; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 676 243 700 260">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 676 243 700 260">
+     <span class='ocr_line' id='line_1_20' title="bbox 676 243 700 260; baseline 0 0"><span class='ocrx_word' id='word_1_45' title='bbox 676 243 700 260; x_wconf 88' lang='eng'><em>52</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 751 167 753 272">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 751 167 753 272">
+     <span class='ocr_line' id='line_1_21' title="bbox 751 167 753 272; baseline 0 973"><span class='ocrx_word' id='word_1_46' title='bbox 751 167 753 272; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 648 266 775 271">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 648 266 775 271">
+     <span class='ocr_line' id='line_1_22' title="bbox 648 266 775 271; baseline 0 974"><span class='ocrx_word' id='word_1_47' title='bbox 648 266 775 271; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 774 255 775 288">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 774 255 775 288">
+     <span class='ocr_line' id='line_1_23' title="bbox 774 255 775 288; baseline 0 957"><span class='ocrx_word' id='word_1_48' title='bbox 774 255 775 288; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 708 219 710 317">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 708 219 710 317">
+     <span class='ocr_line' id='line_1_24' title="bbox 708 219 710 317; baseline 0 928"><span class='ocrx_word' id='word_1_49' title='bbox 708 219 710 317; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 576 336 649 338">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 576 336 649 338">
+     <span class='ocr_line' id='line_1_25' title="bbox 576 336 649 338; baseline 0 907"><span class='ocrx_word' id='word_1_50' title='bbox 576 336 649 338; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 491 481 577 482">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 491 481 577 482">
+     <span class='ocr_line' id='line_1_26' title="bbox 491 481 577 482; baseline 0 763"><span class='ocrx_word' id='word_1_51' title='bbox 491 481 577 482; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 467 679 493 681">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 467 679 493 681">
+     <span class='ocr_line' id='line_1_27' title="bbox 467 679 493 681; baseline 0 564"><span class='ocrx_word' id='word_1_52' title='bbox 467 679 493 681; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 424 810 468 811">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 424 810 468 811">
+     <span class='ocr_line' id='line_1_28' title="bbox 424 810 468 811; baseline 0 434"><span class='ocrx_word' id='word_1_53' title='bbox 424 810 468 811; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 307 896 426 897">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 307 896 426 897">
+     <span class='ocr_line' id='line_1_29' title="bbox 307 896 426 897; baseline 0 348"><span class='ocrx_word' id='word_1_54' title='bbox 307 896 426 897; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 189 982 309 984">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 189 982 309 984">
+     <span class='ocr_line' id='line_1_30' title="bbox 189 982 309 984; baseline 0 261"><span class='ocrx_word' id='word_1_55' title='bbox 189 982 309 984; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 4 1089 191 1090">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 4 1089 191 1090">
+     <span class='ocr_line' id='line_1_31' title="bbox 4 1089 191 1090; baseline 0 155"><span class='ocrx_word' id='word_1_56' title='bbox 4 1089 191 1090; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 4 1089 5 1230">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 4 1089 5 1230">
+     <span class='ocr_line' id='line_1_32' title="bbox 4 1089 5 1230; baseline 0 15"><span class='ocrx_word' id='word_1_57' title='bbox 4 1089 5 1230; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 189 982 191 1199">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 189 982 191 1199">
+     <span class='ocr_line' id='line_1_33' title="bbox 189 982 191 1199; baseline 0 46"><span class='ocrx_word' id='word_1_58' title='bbox 189 982 191 1199; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 424 810 426 986">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 424 810 426 986">
+     <span class='ocr_line' id='line_1_34' title="bbox 424 810 426 986; baseline 0 259"><span class='ocrx_word' id='word_1_59' title='bbox 424 810 426 986; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 467 679 468 941">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 467 679 468 941">
+     <span class='ocr_line' id='line_1_35' title="bbox 467 679 468 941; baseline 0 304"><span class='ocrx_word' id='word_1_60' title='bbox 467 679 468 941; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 491 481 493 880">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 491 481 493 880">
+     <span class='ocr_line' id='line_1_36' title="bbox 491 481 493 880; baseline 0 365"><span class='ocrx_word' id='word_1_61' title='bbox 491 481 493 880; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 576 336 577 626">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 576 336 577 626">
+     <span class='ocr_line' id='line_1_37' title="bbox 576 336 577 626; baseline 0 619"><span class='ocrx_word' id='word_1_62' title='bbox 576 336 577 626; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_37' title="bbox 713 338 738 356">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 713 338 738 356">
+     <span class='ocr_line' id='line_1_38' title="bbox 713 338 738 356; baseline 0 0"><span class='ocrx_word' id='word_1_63' title='bbox 713 338 738 356; x_wconf 87' lang='eng'><em>56</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_38' title="bbox 648 267 649 407">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 648 267 649 407">
+     <span class='ocr_line' id='line_1_39' title="bbox 648 267 649 407; baseline 0 838"><span class='ocrx_word' id='word_1_64' title='bbox 648 267 649 407; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_39' title="bbox 775 255 873 257">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 775 255 873 257">
+     <span class='ocr_line' id='line_1_40' title="bbox 775 255 873 257; baseline 0 988"><span class='ocrx_word' id='word_1_65' title='bbox 775 255 873 257; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_40' title="bbox 851 73 853 181">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 851 73 853 181">
+     <span class='ocr_line' id='line_1_41' title="bbox 851 73 853 181; baseline 0 1064"><span class='ocrx_word' id='word_1_66' title='bbox 851 73 853 181; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_41' title="bbox 856 152 1521 302">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 856 152 1521 302">
+     <span class='ocr_line' id='line_1_42' title="bbox 1052 152 1521 180; baseline 0 -6"><span class='ocrx_word' id='word_1_67' title='bbox 1052 155 1075 174; x_wconf 95' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 1085 155 1206 180; x_wconf 83' lang='eng' dir='ltr'><em>plumensis</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 1215 154 1286 174; x_wconf 88' lang='eng' dir='ltr'><em>SBHS</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 1297 152 1370 180; x_wconf 87' lang='eng' dir='ltr'><em>Strp1T</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 1380 154 1521 180; x_wconf 87' lang='eng' dir='ltr'><em>(AY262825)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 856 183 1399 211; baseline 0 -6"><span class='ocrx_word' id='word_1_72' title='bbox 856 188 878 205; x_wconf 87' lang='eng'>91</span> <span class='ocrx_word' id='word_1_73' title='bbox 887 195 894 196; x_wconf 30' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 902 185 925 205; x_wconf 95' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 937 185 1092 210; x_wconf 80' lang='eng' dir='ltr'><em>tolypomycina</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 1103 185 1158 205; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 1168 183 1253 205; x_wconf 76' lang='eng' dir='ltr'><em>44544T</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 1263 185 1399 211; x_wconf 86' lang='eng' dir='ltr'><em>(AJ508241)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 926 213 1408 241; baseline 0 -6"><span class='ocrx_word' id='word_1_79' title='bbox 926 216 949 235; x_wconf 94' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 960 216 1101 241; x_wconf 87' lang='eng' dir='ltr'><em>balhimycina</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 1111 215 1167 235; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 1177 213 1262 235; x_wconf 80' lang='eng' dir='ltr'><em>44591T</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 1272 215 1408 241; x_wconf 81' lang='eng' dir='ltr'><em>(AJ508239)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 880 243 1373 271; baseline 0.002 -6"><span class='ocrx_word' id='word_1_84' title='bbox 880 246 903 265; x_wconf 91' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 914 246 1064 266; x_wconf 79' lang='eng' dir='ltr'><em>mediterranei</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 1073 246 1143 266; x_wconf 90' lang='eng' dir='ltr'><em>KCTC</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 1154 243 1222 266; x_wconf 72' lang='eng' dir='ltr'><em>1739T</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 1232 246 1373 271; x_wconf 86' lang='eng' dir='ltr'><em>(AY125600)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 973 274 1409 302; baseline 0 -6"><span class='ocrx_word' id='word_1_89' title='bbox 973 276 996 296; x_wconf 93' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 1007 276 1156 296; x_wconf 83' lang='eng' dir='ltr'><em>australiensis</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 1165 274 1258 296; x_wconf 82' lang='eng' dir='ltr'><em>GY048T</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 1268 276 1409 302; x_wconf 80' lang='eng' dir='ltr'><em>(AY183357)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_42' title="bbox 851 179 887 181">
+    <p class='ocr_par' dir='ltr' id='par_1_42' title="bbox 851 179 887 181">
+     <span class='ocr_line' id='line_1_47' title="bbox 851 179 887 181; baseline 0 1064"><span class='ocrx_word' id='word_1_93' title='bbox 851 179 887 181; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_43' title="bbox 886 164 887 196">
+    <p class='ocr_par' dir='ltr' id='par_1_43' title="bbox 886 164 887 196">
+     <span class='ocr_line' id='line_1_48' title="bbox 886 164 887 196; baseline 0 1049"><span class='ocrx_word' id='word_1_94' title='bbox 886 164 887 196; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_44' title="bbox 612 286 1419 332">
+    <p class='ocr_par' dir='ltr' id='par_1_44' title="bbox 612 305 1419 332">
+     <span class='ocr_line' id='line_1_49' title="bbox 612 305 1419 332; baseline -0.004 -3"><span class='ocrx_word' id='word_1_95' title='bbox 612 313 636 330; x_wconf 88' lang='eng'>50</span> <span class='ocrx_word' id='word_1_96' title='bbox 710 316 935 317; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_97' title='bbox 944 307 967 327; x_wconf 92' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 978 307 1133 327; x_wconf 82' lang='eng' dir='ltr'><em>saalfe/densis</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 1143 307 1183 327; x_wconf 92' lang='eng' dir='ltr'><em>HKI</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 1194 305 1264 327; x_wconf 91' lang='eng' dir='ltr'><em>0457T</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 1274 307 1419 332; x_wconf 88' lang='eng' dir='ltr'><em>(DQ792500)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_45' title="bbox 962 335 1290 362">
+    <p class='ocr_par' dir='ltr' id='par_1_45' title="bbox 962 335 1290 362">
+     <span class='ocr_line' id='line_1_50' title="bbox 962 335 1290 362; baseline 0 -5"><span class='ocrx_word' id='word_1_102' title='bbox 962 337 985 357; x_wconf 97' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 997 337 1069 357; x_wconf 68' lang='eng' dir='ltr'><em>rubida</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 1081 335 1141 357; x_wconf 79' lang='eng' dir='ltr'><em>13.4T</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 1150 337 1290 362; x_wconf 88' lang='eng' dir='ltr'><em>(AF222022)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_46' title="bbox 787 366 1305 393">
+    <p class='ocr_par' dir='ltr' id='par_1_46' title="bbox 787 366 1305 393">
+     <span class='ocr_line' id='line_1_51' title="bbox 787 366 1305 393; baseline -0.002 -5"><span class='ocrx_word' id='word_1_106' title='bbox 787 368 810 387; x_wconf 93' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 821 368 962 388; x_wconf 83' lang='eng' dir='ltr'><em>albidoﬂavus</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 972 368 1045 388; x_wconf 86' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 1057 366 1154 388; x_wconf 81' lang='eng' dir='ltr'><em>100337T</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 1164 368 1305 393; x_wconf 88' lang='eng' dir='ltr'><em>(AB327251)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_47' title="bbox 648 405 1200 408">
+    <p class='ocr_par' dir='ltr' id='par_1_47' title="bbox 648 405 1200 408">
+     <span class='ocr_line' id='line_1_52' title="bbox 648 405 1200 408; baseline 0 837"><span class='ocrx_word' id='word_1_111' title='bbox 648 405 1200 408; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_48' title="bbox 680 414 705 431">
+    <p class='ocr_par' dir='ltr' id='par_1_48' title="bbox 680 414 705 431">
+     <span class='ocr_line' id='line_1_53' title="bbox 680 414 705 431; baseline 0 0"><span class='ocrx_word' id='word_1_112' title='bbox 680 414 705 431; x_wconf 74' lang='eng'><em>89</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_49' title="bbox 713 362 715 446">
+    <p class='ocr_par' dir='ltr' id='par_1_49' title="bbox 713 362 715 446">
+     <span class='ocr_line' id='line_1_54' title="bbox 713 362 715 446; baseline 0 799"><span class='ocrx_word' id='word_1_113' title='bbox 713 362 715 446; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_50' title="bbox 713 445 741 446">
+    <p class='ocr_par' dir='ltr' id='par_1_50' title="bbox 713 445 741 446">
+     <span class='ocr_line' id='line_1_55' title="bbox 713 445 741 446; baseline 0 799"><span class='ocrx_word' id='word_1_114' title='bbox 713 445 741 446; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_51' title="bbox 786 438 787 470">
+    <p class='ocr_par' dir='ltr' id='par_1_51' title="bbox 786 438 787 470">
+     <span class='ocr_line' id='line_1_56' title="bbox 786 438 787 470; baseline 0 775"><span class='ocrx_word' id='word_1_115' title='bbox 786 438 787 470; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_52' title="bbox 739 407 741 486">
+    <p class='ocr_par' dir='ltr' id='par_1_52' title="bbox 739 407 741 486">
+     <span class='ocr_line' id='line_1_57' title="bbox 739 407 741 486; baseline 0 759"><span class='ocrx_word' id='word_1_116' title='bbox 739 407 741 486; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_53' title="bbox 739 484 779 486">
+    <p class='ocr_par' dir='ltr' id='par_1_53' title="bbox 739 484 779 486">
+     <span class='ocr_line' id='line_1_58' title="bbox 739 484 779 486; baseline 0 759"><span class='ocrx_word' id='word_1_117' title='bbox 739 484 779 486; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_54' title="bbox 777 453 779 515">
+    <p class='ocr_par' dir='ltr' id='par_1_54' title="bbox 777 453 779 515">
+     <span class='ocr_line' id='line_1_59' title="bbox 777 453 779 515; baseline 0 730"><span class='ocrx_word' id='word_1_118' title='bbox 777 453 779 515; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_55' title="bbox 777 513 810 515">
+    <p class='ocr_par' dir='ltr' id='par_1_55' title="bbox 777 513 810 515">
+     <span class='ocr_line' id='line_1_60' title="bbox 777 513 810 515; baseline 0 730"><span class='ocrx_word' id='word_1_119' title='bbox 777 513 810 515; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_56' title="bbox 808 498 810 531">
+    <p class='ocr_par' dir='ltr' id='par_1_56' title="bbox 808 498 810 531">
+     <span class='ocr_line' id='line_1_61' title="bbox 808 498 810 531; baseline 0 714"><span class='ocrx_word' id='word_1_120' title='bbox 808 498 810 531; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_57' title="bbox 662 549 841 600">
+    <p class='ocr_par' dir='ltr' id='par_1_57' title="bbox 662 549 841 600">
+     <span class='ocr_line' id='line_1_62' title="bbox 701 549 841 570; baseline 0 0"><span class='ocrx_word' id='word_1_121' title='bbox 701 549 726 567; x_wconf 81' lang='eng'>95</span> <span class='ocrx_word' id='word_1_122' title='bbox 818 550 841 570; x_wconf 91' lang='eng' dir='ltr'><em>A.</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_63' title="bbox 662 560 838 600; baseline 0 -9"><span class='ocrx_word' id='word_1_123' title='bbox 662 560 838 600; x_wconf 58' lang='eng' dir='ltr'><em>{A</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_58' title="bbox 626 598 647 616">
+    <p class='ocr_par' dir='ltr' id='par_1_58' title="bbox 626 598 647 616">
+     <span class='ocr_line' id='line_1_64' title="bbox 626 598 647 616; baseline 0 0"><span class='ocrx_word' id='word_1_124' title='bbox 626 598 647 616; x_wconf 88' lang='eng'><em>91</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_59' title="bbox 576 624 662 626">
+    <p class='ocr_par' dir='ltr' id='par_1_59' title="bbox 576 624 662 626">
+     <span class='ocr_line' id='line_1_65' title="bbox 576 624 662 626; baseline 0 619"><span class='ocrx_word' id='word_1_125' title='bbox 576 624 662 626; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_60' title="bbox 751 641 837 661">
+    <p class='ocr_par' dir='ltr' id='par_1_60' title="bbox 751 641 837 661">
+     <span class='ocr_line' id='line_1_66' title="bbox 751 641 837 661; baseline 0 0"><span class='ocrx_word' id='word_1_126' title='bbox 751 641 837 661; x_wconf 36' lang='eng' dir='ltr'><em>857A.</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_61' title="bbox 755 665 784 667">
+    <p class='ocr_par' dir='ltr' id='par_1_61' title="bbox 755 665 784 667">
+     <span class='ocr_line' id='line_1_67' title="bbox 755 665 784 667; baseline 0 578"><span class='ocrx_word' id='word_1_127' title='bbox 755 665 784 667; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_62' title="bbox 660 574 662 677">
+    <p class='ocr_par' dir='ltr' id='par_1_62' title="bbox 660 574 662 677">
+     <span class='ocr_line' id='line_1_68' title="bbox 660 574 662 677; baseline 0 568"><span class='ocrx_word' id='word_1_128' title='bbox 660 574 662 677; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_63' title="bbox 782 650 784 682">
+    <p class='ocr_par' dir='ltr' id='par_1_63' title="bbox 782 650 784 682">
+     <span class='ocr_line' id='line_1_69' title="bbox 782 650 784 682; baseline 0 563"><span class='ocrx_word' id='word_1_129' title='bbox 782 650 784 682; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_64' title="bbox 660 676 729 677">
+    <p class='ocr_par' dir='ltr' id='par_1_64' title="bbox 660 676 729 677">
+     <span class='ocr_line' id='line_1_70' title="bbox 660 676 729 677; baseline 0 568"><span class='ocrx_word' id='word_1_130' title='bbox 660 676 729 677; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_65' title="bbox 727 621 729 731">
+    <p class='ocr_par' dir='ltr' id='par_1_65' title="bbox 727 621 729 731">
+     <span class='ocr_line' id='line_1_71' title="bbox 727 621 729 731; baseline 0 514"><span class='ocrx_word' id='word_1_131' title='bbox 727 621 729 731; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_66' title="bbox 755 665 757 796">
+    <p class='ocr_par' dir='ltr' id='par_1_66' title="bbox 755 665 757 796">
+     <span class='ocr_line' id='line_1_72' title="bbox 755 665 757 796; baseline 0 449"><span class='ocrx_word' id='word_1_132' title='bbox 755 665 757 796; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_67' title="bbox 755 794 791 796">
+    <p class='ocr_par' dir='ltr' id='par_1_67' title="bbox 755 794 791 796">
+     <span class='ocr_line' id='line_1_73' title="bbox 755 794 791 796; baseline 0 449"><span class='ocrx_word' id='word_1_133' title='bbox 755 794 791 796; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_68' title="bbox 789 772 791 818">
+    <p class='ocr_par' dir='ltr' id='par_1_68' title="bbox 789 772 791 818">
+     <span class='ocr_line' id='line_1_74' title="bbox 789 772 791 818; baseline 0 427"><span class='ocrx_word' id='word_1_134' title='bbox 789 772 791 818; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_69' title="bbox 787 438 875 439">
+    <p class='ocr_par' dir='ltr' id='par_1_69' title="bbox 787 438 875 439">
+     <span class='ocr_line' id='line_1_75' title="bbox 787 438 875 439; baseline 0 806"><span class='ocrx_word' id='word_1_135' title='bbox 787 438 875 439; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_70' title="bbox 810 498 903 500">
+    <p class='ocr_par' dir='ltr' id='par_1_70' title="bbox 810 498 903 500">
+     <span class='ocr_line' id='line_1_76' title="bbox 810 498 903 500; baseline 0 745"><span class='ocrx_word' id='word_1_136' title='bbox 810 498 903 500; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_71' title="bbox 883 396 1716 454">
+    <p class='ocr_par' dir='ltr' id='par_1_71' title="bbox 883 396 1716 454">
+     <span class='ocr_line' id='line_1_77' title="bbox 1208 396 1716 424; baseline 0 -6"><span class='ocrx_word' id='word_1_137' title='bbox 1208 398 1231 418; x_wconf 95' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_138' title='bbox 1243 398 1404 423; x_wconf 81' lang='eng' dir='ltr'><em>benzoati/ytica</em></span> <span class='ocrx_word' id='word_1_139' title='bbox 1414 398 1470 418; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_140' title='bbox 1480 396 1565 418; x_wconf 78' lang='eng' dir='ltr'><em>43387T</em></span> <span class='ocrx_word' id='word_1_141' title='bbox 1575 398 1716 424; x_wconf 85' lang='eng' dir='ltr'><em>(AY957506)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_78' title="bbox 883 426 1392 454; baseline 0 -6"><span class='ocrx_word' id='word_1_142' title='bbox 883 429 906 448; x_wconf 98' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_143' title='bbox 917 429 1058 448; x_wconf 87' lang='eng' dir='ltr'><em>albidoflavus</em></span> <span class='ocrx_word' id='word_1_144' title='bbox 1068 428 1151 448; x_wconf 90' lang='eng' dir='ltr'><em>IMSNU</em></span> <span class='ocrx_word' id='word_1_145' title='bbox 1161 426 1246 448; x_wconf 80' lang='eng' dir='ltr'><em>22139T</em></span> <span class='ocrx_word' id='word_1_146' title='bbox 1256 429 1392 454; x_wconf 87' lang='eng' dir='ltr'><em>(AJ252832)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_72' title="bbox 787 456 1284 484">
+    <p class='ocr_par' dir='ltr' id='par_1_72' title="bbox 787 456 1284 484">
+     <span class='ocr_line' id='line_1_79' title="bbox 787 456 1284 484; baseline 0.002 -6"><span class='ocrx_word' id='word_1_147' title='bbox 787 469 863 470; x_wconf 41' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_148' title='bbox 872 459 895 478; x_wconf 96' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_149' title='bbox 906 459 1052 479; x_wconf 76' lang='eng' dir='ltr'><em>halotolerans</em></span> <span class='ocrx_word' id='word_1_150' title='bbox 1062 456 1129 479; x_wconf 83' lang='eng' dir='ltr'><em>N4-6T</em></span> <span class='ocrx_word' id='word_1_151' title='bbox 1139 459 1284 484; x_wconf 86' lang='eng' dir='ltr'><em>(DQOOO196)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_73' title="bbox 908 487 1317 514">
+    <p class='ocr_par' dir='ltr' id='par_1_73' title="bbox 908 487 1317 514">
+     <span class='ocr_line' id='line_1_80' title="bbox 908 487 1317 514; baseline 0 -5"><span class='ocrx_word' id='word_1_152' title='bbox 908 489 931 509; x_wconf 97' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_153' title='bbox 943 489 1099 514; x_wconf 81' lang='eng' dir='ltr'><em>echigonensis</em></span> <span class='ocrx_word' id='word_1_154' title='bbox 1108 487 1166 509; x_wconf 78' lang='eng' dir='ltr'><em>L02T</em></span> <span class='ocrx_word' id='word_1_155' title='bbox 1176 489 1317 514; x_wconf 86' lang='eng' dir='ltr'><em>(AB248535)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_74' title="bbox 810 517 1262 545">
+    <p class='ocr_par' dir='ltr' id='par_1_74' title="bbox 810 517 1262 545">
+     <span class='ocr_line' id='line_1_81' title="bbox 810 517 1262 545; baseline 0 -6"><span class='ocrx_word' id='word_1_156' title='bbox 810 529 860 531; x_wconf 97' lang='eng'>—</span> <span class='ocrx_word' id='word_1_157' title='bbox 868 520 891 539; x_wconf 76' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_158' title='bbox 902 520 1028 545; x_wconf 82' lang='eng' dir='ltr'><em>niigatensis</em></span> <span class='ocrx_word' id='word_1_159' title='bbox 1038 517 1111 539; x_wconf 86' lang='eng' dir='ltr'><em>LC11T</em></span> <span class='ocrx_word' id='word_1_160' title='bbox 1121 519 1262 545; x_wconf 77' lang='eng' dir='ltr'><em>(ABZ48537)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_75' title="bbox 850 548 1308 606">
+    <p class='ocr_par' dir='ltr' id='par_1_75' title="bbox 850 548 1308 606">
+     <span class='ocr_line' id='line_1_82' title="bbox 853 548 1212 575; baseline 0 -5"><span class='ocrx_word' id='word_1_161' title='bbox 853 550 901 570; x_wconf 84' lang='eng' dir='ltr'><em>alba</em></span> <span class='ocrx_word' id='word_1_162' title='bbox 912 550 968 570; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_163' title='bbox 977 548 1063 570; x_wconf 78' lang='eng' dir='ltr'><em>44262T</em></span> <span class='ocrx_word' id='word_1_164' title='bbox 1073 550 1212 575; x_wconf 86' lang='eng' dir='ltr'><em>(AF051340)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_83' title="bbox 850 578 1308 606; baseline -0.002 -5"><span class='ocrx_word' id='word_1_165' title='bbox 850 581 1000 601; x_wconf 83' lang='eng' dir='ltr'><em>coloradensis</em></span> <span class='ocrx_word' id='word_1_166' title='bbox 1010 581 1080 600; x_wconf 86' lang='eng' dir='ltr'>NRRL</span> <span class='ocrx_word' id='word_1_167' title='bbox 1090 578 1159 601; x_wconf 85' lang='eng' dir='ltr'><em>3218T</em></span> <span class='ocrx_word' id='word_1_168' title='bbox 1168 580 1308 606; x_wconf 88' lang='eng' dir='ltr'><em>(AF051341)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_76' title="bbox 729 609 1257 636">
+    <p class='ocr_par' dir='ltr' id='par_1_76' title="bbox 729 609 1257 636">
+     <span class='ocr_line' id='line_1_84' title="bbox 729 609 1257 636; baseline 0 -5"><span class='ocrx_word' id='word_1_169' title='bbox 729 620 799 622; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_170' title='bbox 808 611 831 631; x_wconf 91' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_171' title='bbox 842 616 923 631; x_wconf 87' lang='eng' dir='ltr'><em>azurea</em></span> <span class='ocrx_word' id='word_1_172' title='bbox 933 611 1016 631; x_wconf 88' lang='eng' dir='ltr'><em>IMSNU</em></span> <span class='ocrx_word' id='word_1_173' title='bbox 1026 609 1111 631; x_wconf 85' lang='eng' dir='ltr'><em>20053T</em></span> <span class='ocrx_word' id='word_1_174' title='bbox 1121 611 1257 636; x_wconf 86' lang='eng' dir='ltr'><em>(AJ400709)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_77' title="bbox 846 639 1548 727">
+    <p class='ocr_par' dir='ltr' id='par_1_77' title="bbox 846 639 1548 727">
+     <span class='ocr_line' id='line_1_85' title="bbox 848 639 1532 667; baseline 0 -6"><span class='ocrx_word' id='word_1_175' title='bbox 848 642 990 667; x_wconf 84' lang='eng' dir='ltr'><em>keratiniphila</em></span> <span class='ocrx_word' id='word_1_176' title='bbox 1000 642 1075 667; x_wconf 86' lang='eng' dir='ltr'><em>subsp.</em></span> <span class='ocrx_word' id='word_1_177' title='bbox 1086 642 1223 667; x_wconf 82' lang='eng' dir='ltr'><em>nogabecina</em></span> <span class='ocrx_word' id='word_1_178' title='bbox 1234 641 1290 661; x_wconf 86' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_179' title='bbox 1300 639 1385 661; x_wconf 81' lang='eng' dir='ltr'><em>44586T</em></span> <span class='ocrx_word' id='word_1_180' title='bbox 1395 641 1532 667; x_wconf 85' lang='eng' dir='ltr'><em>(AJ508238)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_86' title="bbox 846 670 1548 697; baseline 0 -5"><span class='ocrx_word' id='word_1_181' title='bbox 846 689 849 692; x_wconf 99' lang='eng'><em>.</em></span> <span class='ocrx_word' id='word_1_182' title='bbox 860 672 1002 697; x_wconf 81' lang='eng' dir='ltr'><em>keratiniphi/a</em></span> <span class='ocrx_word' id='word_1_183' title='bbox 1012 672 1088 697; x_wconf 84' lang='eng' dir='ltr'><em>subsp.</em></span> <span class='ocrx_word' id='word_1_184' title='bbox 1098 672 1240 697; x_wconf 85' lang='eng' dir='ltr'><em>keratiniphi/a</em></span> <span class='ocrx_word' id='word_1_185' title='bbox 1251 672 1307 692; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_186' title='bbox 1316 670 1402 692; x_wconf 76' lang='eng' dir='ltr'><em>44409T</em></span> <span class='ocrx_word' id='word_1_187' title='bbox 1411 672 1548 697; x_wconf 86' lang='eng' dir='ltr'><em>(AJ278496)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_87' title="bbox 849 700 1221 727; baseline 0 -5"><span class='ocrx_word' id='word_1_188' title='bbox 849 702 913 722; x_wconf 86' lang='eng' dir='ltr'><em>Iurida</em></span> <span class='ocrx_word' id='word_1_189' title='bbox 924 702 980 722; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_190' title='bbox 990 700 1075 722; x_wconf 78' lang='eng' dir='ltr'><em>43134T</em></span> <span class='ocrx_word' id='word_1_191' title='bbox 1085 702 1221 727; x_wconf 85' lang='eng' dir='ltr'><em>(AJ577997)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_78' title="bbox 696 672 1322 771">
+    <p class='ocr_par' dir='ltr' id='par_1_78' title="bbox 696 672 1322 758">
+     <span class='ocr_line' id='line_1_88' title="bbox 696 672 843 701; baseline 0 0"><span class='ocrx_word' id='word_1_192' title='bbox 696 684 721 701; x_wconf 82' lang='eng'><em>88</em></span> <span class='ocrx_word' id='word_1_193' title='bbox 784 681 817 682; x_wconf 35' lang='eng' dir='ltr'><em>i</em></span> <span class='ocrx_word' id='word_1_194' title='bbox 826 672 843 692; x_wconf 76' lang='eng' dir='ltr'><em>A</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_89' title="bbox 757 702 838 722; baseline 0 0"><span class='ocrx_word' id='word_1_195' title='bbox 757 712 808 713; x_wconf 39' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_196' title='bbox 815 702 838 722; x_wconf 97' lang='eng' dir='ltr'><em>A.</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_90' title="bbox 757 730 1322 758; baseline 0 -6"><span class='ocrx_word' id='word_1_197' title='bbox 757 741 829 743; x_wconf 94' lang='eng'>—</span> <span class='ocrx_word' id='word_1_198' title='bbox 836 733 859 752; x_wconf 96' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_199' title='bbox 871 733 1014 757; x_wconf 80' lang='eng' dir='ltr'><em>decaplanina</em></span> <span class='ocrx_word' id='word_1_200' title='bbox 1025 732 1081 752; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_201' title='bbox 1090 730 1175 752; x_wconf 78' lang='eng' dir='ltr'><em>44594T</em></span> <span class='ocrx_word' id='word_1_202' title='bbox 1185 732 1322 758; x_wconf 83' lang='eng' dir='ltr'><em>(AJ508237)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_79' title="bbox 922 760 1354 788">
+    <p class='ocr_par' dir='ltr' id='par_1_79' title="bbox 922 760 1354 788">
+     <span class='ocr_line' id='line_1_91' title="bbox 922 760 1354 788; baseline 0 -6"><span class='ocrx_word' id='word_1_203' title='bbox 922 763 944 782; x_wconf 90' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_204' title='bbox 952 763 1055 788; x_wconf 80' lang='eng' dir='ltr'><em>japan/ca</em></span> <span class='ocrx_word' id='word_1_205' title='bbox 1065 760 1237 783; x_wconf 73' lang='eng' dir='ltr'><em>MG417-CF17T</em></span> <span class='ocrx_word' id='word_1_206' title='bbox 1247 763 1354 788; x_wconf 84' lang='eng' dir='ltr'><em>(X77959)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_80' title="bbox 755 790 1310 841">
+    <p class='ocr_par' dir='ltr' id='par_1_80' title="bbox 755 790 1310 841">
+     <span class='ocr_line' id='line_1_92' title="bbox 755 790 1310 834; baseline 0.002 -22"><span class='ocrx_word' id='word_1_207' title='bbox 755 803 780 820; x_wconf 72' lang='eng'>85</span> <span class='ocrx_word' id='word_1_208' title='bbox 791 803 825 834; x_wconf 22' lang='eng'>%</span> <span class='ocrx_word' id='word_1_209' title='bbox 835 793 858 812; x_wconf 98' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_210' title='bbox 869 793 976 813; x_wconf 77' lang='eng' dir='ltr'><em>orientalis</em></span> <span class='ocrx_word' id='word_1_211' title='bbox 986 793 1068 813; x_wconf 90' lang='eng' dir='ltr'>IMSNU</span> <span class='ocrx_word' id='word_1_212' title='bbox 1079 790 1163 813; x_wconf 87' lang='eng' dir='ltr'><em>20058T</em></span> <span class='ocrx_word' id='word_1_213' title='bbox 1173 793 1310 818; x_wconf 88' lang='eng' dir='ltr'><em>(AJ400711)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_93' title="bbox 788 824 813 841; baseline 0 0"><span class='ocrx_word' id='word_1_214' title='bbox 788 824 813 841; x_wconf 85' lang='eng'>99</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_81' title="bbox 835 821 1260 848">
+    <p class='ocr_par' dir='ltr' id='par_1_81' title="bbox 835 821 1260 848">
+     <span class='ocr_line' id='line_1_94' title="bbox 835 821 1260 848; baseline 0 -5"><span class='ocrx_word' id='word_1_215' title='bbox 835 823 858 843; x_wconf 92' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_216' title='bbox 869 823 1007 848; x_wconf 85' lang='eng' dir='ltr'><em>regifaucium</em></span> <span class='ocrx_word' id='word_1_217' title='bbox 1016 821 1109 843; x_wconf 89' lang='eng' dir='ltr'><em>GY080T</em></span> <span class='ocrx_word' id='word_1_218' title='bbox 1119 823 1260 848; x_wconf 85' lang='eng' dir='ltr'><em>(AY129760)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_82' title="bbox 638 854 662 872">
+    <p class='ocr_par' dir='ltr' id='par_1_82' title="bbox 638 854 662 872">
+     <span class='ocr_line' id='line_1_95' title="bbox 638 854 662 872; baseline 0 0"><span class='ocrx_word' id='word_1_219' title='bbox 638 854 662 872; x_wconf 84' lang='eng'>98</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_83' title="bbox 491 878 679 880">
+    <p class='ocr_par' dir='ltr' id='par_1_83' title="bbox 491 878 679 880">
+     <span class='ocr_line' id='line_1_96' title="bbox 491 878 679 880; baseline 0 365"><span class='ocrx_word' id='word_1_220' title='bbox 491 878 679 880; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_84' title="bbox 504 913 528 931">
+    <p class='ocr_par' dir='ltr' id='par_1_84' title="bbox 504 913 528 931">
+     <span class='ocr_line' id='line_1_97' title="bbox 504 913 528 931; baseline 0 0"><span class='ocrx_word' id='word_1_221' title='bbox 504 913 528 931; x_wconf 86' lang='eng'><em>72</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_85' title="bbox 467 939 548 941">
+    <p class='ocr_par' dir='ltr' id='par_1_85' title="bbox 467 939 548 941">
+     <span class='ocr_line' id='line_1_98' title="bbox 467 939 548 941; baseline 0 304"><span class='ocrx_word' id='word_1_222' title='bbox 467 939 548 941; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_86' title="bbox 546 924 548 956">
+    <p class='ocr_par' dir='ltr' id='par_1_86' title="bbox 546 924 548 956">
+     <span class='ocr_line' id='line_1_99' title="bbox 546 924 548 956; baseline 0 289"><span class='ocrx_word' id='word_1_223' title='bbox 546 924 548 956; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_87' title="bbox 677 863 679 896">
+    <p class='ocr_par' dir='ltr' id='par_1_87' title="bbox 677 863 679 896">
+     <span class='ocr_line' id='line_1_100' title="bbox 677 863 679 896; baseline 0 349"><span class='ocrx_word' id='word_1_224' title='bbox 677 863 679 896; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_88' title="bbox 844 851 1338 909">
+    <p class='ocr_par' dir='ltr' id='par_1_88' title="bbox 844 851 1338 909">
+     <span class='ocr_line' id='line_1_101' title="bbox 844 851 1338 878; baseline 0 -5"><span class='ocrx_word' id='word_1_225' title='bbox 844 853 867 873; x_wconf 93' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_226' title='bbox 878 853 1007 878; x_wconf 88' lang='eng' dir='ltr'><em>nigrescens</em></span> <span class='ocrx_word' id='word_1_227' title='bbox 1016 851 1183 873; x_wconf 78' lang='eng' dir='ltr'><em>CSC17Ta-90T</em></span> <span class='ocrx_word' id='word_1_228' title='bbox 1192 853 1338 878; x_wconf 88' lang='eng' dir='ltr'><em>(DQ486888)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_102' title="bbox 874 881 1326 909; baseline 0.002 -6"><span class='ocrx_word' id='word_1_229' title='bbox 874 884 897 903; x_wconf 97' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_230' title='bbox 908 884 1079 904; x_wconf 77' lang='eng' dir='ltr'><em>minnesotensis</em></span> <span class='ocrx_word' id='word_1_231' title='bbox 1088 881 1171 904; x_wconf 82' lang='eng' dir='ltr'><em>32U-2T</em></span> <span class='ocrx_word' id='word_1_232' title='bbox 1180 883 1326 909; x_wconf 86' lang='eng' dir='ltr'><em>(DQO76842)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_89' title="bbox 761 911 1222 969">
+    <p class='ocr_par' dir='ltr' id='par_1_89' title="bbox 761 911 1222 969">
+     <span class='ocr_line' id='line_1_103' title="bbox 802 911 1172 939; baseline 0 -6"><span class='ocrx_word' id='word_1_233' title='bbox 802 914 825 933; x_wconf 94' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_234' title='bbox 832 914 940 939; x_wconf 84' lang='eng' dir='ltr'><em>jejuensis</em></span> <span class='ocrx_word' id='word_1_235' title='bbox 949 911 1017 933; x_wconf 81' lang='eng' dir='ltr'><em>N7-3T</em></span> <span class='ocrx_word' id='word_1_236' title='bbox 1026 913 1172 939; x_wconf 77' lang='eng'>(00000200)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_104' title="bbox 761 942 1222 969; baseline 0 -5"><span class='ocrx_word' id='word_1_237' title='bbox 761 944 784 964; x_wconf 91' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_238' title='bbox 796 944 912 969; x_wconf 82' lang='eng' dir='ltr'><em>sulphurea</em></span> <span class='ocrx_word' id='word_1_239' title='bbox 922 944 978 964; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_240' title='bbox 989 942 1073 964; x_wconf 81' lang='eng' dir='ltr'><em>46092T</em></span> <span class='ocrx_word' id='word_1_241' title='bbox 1083 944 1222 969; x_wconf 85' lang='eng' dir='ltr'><em>(AF051343)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_90' title="bbox 824 974 841 994">
+    <p class='ocr_par' dir='ltr' id='par_1_90' title="bbox 824 974 841 994">
+     <span class='ocr_line' id='line_1_105' title="bbox 824 974 841 994; baseline 0 0"><span class='ocrx_word' id='word_1_242' title='bbox 824 974 841 994; x_wconf 92' lang='eng' dir='ltr'><em>A</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_91' title="bbox 699 1015 786 1017">
+    <p class='ocr_par' dir='ltr' id='par_1_91' title="bbox 699 1015 786 1017">
+     <span class='ocr_line' id='line_1_106' title="bbox 699 1015 786 1017; baseline 0 228"><span class='ocrx_word' id='word_1_243' title='bbox 699 1015 786 1017; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_92' title="bbox 653 1007 690 1025">
+    <p class='ocr_par' dir='ltr' id='par_1_92' title="bbox 653 1007 690 1025">
+     <span class='ocr_line' id='line_1_107' title="bbox 653 1007 690 1025; baseline 0 0"><span class='ocrx_word' id='word_1_244' title='bbox 653 1007 690 1025; x_wconf 90' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_93' title="bbox 357 1030 699 1032">
+    <p class='ocr_par' dir='ltr' id='par_1_93' title="bbox 357 1030 699 1032">
+     <span class='ocr_line' id='line_1_108' title="bbox 357 1030 699 1032; baseline 0 213"><span class='ocrx_word' id='word_1_245' title='bbox 357 1030 699 1032; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_94' title="bbox 307 896 309 1068">
+    <p class='ocr_par' dir='ltr' id='par_1_94' title="bbox 307 896 309 1068">
+     <span class='ocr_line' id='line_1_109' title="bbox 307 896 309 1068; baseline 0 177"><span class='ocrx_word' id='word_1_246' title='bbox 307 896 309 1068; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_95' title="bbox 307 1066 358 1068">
+    <p class='ocr_par' dir='ltr' id='par_1_95' title="bbox 307 1066 358 1068">
+     <span class='ocr_line' id='line_1_110' title="bbox 307 1066 358 1068; baseline 0 177"><span class='ocrx_word' id='word_1_247' title='bbox 307 1066 358 1068; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_96' title="bbox 357 1030 358 1104">
+    <p class='ocr_par' dir='ltr' id='par_1_96' title="bbox 357 1030 358 1104">
+     <span class='ocr_line' id='line_1_111' title="bbox 357 1030 358 1104; baseline 0 141"><span class='ocrx_word' id='word_1_248' title='bbox 357 1030 358 1104; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_97' title="bbox 441 1080 465 1097">
+    <p class='ocr_par' dir='ltr' id='par_1_97' title="bbox 441 1080 465 1097">
+     <span class='ocr_line' id='line_1_112' title="bbox 441 1080 465 1097; baseline 0 0"><span class='ocrx_word' id='word_1_249' title='bbox 441 1080 465 1097; x_wconf 81' lang='eng'>58</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_98' title="bbox 698 1015 699 1047">
+    <p class='ocr_par' dir='ltr' id='par_1_98' title="bbox 698 1015 699 1047">
+     <span class='ocr_line' id='line_1_113' title="bbox 698 1015 699 1047; baseline 0 198"><span class='ocrx_word' id='word_1_250' title='bbox 698 1015 699 1047; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_99' title="bbox 844 972 1173 999">
+    <p class='ocr_par' dir='ltr' id='par_1_99' title="bbox 844 972 1173 999">
+     <span class='ocr_line' id='line_1_114' title="bbox 844 972 1173 999; baseline 0 -5"><span class='ocrx_word' id='word_1_251' title='bbox 844 991 847 994; x_wconf 99' lang='eng'><em>.</em></span> <span class='ocrx_word' id='word_1_252' title='bbox 859 974 959 994; x_wconf 85' lang='eng' dir='ltr'><em>sacchari</em></span> <span class='ocrx_word' id='word_1_253' title='bbox 967 972 1024 994; x_wconf 92' lang='eng' dir='ltr'><em>K24T</em></span> <span class='ocrx_word' id='word_1_254' title='bbox 1034 974 1173 999; x_wconf 82' lang='eng' dir='ltr'><em>(AF223354)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_100' title="bbox 699 1002 1227 1059">
+    <p class='ocr_par' dir='ltr' id='par_1_100' title="bbox 699 1002 1227 1059">
+     <span class='ocr_line' id='line_1_115' title="bbox 791 1002 1186 1030; baseline 0 -6"><span class='ocrx_word' id='word_1_255' title='bbox 791 1005 817 1024; x_wconf 94' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_256' title='bbox 827 1005 914 1024; x_wconf 84' lang='eng' dir='ltr'><em>marina</em></span> <span class='ocrx_word' id='word_1_257' title='bbox 924 1002 1034 1024; x_wconf 76' lang='eng' dir='ltr'><em>Ms392AT</em></span> <span class='ocrx_word' id='word_1_258' title='bbox 1044 1004 1186 1030; x_wconf 85' lang='eng' dir='ltr'><em>(EU329845)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_116' title="bbox 699 1032 1227 1059; baseline 0 -5"><span class='ocrx_word' id='word_1_259' title='bbox 699 1034 789 1054; x_wconf 95' lang='eng' dir='ltr'><em>—A.</em></span> <span class='ocrx_word' id='word_1_260' title='bbox 800 1034 990 1059; x_wconf 76' lang='eng' dir='ltr'><em>palatopharyngis</em></span> <span class='ocrx_word' id='word_1_261' title='bbox 1001 1032 1077 1054; x_wconf 88' lang='eng' dir='ltr'><em>1BDZT</em></span> <span class='ocrx_word' id='word_1_262' title='bbox 1087 1034 1227 1059; x_wconf 81' lang='eng' dir='ltr'><em>(AF479268)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_101' title="bbox 482 1075 1159 1077">
+    <p class='ocr_par' dir='ltr' id='par_1_101' title="bbox 482 1075 1159 1077">
+     <span class='ocr_line' id='line_1_117' title="bbox 482 1075 1159 1077; baseline 0 168"><span class='ocrx_word' id='word_1_263' title='bbox 482 1075 1159 1077; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_102' title="bbox 357 1102 484 1104">
+    <p class='ocr_par' dir='ltr' id='par_1_102' title="bbox 357 1102 484 1104">
+     <span class='ocr_line' id='line_1_118' title="bbox 357 1102 484 1104; baseline 0 141"><span class='ocrx_word' id='word_1_264' title='bbox 357 1102 484 1104; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_103' title="bbox 482 1075 484 1130">
+    <p class='ocr_par' dir='ltr' id='par_1_103' title="bbox 482 1075 484 1130">
+     <span class='ocr_line' id='line_1_119' title="bbox 482 1075 484 1130; baseline 0 115"><span class='ocrx_word' id='word_1_265' title='bbox 482 1075 484 1130; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_104' title="bbox 778 1105 815 1122">
+    <p class='ocr_par' dir='ltr' id='par_1_104' title="bbox 778 1105 815 1122">
+     <span class='ocr_line' id='line_1_120' title="bbox 778 1105 815 1122; baseline 0 0"><span class='ocrx_word' id='word_1_266' title='bbox 778 1105 815 1122; x_wconf 87' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_105' title="bbox 482 1128 829 1130">
+    <p class='ocr_par' dir='ltr' id='par_1_105' title="bbox 482 1128 829 1130">
+     <span class='ocr_line' id='line_1_121' title="bbox 482 1128 829 1130; baseline 0 115"><span class='ocrx_word' id='word_1_267' title='bbox 482 1128 829 1130; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_106' title="bbox 827 1106 829 1152">
+    <p class='ocr_par' dir='ltr' id='par_1_106' title="bbox 827 1106 829 1152">
+     <span class='ocr_line' id='line_1_122' title="bbox 827 1106 829 1152; baseline 0 93"><span class='ocrx_word' id='word_1_268' title='bbox 827 1106 829 1152; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_107' title="bbox 829 1106 927 1108">
+    <p class='ocr_par' dir='ltr' id='par_1_107' title="bbox 829 1106 927 1108">
+     <span class='ocr_line' id='line_1_123' title="bbox 829 1106 927 1108; baseline 0 137"><span class='ocrx_word' id='word_1_269' title='bbox 829 1106 927 1108; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_108' title="bbox 932 1062 1621 1150">
+    <p class='ocr_par' dir='ltr' id='par_1_108' title="bbox 932 1062 1621 1150">
+     <span class='ocr_line' id='line_1_124' title="bbox 1168 1062 1621 1090; baseline 0 -6"><span class='ocrx_word' id='word_1_270' title='bbox 1168 1065 1190 1084; x_wconf 93' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_271' title='bbox 1202 1065 1342 1084; x_wconf 83' lang='eng' dir='ltr'><em>taiwanensis</em></span> <span class='ocrx_word' id='word_1_272' title='bbox 1350 1062 1466 1084; x_wconf 90' lang='eng' dir='ltr'><em>0345M-7T</em></span> <span class='ocrx_word' id='word_1_273' title='bbox 1476 1064 1621 1090; x_wconf 85' lang='eng' dir='ltr'><em>(DQ160215)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_125' title="bbox 934 1092 1349 1120; baseline 0 -6"><span class='ocrx_word' id='word_1_274' title='bbox 934 1095 957 1114; x_wconf 95' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_275' title='bbox 969 1095 1103 1120; x_wconf 83' lang='eng' dir='ltr'><em>eurytherma</em></span> <span class='ocrx_word' id='word_1_276' title='bbox 1114 1092 1203 1114; x_wconf 88' lang='eng' dir='ltr'><em>NT202T</em></span> <span class='ocrx_word' id='word_1_277' title='bbox 1213 1094 1349 1120; x_wconf 89' lang='eng' dir='ltr'><em>(AJ000285)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_126' title="bbox 932 1122 1460 1150; baseline 0.002 -6"><span class='ocrx_word' id='word_1_278' title='bbox 932 1137 940 1139; x_wconf 98' lang='eng'><em>-</em></span> <span class='ocrx_word' id='word_1_279' title='bbox 948 1125 971 1144; x_wconf 73' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_280' title='bbox 982 1125 1126 1145; x_wconf 83' lang='eng' dir='ltr'><em>methanol/ca</em></span> <span class='ocrx_word' id='word_1_281' title='bbox 1137 1125 1219 1145; x_wconf 92' lang='eng' dir='ltr'><em>IMSNU</em></span> <span class='ocrx_word' id='word_1_282' title='bbox 1230 1122 1314 1145; x_wconf 88' lang='eng' dir='ltr'><em>20055T</em></span> <span class='ocrx_word' id='word_1_283' title='bbox 1324 1125 1460 1150; x_wconf 85' lang='eng' dir='ltr'><em>(AJ249135)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_109' title="bbox 827 1151 932 1152">
+    <p class='ocr_par' dir='ltr' id='par_1_109' title="bbox 827 1151 932 1152">
+     <span class='ocr_line' id='line_1_127' title="bbox 827 1151 932 1152; baseline 0 93"><span class='ocrx_word' id='word_1_284' title='bbox 827 1151 932 1152; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_110' title="bbox 930 1137 932 1168">
+    <p class='ocr_par' dir='ltr' id='par_1_110' title="bbox 930 1137 932 1168">
+     <span class='ocr_line' id='line_1_128' title="bbox 930 1137 932 1168; baseline 0 77"><span class='ocrx_word' id='word_1_285' title='bbox 930 1137 932 1168; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_111' title="bbox 879 1152 1388 1180">
+    <p class='ocr_par' dir='ltr' id='par_1_111' title="bbox 879 1152 1388 1180">
+     <span class='ocr_line' id='line_1_129' title="bbox 879 1152 1388 1180; baseline 0.002 -6"><span class='ocrx_word' id='word_1_286' title='bbox 879 1161 915 1179; x_wconf 81' lang='eng'>100</span> <span class='ocrx_word' id='word_1_287' title='bbox 932 1166 958 1168; x_wconf 98' lang='eng'>—</span> <span class='ocrx_word' id='word_1_288' title='bbox 967 1155 990 1174; x_wconf 95' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_289' title='bbox 1002 1155 1141 1175; x_wconf 84' lang='eng' dir='ltr'><em>thermof/ava</em></span> <span class='ocrx_word' id='word_1_290' title='bbox 1151 1152 1239 1175; x_wconf 89' lang='eng' dir='ltr'><em>N1165T</em></span> <span class='ocrx_word' id='word_1_291' title='bbox 1249 1155 1388 1180; x_wconf 84' lang='eng' dir='ltr'><em>(AF052390)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_112' title="bbox 189 1197 873 1199">
+    <p class='ocr_par' dir='ltr' id='par_1_112' title="bbox 189 1197 873 1199">
+     <span class='ocr_line' id='line_1_130' title="bbox 189 1197 873 1199; baseline 0 46"><span class='ocrx_word' id='word_1_292' title='bbox 189 1197 873 1199; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_113' title="bbox 881 1185 1362 1213">
+    <p class='ocr_par' dir='ltr' id='par_1_113' title="bbox 881 1185 1362 1213">
+     <span class='ocr_line' id='line_1_131' title="bbox 881 1185 1362 1213; baseline 0 -6"><span class='ocrx_word' id='word_1_293' title='bbox 881 1187 904 1207; x_wconf 91' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_294' title='bbox 916 1187 1028 1207; x_wconf 80' lang='eng' dir='ltr'><em>fastidiosa</em></span> <span class='ocrx_word' id='word_1_295' title='bbox 1038 1187 1120 1207; x_wconf 88' lang='eng' dir='ltr'><em>IMSNU</em></span> <span class='ocrx_word' id='word_1_296' title='bbox 1131 1185 1216 1207; x_wconf 75' lang='eng' dir='ltr'><em>20054T</em></span> <span class='ocrx_word' id='word_1_297' title='bbox 1225 1187 1362 1213; x_wconf 91' lang='eng' dir='ltr'><em>(AJ400710)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_114' title="bbox 488 1217 1023 1245">
+    <p class='ocr_par' dir='ltr' id='par_1_114' title="bbox 488 1217 1023 1245">
+     <span class='ocr_line' id='line_1_132' title="bbox 488 1217 1023 1245; baseline 0 -6"><span class='ocrx_word' id='word_1_298' title='bbox 488 1220 623 1239; x_wconf 83' lang='eng' dir='ltr'><em>Prauserella</em></span> <span class='ocrx_word' id='word_1_299' title='bbox 632 1225 713 1245; x_wconf 87' lang='eng' dir='ltr'><em>rugosa</em></span> <span class='ocrx_word' id='word_1_300' title='bbox 723 1219 779 1239; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_301' title='bbox 789 1217 874 1239; x_wconf 76' lang='eng' dir='ltr'><em>43194T</em></span> <span class='ocrx_word' id='word_1_302' title='bbox 884 1219 1023 1245; x_wconf 86' lang='eng' dir='ltr'><em>(AF051342)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000109-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000109-0-000.pbm.png
new file mode 100644
index 00000000..784f114c
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000109-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000109-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000109-0-000.pbm.png.hocr
new file mode 100644
index 00000000..2d37d066
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000109-0-000.pbm.png.hocr
@@ -0,0 +1,198 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000109-0-000.pbm.png"; bbox 0 0 994 1019; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 77 0 994 1019">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 317 0 853 28">
+     <span class='ocr_line' id='line_1_1' title="bbox 317 0 853 28; baseline 0 -5"><span class='ocrx_word' id='word_1_1' title='bbox 317 3 474 23; x_wconf 78' lang='eng' dir='ltr'><em>Roseobacter</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 481 3 566 23; x_wconf 77' lang='eng' dir='ltr'><em>literal/s</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 574 3 648 23; x_wconf 93' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 657 0 744 23; x_wconf 83' lang='eng' dir='ltr'><em>49566T</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 754 5 853 28; x_wconf 85' lang='eng' dir='ltr'>(X78312)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 291 36 807 64">
+     <span class='ocr_line' id='line_1_2' title="bbox 291 36 807 64; baseline 0 -5"><span class='ocrx_word' id='word_1_6' title='bbox 291 38 444 59; x_wconf 76' lang='eng' dir='ltr'><em>Sulfitobacter</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 449 39 568 64; x_wconf 81' lang='eng' dir='ltr'><em>pontiacus</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 577 38 646 59; x_wconf 88' lang='eng' dir='ltr'><em>ChLG</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 659 36 697 59; x_wconf 88' lang='eng' dir='ltr'><em>1OT</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 707 41 807 64; x_wconf 86' lang='eng' dir='ltr'>(Y13155)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 372 73 782 102">
+     <span class='ocr_line' id='line_1_3' title="bbox 372 73 782 102; baseline 0 -6"><span class='ocrx_word' id='word_1_11' title='bbox 372 76 466 96; x_wconf 87' lang='eng' dir='ltr'><em>Nereida</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 476 76 555 102; x_wconf 85' lang='eng' dir='ltr'><em>ignava</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 565 73 647 96; x_wconf 80' lang='eng' dir='ltr'><em>28M4T</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 657 78 782 101; x_wconf 87' lang='eng' dir='ltr'>(AJ748748)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 345 111 815 138">
+     <span class='ocr_line' id='line_1_4' title="bbox 345 111 815 138; baseline 0 -5"><span class='ocrx_word' id='word_1_15' title='bbox 345 113 540 133; x_wconf 82' lang='eng' dir='ltr'><em>Octadecabacter</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 546 113 640 133; x_wconf 82' lang='eng' dir='ltr'><em>arcticus</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 649 111 705 133; x_wconf 78' lang='eng' dir='ltr'><em>238T</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 714 115 815 138; x_wconf 87' lang='eng' dir='ltr'>(U73725)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 272 147 803 175">
+     <span class='ocr_line' id='line_1_5' title="bbox 272 147 803 175; baseline 0 -6"><span class='ocrx_word' id='word_1_19' title='bbox 272 149 429 169; x_wconf 84' lang='eng' dir='ltr'><em>Phaeobacter</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 435 149 593 175; x_wconf 85' lang='eng' dir='ltr'><em>ga/Iaeciensis</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 602 147 694 169; x_wconf 88' lang='eng' dir='ltr'><em>BS107T</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 704 151 803 174; x_wconf 84' lang='eng' dir='ltr'>(Y13244)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 273 183 797 212">
+     <span class='ocr_line' id='line_1_6' title="bbox 273 183 797 212; baseline 0 -6"><span class='ocrx_word' id='word_1_23' title='bbox 273 186 408 206; x_wconf 81' lang='eng' dir='ltr'><em>Mar/novum</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 417 186 509 212; x_wconf 87' lang='eng' dir='ltr'><em>a/gico/a</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 518 186 591 206; x_wconf 93' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 602 183 688 206; x_wconf 91' lang='eng' dir='ltr'><em>51440T</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 698 188 797 211; x_wconf 84' lang='eng' dir='ltr'>(X78315)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 289 221 931 248">
+     <span class='ocr_line' id='line_1_7' title="bbox 289 221 931 248; baseline 0 -5"><span class='ocrx_word' id='word_1_28' title='bbox 289 223 448 243; x_wconf 84' lang='eng' dir='ltr'><em>Thalassobius</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 457 223 632 243; x_wconf 82' lang='eng' dir='ltr'><em>mediterraneus</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 642 223 715 243; x_wconf 86' lang='eng' dir='ltr'><em>CECT</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 725 221 796 243; x_wconf 75' lang='eng' dir='ltr'><em>5383T</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 805 225 931 248; x_wconf 87' lang='eng' dir='ltr'>(AJ878874)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 282 257 766 285">
+     <span class='ocr_line' id='line_1_8' title="bbox 282 257 766 285; baseline 0 -6"><span class='ocrx_word' id='word_1_33' title='bbox 282 259 392 285; x_wconf 86' lang='eng' dir='ltr'><em>Ruegeria</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 401 259 503 279; x_wconf 79' lang='eng' dir='ltr'><em>at/antica</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 514 259 559 279; x_wconf 93' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 571 257 656 279; x_wconf 79' lang='eng' dir='ltr'><em>14463T</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 665 261 766 284; x_wconf 84' lang='eng' dir='ltr'>(D88526)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 262 293 845 322">
+     <span class='ocr_line' id='line_1_9' title="bbox 262 293 845 322; baseline -0.002 -5"><span class='ocrx_word' id='word_1_38' title='bbox 262 296 455 322; x_wconf 84' lang='eng' dir='ltr'><em>Pseudoruegeria</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 465 296 583 322; x_wconf 85' lang='eng' dir='ltr'><em>aquimaris</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 593 293 702 317; x_wconf 86' lang='eng' dir='ltr'><em>SW-255T</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 712 298 845 321; x_wconf 80' lang='eng' dir='ltr'>(D0675021)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 335 330 722 358">
+     <span class='ocr_line' id='line_1_10' title="bbox 335 330 722 358; baseline 0 -5"><span class='ocrx_word' id='word_1_42' title='bbox 335 332 439 358; x_wconf 78' lang='eng' dir='ltr'><em>Sagittula</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 449 333 535 353; x_wconf 77' lang='eng' dir='ltr'><em>stellata</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 546 330 613 353; x_wconf 77' lang='eng' dir='ltr'><em>E-37T</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 622 335 722 358; x_wconf 86' lang='eng' dir='ltr'>(U58356)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 325 367 887 395">
+     <span class='ocr_line' id='line_1_11' title="bbox 325 367 887 395; baseline 0 -5"><span class='ocrx_word' id='word_1_46' title='bbox 325 370 506 390; x_wconf 77' lang='eng' dir='ltr'><em>Antarctobacter</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 513 370 670 390; x_wconf 85' lang='eng' dir='ltr'><em>heliothermus</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 680 367 778 390; x_wconf 81' lang='eng' dir='ltr'><em>EL-219T</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 788 372 887 395; x_wconf 85' lang='eng' dir='ltr'>(Y11552)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 275 403 750 431">
+     <span class='ocr_line' id='line_1_12' title="bbox 275 403 750 431; baseline 0 -5"><span class='ocrx_word' id='word_1_50' title='bbox 275 406 427 426; x_wconf 84' lang='eng' dir='ltr'><em>Roseovarius</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 436 406 533 426; x_wconf 79' lang='eng' dir='ltr'><em>tolerans</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 543 403 641 426; x_wconf 89' lang='eng' dir='ltr'><em>EL-172T</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 651 408 750 431; x_wconf 92' lang='eng' dir='ltr'>(Y11551)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 316 440 845 468">
+     <span class='ocr_line' id='line_1_13' title="bbox 316 440 845 468; baseline 0 -5"><span class='ocrx_word' id='word_1_54' title='bbox 316 443 448 463; x_wconf 84' lang='eng' dir='ltr'><em>Roseivivax</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 456 443 606 463; x_wconf 83' lang='eng' dir='ltr'><em>ha/oto/erans</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 615 443 669 463; x_wconf 90' lang='eng' dir='ltr'><em>OCh</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 679 440 735 463; x_wconf 89' lang='eng' dir='ltr'><em>210T</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 745 445 845 468; x_wconf 83' lang='eng' dir='ltr'>(D85831)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 354 476 870 504">
+     <span class='ocr_line' id='line_1_14' title="bbox 354 476 870 504; baseline 0 -5"><span class='ocrx_word' id='word_1_59' title='bbox 354 479 486 499; x_wconf 81' lang='eng' dir='ltr'><em>Roseivivax</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 495 479 630 499; x_wconf 84' lang='eng' dir='ltr'><em>ha/odurans</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 639 478 693 499; x_wconf 90' lang='eng' dir='ltr'><em>OCh</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 704 476 760 499; x_wconf 78' lang='eng' dir='ltr'><em>239T</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 770 481 870 504; x_wconf 84' lang='eng' dir='ltr'>(D85829)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 306 513 721 541">
+     <span class='ocr_line' id='line_1_15' title="bbox 306 513 721 541; baseline 0 -5"><span class='ocrx_word' id='word_1_64' title='bbox 306 516 413 541; x_wconf 86' lang='eng' dir='ltr'><em>Salipiger</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 420 521 529 536; x_wconf 88' lang='eng' dir='ltr'><em>mucosus</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 538 513 582 536; x_wconf 88' lang='eng' dir='ltr'><em>A3T</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 592 518 721 541; x_wconf 87' lang='eng' dir='ltr'>(AY527274)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 218 551 739 579">
+     <span class='ocr_line' id='line_1_16' title="bbox 218 551 739 579; baseline 0 -6"><span class='ocrx_word' id='word_1_68' title='bbox 218 553 354 579; x_wconf 82' lang='eng' dir='ltr'><em>Donghicola</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 364 553 477 573; x_wconf 85' lang='eng' dir='ltr'><em>eburneus</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 486 551 596 573; x_wconf 87' lang='eng' dir='ltr'><em>SW-277T</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 606 555 739 578; x_wconf 83' lang='eng' dir='ltr'>(DQ667965)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 265 587 994 687">
+     <span class='ocr_line' id='line_1_17' title="bbox 290 587 994 615; baseline 0 -5"><span class='ocrx_word' id='word_1_72' title='bbox 290 589 482 610; x_wconf 85' lang='eng' dir='ltr'><em>Lutimaribacter</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 489 589 718 610; x_wconf 88' lang='eng' dir='ltr'><em>saemankumensis</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 727 587 854 610; x_wconf 89' lang='eng' dir='ltr'><em>SMK-117T</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 863 591 994 615; x_wconf 81' lang='eng' dir='ltr'><em>(EU336981)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 304 623 919 651; baseline 0 -5"><span class='ocrx_word' id='word_1_76' title='bbox 304 626 479 646; x_wconf 76' lang='eng' dir='ltr'><em>Maritimibacter</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 485 626 619 651; x_wconf 81' lang='eng' dir='ltr'><em>alkaliphilus</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 629 623 776 646; x_wconf 79' lang='eng' dir='ltr'><em>HTC02654T</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 786 628 919 651; x_wconf 77' lang='eng' dir='ltr'>(DQQ15443)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 265 660 874 687; baseline -0.002 -4"><span class='ocrx_word' id='word_1_80' title='bbox 265 662 400 683; x_wconf 83' lang='eng' dir='ltr'><em>Oceanicola</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 409 662 556 683; x_wconf 80' lang='eng' dir='ltr'><em>nanhaiensis</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 565 660 731 683; x_wconf 88' lang='eng' dir='ltr'><em>SSO11B1—20T</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 741 664 874 687; x_wconf 88' lang='eng' dir='ltr'><em>(DQ414420)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 92 697 803 761">
+     <span class='ocr_line' id='line_1_20' title="bbox 92 697 803 724; baseline 0 -5"><span class='ocrx_word' id='word_1_84' title='bbox 92 698 126 711; x_wconf 77' lang='eng'><em>54-9</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 246 699 381 719; x_wconf 80' lang='eng' dir='ltr'><em>Oceanicola</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 391 699 506 719; x_wconf 82' lang='eng' dir='ltr'><em>batsensis</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 517 697 663 719; x_wconf 79' lang='eng' dir='ltr'><em>HTCCZSQ7T</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 673 701 803 724; x_wconf 85' lang='eng' dir='ltr'>(AY424898)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 232 733 722 761; baseline 0 -5"><span class='ocrx_word' id='word_1_89' title='bbox 232 736 367 756; x_wconf 83' lang='eng' dir='ltr'><em>Ocean/cola</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 377 736 474 756; x_wconf 86' lang='eng' dir='ltr'><em>marinus</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 482 733 579 756; x_wconf 91' lang='eng' dir='ltr'><em>AZO-CT</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 589 738 722 761; x_wconf 81' lang='eng' dir='ltr'>(DQ822569)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 77 770 815 798">
+     <span class='ocr_line' id='line_1_22' title="bbox 77 770 815 798; baseline -0.003 -4"><span class='ocrx_word' id='word_1_93' title='bbox 77 781 111 794; x_wconf 73' lang='eng'><em>95.7</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 240 772 375 793; x_wconf 86' lang='eng' dir='ltr'><em>Oceanicola</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 384 772 519 798; x_wconf 87' lang='eng' dir='ltr'><em>granulosus</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 529 770 675 793; x_wconf 79' lang='eng' dir='ltr'><em>HTC02516T</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 685 774 815 797; x_wconf 88' lang='eng' dir='ltr'>(AY424896)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 79 781 764 835">
+     <span class='ocr_line' id='line_1_23' title="bbox 79 781 764 835; baseline 0 -5"><span class='ocrx_word' id='word_1_98' title='bbox 79 781 226 821; x_wconf 71' lang='eng'><em>—+:</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 240 810 395 830; x_wconf 83' lang='eng' dir='ltr'><em>Roseisalinus</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 404 810 537 830; x_wconf 79' lang='eng' dir='ltr'><em>antarcticus</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 547 807 629 830; x_wconf 70' lang='eng' dir='ltr'><em>EL-BST</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 639 812 764 835; x_wconf 82' lang='eng' dir='ltr'>(AJ605747)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 270 844 895 872">
+     <span class='ocr_line' id='line_1_24' title="bbox 270 844 895 872; baseline 0 -5"><span class='ocrx_word' id='word_1_103' title='bbox 270 847 510 872; x_wconf 84' lang='eng' dir='ltr'><em>Ketogu/onicigenium</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 520 847 607 872; x_wconf 84' lang='eng' dir='ltr'><em>vulgare</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 618 846 675 867; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 685 844 757 867; x_wconf 88' lang='eng' dir='ltr'><em>4025T</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 767 849 895 872; x_wconf 84' lang='eng' dir='ltr'>(AF136849)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 284 879 849 908">
+     <span class='ocr_line' id='line_1_25' title="bbox 284 879 849 908; baseline 0 -6"><span class='ocrx_word' id='word_1_108' title='bbox 284 882 422 902; x_wconf 87' lang='eng' dir='ltr'><em>Jannaschia</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 431 882 615 908; x_wconf 84' lang='eng' dir='ltr'><em>helgolandensis</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 625 882 662 902; x_wconf 95' lang='eng' dir='ltr'><em>Hel</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 675 879 713 902; x_wconf 90' lang='eng' dir='ltr'><em>1OT</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 723 884 849 907; x_wconf 83' lang='eng' dir='ltr'>(AJ438157)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 304 916 854 944">
+     <span class='ocr_line' id='line_1_26' title="bbox 304 916 854 944; baseline 0 -5"><span class='ocrx_word' id='word_1_113' title='bbox 304 919 428 939; x_wconf 85' lang='eng' dir='ltr'><em>Loktane/la</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 437 919 556 939; x_wconf 85' lang='eng' dir='ltr'><em>salsi/acus</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 566 919 622 939; x_wconf 93' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 632 916 719 939; x_wconf 88' lang='eng' dir='ltr'><em>21507T</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 729 921 854 944; x_wconf 80' lang='eng' dir='ltr'>(AJ440997)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 362 954 947 982">
+     <span class='ocr_line' id='line_1_27' title="bbox 362 954 947 982; baseline 0 -6"><span class='ocrx_word' id='word_1_118' title='bbox 362 956 521 976; x_wconf 84' lang='eng' dir='ltr'><em>Rhodobacter</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 528 956 658 982; x_wconf 82' lang='eng' dir='ltr'><em>capsu/atus</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 666 956 740 976; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 753 956 760 976; x_wconf 97' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 768 956 775 976; x_wconf 90' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 783 954 837 976; x_wconf 81' lang='eng' dir='ltr'><em>166T</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 847 958 947 981; x_wconf 79' lang='eng'>(016428)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 487 991 958 1019">
+     <span class='ocr_line' id='line_1_28' title="bbox 487 991 958 1019; baseline -0.002 -5"><span class='ocrx_word' id='word_1_125' title='bbox 487 993 578 1019; x_wconf 86' lang='eng' dir='ltr'><em>Stappia</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 588 993 695 1014; x_wconf 87' lang='eng' dir='ltr'><em>ste/Iu/ata</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 706 993 751 1013; x_wconf 93' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 763 991 848 1014; x_wconf 80' lang='eng' dir='ltr'><em>12621T</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 857 995 958 1018; x_wconf 84' lang='eng' dir='ltr'>(D88525)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 0 7 482 1008">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 0 7 482 1008">
+     <span class='ocr_line' id='line_1_29' title="bbox 136 7 306 42; baseline 0 -20"><span class='ocrx_word' id='word_1_130' title='bbox 136 7 306 42; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 102 42 291 78; baseline 0 941"><span class='ocrx_word' id='word_1_131' title='bbox 102 42 291 78; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 87 78 361 133; baseline 0 0"><span class='ocrx_word' id='word_1_132' title='bbox 87 78 361 133; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 75 133 273 226; baseline 0 0"><span class='ocrx_word' id='word_1_133' title='bbox 75 133 273 226; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 75 226 276 261; baseline 0 758"><span class='ocrx_word' id='word_1_134' title='bbox 75 226 276 261; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 75 261 276 279; baseline 0 740"><span class='ocrx_word' id='word_1_135' title='bbox 75 261 276 279; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 68 279 262 299; baseline 0 720"><span class='ocrx_word' id='word_1_136' title='bbox 68 279 262 299; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 68 299 262 336; baseline 0 683"><span class='ocrx_word' id='word_1_137' title='bbox 68 299 262 336; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 68 336 323 389; baseline 0 0"><span class='ocrx_word' id='word_1_138' title='bbox 68 336 323 389; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 59 389 275 409; baseline 0 610"><span class='ocrx_word' id='word_1_139' title='bbox 59 389 275 409; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 59 409 275 445; baseline 0 574"><span class='ocrx_word' id='word_1_140' title='bbox 59 409 275 445; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 59 445 343 499; baseline 0 0"><span class='ocrx_word' id='word_1_141' title='bbox 59 445 343 499; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 35 499 306 593; baseline 0 -38"><span class='ocrx_word' id='word_1_142' title='bbox 35 499 306 593; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 35 593 207 665; baseline 0 0"><span class='ocrx_word' id='word_1_143' title='bbox 35 593 207 665; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 15 665 84 700; baseline 0 319"><span class='ocrx_word' id='word_1_144' title='bbox 15 665 84 700; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 0 700 84 775; baseline 0 0"><span class='ocrx_word' id='word_1_145' title='bbox 0 700 84 775; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 0 841 270 886; baseline 0 -37"><span class='ocrx_word' id='word_1_146' title='bbox 0 841 270 886; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 0 886 284 922; baseline 0 97"><span class='ocrx_word' id='word_1_147' title='bbox 0 886 284 922; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 0 922 304 958; baseline 0 61"><span class='ocrx_word' id='word_1_148' title='bbox 0 922 304 958; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_48' title="bbox 0 958 482 1008; baseline 0 0"><span class='ocrx_word' id='word_1_149' title='bbox 0 958 482 1008; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 77 656 80 857">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 77 656 80 857">
+     <span class='ocr_line' id='line_1_49' title="bbox 77 656 80 857; baseline 0 162"><span class='ocrx_word' id='word_1_150' title='bbox 77 656 80 857; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000117-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000117-0-000.pbm.png
new file mode 100644
index 00000000..8d0720c4
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000117-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000117-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000117-0-000.pbm.png.hocr
new file mode 100644
index 00000000..d6d1a882
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000117-0-000.pbm.png.hocr
@@ -0,0 +1,124 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000117-0-000.pbm.png"; bbox 0 0 1302 695; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 427 4 1299 562">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 524 4 1139 33">
+     <span class='ocr_line' id='line_1_1' title="bbox 524 4 1139 33; baseline 0 -6"><span class='ocrx_word' id='word_1_1' title='bbox 524 6 681 27; x_wconf 86' lang='eng' dir='ltr'><em>Providencia</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 690 6 793 27; x_wconf 86' lang='eng' dir='ltr'><em>sneebia</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 802 4 833 27; x_wconf 97' lang='eng' dir='ltr'><em>AT</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 843 6 1139 33; x_wconf 83' lang='eng' dir='ltr'><em>(EU587095—EU587100)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 527 37 1161 64">
+     <span class='ocr_line' id='line_1_2' title="bbox 527 37 1161 64; baseline 0 -6"><span class='ocrx_word' id='word_1_5' title='bbox 527 38 684 58; x_wconf 91' lang='eng' dir='ltr'><em>Providencia</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 693 38 796 58; x_wconf 88' lang='eng' dir='ltr'><em>sneebia</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 805 38 855 58; x_wconf 91' lang='eng' dir='ltr'><em>A75</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 865 37 1161 64; x_wconf 85' lang='eng' dir='ltr'><em>(EU587053—EU587058)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 481 68 1173 157">
+     <span class='ocr_line' id='line_1_3' title="bbox 482 68 1157 96; baseline 0 -7"><span class='ocrx_word' id='word_1_9' title='bbox 482 78 508 96; x_wconf 74' lang='eng'><em>52</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 523 69 680 89; x_wconf 87' lang='eng' dir='ltr'><em>Providencia</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 689 69 792 89; x_wconf 87' lang='eng' dir='ltr'><em>sneebia</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 801 68 847 89; x_wconf 89' lang='eng' dir='ltr'><em>A91</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 861 68 1157 95; x_wconf 83' lang='eng' dir='ltr'><em>(EU587059—EU587064)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 481 100 1173 126; baseline 0 -5"><span class='ocrx_word' id='word_1_14' title='bbox 481 102 514 124; x_wconf 68' lang='eng'><em>59!</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 523 100 680 121; x_wconf 88' lang='eng' dir='ltr'><em>Providencia</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 689 100 792 121; x_wconf 85' lang='eng' dir='ltr'><em>sneebia</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 800 100 866 121; x_wconf 89' lang='eng' dir='ltr'>A102</span> <span class='ocrx_word' id='word_1_18' title='bbox 877 100 1173 126; x_wconf 85' lang='eng' dir='ltr'><em>(EU587071—EU58707G)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 482 125 1173 157; baseline 0.001 -6"><span class='ocrx_word' id='word_1_19' title='bbox 482 125 514 148; x_wconf 90' lang='eng' dir='ltr'><em>60l</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 523 131 680 152; x_wconf 90' lang='eng' dir='ltr'><em>Providencia</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 689 131 792 152; x_wconf 85' lang='eng' dir='ltr'><em>sneebia</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 800 131 863 152; x_wconf 91' lang='eng' dir='ltr'><em>A101</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 877 131 1173 157; x_wconf 88' lang='eng' dir='ltr'><em>(EU587065—EU587070)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 427 159 1299 500">
+     <span class='ocr_line' id='line_1_6' title="bbox 465 159 1262 188; baseline 0 -6"><span class='ocrx_word' id='word_1_24' title='bbox 465 159 491 178; x_wconf 77' lang='eng'><em>56</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 510 162 667 182; x_wconf 90' lang='eng' dir='ltr'><em>Providencia</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 676 162 916 188; x_wconf 84' lang='eng' dir='ltr'><em>burhodogranariea</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 926 159 956 182; x_wconf 82' lang='eng' dir='ltr'>BT</span> <span class='ocrx_word' id='word_1_28' title='bbox 965 161 1262 188; x_wconf 88' lang='eng' dir='ltr'><em>(EU587101—EU587106)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 453 185 1282 219; baseline 0 -5"><span class='ocrx_word' id='word_1_29' title='bbox 453 185 491 204; x_wconf 71' lang='eng'><em>10°</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 511 193 669 214; x_wconf 84' lang='eng' dir='ltr'><em>Providencia</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 678 193 917 219; x_wconf 86' lang='eng' dir='ltr'><em>burhodogranariea</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 927 193 975 214; x_wconf 88' lang='eng' dir='ltr'><em>B97</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 986 193 1282 219; x_wconf 85' lang='eng' dir='ltr'><em>(EU587083—EU587088)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 507 224 1278 250; baseline 0.001 -6"><span class='ocrx_word' id='word_1_34' title='bbox 507 224 665 245; x_wconf 85' lang='eng' dir='ltr'><em>Providencia</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 674 224 913 250; x_wconf 84' lang='eng' dir='ltr'><em>burhodogranariea</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 923 224 971 245; x_wconf 92' lang='eng' dir='ltr'><em>B18</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 982 224 1278 250; x_wconf 91' lang='eng' dir='ltr'><em>(EU587077—EU587082)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 517 255 1257 282; baseline 0 -6"><span class='ocrx_word' id='word_1_38' title='bbox 517 256 675 276; x_wconf 88' lang='eng' dir='ltr'><em>Providencia</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 684 256 923 282; x_wconf 87' lang='eng' dir='ltr'><em>burhodogranariea</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 934 256 951 276; x_wconf 96' lang='eng' dir='ltr'><strong>D</strong></span> <span class='ocrx_word' id='word_1_41' title='bbox 961 255 1257 282; x_wconf 86' lang='eng' dir='ltr'><em>(EU587113—EU587118)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 461 286 1287 313; baseline 0.002 -7"><span class='ocrx_word' id='word_1_42' title='bbox 461 286 500 305; x_wconf 85' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 516 287 674 308; x_wconf 85' lang='eng' dir='ltr'><em>Providencia</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 683 287 922 313; x_wconf 89' lang='eng' dir='ltr'><em>burhodogranariea</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 932 286 981 308; x_wconf 90' lang='eng' dir='ltr'><em>D37</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 991 286 1287 313; x_wconf 82' lang='eng' dir='ltr'><em>(EU587089-EU587094)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 525 316 1219 344; baseline 0.001 -6"><span class='ocrx_word' id='word_1_47' title='bbox 525 318 670 339; x_wconf 86' lang='eng' dir='ltr'><em>Providencia</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 679 318 762 339; x_wconf 72' lang='eng' dir='ltr'><em>stuartii</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 771 318 830 339; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 839 316 913 339; x_wconf 84' lang='eng' dir='ltr'><em>4539T</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 923 318 1219 344; x_wconf 85' lang='eng' dir='ltr'><em>(EU587024—EU587029)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 529 347 1293 376; baseline 0 -6"><span class='ocrx_word' id='word_1_52' title='bbox 529 349 674 370; x_wconf 85' lang='eng' dir='ltr'><em>Providencia</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 683 349 834 370; x_wconf 85' lang='eng' dir='ltr'><em>heimbachae</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 845 349 904 370; x_wconf 92' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 914 347 987 370; x_wconf 81' lang='eng' dir='ltr'><em>3591T</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 997 349 1293 376; x_wconf 82' lang='eng' dir='ltr'><em>(EU587018—EU587023)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 519 378 1299 407; baseline 0 -6"><span class='ocrx_word' id='word_1_57' title='bbox 519 380 664 401; x_wconf 82' lang='eng' dir='ltr'><em>Providencia</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 673 380 825 401; x_wconf 83' lang='eng' dir='ltr'><em>a/ca/ifaciens</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 835 380 894 401; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 904 378 993 401; x_wconf 84' lang='eng' dir='ltr'><em>30120T</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 1002 380 1299 407; x_wconf 86' lang='eng' dir='ltr'><em>(EU587047—EU587052)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 427 409 1157 437; baseline 0 -5"><span class='ocrx_word' id='word_1_62' title='bbox 427 411 571 432; x_wconf 84' lang='eng' dir='ltr'><em>Providencia</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 581 411 700 437; x_wconf 84' lang='eng' dir='ltr'><em>rustigianii</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 709 411 767 432; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 777 409 851 432; x_wconf 91' lang='eng' dir='ltr'><em>4541T</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 861 411 1157 437; x_wconf 86' lang='eng' dir='ltr'><em>(EU587030—EU587034)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 510 440 1257 469; baseline 0 -6"><span class='ocrx_word' id='word_1_67' title='bbox 510 443 655 463; x_wconf 86' lang='eng' dir='ltr'><em>Providencia</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 665 443 783 463; x_wconf 87' lang='eng' dir='ltr'><em>vermicola</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 793 442 852 463; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 864 440 951 463; x_wconf 82' lang='eng' dir='ltr'><em>17385T</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 961 442 1257 469; x_wconf 87' lang='eng' dir='ltr'><em>(EU587041—EU587046)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 510 471 1209 500; baseline 0 -6"><span class='ocrx_word' id='word_1_72' title='bbox 510 474 655 494; x_wconf 83' lang='eng' dir='ltr'><em>Providencia</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 664 474 752 500; x_wconf 80' lang='eng' dir='ltr'><em>rettgeri</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 760 473 819 494; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 829 471 902 494; x_wconf 91' lang='eng' dir='ltr'><em>4542T</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 913 473 1209 500; x_wconf 82' lang='eng' dir='ltr'><em>(EU587035—EU587040)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 450 504 1107 562">
+     <span class='ocr_line' id='line_1_17' title="bbox 450 504 1107 531; baseline 0.003 -8"><span class='ocrx_word' id='word_1_77' title='bbox 450 504 488 523; x_wconf 87' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 511 505 669 525; x_wconf 85' lang='eng' dir='ltr'><em>Providencia</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 678 505 775 531; x_wconf 87' lang='eng' dir='ltr'><em>rettgeri</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 782 505 800 525; x_wconf 95' lang='eng' dir='ltr'><strong>C</strong></span> <span class='ocrx_word' id='word_1_81' title='bbox 811 505 1107 531; x_wconf 89' lang='eng' dir='ltr'><em>(EU587107—EU587112)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 512 536 978 562; baseline -0.002 -5"><span class='ocrx_word' id='word_1_82' title='bbox 512 536 608 557; x_wconf 81' lang='eng' dir='ltr'><em>Proteus</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 617 536 719 557; x_wconf 87' lang='eng' dir='ltr'><em>mirabi/is</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 729 536 816 557; x_wconf 86' lang='eng' dir='ltr'><em>Hl4320</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 827 536 978 562; x_wconf 83' lang='eng' dir='ltr'><em>(AM942759)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 3 564 1274 687">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 25 564 1274 687">
+     <span class='ocr_line' id='line_1_19' title="bbox 463 564 1042 593; baseline 0 -6"><span class='ocrx_word' id='word_1_86' title='bbox 463 567 636 587; x_wconf 82' lang='eng' dir='ltr'><em>Photorhabdus</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 645 567 800 587; x_wconf 85' lang='eng' dir='ltr'><em>Iuminescens</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 808 564 886 587; x_wconf 91' lang='eng' dir='ltr'><em>TTO1T</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 895 567 1042 593; x_wconf 90' lang='eng' dir='ltr'><em>(BX470251)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 462 598 875 625; baseline 0 -6"><span class='ocrx_word' id='word_1_90' title='bbox 462 598 559 619; x_wconf 81' lang='eng' dir='ltr'><em>Yersinia</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 567 598 640 625; x_wconf 81' lang='eng' dir='ltr'><em>pest/s</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 649 598 721 619; x_wconf 77' lang='eng'><em>€092</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 731 598 875 625; x_wconf 85' lang='eng' dir='ltr'><em>(AL590842)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 25 629 1274 657; baseline 0 -7"><span class='ocrx_word' id='word_1_94' title='bbox 25 638 64 657; x_wconf 76' lang='eng'>100</span> <span class='ocrx_word' id='word_1_95' title='bbox 513 630 604 650; x_wconf 84' lang='eng' dir='ltr'><em>Erwinia</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 614 630 744 650; x_wconf 83' lang='eng' dir='ltr'><em>carotovora</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 754 630 833 656; x_wconf 87' lang='eng' dir='ltr'>subsp.</span> <span class='ocrx_word' id='word_1_98' title='bbox 844 630 980 656; x_wconf 80' lang='eng' dir='ltr'><em>atroseptica</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 989 629 1117 650; x_wconf 86' lang='eng' dir='ltr'><em>SCR|1043</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 1127 629 1274 656; x_wconf 86' lang='eng' dir='ltr'><em>(BX950851)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 105 660 1031 687; baseline 0.001 -7"><span class='ocrx_word' id='word_1_101' title='bbox 105 662 143 680; x_wconf 91' lang='eng'>100</span> <span class='ocrx_word' id='word_1_102' title='bbox 531 661 674 681; x_wconf 84' lang='eng' dir='ltr'><em>Escherichia</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 684 661 726 681; x_wconf 87' lang='eng' dir='ltr'><em>coli</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 735 661 790 681; x_wconf 88' lang='eng' dir='ltr'>K-12</span> <span class='ocrx_word' id='word_1_105' title='bbox 801 660 907 681; x_wconf 89' lang='eng' dir='ltr'>MG1655</span> <span class='ocrx_word' id='word_1_106' title='bbox 917 660 1031 687; x_wconf 79' lang='eng' dir='ltr'><em>(UOOOQB)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 3 9 524 511">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 3 9 524 511">
+     <span class='ocr_line' id='line_1_23' title="bbox 246 9 522 54; baseline 0 0"><span class='ocrx_word' id='word_1_107' title='bbox 246 9 522 54; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 246 54 482 110; baseline 0 -23"><span class='ocrx_word' id='word_1_108' title='bbox 246 54 482 110; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 239 110 257 139; baseline 0 556"><span class='ocrx_word' id='word_1_109' title='bbox 239 110 257 139; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 239 139 257 202; baseline 0 -29"><span class='ocrx_word' id='word_1_110' title='bbox 239 139 257 202; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 200 202 453 236; baseline 0 459"><span class='ocrx_word' id='word_1_111' title='bbox 200 202 453 236; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 207 236 512 273; baseline 0 0"><span class='ocrx_word' id='word_1_112' title='bbox 207 236 512 273; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 161 273 461 295; baseline 0 400"><span class='ocrx_word' id='word_1_113' title='bbox 161 273 461 295; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 99 295 461 326; baseline 0 369"><span class='ocrx_word' id='word_1_114' title='bbox 99 295 461 326; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 99 326 524 364; baseline 0 331"><span class='ocrx_word' id='word_1_115' title='bbox 99 326 524 364; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 99 364 519 395; baseline 0 300"><span class='ocrx_word' id='word_1_116' title='bbox 99 364 519 395; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 99 395 427 421; baseline 0 274"><span class='ocrx_word' id='word_1_117' title='bbox 99 395 427 421; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 12 421 427 451; baseline 0 244"><span class='ocrx_word' id='word_1_118' title='bbox 12 421 427 451; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 12 451 505 491; baseline 0 204"><span class='ocrx_word' id='word_1_119' title='bbox 12 451 505 491; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 3 491 450 511; baseline 0 184"><span class='ocrx_word' id='word_1_120' title='bbox 3 491 450 511; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 74 104 244 136">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 74 104 244 136">
+     <span class='ocr_line' id='line_1_37' title="bbox 74 104 244 136; baseline 0 -14"><span class='ocrx_word' id='word_1_121' title='bbox 74 104 121 122; x_wconf 88' lang='eng'><em>0.02</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 218 118 244 136; x_wconf 78' lang='eng'><em>54</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 60 408 99 426">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 60 408 99 426">
+     <span class='ocr_line' id='line_1_38' title="bbox 60 408 99 426; baseline 0 0"><span class='ocrx_word' id='word_1_123' title='bbox 60 408 99 426; x_wconf 84' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000158-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000158-0-000.pbm.png
new file mode 100644
index 00000000..1256630a
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000158-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000158-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000158-0-000.pbm.png.hocr
new file mode 100644
index 00000000..7b86db5a
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000158-0-000.pbm.png.hocr
@@ -0,0 +1,224 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000158-0-000.pbm.png"; bbox 0 0 1657 1171; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 1 16 854 18">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 1 16 854 18">
+     <span class='ocr_line' id='line_1_1' title="bbox 1 16 854 18; baseline 0 1153"><span class='ocrx_word' id='word_1_1' title='bbox 1 16 854 18; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 1 16 5 392">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 1 16 5 392">
+     <span class='ocr_line' id='line_1_2' title="bbox 1 16 5 392; baseline 0 779"><span class='ocrx_word' id='word_1_2' title='bbox 1 16 5 392; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 863 2 1489 34">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 863 2 1489 34">
+     <span class='ocr_line' id='line_1_3' title="bbox 863 2 1489 34; baseline 0 -7"><span class='ocrx_word' id='word_1_3' title='bbox 863 5 1000 34; x_wconf 78' lang='eng' dir='ltr'><em>Cytophaga</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 1009 5 1245 27; x_wconf 71' lang='eng' dir='ltr'><em>hutch/hsom&#39;iATCC</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 1255 2 1351 27; x_wconf 78' lang='eng' dir='ltr'><em>33406T</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 1361 3 1489 31; x_wconf 84' lang='eng' dir='ltr'><em>(M58768)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 334 43 1655 155">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 334 43 1655 155">
+     <span class='ocr_line' id='line_1_4' title="bbox 413 43 1417 82; baseline -0.002 -13"><span class='ocrx_word' id='word_1_7' title='bbox 413 67 437 82; x_wconf 67' lang='eng'>97</span> <span class='ocrx_word' id='word_1_8' title='bbox 835 46 985 68; x_wconf 75' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 991 46 1079 68; x_wconf 66' lang='eng' dir='ltr'><em>sat/tans</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 1087 46 1148 68; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 1162 47 1169 67; x_wconf 99' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 1178 43 1256 67; x_wconf 84' lang='eng' dir='ltr'><em>2145T</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 1266 44 1367 72; x_wconf 88' lang='eng' dir='ltr'><em>(AJ4381</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 1376 43 1417 72; x_wconf 90' lang='eng'><em>73)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 361 57 1655 140; baseline 0 -32"><span class='ocrx_word' id='word_1_15' title='bbox 361 57 935 140; x_wconf 62' lang='eng' dir='ltr'>E</span> <span class='ocrx_word' id='word_1_16' title='bbox 941 86 1172 115; x_wconf 76' lang='eng' dir='ltr'><em>Sph/hgobacterium</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 1181 87 1325 114; x_wconf 66' lang='eng' dir='ltr'><em>spl&#39;r/T/vorum</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 1332 86 1411 108; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 1421 87 1500 108; x_wconf 88' lang='eng'>33861</span> <span class='ocrx_word' id='word_1_20' title='bbox 1507 83 1518 98; x_wconf 74' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_21' title='bbox 1527 84 1609 112; x_wconf 90' lang='eng' dir='ltr'><em>(M587</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 1614 88 1626 108; x_wconf 91' lang='eng'>7</span> <span class='ocrx_word' id='word_1_23' title='bbox 1631 84 1655 112; x_wconf 87' lang='eng'>8)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 334 124 1625 155; baseline -0.002 -5"><span class='ocrx_word' id='word_1_24' title='bbox 334 125 354 141; x_wconf 68' lang='eng'><em>6‘</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 887 127 1118 155; x_wconf 75' lang='eng' dir='ltr'><em>Sph/hgobacter/um</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 1127 127 1287 155; x_wconf 69' lang='eng' dir='ltr'><em>thalpoph/Yum</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 1296 127 1357 149; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 1370 128 1377 148; x_wconf 99' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 1387 128 1395 148; x_wconf 99' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 1404 124 1464 148; x_wconf 88' lang='eng' dir='ltr'><em>723T</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 1474 125 1575 153; x_wconf 88' lang='eng' dir='ltr'><em>(AJ4381</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 1584 125 1625 153; x_wconf 91' lang='eng'><em>77)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 430 165 1275 343">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 430 165 1275 343">
+     <span class='ocr_line' id='line_1_7' title="bbox 430 165 1109 195; baseline 0 -6"><span class='ocrx_word' id='word_1_33' title='bbox 430 179 465 195; x_wconf 69' lang='eng'>100</span> <span class='ocrx_word' id='word_1_34' title='bbox 610 168 759 189; x_wconf 78' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 765 168 841 189; x_wconf 83' lang='eng' dir='ltr'><em>lentus</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 849 165 944 189; x_wconf 91' lang='eng' dir='ltr'><em>DS-4OT</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 954 166 1059 194; x_wconf 87' lang='eng' dir='ltr'><em>(EF4461</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 1067 165 1109 193; x_wconf 89' lang='eng'><em>46)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 627 205 1152 234; baseline -0.002 -4"><span class='ocrx_word' id='word_1_39' title='bbox 627 208 776 230; x_wconf 81' lang='eng' dir='ltr'><em>Pedobacler</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 783 208 883 230; x_wconf 82' lang='eng' dir='ltr'><em>tem&#39;co/a</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 892 205 987 230; x_wconf 88' lang='eng' dir='ltr'><em>DS—45T</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 997 206 1102 234; x_wconf 90' lang='eng' dir='ltr'><em>(EF4461</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 1109 206 1152 234; x_wconf 88' lang='eng'><em>47)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 662 245 1204 277; baseline 0 -7"><span class='ocrx_word' id='word_1_44' title='bbox 662 249 812 270; x_wconf 77' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 818 249 921 277; x_wconf 69' lang='eng' dir='ltr'><em>aquatﬂ/s</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 928 245 1029 270; x_wconf 90' lang='eng' dir='ltr'><em>AR107T</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 1039 247 1101 275; x_wconf 93' lang='eng' dir='ltr'><em>(AM1</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 1111 250 1118 270; x_wconf 94' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 1126 247 1204 274; x_wconf 87' lang='eng'><em>4396)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 443 286 1275 343; baseline 0.001 -33"><span class='ocrx_word' id='word_1_50' title='bbox 443 294 466 310; x_wconf 82' lang='eng'>97</span> <span class='ocrx_word' id='word_1_51' title='bbox 533 299 620 343; x_wconf 42' lang='eng'><em>$1:</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 633 289 791 312; x_wconf 83' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 798 289 921 311; x_wconf 81' lang='eng' dir='ltr'><em>alluvionis</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 931 289 1060 311; x_wconf 94' lang='eng' dir='ltr'><em>NWER-II1</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 1071 286 1096 311; x_wconf 90' lang='eng' dir='ltr'><em>1T</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 1107 287 1275 315; x_wconf 87' lang='eng' dir='ltr'><em>(EU030688)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 319 143 362 145">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 319 143 362 145">
+     <span class='ocr_line' id='line_1_11' title="bbox 319 143 362 145; baseline 0 1026"><span class='ocrx_word' id='word_1_57' title='bbox 319 143 362 145; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 359 87 363 202">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 359 87 363 202">
+     <span class='ocr_line' id='line_1_12' title="bbox 359 87 363 202; baseline 0 969"><span class='ocrx_word' id='word_1_58' title='bbox 359 87 363 202; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 561 381 650 383">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 561 381 650 383">
+     <span class='ocr_line' id='line_1_13' title="bbox 561 381 650 383; baseline 0 788"><span class='ocrx_word' id='word_1_59' title='bbox 561 381 650 383; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 531 319 534 390">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 531 319 534 390">
+     <span class='ocr_line' id='line_1_14' title="bbox 531 319 534 390; baseline 0 781"><span class='ocrx_word' id='word_1_60' title='bbox 531 319 534 390; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 577 422 660 424">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 577 422 660 424">
+     <span class='ocr_line' id='line_1_15' title="bbox 577 422 660 424; baseline 0 747"><span class='ocrx_word' id='word_1_61' title='bbox 577 422 660 424; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 4 327 1260 464">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 4 327 1260 464">
+     <span class='ocr_line' id='line_1_16' title="bbox 503 327 1181 360; baseline -0.001 -8"><span class='ocrx_word' id='word_1_62' title='bbox 503 345 527 360; x_wconf 69' lang='eng'>93</span> <span class='ocrx_word' id='word_1_63' title='bbox 621 330 771 352; x_wconf 79' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 776 337 861 352; x_wconf 82' lang='eng' dir='ltr'><em>roseus</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 868 330 938 352; x_wconf 86' lang='eng' dir='ltr'><em>CL—G</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 943 327 1005 351; x_wconf 90' lang='eng' dir='ltr'><em>P80T</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 1014 328 1078 356; x_wconf 84' lang='eng' dir='ltr'><em>(D01</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 1089 331 1096 351; x_wconf 96' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 1105 328 1181 356; x_wconf 86' lang='eng'>2353)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 4 368 1260 397; baseline 0 -5"><span class='ocrx_word' id='word_1_70' title='bbox 4 370 326 397; x_wconf 50' lang='eng' dir='ltr'><em>—ﬂ.</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 659 371 809 392; x_wconf 79' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 815 371 981 392; x_wconf 77' lang='eng' dir='ltr'><em>sandarak/hus</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 989 371 1037 392; x_wconf 89' lang='eng' dir='ltr'><em>DS—</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 1041 372 1054 392; x_wconf 87' lang='eng'><em>2</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 1058 368 1084 392; x_wconf 92' lang='eng' dir='ltr'><em>7T</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 1093 368 1215 396; x_wconf 85' lang='eng' dir='ltr'>(D02352</span> <span class='ocrx_word' id='word_1_77' title='bbox 1219 372 1232 392; x_wconf 86' lang='eng'>2</span> <span class='ocrx_word' id='word_1_78' title='bbox 1236 368 1260 397; x_wconf 88' lang='eng'>8)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 535 408 1194 437; baseline 0 -4"><span class='ocrx_word' id='word_1_79' title='bbox 535 412 562 432; x_wconf 52' lang='eng' dir='ltr'><em>ﬂ</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 670 411 829 433; x_wconf 82' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 836 411 942 433; x_wconf 81' lang='eng' dir='ltr'><em>borea/I&#39;s</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 951 408 1015 433; x_wconf 92' lang='eng' dir='ltr'><em>G-1T</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 1026 408 1194 437; x_wconf 89' lang='eng' dir='ltr'><em>(EU030687)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 553 448 576 464; baseline 0 0"><span class='ocrx_word' id='word_1_84' title='bbox 553 448 576 464; x_wconf 82' lang='eng'><em>65</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 562 442 580 444">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 562 442 580 444">
+     <span class='ocr_line' id='line_1_20' title="bbox 562 442 580 444; baseline 0 727"><span class='ocrx_word' id='word_1_85' title='bbox 562 442 580 444; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 578 434 580 464">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 578 434 580 464">
+     <span class='ocr_line' id='line_1_21' title="bbox 578 434 580 464; baseline 0 707"><span class='ocrx_word' id='word_1_86' title='bbox 578 434 580 464; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 580 462 657 465">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 580 462 657 465">
+     <span class='ocr_line' id='line_1_22' title="bbox 580 462 657 465; baseline 0 706"><span class='ocrx_word' id='word_1_87' title='bbox 580 462 657 465; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 321 449 1392 1087">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 396 449 1392 1087">
+     <span class='ocr_line' id='line_1_23' title="bbox 669 449 1247 478; baseline -0.002 -4"><span class='ocrx_word' id='word_1_88' title='bbox 669 452 819 474; x_wconf 78' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 825 452 974 474; x_wconf 86' lang='eng' dir='ltr'><em>suwonens/s</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 983 453 990 473; x_wconf 96' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 998 453 1041 473; x_wconf 88' lang='eng'><em>5—5</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 1045 449 1070 473; x_wconf 87' lang='eng' dir='ltr'><em>2T</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 1080 449 1166 478; x_wconf 84' lang='eng' dir='ltr'><em>(D009</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 1171 453 1183 473; x_wconf 92' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 1188 453 1201 473; x_wconf 87' lang='eng'>2</span> <span class='ocrx_word' id='word_1_96' title='bbox 1206 453 1218 473; x_wconf 92' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 1222 449 1247 478; x_wconf 93' lang='eng'>4)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 548 489 1324 546; baseline 0 -32"><span class='ocrx_word' id='word_1_98' title='bbox 548 503 661 546; x_wconf 47' lang='eng'><em>553+:</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 673 492 831 514; x_wconf 78' lang='eng' dir='ltr'><em>Pedobacz‘er</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 838 492 986 521; x_wconf 78' lang='eng' dir='ltr'><em>nyac/(ens/s</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 995 489 1146 514; x_wconf 76' lang='eng' dir='ltr'><em>NWG-II14T</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 1156 490 1324 519; x_wconf 88' lang='eng' dir='ltr'><em>(EU030686)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 674 530 1273 561; baseline -0.002 -6"><span class='ocrx_word' id='word_1_103' title='bbox 674 533 823 555; x_wconf 78' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 829 533 953 561; x_wconf 75' lang='eng' dir='ltr'><em>hepar/hus</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 961 533 1022 555; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 1034 530 1112 554; x_wconf 83' lang='eng' dir='ltr'><em>2366T</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 1121 531 1223 559; x_wconf 85' lang='eng' dir='ltr'><em>(AJ4381</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 1232 534 1244 554; x_wconf 90' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 1249 531 1273 559; x_wconf 86' lang='eng'><em>2)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 685 570 1292 599; baseline 0 -4"><span class='ocrx_word' id='word_1_110' title='bbox 685 573 835 595; x_wconf 78' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 840 574 955 595; x_wconf 82' lang='eng' dir='ltr'><em>afr/canus</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 963 573 1024 595; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 1037 575 1045 595; x_wconf 94' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 1053 574 1079 595; x_wconf 88' lang='eng'>21</span> <span class='ocrx_word' id='word_1_115' title='bbox 1088 570 1131 595; x_wconf 84' lang='eng' dir='ltr'><em>26T</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 1141 571 1242 599; x_wconf 90' lang='eng' dir='ltr'><em>(AJ4381</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 1252 571 1292 599; x_wconf 94' lang='eng'>71)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 396 611 1374 645; baseline 0 -9"><span class='ocrx_word' id='word_1_118' title='bbox 396 616 432 631; x_wconf 85' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 568 629 591 645; x_wconf 73' lang='eng'><em>73</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 693 615 843 636; x_wconf 77' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 849 615 1182 642; x_wconf 71' lang='eng' dir='ltr'><em>metabo/IpauperWBQ3-71</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 1189 611 1200 626; x_wconf 78' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_123' title='bbox 1209 612 1306 640; x_wconf 87' lang='eng' dir='ltr'><em>(AM491</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 1314 612 1374 640; x_wconf 89' lang='eng'>370)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 671 652 1275 683; baseline -0.002 -6"><span class='ocrx_word' id='word_1_125' title='bbox 671 655 821 677; x_wconf 79' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 828 655 945 683; x_wconf 77' lang='eng' dir='ltr'><em>duraquae</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 953 655 1038 676; x_wconf 78' lang='eng' dir='ltr'><em>WBQ.1</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 1046 652 1101 676; x_wconf 85' lang='eng' dir='ltr'><em>—25T</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 1110 653 1208 681; x_wconf 84' lang='eng' dir='ltr'><em>(AM491</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 1215 653 1275 681; x_wconf 87' lang='eng'>368)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 660 692 1219 721; baseline 0 -4"><span class='ocrx_word' id='word_1_131' title='bbox 660 696 809 717; x_wconf 77' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_132' title='bbox 816 695 951 717; x_wconf 80' lang='eng' dir='ltr'><em>caen/LMG</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 963 692 1058 717; x_wconf 84' lang='eng' dir='ltr'><em>22862T</em></span> <span class='ocrx_word' id='word_1_134' title='bbox 1068 693 1219 721; x_wconf 85' lang='eng' dir='ltr'><em>(AJ786798)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 601 732 1222 764; baseline -0.002 -6"><span class='ocrx_word' id='word_1_135' title='bbox 601 732 636 748; x_wconf 70' lang='eng'><em>‘00</em></span> <span class='ocrx_word' id='word_1_136' title='bbox 658 736 808 758; x_wconf 81' lang='eng' dir='ltr'><em>Pedobacfer</em></span> <span class='ocrx_word' id='word_1_137' title='bbox 814 733 1048 764; x_wconf 74' lang='eng' dir='ltr'><em>steyn/iWB2.3—45T</em></span> <span class='ocrx_word' id='word_1_138' title='bbox 1058 734 1222 762; x_wconf 83' lang='eng' dir='ltr'><em>(AM491372)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 493 773 1294 805; baseline 0 -7"><span class='ocrx_word' id='word_1_139' title='bbox 493 781 555 794; x_wconf 70' lang='eng'><em>—0</em></span> <span class='ocrx_word' id='word_1_140' title='bbox 675 777 825 798; x_wconf 80' lang='eng' dir='ltr'><em>Pedobaoter</em></span> <span class='ocrx_word' id='word_1_141' title='bbox 830 776 1052 805; x_wconf 70' lang='eng' dir='ltr'><em>g/hseng/lso/I&#39;Gsoil</em></span> <span class='ocrx_word' id='word_1_142' title='bbox 1065 773 1124 798; x_wconf 96' lang='eng' dir='ltr'><em>104T</em></span> <span class='ocrx_word' id='word_1_143' title='bbox 1134 774 1294 802; x_wconf 90' lang='eng' dir='ltr'><em>(AB245371)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 552 814 1291 845; baseline -0.001 -6"><span class='ocrx_word' id='word_1_144' title='bbox 552 823 575 838; x_wconf 86' lang='eng'><em>62</em></span> <span class='ocrx_word' id='word_1_145' title='bbox 603 827 639 843; x_wconf 79' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_146' title='bbox 665 817 977 845; x_wconf 75' lang='eng' dir='ltr'><em>Pedobacterpanac/lerrae</em></span> <span class='ocrx_word' id='word_1_147' title='bbox 985 817 1049 839; x_wconf 85' lang='eng' dir='ltr'><strong>Gsoil</strong></span> <span class='ocrx_word' id='word_1_148' title='bbox 1060 814 1121 838; x_wconf 86' lang='eng' dir='ltr'><em>042T</em></span> <span class='ocrx_word' id='word_1_149' title='bbox 1130 815 1291 843; x_wconf 73' lang='eng' dir='ltr'><em>(ABQ45368)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 658 855 1166 883; baseline 0 -4"><span class='ocrx_word' id='word_1_150' title='bbox 658 858 808 879; x_wconf 79' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_151' title='bbox 815 860 886 879; x_wconf 75' lang='eng' dir='ltr'><em>terrae</em></span> <span class='ocrx_word' id='word_1_152' title='bbox 895 855 990 879; x_wconf 89' lang='eng' dir='ltr'><em>DS-57T</em></span> <span class='ocrx_word' id='word_1_153' title='bbox 1000 856 1166 883; x_wconf 82' lang='eng' dir='ltr'>(D0889723)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 723 895 1313 927; baseline 0 -7"><span class='ocrx_word' id='word_1_154' title='bbox 723 898 975 927; x_wconf 69' lang='eng' dir='ltr'><em>Pedobacterp/lsc/um</em></span> <span class='ocrx_word' id='word_1_155' title='bbox 984 898 1045 920; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_156' title='bbox 1058 899 1065 920; x_wconf 97' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_157' title='bbox 1075 899 1083 920; x_wconf 92' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_158' title='bbox 1092 895 1152 920; x_wconf 87' lang='eng' dir='ltr'><em>725T</em></span> <span class='ocrx_word' id='word_1_159' title='bbox 1161 896 1263 924; x_wconf 88' lang='eng' dir='ltr'><em>(AJ4381</em></span> <span class='ocrx_word' id='word_1_160' title='bbox 1272 896 1313 924; x_wconf 92' lang='eng'><em>74)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 726 936 1309 965; baseline 0 -4"><span class='ocrx_word' id='word_1_161' title='bbox 726 939 876 961; x_wconf 77' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_162' title='bbox 882 939 998 961; x_wconf 66' lang='eng' dir='ltr'><em>hanfon/us</em></span> <span class='ocrx_word' id='word_1_163' title='bbox 1004 936 1135 961; x_wconf 85' lang='eng' dir='ltr'><em>WB3.3-3T</em></span> <span class='ocrx_word' id='word_1_164' title='bbox 1144 937 1242 965; x_wconf 86' lang='eng' dir='ltr'><em>(AM491</em></span> <span class='ocrx_word' id='word_1_165' title='bbox 1249 940 1294 961; x_wconf 89' lang='eng'>371</span> <span class='ocrx_word' id='word_1_166' title='bbox 1301 937 1309 965; x_wconf 92' lang='eng'><em>)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 723 977 1246 1008; baseline 0 -7"><span class='ocrx_word' id='word_1_167' title='bbox 723 980 872 1002; x_wconf 79' lang='eng' dir='ltr'><em>Pedabacter</em></span> <span class='ocrx_word' id='word_1_168' title='bbox 879 980 1015 1008; x_wconf 62' lang='eng' dir='ltr'><em>cg/ocon/I/s</em></span> <span class='ocrx_word' id='word_1_169' title='bbox 1021 980 1055 1001; x_wconf 94' lang='eng' dir='ltr'>A3</span> <span class='ocrx_word' id='word_1_170' title='bbox 1060 977 1085 1001; x_wconf 91' lang='eng' dir='ltr'><em>7T</em></span> <span class='ocrx_word' id='word_1_171' title='bbox 1094 977 1196 1006; x_wconf 86' lang='eng' dir='ltr'><em>(AJ4381</em></span> <span class='ocrx_word' id='word_1_172' title='bbox 1205 977 1246 1005; x_wconf 94' lang='eng'><em>70)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 765 1017 1364 1048; baseline 0 -6"><span class='ocrx_word' id='word_1_173' title='bbox 765 1020 915 1042; x_wconf 73' lang='eng' dir='ltr'><em>Pedobacfer</em></span> <span class='ocrx_word' id='word_1_174' title='bbox 921 1020 1081 1048; x_wconf 61' lang='eng' dir='ltr'><em>h/Ma/ayens/s</em></span> <span class='ocrx_word' id='word_1_175' title='bbox 1088 1021 1105 1042; x_wconf 98' lang='eng' dir='ltr'><strong>H</strong></span> <span class='ocrx_word' id='word_1_176' title='bbox 1110 1020 1148 1042; x_wconf 89' lang='eng' dir='ltr'><em>HS</em></span> <span class='ocrx_word' id='word_1_177' title='bbox 1160 1017 1203 1042; x_wconf 77' lang='eng' dir='ltr'><em>22T</em></span> <span class='ocrx_word' id='word_1_178' title='bbox 1213 1018 1364 1046; x_wconf 86' lang='eng' dir='ltr'><em>(AJ583425)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 717 1058 1392 1087; baseline -0.001 -4"><span class='ocrx_word' id='word_1_179' title='bbox 717 1061 867 1083; x_wconf 80' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_180' title='bbox 875 1061 1063 1083; x_wconf 80' lang='eng' dir='ltr'><em>westerhafens/s</em></span> <span class='ocrx_word' id='word_1_181' title='bbox 1069 1058 1218 1082; x_wconf 77' lang='eng' dir='ltr'><em>WBS.3—22T</em></span> <span class='ocrx_word' id='word_1_182' title='bbox 1227 1059 1324 1087; x_wconf 84' lang='eng' dir='ltr'><em>(AM491</em></span> <span class='ocrx_word' id='word_1_183' title='bbox 1332 1058 1392 1087; x_wconf 85' lang='eng'>369)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 494 1098 1297 1168">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 494 1098 1297 1168">
+     <span class='ocr_line' id='line_1_39' title="bbox 494 1098 1153 1154; baseline 0 -31"><span class='ocrx_word' id='word_1_184' title='bbox 494 1101 791 1154; x_wconf 37' lang='eng' dir='ltr'><em>ﬁddobacter</em></span> <span class='ocrx_word' id='word_1_185' title='bbox 797 1101 884 1123; x_wconf 82' lang='eng' dir='ltr'><em>I&#39;nsu/ae</em></span> <span class='ocrx_word' id='word_1_186' title='bbox 892 1098 988 1123; x_wconf 78' lang='eng' dir='ltr'><em>DS-39T</em></span> <span class='ocrx_word' id='word_1_187' title='bbox 997 1099 1050 1127; x_wconf 90' lang='eng' dir='ltr'><em>(EF1</em></span> <span class='ocrx_word' id='word_1_188' title='bbox 1058 1099 1153 1127; x_wconf 86' lang='eng'>00697)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 685 1139 1297 1168; baseline -0.002 -4"><span class='ocrx_word' id='word_1_189' title='bbox 685 1142 834 1164; x_wconf 79' lang='eng' dir='ltr'><em>Pedobacler</em></span> <span class='ocrx_word' id='word_1_190' title='bbox 840 1142 961 1164; x_wconf 76' lang='eng' dir='ltr'><em>koreensis</em></span> <span class='ocrx_word' id='word_1_191' title='bbox 967 1142 1070 1164; x_wconf 90' lang='eng' dir='ltr'>WPCB1</span> <span class='ocrx_word' id='word_1_192' title='bbox 1078 1139 1121 1163; x_wconf 88' lang='eng' dir='ltr'><em>89T</em></span> <span class='ocrx_word' id='word_1_193' title='bbox 1131 1140 1282 1168; x_wconf 82' lang='eng' dir='ltr'><em>(D0092871</em></span> <span class='ocrx_word' id='word_1_194' title='bbox 1289 1140 1297 1168; x_wconf 91' lang='eng'><em>)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 546 625 676 630">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 546 625 676 630">
+     <span class='ocr_line' id='line_1_41' title="bbox 546 625 676 630; baseline 0 541"><span class='ocrx_word' id='word_1_195' title='bbox 546 625 676 630; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 319 143 321 638">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 319 143 321 638">
+     <span class='ocr_line' id='line_1_42' title="bbox 319 143 321 638; baseline 0 533"><span class='ocrx_word' id='word_1_196' title='bbox 319 143 321 638; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 563 391 565 736">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 563 391 565 736">
+     <span class='ocr_line' id='line_1_43' title="bbox 563 391 565 736; baseline 0 435"><span class='ocrx_word' id='word_1_197' title='bbox 563 391 565 736; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 546 629 551 949">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 546 629 551 949">
+     <span class='ocr_line' id='line_1_44' title="bbox 546 629 551 949; baseline 0 222"><span class='ocrx_word' id='word_1_198' title='bbox 546 629 551 949; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 546 905 761 1078">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 546 905 761 1078">
+     <span class='ocr_line' id='line_1_45' title="bbox 546 905 721 979; baseline 0 0"><span class='ocrx_word' id='word_1_199' title='bbox 546 905 721 979; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 546 979 761 1078; baseline 0 -55"><span class='ocrx_word' id='word_1_200' title='bbox 546 979 761 1078; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 440 313 443 959">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 440 313 443 959">
+     <span class='ocr_line' id='line_1_47' title="bbox 440 313 443 959; baseline 0 212"><span class='ocrx_word' id='word_1_201' title='bbox 440 313 443 959; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 444 939 498 968">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 444 939 498 968">
+     <span class='ocr_line' id='line_1_48' title="bbox 450 939 474 955; baseline 0 0"><span class='ocrx_word' id='word_1_202' title='bbox 450 939 474 955; x_wconf 82' lang='eng'><em>96</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_49' title="bbox 444 956 498 968; baseline 0 0"><span class='ocrx_word' id='word_1_203' title='bbox 444 956 498 968; x_wconf 70' lang='eng' dir='ltr'><em>—o</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 118 1008 156 1023">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 118 1008 156 1023">
+     <span class='ocr_line' id='line_1_50' title="bbox 118 1008 156 1023; baseline 0 0"><span class='ocrx_word' id='word_1_204' title='bbox 118 1008 156 1023; x_wconf 86' lang='eng'><em>0.01</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 644 1057 664 1072">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 644 1057 664 1072">
+     <span class='ocr_line' id='line_1_51' title="bbox 644 1057 664 1072; baseline 0 0"><span class='ocrx_word' id='word_1_205' title='bbox 644 1057 664 1072; x_wconf 90' lang='eng'>51</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 491 786 494 1133">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 491 786 494 1133">
+     <span class='ocr_line' id='line_1_52' title="bbox 491 786 494 1133; baseline 0 38"><span class='ocrx_word' id='word_1_206' title='bbox 491 786 494 1133; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000174-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000174-0-000.pbm.png
new file mode 100644
index 00000000..b78652c8
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000174-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000174-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000174-0-000.pbm.png.hocr
new file mode 100644
index 00000000..0cce8bbf
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000174-0-000.pbm.png.hocr
@@ -0,0 +1,66 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000174-0-000.pbm.png"; bbox 0 0 994 516; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 273 4 951 34">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 273 4 951 34">
+     <span class='ocr_line' id='line_1_1' title="bbox 273 4 951 34; baseline 0 -7"><span class='ocrx_word' id='word_1_1' title='bbox 273 4 448 34; x_wconf 78' lang='eng' dir='ltr'><em>‘Rhodoplanes</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 458 4 616 34; x_wconf 77' lang='eng' dir='ltr'><em>cryptolactis’</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 633 5 701 27; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 711 5 773 27; x_wconf 84' lang='eng'><em>9987</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 791 5 951 33; x_wconf 88' lang='eng' dir='ltr'>(AB087718)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 0 9 324 504">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 0 9 324 504">
+     <span class='ocr_line' id='line_1_2' title="bbox 165 9 272 51; baseline 0 -1"><span class='ocrx_word' id='word_1_6' title='bbox 165 9 272 51; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 138 51 272 120; baseline 0 -4"><span class='ocrx_word' id='word_1_7' title='bbox 138 51 272 120; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 63 120 251 187; baseline 0.027 -4"><span class='ocrx_word' id='word_1_8' title='bbox 63 120 251 187; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 0 187 303 321; baseline 0.02 -70"><span class='ocrx_word' id='word_1_9' title='bbox 0 187 303 321; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 0 321 324 461; baseline 0 0"><span class='ocrx_word' id='word_1_10' title='bbox 0 321 324 461; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 0 461 275 504; baseline 0 12"><span class='ocrx_word' id='word_1_11' title='bbox 0 461 275 504; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 244 67 990 445">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 244 67 844 168">
+     <span class='ocr_line' id='line_1_8' title="bbox 288 67 844 100; baseline 0.002 -7"><span class='ocrx_word' id='word_1_12' title='bbox 288 70 455 100; x_wconf 81' lang='eng' dir='ltr'><em>Rhodoplanes</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 465 78 547 93; x_wconf 77' lang='eng' dir='ltr'><em>roseus</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 557 72 624 94; x_wconf 92' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 635 67 710 94; x_wconf 86' lang='eng' dir='ltr'><em>5909T</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 721 70 844 100; x_wconf 83' lang='eng' dir='ltr'>(D25313)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 244 136 758 168; baseline 0 -6"><span class='ocrx_word' id='word_1_17' title='bbox 244 139 410 168; x_wconf 80' lang='eng' dir='ltr'><em>Rhodoplanes</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 420 139 517 168; x_wconf 83' lang='eng' dir='ltr'><em>elegans</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 527 136 628 162; x_wconf 80' lang='eng' dir='ltr'><em>A8130T</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 635 139 728 167; x_wconf 88' lang='eng' dir='ltr'>(D2531</span> <span class='ocrx_word' id='word_1_21' title='bbox 737 139 758 168; x_wconf 94' lang='eng'><em>1)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 263 203 670 235">
+     <span class='ocr_line' id='line_1_10' title="bbox 263 203 670 235; baseline 0.002 -6"><span class='ocrx_word' id='word_1_22' title='bbox 263 207 345 230; x_wconf 82' lang='eng' dir='ltr'><strong>Strain</strong></span> <span class='ocrx_word' id='word_1_23' title='bbox 356 203 499 230; x_wconf 86' lang='eng' dir='ltr'><em>TUT3530T</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 509 207 670 235; x_wconf 87' lang='eng' dir='ltr'><strong>(AB087717)</strong></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 281 273 990 445">
+     <span class='ocr_line' id='line_1_11' title="bbox 303 273 889 305; baseline 0.002 -7"><span class='ocrx_word' id='word_1_25' title='bbox 303 276 473 298; x_wconf 77' lang='eng' dir='ltr'><em>Blastochlaris</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 484 276 563 298; x_wconf 82' lang='eng' dir='ltr'><em>viridis</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 573 277 657 299; x_wconf 91' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_28' title='bbox 671 273 889 305; x_wconf 71' lang='eng' dir='ltr'>19567T(D25314)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 336 343 937 375; baseline 0.002 -7"><span class='ocrx_word' id='word_1_29' title='bbox 336 345 506 368; x_wconf 80' lang='eng' dir='ltr'><em>Blastochloris</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 516 345 659 374; x_wconf 76' lang='eng' dir='ltr'><em>sulfoviridis</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 671 346 736 369; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 748 343 807 369; x_wconf 84' lang='eng' dir='ltr'><em>729T</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 815 346 937 375; x_wconf 88' lang='eng' dir='ltr'>(D86514)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 281 412 990 445; baseline 0 -7"><span class='ocrx_word' id='word_1_34' title='bbox 281 415 538 444; x_wconf 79' lang='eng' dir='ltr'><em>Rhodopseudomonas</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 545 415 659 444; x_wconf 81' lang='eng' dir='ltr'><em>palustris</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 674 416 758 439; x_wconf 90' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_37' title='bbox 771 412 990 445; x_wconf 75' lang='eng' dir='ltr'>17001T(D25312)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 293 481 956 513">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 293 481 956 513">
+     <span class='ocr_line' id='line_1_14' title="bbox 293 481 956 513; baseline 0 -6"><span class='ocrx_word' id='word_1_38' title='bbox 293 484 465 507; x_wconf 76' lang='eng' dir='ltr'><em>Rhodoblastus</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 476 484 625 513; x_wconf 74' lang='eng' dir='ltr'><em>acidophilus</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 634 485 718 508; x_wconf 88' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_41' title='bbox 728 481 820 508; x_wconf 90' lang='eng' dir='ltr'><em>25092T</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 828 484 956 513; x_wconf 85' lang='eng' dir='ltr'>(M34128)</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000257-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000257-0-000.pbm.png
new file mode 100644
index 00000000..5e672768
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000257-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000257-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000257-0-000.pbm.png.hocr
new file mode 100644
index 00000000..54293153
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000257-0-000.pbm.png.hocr
@@ -0,0 +1,652 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000257-0-000.pbm.png"; bbox 0 0 1302 1689; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 1 1459 9 1670">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 1 1459 9 1670">
+     <span class='ocr_line' id='line_1_1' title="bbox 1 1459 9 1670; baseline 0 19"><span class='ocrx_word' id='word_1_1' title='bbox 1 1459 9 1670; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 129 521 157 537">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 129 521 157 537">
+     <span class='ocr_line' id='line_1_2' title="bbox 129 521 157 537; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 129 521 157 537; x_wconf 88' lang='eng'>0.0</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 143 1307 167 1322">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 144 1307 166 1322">
+     <span class='ocr_line' id='line_1_3' title="bbox 144 1307 166 1322; baseline 0 0"><span class='ocrx_word' id='word_1_3' title='bbox 144 1307 166 1322; x_wconf 80' lang='eng'><em>59</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 161 522 166 537">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 161 522 166 537">
+     <span class='ocr_line' id='line_1_4' title="bbox 161 522 166 537; baseline 0 0"><span class='ocrx_word' id='word_1_4' title='bbox 161 522 166 537; x_wconf 99' lang='eng'><em>1</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 214 1189 236 1205">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 214 1189 236 1205">
+     <span class='ocr_line' id='line_1_5' title="bbox 214 1189 236 1205; baseline 0 0"><span class='ocrx_word' id='word_1_5' title='bbox 214 1189 236 1205; x_wconf 82' lang='eng'><em>84</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 141 1324 171 1326">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 141 1324 171 1326">
+     <span class='ocr_line' id='line_1_6' title="bbox 141 1324 171 1326; baseline 0 363"><span class='ocrx_word' id='word_1_6' title='bbox 141 1324 171 1326; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 138 1324 146 1597">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 138 1324 146 1597">
+     <span class='ocr_line' id='line_1_7' title="bbox 138 1324 146 1597; baseline 0 92"><span class='ocrx_word' id='word_1_7' title='bbox 138 1324 146 1597; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 166 1209 174 1440">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 166 1209 174 1440">
+     <span class='ocr_line' id='line_1_8' title="bbox 166 1209 174 1440; baseline 0 249"><span class='ocrx_word' id='word_1_8' title='bbox 166 1209 174 1440; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 171 1209 244 1211">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 171 1209 244 1211">
+     <span class='ocr_line' id='line_1_9' title="bbox 171 1209 244 1211; baseline 0 478"><span class='ocrx_word' id='word_1_9' title='bbox 171 1209 244 1211; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 311 869 317 1070">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 311 869 317 1070">
+     <span class='ocr_line' id='line_1_10' title="bbox 311 869 317 1070; baseline 0 619"><span class='ocrx_word' id='word_1_10' title='bbox 311 869 317 1070; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 436 1 1264 751">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 437 6 1260 744">
+     <span class='ocr_line' id='line_1_11' title="bbox 610 6 1196 31; baseline -0.003 -3"><span class='ocrx_word' id='word_1_11' title='bbox 610 12 632 28; x_wconf 85' lang='eng'>96</span> <span class='ocrx_word' id='word_1_12' title='bbox 638 15 659 17; x_wconf 91' lang='eng'>—</span> <span class='ocrx_word' id='word_1_13' title='bbox 666 8 822 31; x_wconf 73' lang='eng' dir='ltr'><em>Sphfngomonas</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 829 9 950 31; x_wconf 78' lang='eng' dir='ltr'><em>yabuuchiae</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 959 8 1007 26; x_wconf 91' lang='eng' dir='ltr'><em>GTC</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 1016 6 1063 26; x_wconf 79' lang='eng' dir='ltr'><em>868T</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 1072 8 1196 31; x_wconf 85' lang='eng' dir='ltr'>(ABO71955)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 727 39 1189 63; baseline 0 -5"><span class='ocrx_word' id='word_1_18' title='bbox 727 41 884 63; x_wconf 83' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 892 41 992 58; x_wconf 86' lang='eng' dir='ltr'><em>roseiﬂava</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 1001 39 1084 58; x_wconf 78' lang='eng' dir='ltr'><em>MK341T</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 1093 41 1189 63; x_wconf 85' lang='eng' dir='ltr'><em>(D84520)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 671 71 1247 95; baseline -0.002 -4"><span class='ocrx_word' id='word_1_22' title='bbox 671 73 828 95; x_wconf 82' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 835 73 1013 95; x_wconf 84' lang='eng' dir='ltr'><em>parapaucimobilis</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 1022 73 1059 91; x_wconf 91' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 1069 71 1142 91; x_wconf 79' lang='eng' dir='ltr'><em>15100T</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 1151 73 1247 95; x_wconf 88' lang='eng' dir='ltr'>(D13724)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 638 103 1186 128; baseline 0 -5"><span class='ocrx_word' id='word_1_27' title='bbox 638 105 795 128; x_wconf 84' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 802 106 980 128; x_wconf 74' lang='eng' dir='ltr'><em>pseudosanguinis</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 988 105 1014 123; x_wconf 90' lang='eng' dir='ltr'>G1</span> <span class='ocrx_word' id='word_1_30' title='bbox 1019 103 1049 123; x_wconf 61' lang='eng' dir='ltr'><em>~2T</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 1058 105 1186 128; x_wconf 83' lang='eng' dir='ltr'><em>(AM412238)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 640 136 1194 160; baseline 0 -5"><span class='ocrx_word' id='word_1_32' title='bbox 640 144 689 146; x_wconf 93' lang='eng'>—</span> <span class='ocrx_word' id='word_1_33' title='bbox 696 138 853 160; x_wconf 80' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 861 138 960 160; x_wconf 83' lang='eng' dir='ltr'><em>sanguinis</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 969 138 1006 155; x_wconf 94' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 1016 136 1089 155; x_wconf 80' lang='eng' dir='ltr'><em>13937T</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 1098 138 1194 160; x_wconf 84' lang='eng' dir='ltr'><em>(D84529)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 611 168 1224 193; baseline 0 -5"><span class='ocrx_word' id='word_1_38' title='bbox 611 169 633 184; x_wconf 85' lang='eng'>97</span> <span class='ocrx_word' id='word_1_39' title='bbox 640 177 686 179; x_wconf 93' lang='eng'>—</span> <span class='ocrx_word' id='word_1_40' title='bbox 692 170 849 192; x_wconf 82' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 856 170 987 192; x_wconf 75' lang='eng' dir='ltr'><em>paucimobilis</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 994 170 1048 188; x_wconf 91' lang='eng' dir='ltr'><strong>GIFU</strong></span> <span class='ocrx_word' id='word_1_43' title='bbox 1058 168 1119 188; x_wconf 79' lang='eng' dir='ltr'><em>2395T</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 1128 170 1224 193; x_wconf 89' lang='eng' dir='ltr'><em>(D16144)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 509 201 1142 225; baseline 0 -5"><span class='ocrx_word' id='word_1_45' title='bbox 509 209 612 211; x_wconf 91' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_46' title='bbox 619 203 776 225; x_wconf 85' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 784 203 891 220; x_wconf 83' lang='eng' dir='ltr'><em>adhaesiva</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 899 203 953 220; x_wconf 88' lang='eng' dir='ltr'><em>GIFU</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 964 201 1037 220; x_wconf 79' lang='eng' dir='ltr'><em>11458T</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 1045 203 1142 225; x_wconf 82' lang='eng'><em>(084527)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 580 235 1185 257; baseline 0 -5"><span class='ocrx_word' id='word_1_51' title='bbox 580 242 671 244; x_wconf 93' lang='eng'>—</span> <span class='ocrx_word' id='word_1_52' title='bbox 677 235 834 257; x_wconf 83' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 841 235 1002 257; x_wconf 79' lang='eng' dir='ltr'><em>phyllosphaerae</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 1011 235 1048 252; x_wconf 90' lang='eng' dir='ltr'>FA1</span> <span class='ocrx_word' id='word_1_55' title='bbox 1060 235 1185 257; x_wconf 83' lang='eng' dir='ltr'><em>(AY563441)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 541 265 1169 290; baseline 0 -5"><span class='ocrx_word' id='word_1_56' title='bbox 541 265 573 280; x_wconf 79' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 580 274 627 276; x_wconf 93' lang='eng'>—</span> <span class='ocrx_word' id='word_1_58' title='bbox 634 267 791 290; x_wconf 84' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 798 268 931 290; x_wconf 84' lang='eng' dir='ltr'><em>yunnanensis</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 938 268 979 285; x_wconf 90' lang='eng' dir='ltr'><em>YIM</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 988 265 1036 285; x_wconf 75' lang='eng' dir='ltr'><em>003T</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 1044 267 1169 290; x_wconf 81' lang='eng' dir='ltr'>(AY894691)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 534 298 1057 322; baseline 0 -4"><span class='ocrx_word' id='word_1_63' title='bbox 534 307 557 309; x_wconf 91' lang='eng'>—</span> <span class='ocrx_word' id='word_1_64' title='bbox 563 300 720 322; x_wconf 82' lang='eng' dir='ltr'><em>Sphingornonas</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 728 300 848 318; x_wconf 71' lang='eng' dir='ltr'><em>desiccabi/is</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 856 298 928 318; x_wconf 86' lang='eng' dir='ltr'><em>CP1DT</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 936 300 1057 322; x_wconf 85' lang='eng' dir='ltr'>(AJ871435)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 622 331 1132 355; baseline 0 -5"><span class='ocrx_word' id='word_1_68' title='bbox 622 333 779 355; x_wconf 73' lang='eng' dir='ltr'><em>Sphfngomonas</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 787 333 921 350; x_wconf 81' lang='eng' dir='ltr'><em>molluscorum</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 928 333 955 350; x_wconf 92' lang='eng' dir='ltr'>An</span> <span class='ocrx_word' id='word_1_71' title='bbox 966 331 999 350; x_wconf 74' lang='eng' dir='ltr'><em>18T</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 1008 333 1132 355; x_wconf 80' lang='eng' dir='ltr'><em>(ABZ48285)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 722 363 1001 387; baseline -0.004 -4"><span class='ocrx_word' id='word_1_73' title='bbox 722 365 787 383; x_wconf 84' lang='eng' dir='ltr'><em>Strain</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 797 363 864 383; x_wconf 65' lang='eng' dir='ltr'><em>NxozY</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 873 365 1001 387; x_wconf 83' lang='eng' dir='ltr'>(DQ789172)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 638 395 1104 420; baseline 0 -5"><span class='ocrx_word' id='word_1_76' title='bbox 638 404 645 406; x_wconf 88' lang='eng'><em>-</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 651 397 808 420; x_wconf 70' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 815 398 903 419; x_wconf 79' lang='eng' dir='ltr'><em>pituitosa</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 912 395 975 415; x_wconf 84' lang='eng' dir='ltr'><em>EDIVT</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 984 397 1104 420; x_wconf 83' lang='eng' dir='ltr'>(AJ243751)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 638 428 1164 471; baseline 0 -24"><span class='ocrx_word' id='word_1_81' title='bbox 638 430 845 471; x_wconf 64' lang='eng' dir='ltr'><em>_LSphingomonas</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 853 430 933 452; x_wconf 82' lang='eng' dir='ltr'><em>trueperi</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 941 430 989 447; x_wconf 91' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 998 428 1059 447; x_wconf 88' lang='eng' dir='ltr'><em>2142T</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 1068 430 1164 452; x_wconf 87' lang='eng' dir='ltr'><em>(X97776)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 645 460 1260 484; baseline -0.002 -4"><span class='ocrx_word' id='word_1_86' title='bbox 645 460 667 475; x_wconf 82' lang='eng'>99</span> <span class='ocrx_word' id='word_1_87' title='bbox 693 462 850 484; x_wconf 84' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 858 462 970 484; x_wconf 74' lang='eng' dir='ltr'><em>azotiﬁgens</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 979 462 1043 480; x_wconf 88' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_90' title='bbox 1054 460 1126 480; x_wconf 85' lang='eng' dir='ltr'><em>15497T</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 1135 462 1260 484; x_wconf 87' lang='eng' dir='ltr'>(AB217471)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 437 492 981 517; baseline 0 -5"><span class='ocrx_word' id='word_1_92' title='bbox 437 501 564 503; x_wconf 43' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 570 494 727 517; x_wconf 84' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 734 495 793 517; x_wconf 87' lang='eng' dir='ltr'><em>panni</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 800 492 852 512; x_wconf 81' lang='eng' dir='ltr'><em>052T</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 860 494 981 517; x_wconf 86' lang='eng' dir='ltr'>(AJ575818)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 464 525 1142 549; baseline 0 -5"><span class='ocrx_word' id='word_1_97' title='bbox 464 532 486 547; x_wconf 69' lang='eng'><em>89</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 593 527 750 549; x_wconf 85' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 758 527 894 544; x_wconf 78' lang='eng' dir='ltr'><em>mucosissima</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 903 525 1005 544; x_wconf 79' lang='eng' dir='ltr'><em>CP173-2T</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 1013 527 1142 549; x_wconf 83' lang='eng' dir='ltr'>(AM229669)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 493 557 1065 581; baseline 0.002 -5"><span class='ocrx_word' id='word_1_102' title='bbox 493 565 555 567; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_103' title='bbox 561 559 718 581; x_wconf 86' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 726 559 858 577; x_wconf 76' lang='eng' dir='ltr'><em>dokdonensis</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 866 557 928 577; x_wconf 78' lang='eng' dir='ltr'><em>DS-4T</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 937 559 1065 581; x_wconf 86' lang='eng' dir='ltr'>(DQ178975)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 561 590 1045 614; baseline 0.002 -5"><span class='ocrx_word' id='word_1_107' title='bbox 561 592 718 614; x_wconf 84' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 726 592 826 610; x_wconf 86' lang='eng' dir='ltr'><em>koreensis</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 834 590 913 610; x_wconf 74' lang='eng' dir='ltr'><em>JSSZBT</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 922 592 1045 614; x_wconf 85' lang='eng' dir='ltr'>(AF131296)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 455 622 1053 647; baseline 0 -5"><span class='ocrx_word' id='word_1_111' title='bbox 455 631 637 633; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_112' title='bbox 643 624 800 647; x_wconf 84' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 808 625 843 642; x_wconf 85' lang='eng' dir='ltr'><em>soli</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 849 622 920 642; x_wconf 79' lang='eng' dir='ltr'><em>T5-04T</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 929 624 1053 647; x_wconf 80' lang='eng' dir='ltr'><em>(AB166883)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 458 655 937 679; baseline -0.004 -3"><span class='ocrx_word' id='word_1_116' title='bbox 458 660 477 676; x_wconf 82' lang='eng'>91</span> <span class='ocrx_word' id='word_1_117' title='bbox 497 657 654 679; x_wconf 82' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 662 657 706 674; x_wconf 84' lang='eng' dir='ltr'><em>mali</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 713 657 750 674; x_wconf 92' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 760 655 833 674; x_wconf 79' lang='eng' dir='ltr'><em>15500T</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 841 657 937 679; x_wconf 82' lang='eng' dir='ltr'><em>(Y09638)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 438 684 961 711; baseline 0.002 -5"><span class='ocrx_word' id='word_1_122' title='bbox 438 684 459 700; x_wconf 72' lang='eng'><em>80</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 512 689 669 711; x_wconf 85' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 676 689 730 711; x_wconf 90' lang='eng' dir='ltr'><em>pruni</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 737 689 774 707; x_wconf 91' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 784 687 857 707; x_wconf 73' lang='eng' dir='ltr'><em>15498T</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 865 689 961 711; x_wconf 82' lang='eng' dir='ltr'><em>(Y09637)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 466 719 1071 744; baseline 0 -5"><span class='ocrx_word' id='word_1_128' title='bbox 466 728 505 730; x_wconf 93' lang='eng'>—</span> <span class='ocrx_word' id='word_1_129' title='bbox 511 721 668 744; x_wconf 82' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 676 722 838 744; x_wconf 81' lang='eng' dir='ltr'><em>asaccharolytica</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 848 721 885 739; x_wconf 94' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_132' title='bbox 895 719 968 739; x_wconf 79' lang='eng' dir='ltr'><em>15499T</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 976 721 1071 744; x_wconf 84' lang='eng' dir='ltr'><em>(Y09639)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 556 37 589 93">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 557 37 589 93">
+     <span class='ocr_line' id='line_1_34' title="bbox 567 37 589 52; baseline 0 0"><span class='ocrx_word' id='word_1_134' title='bbox 567 37 589 52; x_wconf 89' lang='eng'><em>64</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 557 77 579 93; baseline 0 0"><span class='ocrx_word' id='word_1_135' title='bbox 557 77 579 93; x_wconf 79' lang='eng'><em>99</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 638 47 721 49">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 638 47 721 49">
+     <span class='ocr_line' id='line_1_36' title="bbox 638 47 721 49; baseline 0 1640"><span class='ocrx_word' id='word_1_136' title='bbox 638 47 721 49; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 495 95 585 99">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 495 95 585 99">
+     <span class='ocr_line' id='line_1_37' title="bbox 495 95 585 99; baseline 0 1590"><span class='ocrx_word' id='word_1_137' title='bbox 495 95 585 99; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 582 55 586 138">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 582 55 586 138">
+     <span class='ocr_line' id='line_1_38' title="bbox 582 55 586 138; baseline 0 1551"><span class='ocrx_word' id='word_1_138' title='bbox 582 55 586 138; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 583 136 600 138">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 583 136 600 138">
+     <span class='ocr_line' id='line_1_39' title="bbox 583 136 600 138; baseline 0 1551"><span class='ocrx_word' id='word_1_139' title='bbox 583 136 600 138; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 636 15 640 179">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 636 15 640 179">
+     <span class='ocr_line' id='line_1_40' title="bbox 636 15 640 179; baseline 0 1510"><span class='ocrx_word' id='word_1_140' title='bbox 636 15 640 179; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 599 112 601 162">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 599 112 601 162">
+     <span class='ocr_line' id='line_1_41' title="bbox 599 112 601 162; baseline 0 1527"><span class='ocrx_word' id='word_1_141' title='bbox 599 112 601 162; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 572 144 594 159">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 572 144 594 159">
+     <span class='ocr_line' id='line_1_42' title="bbox 572 144 594 159; baseline 0 0"><span class='ocrx_word' id='word_1_142' title='bbox 572 144 594 159; x_wconf 89' lang='eng'>74</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 599 159 640 163">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 599 159 640 163">
+     <span class='ocr_line' id='line_1_43' title="bbox 599 159 640 163; baseline 0 1526"><span class='ocrx_word' id='word_1_143' title='bbox 599 159 640 163; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 494 96 498 235">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 494 96 498 235">
+     <span class='ocr_line' id='line_1_44' title="bbox 494 96 498 235; baseline 0 1454"><span class='ocrx_word' id='word_1_144' title='bbox 494 96 498 235; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 506 209 510 260">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 506 209 510 260">
+     <span class='ocr_line' id='line_1_45' title="bbox 506 209 510 260; baseline 0 1429"><span class='ocrx_word' id='word_1_145' title='bbox 506 209 510 260; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 507 257 580 261">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 507 257 580 261">
+     <span class='ocr_line' id='line_1_46' title="bbox 507 257 580 261; baseline 0 1428"><span class='ocrx_word' id='word_1_146' title='bbox 507 257 580 261; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 577 242 581 276">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 577 242 581 276">
+     <span class='ocr_line' id='line_1_47' title="bbox 577 242 581 276; baseline 0 1413"><span class='ocrx_word' id='word_1_147' title='bbox 577 242 581 276; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 506 303 528 319">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 506 304 528 319">
+     <span class='ocr_line' id='line_1_48' title="bbox 506 304 528 319; baseline 0 0"><span class='ocrx_word' id='word_1_148' title='bbox 506 304 528 319; x_wconf 80' lang='eng'><em>95</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 468 322 534 326">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 468 322 534 326">
+     <span class='ocr_line' id='line_1_49' title="bbox 468 322 534 326; baseline 0 1363"><span class='ocrx_word' id='word_1_149' title='bbox 468 322 534 326; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 531 307 535 341">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 531 307 535 341">
+     <span class='ocr_line' id='line_1_50' title="bbox 531 307 535 341; baseline 0 1348"><span class='ocrx_word' id='word_1_150' title='bbox 531 307 535 341; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 534 339 616 341">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 534 339 616 341">
+     <span class='ocr_line' id='line_1_51' title="bbox 534 339 616 341; baseline 0 1348"><span class='ocrx_word' id='word_1_151' title='bbox 534 339 616 341; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 467 323 471 400">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 467 323 471 400">
+     <span class='ocr_line' id='line_1_52' title="bbox 467 323 471 400; baseline 0 1289"><span class='ocrx_word' id='word_1_152' title='bbox 467 323 471 400; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 468 399 505 401">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 468 399 505 401">
+     <span class='ocr_line' id='line_1_53' title="bbox 468 399 505 401; baseline 0 1288"><span class='ocrx_word' id='word_1_153' title='bbox 468 399 505 401; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 474 407 495 422">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 475 407 494 422">
+     <span class='ocr_line' id='line_1_54' title="bbox 475 407 494 422; baseline 0 0"><span class='ocrx_word' id='word_1_154' title='bbox 475 407 494 422; x_wconf 92' lang='eng'><em>71</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 502 371 506 430">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 502 371 506 430">
+     <span class='ocr_line' id='line_1_55' title="bbox 502 371 506 430; baseline 0 1259"><span class='ocrx_word' id='word_1_155' title='bbox 502 371 506 430; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 503 426 638 432">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 503 426 638 432">
+     <span class='ocr_line' id='line_1_56' title="bbox 503 426 638 432; baseline 0 1257"><span class='ocrx_word' id='word_1_156' title='bbox 503 426 638 432; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 635 404 639 455">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 635 404 639 455">
+     <span class='ocr_line' id='line_1_57' title="bbox 635 404 639 455; baseline 0 1234"><span class='ocrx_word' id='word_1_157' title='bbox 635 404 639 455; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 602 434 634 452">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 602 435 634 451">
+     <span class='ocr_line' id='line_1_58' title="bbox 602 435 634 451; baseline 0 0"><span class='ocrx_word' id='word_1_158' title='bbox 602 435 634 451; x_wconf 85' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 435 548 493 552">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 435 548 493 552">
+     <span class='ocr_line' id='line_1_59' title="bbox 435 548 493 552; baseline 0 1137"><span class='ocrx_word' id='word_1_159' title='bbox 435 548 493 552; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_37' title="bbox 491 533 493 567">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 491 533 493 567">
+     <span class='ocr_line' id='line_1_60' title="bbox 491 533 493 567; baseline 0 1122"><span class='ocrx_word' id='word_1_160' title='bbox 491 533 493 567; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_38' title="bbox 413 382 421 584">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 413 382 421 584">
+     <span class='ocr_line' id='line_1_61' title="bbox 413 382 421 584; baseline 0 1105"><span class='ocrx_word' id='word_1_161' title='bbox 413 382 421 584; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_39' title="bbox 431 262 441 617">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 431 262 441 617">
+     <span class='ocr_line' id='line_1_62' title="bbox 431 262 441 617; baseline 0 1072"><span class='ocrx_word' id='word_1_162' title='bbox 431 262 441 617; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_40' title="bbox 377 613 455 618">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 377 613 455 618">
+     <span class='ocr_line' id='line_1_63' title="bbox 377 613 455 618; baseline 0 1071"><span class='ocrx_word' id='word_1_163' title='bbox 377 613 455 618; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_41' title="bbox 453 598 455 633">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 453 598 455 633">
+     <span class='ocr_line' id='line_1_64' title="bbox 453 598 455 633; baseline 0 1056"><span class='ocrx_word' id='word_1_164' title='bbox 453 598 455 633; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_42' title="bbox 464 679 466 730">
+    <p class='ocr_par' dir='ltr' id='par_1_42' title="bbox 464 679 466 730">
+     <span class='ocr_line' id='line_1_65' title="bbox 464 679 466 730; baseline 0 959"><span class='ocrx_word' id='word_1_165' title='bbox 464 679 466 730; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_43' title="bbox 352 757 529 765">
+    <p class='ocr_par' dir='ltr' id='par_1_43' title="bbox 352 757 529 765">
+     <span class='ocr_line' id='line_1_66' title="bbox 352 757 529 765; baseline 0 924"><span class='ocrx_word' id='word_1_166' title='bbox 352 757 529 765; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_44' title="bbox 350 760 356 981">
+    <p class='ocr_par' dir='ltr' id='par_1_44' title="bbox 350 760 356 981">
+     <span class='ocr_line' id='line_1_67' title="bbox 350 760 356 981; baseline 0 708"><span class='ocrx_word' id='word_1_167' title='bbox 350 760 356 981; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_45' title="bbox 458 748 1035 816">
+    <p class='ocr_par' dir='ltr' id='par_1_45' title="bbox 458 752 1035 809">
+     <span class='ocr_line' id='line_1_68' title="bbox 535 752 990 776; baseline 0 -5"><span class='ocrx_word' id='word_1_168' title='bbox 535 754 692 776; x_wconf 83' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_169' title='bbox 700 754 774 771; x_wconf 83' lang='eng' dir='ltr'><em>insu/ae</em></span> <span class='ocrx_word' id='word_1_170' title='bbox 783 752 858 771; x_wconf 89' lang='eng' dir='ltr'><em>DS-28T</em></span> <span class='ocrx_word' id='word_1_171' title='bbox 866 754 990 776; x_wconf 84' lang='eng' dir='ltr'><em>(EF363714)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_69' title="bbox 458 784 1035 809; baseline 0 -5"><span class='ocrx_word' id='word_1_172' title='bbox 458 793 619 795; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_173' title='bbox 626 786 783 809; x_wconf 81' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_174' title='bbox 790 787 847 804; x_wconf 85' lang='eng' dir='ltr'><em>abaci</em></span> <span class='ocrx_word' id='word_1_175' title='bbox 854 784 906 804; x_wconf 77' lang='eng' dir='ltr'><em>C42T</em></span> <span class='ocrx_word' id='word_1_176' title='bbox 915 786 1035 809; x_wconf 85' lang='eng' dir='ltr'>(AJ575817)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_46' title="bbox 457 813 1073 880">
+    <p class='ocr_par' dir='ltr' id='par_1_46' title="bbox 474 817 1073 873">
+     <span class='ocr_line' id='line_1_70' title="bbox 511 817 977 859; baseline 0 -23"><span class='ocrx_word' id='word_1_177' title='bbox 511 819 678 859; x_wconf 77' lang='eng' dir='ltr'><em>[Sphingomonas</em></span> <span class='ocrx_word' id='word_1_178' title='bbox 686 819 772 841; x_wconf 78' lang='eng' dir='ltr'><em>aquatilis</em></span> <span class='ocrx_word' id='word_1_179' title='bbox 780 817 845 836; x_wconf 89' lang='eng' dir='ltr'><em>JSS7T</em></span> <span class='ocrx_word' id='word_1_180' title='bbox 854 819 977 841; x_wconf 84' lang='eng' dir='ltr'>(AF131295)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_71' title="bbox 474 848 1073 873; baseline 0.002 -5"><span class='ocrx_word' id='word_1_181' title='bbox 474 848 506 863; x_wconf 78' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_182' title='bbox 525 851 682 873; x_wconf 79' lang='eng' dir='ltr'><em>Sphingnmnnas</em></span> <span class='ocrx_word' id='word_1_183' title='bbox 690 851 771 869; x_wconf 76' lang='eng' dir='ltr'><em>melon/s</em></span> <span class='ocrx_word' id='word_1_184' title='bbox 779 851 884 869; x_wconf 88' lang='eng' dir='ltr'><em>DAPP-PG</em></span> <span class='ocrx_word' id='word_1_185' title='bbox 893 849 941 868; x_wconf 76' lang='eng' dir='ltr'><em>224T</em></span> <span class='ocrx_word' id='word_1_186' title='bbox 949 851 1073 873; x_wconf 76' lang='eng' dir='ltr'><em>(A3055863)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_47' title="bbox 378 877 1183 929">
+    <p class='ocr_par' dir='ltr' id='par_1_47' title="bbox 379 881 1182 929">
+     <span class='ocr_line' id='line_1_72' title="bbox 379 881 1182 924; baseline 0 -23"><span class='ocrx_word' id='word_1_187' title='bbox 379 889 612 924; x_wconf 56' lang='eng'><em>_‘_—</em></span> <span class='ocrx_word' id='word_1_188' title='bbox 618 883 775 906; x_wconf 81' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_189' title='bbox 783 884 895 901; x_wconf 82' lang='eng' dir='ltr'><em>echinaides</em></span> <span class='ocrx_word' id='word_1_190' title='bbox 902 883 966 901; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_191' title='bbox 976 881 1049 901; x_wconf 75' lang='eng' dir='ltr'><em>14820T</em></span> <span class='ocrx_word' id='word_1_192' title='bbox 1058 883 1182 906; x_wconf 87' lang='eng' dir='ltr'>(ABO21370)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_73' title="bbox 415 913 425 929; baseline 0 0"><span class='ocrx_word' id='word_1_193' title='bbox 415 913 425 929; x_wconf 81' lang='eng'>9</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_48' title="bbox 427 906 1052 979">
+    <p class='ocr_par' dir='ltr' id='par_1_48' title="bbox 427 914 1052 971">
+     <span class='ocr_line' id='line_1_74' title="bbox 427 914 1009 938; baseline 0.002 -5"><span class='ocrx_word' id='word_1_194' title='bbox 427 914 438 929; x_wconf 91' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_195' title='bbox 489 916 645 938; x_wconf 84' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_196' title='bbox 654 916 804 938; x_wconf 81' lang='eng' dir='ltr'><em>oligophenolica</em></span> <span class='ocrx_word' id='word_1_197' title='bbox 812 914 876 934; x_wconf 56' lang='eng' dir='ltr'><em>8213&#39;r</em></span> <span class='ocrx_word' id='word_1_198' title='bbox 885 916 1009 938; x_wconf 83' lang='eng' dir='ltr'><em>(ABO18439)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_75' title="bbox 591 946 1052 971; baseline 0 -5"><span class='ocrx_word' id='word_1_199' title='bbox 591 948 748 971; x_wconf 84' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_200' title='bbox 756 949 840 966; x_wconf 79' lang='eng' dir='ltr'><em>aemlata</em></span> <span class='ocrx_word' id='word_1_201' title='bbox 849 946 923 966; x_wconf 87' lang='eng' dir='ltr'><em>NW12T</em></span> <span class='ocrx_word' id='word_1_202' title='bbox 932 948 1052 971; x_wconf 86' lang='eng' dir='ltr'><em>(AJ429240)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_49' title="bbox 415 760 417 819">
+    <p class='ocr_par' dir='ltr' id='par_1_49' title="bbox 415 760 417 819">
+     <span class='ocr_line' id='line_1_76' title="bbox 415 760 417 819; baseline 0 870"><span class='ocrx_word' id='word_1_203' title='bbox 415 760 417 819; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_50' title="bbox 423 824 444 839">
+    <p class='ocr_par' dir='ltr' id='par_1_50' title="bbox 424 824 443 839">
+     <span class='ocr_line' id='line_1_77' title="bbox 424 824 443 839; baseline 0 0"><span class='ocrx_word' id='word_1_204' title='bbox 424 824 443 839; x_wconf 91' lang='eng'><em>71</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_51' title="bbox 455 793 459 843">
+    <p class='ocr_par' dir='ltr' id='par_1_51' title="bbox 455 793 459 843">
+     <span class='ocr_line' id='line_1_78' title="bbox 455 793 459 843; baseline 0 846"><span class='ocrx_word' id='word_1_205' title='bbox 455 793 459 843; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_52' title="bbox 373 614 383 908">
+    <p class='ocr_par' dir='ltr' id='par_1_52' title="bbox 373 614 383 908">
+     <span class='ocr_line' id='line_1_79' title="bbox 373 614 383 908; baseline 0 781"><span class='ocrx_word' id='word_1_206' title='bbox 373 614 383 908; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_53' title="bbox 353 948 1087 1022">
+    <p class='ocr_par' dir='ltr' id='par_1_53' title="bbox 505 979 1086 1003">
+     <span class='ocr_line' id='line_1_80' title="bbox 505 979 1086 1003; baseline 0 -4"><span class='ocrx_word' id='word_1_207' title='bbox 505 986 537 1001; x_wconf 90' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_208' title='bbox 577 981 734 1003; x_wconf 83' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_209' title='bbox 742 981 851 999; x_wconf 77' lang='eng' dir='ltr'><em>aurantiaca</em></span> <span class='ocrx_word' id='word_1_210' title='bbox 860 979 956 999; x_wconf 83' lang='eng' dir='ltr'><em>MA101bT</em></span> <span class='ocrx_word' id='word_1_211' title='bbox 965 981 1086 1003; x_wconf 80' lang='eng' dir='ltr'>(AJ429236)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_54' title="bbox 541 1003 1108 1074">
+    <p class='ocr_par' dir='ltr' id='par_1_54' title="bbox 541 1010 1107 1068">
+     <span class='ocr_line' id='line_1_81' title="bbox 541 1010 1017 1036; baseline 0 -5"><span class='ocrx_word' id='word_1_212' title='bbox 541 1010 563 1026; x_wconf 80' lang='eng'><em>‘39</em></span> <span class='ocrx_word' id='word_1_213' title='bbox 577 1013 734 1036; x_wconf 84' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_214' title='bbox 742 1013 793 1031; x_wconf 86' lang='eng' dir='ltr'><em>faeni</em></span> <span class='ocrx_word' id='word_1_215' title='bbox 800 1011 887 1031; x_wconf 70' lang='eng' dir='ltr'><em>MA—olkiT</em></span> <span class='ocrx_word' id='word_1_216' title='bbox 896 1013 1017 1036; x_wconf 82' lang='eng' dir='ltr'>(AJ429239)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_82' title="bbox 631 1044 1107 1068; baseline 0 -5"><span class='ocrx_word' id='word_1_217' title='bbox 631 1046 788 1068; x_wconf 84' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_218' title='bbox 792 1046 856 1068; x_wconf 82' lang='eng' dir='ltr'><em>jaspsi</em></span> <span class='ocrx_word' id='word_1_219' title='bbox 862 1044 973 1063; x_wconf 80' lang='eng' dir='ltr'><em>TDMA-16T</em></span> <span class='ocrx_word' id='word_1_220' title='bbox 982 1046 1107 1068; x_wconf 80' lang='eng' dir='ltr'>(A8264131)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_55' title="bbox 313 1067 426 1071">
+    <p class='ocr_par' dir='ltr' id='par_1_55' title="bbox 313 1067 426 1071">
+     <span class='ocr_line' id='line_1_83' title="bbox 313 1067 426 1071; baseline 0 618"><span class='ocrx_word' id='word_1_221' title='bbox 313 1067 426 1071; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_56' title="bbox 244 1065 268 1080">
+    <p class='ocr_par' dir='ltr' id='par_1_56' title="bbox 245 1065 267 1080">
+     <span class='ocr_line' id='line_1_84' title="bbox 245 1065 267 1080; baseline 0 0"><span class='ocrx_word' id='word_1_222' title='bbox 245 1065 267 1080; x_wconf 81' lang='eng'><em>53</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_57' title="bbox 245 1083 274 1085">
+    <p class='ocr_par' dir='ltr' id='par_1_57' title="bbox 245 1083 274 1085">
+     <span class='ocr_line' id='line_1_85' title="bbox 245 1083 274 1085; baseline 0 604"><span class='ocrx_word' id='word_1_223' title='bbox 245 1083 274 1085; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_58' title="bbox 423 1052 427 1086">
+    <p class='ocr_par' dir='ltr' id='par_1_58' title="bbox 423 1052 427 1086">
+     <span class='ocr_line' id='line_1_86' title="bbox 423 1052 427 1086; baseline 0 603"><span class='ocrx_word' id='word_1_224' title='bbox 423 1052 427 1086; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_59' title="bbox 567 1072 1043 1106">
+    <p class='ocr_par' dir='ltr' id='par_1_59' title="bbox 567 1076 1043 1100">
+     <span class='ocr_line' id='line_1_87' title="bbox 567 1076 1043 1100; baseline 0.002 -5"><span class='ocrx_word' id='word_1_225' title='bbox 567 1078 724 1100; x_wconf 84' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_226' title='bbox 732 1078 835 1096; x_wconf 74' lang='eng' dir='ltr'><em>kaistensis</em></span> <span class='ocrx_word' id='word_1_227' title='bbox 844 1076 910 1096; x_wconf 74' lang='eng' dir='ltr'><em>PB56T</em></span> <span class='ocrx_word' id='word_1_228' title='bbox 919 1078 1043 1100; x_wconf 83' lang='eng' dir='ltr'>(AY769083)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_60' title="bbox 396 1067 1142 1142">
+    <p class='ocr_par' dir='ltr' id='par_1_60' title="bbox 396 1076 1142 1133">
+     <span class='ocr_line' id='line_1_88' title="bbox 396 1076 561 1092; baseline 0 0"><span class='ocrx_word' id='word_1_229' title='bbox 396 1076 418 1092; x_wconf 84' lang='eng'><em>96</em></span> <span class='ocrx_word' id='word_1_230' title='bbox 426 1084 561 1086; x_wconf 92' lang='eng'><strong>—</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_89' title="bbox 420 1108 1142 1133; baseline 0 -5"><span class='ocrx_word' id='word_1_231' title='bbox 420 1113 439 1129; x_wconf 86' lang='eng'>91</span> <span class='ocrx_word' id='word_1_232' title='bbox 595 1110 752 1133; x_wconf 83' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_233' title='bbox 760 1111 967 1128; x_wconf 76' lang='eng' dir='ltr'><em>haloaromaticamans</em></span> <span class='ocrx_word' id='word_1_234' title='bbox 973 1108 1038 1128; x_wconf 80' lang='eng' dir='ltr'><em>A175T</em></span> <span class='ocrx_word' id='word_1_235' title='bbox 1047 1110 1142 1133; x_wconf 85' lang='eng' dir='ltr'>(X94101)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_61' title="bbox 364 1138 383 1154">
+    <p class='ocr_par' dir='ltr' id='par_1_61' title="bbox 364 1138 383 1153">
+     <span class='ocr_line' id='line_1_90' title="bbox 364 1138 383 1153; baseline 0 0"><span class='ocrx_word' id='word_1_236' title='bbox 364 1138 383 1153; x_wconf 85' lang='eng'>91</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_62' title="bbox 305 1156 389 1160">
+    <p class='ocr_par' dir='ltr' id='par_1_62' title="bbox 305 1156 389 1160">
+     <span class='ocr_line' id='line_1_91' title="bbox 305 1156 389 1160; baseline 0 529"><span class='ocrx_word' id='word_1_237' title='bbox 305 1156 389 1160; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_63' title="bbox 269 969 277 1199">
+    <p class='ocr_par' dir='ltr' id='par_1_63' title="bbox 269 969 277 1199">
+     <span class='ocr_line' id='line_1_92' title="bbox 269 969 277 1199; baseline 0 490"><span class='ocrx_word' id='word_1_238' title='bbox 269 969 277 1199; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_64' title="bbox 304 1157 308 1240">
+    <p class='ocr_par' dir='ltr' id='par_1_64' title="bbox 304 1157 308 1240">
+     <span class='ocr_line' id='line_1_93' title="bbox 304 1157 308 1240; baseline 0 449"><span class='ocrx_word' id='word_1_239' title='bbox 304 1157 308 1240; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_65' title="bbox 386 1133 390 1183">
+    <p class='ocr_par' dir='ltr' id='par_1_65' title="bbox 386 1133 390 1183">
+     <span class='ocr_line' id='line_1_94' title="bbox 386 1133 390 1183; baseline 0 506"><span class='ocrx_word' id='word_1_240' title='bbox 386 1133 390 1183; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_66' title="bbox 389 1136 1164 1238">
+    <p class='ocr_par' dir='ltr' id='par_1_66' title="bbox 389 1141 1164 1230">
+     <span class='ocr_line' id='line_1_95' title="bbox 574 1141 1076 1165; baseline 0 -5"><span class='ocrx_word' id='word_1_241' title='bbox 574 1143 731 1165; x_wconf 83' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_242' title='bbox 740 1143 816 1160; x_wconf 77' lang='eng' dir='ltr'><em>wittichii</em></span> <span class='ocrx_word' id='word_1_243' title='bbox 823 1143 873 1160; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_244' title='bbox 882 1141 943 1160; x_wconf 73' lang='eng' dir='ltr'><em>6014T</em></span> <span class='ocrx_word' id='word_1_245' title='bbox 952 1143 1076 1165; x_wconf 82' lang='eng' dir='ltr'><em>(ABOZ1492)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_96' title="bbox 389 1173 1042 1198; baseline 0 -5"><span class='ocrx_word' id='word_1_246' title='bbox 389 1181 594 1183; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_247' title='bbox 601 1175 758 1197; x_wconf 80' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_248' title='bbox 766 1175 841 1193; x_wconf 83' lang='eng' dir='ltr'><em>fennica</em></span> <span class='ocrx_word' id='word_1_249' title='bbox 850 1173 913 1193; x_wconf 84' lang='eng' dir='ltr'><em>K101T</em></span> <span class='ocrx_word' id='word_1_250' title='bbox 922 1175 1042 1198; x_wconf 86' lang='eng' dir='ltr'><em>(AJ009706)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_97' title="bbox 480 1206 1164 1230; baseline 0 -5"><span class='ocrx_word' id='word_1_251' title='bbox 480 1214 632 1216; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_252' title='bbox 638 1208 774 1230; x_wconf 83' lang='eng' dir='ltr'><em>Sphingobium</em></span> <span class='ocrx_word' id='word_1_253' title='bbox 782 1208 902 1230; x_wconf 82' lang='eng' dir='ltr'><em>yanoikuyae</em></span> <span class='ocrx_word' id='word_1_254' title='bbox 911 1208 975 1226; x_wconf 86' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_255' title='bbox 985 1206 1058 1226; x_wconf 87' lang='eng' dir='ltr'><em>15102T</em></span> <span class='ocrx_word' id='word_1_256' title='bbox 1067 1208 1164 1230; x_wconf 81' lang='eng' dir='ltr'>(D13728)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_67' title="bbox 305 1236 480 1242">
+    <p class='ocr_par' dir='ltr' id='par_1_67' title="bbox 305 1236 480 1242">
+     <span class='ocr_line' id='line_1_98' title="bbox 305 1236 480 1242; baseline 0 447"><span class='ocrx_word' id='word_1_257' title='bbox 305 1236 480 1242; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_68' title="bbox 242 1083 250 1337">
+    <p class='ocr_par' dir='ltr' id='par_1_68' title="bbox 242 1083 250 1337">
+     <span class='ocr_line' id='line_1_99' title="bbox 242 1083 250 1337; baseline 0 352"><span class='ocrx_word' id='word_1_258' title='bbox 242 1083 250 1337; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_69' title="bbox 443 1233 1297 1285">
+    <p class='ocr_par' dir='ltr' id='par_1_69' title="bbox 443 1238 1297 1284">
+     <span class='ocr_line' id='line_1_100' title="bbox 443 1238 1297 1281; baseline -0.002 -21"><span class='ocrx_word' id='word_1_259' title='bbox 443 1245 690 1281; x_wconf 68' lang='eng'><em>100—:</em></span> <span class='ocrx_word' id='word_1_260' title='bbox 696 1240 833 1263; x_wconf 71' lang='eng' dir='ltr'><em>Sphingobium</em></span> <span class='ocrx_word' id='word_1_261' title='bbox 841 1241 1008 1258; x_wconf 74' lang='eng' dir='ltr'><em>herbicidovorans</em></span> <span class='ocrx_word' id='word_1_262' title='bbox 1017 1240 1081 1258; x_wconf 89' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_263' title='bbox 1092 1238 1164 1258; x_wconf 82' lang='eng' dir='ltr'><em>16415T</em></span> <span class='ocrx_word' id='word_1_264' title='bbox 1173 1240 1297 1263; x_wconf 81' lang='eng' dir='ltr'>(ABO42233)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_101' title="bbox 545 1269 566 1284; baseline 0 0"><span class='ocrx_word' id='word_1_265' title='bbox 545 1269 566 1284; x_wconf 85' lang='eng'>99</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_70' title="bbox 477 1266 1264 1333">
+    <p class='ocr_par' dir='ltr' id='par_1_70' title="bbox 477 1271 1263 1327">
+     <span class='ocr_line' id='line_1_102' title="bbox 675 1271 1263 1295; baseline 0 -5"><span class='ocrx_word' id='word_1_266' title='bbox 675 1273 812 1295; x_wconf 75' lang='eng' dir='ltr'><em>Sphingobium</em></span> <span class='ocrx_word' id='word_1_267' title='bbox 820 1273 1005 1295; x_wconf 83' lang='eng' dir='ltr'><em>chlorophenolicum</em></span> <span class='ocrx_word' id='word_1_268' title='bbox 1012 1273 1076 1290; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_269' title='bbox 1085 1271 1159 1290; x_wconf 80' lang='eng' dir='ltr'><em>33790T</em></span> <span class='ocrx_word' id='word_1_270' title='bbox 1168 1273 1263 1295; x_wconf 86' lang='eng' dir='ltr'>(X87161)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_103' title="bbox 477 1303 980 1327; baseline 0.002 -5"><span class='ocrx_word' id='word_1_271' title='bbox 477 1311 515 1313; x_wconf 90' lang='eng'>—</span> <span class='ocrx_word' id='word_1_272' title='bbox 522 1305 691 1327; x_wconf 77' lang='eng' dir='ltr'><em>Sphingosinicella</em></span> <span class='ocrx_word' id='word_1_273' title='bbox 700 1305 735 1323; x_wconf 85' lang='eng' dir='ltr'><em>soli</em></span> <span class='ocrx_word' id='word_1_274' title='bbox 743 1303 843 1323; x_wconf 79' lang='eng' dir='ltr'><em>KSL-125T</em></span> <span class='ocrx_word' id='word_1_275' title='bbox 851 1305 980 1327; x_wconf 77' lang='eng' dir='ltr'><em>(DQOB7403)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_71' title="bbox 245 1332 477 1340">
+    <p class='ocr_par' dir='ltr' id='par_1_71' title="bbox 245 1332 477 1340">
+     <span class='ocr_line' id='line_1_104' title="bbox 245 1332 477 1340; baseline 0 349"><span class='ocrx_word' id='word_1_276' title='bbox 245 1332 477 1340; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_72' title="bbox 473 1214 482 1362">
+    <p class='ocr_par' dir='ltr' id='par_1_72' title="bbox 473 1214 482 1362">
+     <span class='ocr_line' id='line_1_105' title="bbox 473 1214 482 1362; baseline 0 327"><span class='ocrx_word' id='word_1_277' title='bbox 473 1214 482 1362; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_73' title="bbox 439 1342 471 1359">
+    <p class='ocr_par' dir='ltr' id='par_1_73' title="bbox 439 1343 471 1358">
+     <span class='ocr_line' id='line_1_106' title="bbox 439 1343 471 1358; baseline 0 0"><span class='ocrx_word' id='word_1_278' title='bbox 439 1343 471 1358; x_wconf 90' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_74' title="bbox 466 1330 1083 1382">
+    <p class='ocr_par' dir='ltr' id='par_1_74' title="bbox 466 1337 1083 1382">
+     <span class='ocr_line' id='line_1_107' title="bbox 505 1337 1083 1360; baseline 0 -5"><span class='ocrx_word' id='word_1_279' title='bbox 505 1337 674 1360; x_wconf 73' lang='eng' dir='ltr'><em>Sphingosinicella</em></span> <span class='ocrx_word' id='word_1_280' title='bbox 683 1338 877 1360; x_wconf 79' lang='eng' dir='ltr'><em>microcystinivorans</em></span> <span class='ocrx_word' id='word_1_281' title='bbox 886 1338 949 1355; x_wconf 82' lang='eng' dir='ltr'>MDBZ</span> <span class='ocrx_word' id='word_1_282' title='bbox 958 1337 1083 1360; x_wconf 78' lang='eng' dir='ltr'><em>(ABZ19940)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_108' title="bbox 466 1367 488 1382; baseline 0 0"><span class='ocrx_word' id='word_1_283' title='bbox 466 1367 488 1382; x_wconf 80' lang='eng'>99</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_75' title="bbox 514 1363 1086 1399">
+    <p class='ocr_par' dir='ltr' id='par_1_75' title="bbox 514 1368 1086 1392">
+     <span class='ocr_line' id='line_1_109' title="bbox 514 1368 1086 1392; baseline 0 -5"><span class='ocrx_word' id='word_1_284' title='bbox 514 1370 683 1392; x_wconf 79' lang='eng' dir='ltr'><em>Sphingosinicella</em></span> <span class='ocrx_word' id='word_1_285' title='bbox 691 1370 865 1392; x_wconf 79' lang='eng' dir='ltr'><em>xenopeptidilytica</em></span> <span class='ocrx_word' id='word_1_286' title='bbox 874 1368 953 1387; x_wconf 65' lang='eng' dir='ltr'><em>3»2W4T</em></span> <span class='ocrx_word' id='word_1_287' title='bbox 961 1370 1086 1392; x_wconf 83' lang='eng' dir='ltr'><em>(AY950663)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_76' title="bbox 279 1396 899 1433">
+    <p class='ocr_par' dir='ltr' id='par_1_76' title="bbox 279 1400 899 1425">
+     <span class='ocr_line' id='line_1_110' title="bbox 279 1400 899 1425; baseline 0 -5"><span class='ocrx_word' id='word_1_288' title='bbox 279 1408 414 1410; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_289' title='bbox 420 1402 609 1424; x_wconf 75' lang='eng' dir='ltr'><em>Novosphingobium</em></span> <span class='ocrx_word' id='word_1_290' title='bbox 617 1407 662 1420; x_wconf 81' lang='eng' dir='ltr'><em>rose</em></span> <span class='ocrx_word' id='word_1_291' title='bbox 671 1402 710 1420; x_wconf 95' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_292' title='bbox 721 1400 793 1420; x_wconf 86' lang='eng' dir='ltr'><em>14222T</em></span> <span class='ocrx_word' id='word_1_293' title='bbox 802 1402 899 1425; x_wconf 76' lang='eng'><em>(013945)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_77' title="bbox 169 1434 530 1447">
+    <p class='ocr_par' dir='ltr' id='par_1_77' title="bbox 169 1434 530 1447">
+     <span class='ocr_line' id='line_1_111' title="bbox 169 1434 530 1447; baseline 0 242"><span class='ocrx_word' id='word_1_294' title='bbox 169 1434 530 1447; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_78' title="bbox 141 1594 215 1598">
+    <p class='ocr_par' dir='ltr' id='par_1_78' title="bbox 141 1594 215 1598">
+     <span class='ocr_line' id='line_1_112' title="bbox 141 1594 215 1598; baseline 0 91"><span class='ocrx_word' id='word_1_295' title='bbox 141 1594 215 1598; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_79' title="bbox 212 1571 214 1621">
+    <p class='ocr_par' dir='ltr' id='par_1_79' title="bbox 212 1571 214 1621">
+     <span class='ocr_line' id='line_1_113' title="bbox 212 1571 214 1621; baseline 0 68"><span class='ocrx_word' id='word_1_296' title='bbox 212 1571 214 1621; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_80' title="bbox 186 1600 208 1616">
+    <p class='ocr_par' dir='ltr' id='par_1_80' title="bbox 186 1601 208 1616">
+     <span class='ocr_line' id='line_1_114' title="bbox 186 1601 208 1616; baseline 0 0"><span class='ocrx_word' id='word_1_297' title='bbox 186 1601 208 1616; x_wconf 83' lang='eng'><em>69</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_81' title="bbox 277 1408 279 1471">
+    <p class='ocr_par' dir='ltr' id='par_1_81' title="bbox 277 1408 279 1471">
+     <span class='ocr_line' id='line_1_115' title="bbox 277 1408 279 1471; baseline 0 218"><span class='ocrx_word' id='word_1_298' title='bbox 277 1408 279 1471; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_82' title="bbox 254 1446 276 1461">
+    <p class='ocr_par' dir='ltr' id='par_1_82' title="bbox 254 1446 276 1461">
+     <span class='ocr_line' id='line_1_116' title="bbox 254 1446 276 1461; baseline 0 0"><span class='ocrx_word' id='word_1_299' title='bbox 254 1446 276 1461; x_wconf 80' lang='eng'>89</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_83' title="bbox 536 1429 1105 1463">
+    <p class='ocr_par' dir='ltr' id='par_1_83' title="bbox 536 1433 1105 1457">
+     <span class='ocr_line' id='line_1_117' title="bbox 536 1433 1105 1457; baseline 0 -5"><span class='ocrx_word' id='word_1_300' title='bbox 536 1435 725 1457; x_wconf 81' lang='eng' dir='ltr'><em>Novosphingobium</em></span> <span class='ocrx_word' id='word_1_301' title='bbox 733 1435 853 1457; x_wconf 73' lang='eng' dir='ltr'><em>capsulatum</em></span> <span class='ocrx_word' id='word_1_302' title='bbox 862 1434 916 1452; x_wconf 91' lang='eng' dir='ltr'><em>GIFU</em></span> <span class='ocrx_word' id='word_1_303' title='bbox 927 1433 1000 1452; x_wconf 82' lang='eng' dir='ltr'><em>11526T</em></span> <span class='ocrx_word' id='word_1_304' title='bbox 1008 1435 1105 1457; x_wconf 86' lang='eng' dir='ltr'>(D16147)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_84' title="bbox 277 1467 397 1473">
+    <p class='ocr_par' dir='ltr' id='par_1_84' title="bbox 277 1467 397 1473">
+     <span class='ocr_line' id='line_1_118' title="bbox 277 1467 397 1473; baseline 0 216"><span class='ocrx_word' id='word_1_305' title='bbox 277 1467 397 1473; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_85' title="bbox 212 1619 266 1621">
+    <p class='ocr_par' dir='ltr' id='par_1_85' title="bbox 212 1619 266 1621">
+     <span class='ocr_line' id='line_1_119' title="bbox 212 1619 266 1621; baseline 0 68"><span class='ocrx_word' id='word_1_306' title='bbox 212 1619 266 1621; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_86' title="bbox 264 1603 266 1637">
+    <p class='ocr_par' dir='ltr' id='par_1_86' title="bbox 264 1603 266 1637">
+     <span class='ocr_line' id='line_1_120' title="bbox 264 1603 266 1637; baseline 0 52"><span class='ocrx_word' id='word_1_307' title='bbox 264 1603 266 1637; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_87' title="bbox 404 1473 475 1475">
+    <p class='ocr_par' dir='ltr' id='par_1_87' title="bbox 404 1473 475 1475">
+     <span class='ocr_line' id='line_1_121' title="bbox 404 1473 475 1475; baseline 0 214"><span class='ocrx_word' id='word_1_308' title='bbox 404 1473 475 1475; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_88' title="bbox 394 1441 398 1499">
+    <p class='ocr_par' dir='ltr' id='par_1_88' title="bbox 394 1441 398 1499">
+     <span class='ocr_line' id='line_1_122' title="bbox 394 1441 398 1499; baseline 0 190"><span class='ocrx_word' id='word_1_309' title='bbox 394 1441 398 1499; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_89' title="bbox 366 1460 1092 1529">
+    <p class='ocr_par' dir='ltr' id='par_1_89' title="bbox 367 1465 1091 1522">
+     <span class='ocr_line' id='line_1_123' title="bbox 367 1465 1091 1491; baseline 0 -7"><span class='ocrx_word' id='word_1_310' title='bbox 367 1476 389 1491; x_wconf 74' lang='eng'>99</span> <span class='ocrx_word' id='word_1_311' title='bbox 480 1467 669 1489; x_wconf 84' lang='eng' dir='ltr'><em>Novosphingnbium</em></span> <span class='ocrx_word' id='word_1_312' title='bbox 677 1467 822 1484; x_wconf 86' lang='eng' dir='ltr'><em>subterraneum</em></span> <span class='ocrx_word' id='word_1_313' title='bbox 831 1467 899 1484; x_wconf 84' lang='eng' dir='ltr'><em>SMCC</em></span> <span class='ocrx_word' id='word_1_314' title='bbox 909 1465 985 1484; x_wconf 74' lang='eng' dir='ltr'><em>30478T</em></span> <span class='ocrx_word' id='word_1_315' title='bbox 994 1467 1091 1489; x_wconf 82' lang='eng' dir='ltr'>(U20773)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_124' title="bbox 467 1499 1089 1522; baseline 0 -5"><span class='ocrx_word' id='word_1_316' title='bbox 467 1499 656 1522; x_wconf 84' lang='eng' dir='ltr'><em>Novosphingobium</em></span> <span class='ocrx_word' id='word_1_317' title='bbox 664 1499 831 1517; x_wconf 76' lang='eng' dir='ltr'><em>aromatic/vorans</em></span> <span class='ocrx_word' id='word_1_318' title='bbox 839 1499 907 1517; x_wconf 87' lang='eng' dir='ltr'><em>SMCC</em></span> <span class='ocrx_word' id='word_1_319' title='bbox 916 1499 982 1517; x_wconf 82' lang='eng' dir='ltr'>B0695</span> <span class='ocrx_word' id='word_1_320' title='bbox 991 1499 1089 1522; x_wconf 85' lang='eng' dir='ltr'>(U20755)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_90' title="bbox 416 1521 1070 1562">
+    <p class='ocr_par' dir='ltr' id='par_1_90' title="bbox 416 1529 1070 1554">
+     <span class='ocr_line' id='line_1_125' title="bbox 416 1529 1070 1554; baseline 0.002 -5"><span class='ocrx_word' id='word_1_321' title='bbox 416 1529 439 1545; x_wconf 80' lang='eng'>99</span> <span class='ocrx_word' id='word_1_322' title='bbox 454 1532 642 1554; x_wconf 88' lang='eng' dir='ltr'><em>Novosphingobium</em></span> <span class='ocrx_word' id='word_1_323' title='bbox 650 1532 818 1550; x_wconf 80' lang='eng' dir='ltr'><em>aromaticivorans</em></span> <span class='ocrx_word' id='word_1_324' title='bbox 826 1532 894 1550; x_wconf 85' lang='eng' dir='ltr'><em>SMCC</em></span> <span class='ocrx_word' id='word_1_325' title='bbox 903 1530 965 1550; x_wconf 70' lang='eng' dir='ltr'><em>F199T</em></span> <span class='ocrx_word' id='word_1_326' title='bbox 974 1532 1070 1554; x_wconf 83' lang='eng' dir='ltr'>(U20756)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_91' title="bbox 401 1473 405 1524">
+    <p class='ocr_par' dir='ltr' id='par_1_91' title="bbox 401 1473 405 1524">
+     <span class='ocr_line' id='line_1_126' title="bbox 401 1473 405 1524; baseline 0 165"><span class='ocrx_word' id='word_1_327' title='bbox 401 1473 405 1524; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_92' title="bbox 214 1558 949 1628">
+    <p class='ocr_par' dir='ltr' id='par_1_92' title="bbox 214 1563 949 1619">
+     <span class='ocr_line' id='line_1_127' title="bbox 214 1563 856 1587; baseline 0 -5"><span class='ocrx_word' id='word_1_328' title='bbox 214 1571 380 1573; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_329' title='bbox 386 1565 526 1587; x_wconf 80' lang='eng' dir='ltr'><em>Sphingopyxis</em></span> <span class='ocrx_word' id='word_1_330' title='bbox 534 1565 594 1582; x_wconf 76' lang='eng' dir='ltr'><em>terrae</em></span> <span class='ocrx_word' id='word_1_331' title='bbox 603 1564 668 1582; x_wconf 87' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_332' title='bbox 679 1563 751 1582; x_wconf 79' lang='eng' dir='ltr'><em>15098T</em></span> <span class='ocrx_word' id='word_1_333' title='bbox 760 1565 856 1587; x_wconf 88' lang='eng' dir='ltr'>(D13727)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_128' title="bbox 266 1597 949 1619; baseline 0 -5"><span class='ocrx_word' id='word_1_334' title='bbox 266 1603 441 1605; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_335' title='bbox 448 1597 587 1619; x_wconf 82' lang='eng' dir='ltr'><em>Sphingopyxis</em></span> <span class='ocrx_word' id='word_1_336' title='bbox 595 1597 756 1619; x_wconf 73' lang='eng' dir='ltr'><em>macrogoltabida</em></span> <span class='ocrx_word' id='word_1_337' title='bbox 765 1597 812 1614; x_wconf 92' lang='eng' dir='ltr'><em>EY-1</em></span> <span class='ocrx_word' id='word_1_338' title='bbox 824 1597 949 1619; x_wconf 77' lang='eng' dir='ltr'><em>(A8255383)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_93' title="bbox 609 1623 1160 1659">
+    <p class='ocr_par' dir='ltr' id='par_1_93' title="bbox 610 1627 1159 1652">
+     <span class='ocr_line' id='line_1_129' title="bbox 610 1627 1159 1652; baseline 0 -5"><span class='ocrx_word' id='word_1_339' title='bbox 610 1629 750 1652; x_wconf 71' lang='eng' dir='ltr'><em>Sphingopyxis</em></span> <span class='ocrx_word' id='word_1_340' title='bbox 757 1629 923 1652; x_wconf 82' lang='eng' dir='ltr'><em>baekryungensis</em></span> <span class='ocrx_word' id='word_1_341' title='bbox 931 1627 1025 1647; x_wconf 81' lang='eng' dir='ltr'><em>SW-150T</em></span> <span class='ocrx_word' id='word_1_342' title='bbox 1034 1629 1159 1652; x_wconf 86' lang='eng' dir='ltr'><em>(AY608604)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_94' title="bbox 324 1656 803 1689">
+    <p class='ocr_par' dir='ltr' id='par_1_94' title="bbox 324 1660 803 1684">
+     <span class='ocr_line' id='line_1_130' title="bbox 324 1660 803 1684; baseline 0 -5"><span class='ocrx_word' id='word_1_343' title='bbox 324 1662 468 1684; x_wconf 79' lang='eng' dir='ltr'><em>Erythrobacter</em></span> <span class='ocrx_word' id='word_1_344' title='bbox 474 1662 543 1684; x_wconf 82' lang='eng' dir='ltr'><em>Iongus</em></span> <span class='ocrx_word' id='word_1_345' title='bbox 551 1662 601 1679; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_346' title='bbox 610 1660 672 1679; x_wconf 78' lang='eng' dir='ltr'><em>6997T</em></span> <span class='ocrx_word' id='word_1_347' title='bbox 680 1662 803 1684; x_wconf 81' lang='eng' dir='ltr'><em>(AF465835)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000265-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000265-0-000.pbm.png
new file mode 100644
index 00000000..98860bcc
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000265-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000265-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000265-0-000.pbm.png.hocr
new file mode 100644
index 00000000..73a97d48
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000265-0-000.pbm.png.hocr
@@ -0,0 +1,114 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000265-0-000.pbm.png"; bbox 0 0 1124 662; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 402 0 1049 73">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 402 0 1049 73">
+     <span class='ocr_line' id='line_1_1' title="bbox 402 0 957 27; baseline 0.002 -6"><span class='ocrx_word' id='word_1_1' title='bbox 402 1 586 27; x_wconf 83' lang='eng' dir='ltr'><em>Hymenobacter</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 593 1 646 27; x_wconf 86' lang='eng' dir='ltr'><em>rigui</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 653 0 795 22; x_wconf 84' lang='eng' dir='ltr'><em>WPCB131T</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 804 1 957 27; x_wconf 72' lang='eng' dir='ltr'><em>(DQOBQBBQ)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 444 45 1049 73; baseline 0 -6"><span class='ocrx_word' id='word_1_5' title='bbox 444 46 628 73; x_wconf 84' lang='eng' dir='ltr'><em>Hymenobacter</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 633 46 794 73; x_wconf 84' lang='eng' dir='ltr'><em>Xinjiangensis</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 802 45 887 73; x_wconf 90' lang='eng' dir='ltr'><em>X2-1gT</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 897 46 1049 72; x_wconf 77' lang='eng' dir='ltr'>(D0888329)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 229 5 435 423">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 229 5 435 423">
+     <span class='ocr_line' id='line_1_3' title="bbox 315 5 402 40; baseline 0 622"><span class='ocrx_word' id='word_1_9' title='bbox 315 5 402 40; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 313 40 435 176; baseline 0 0"><span class='ocrx_word' id='word_1_10' title='bbox 313 40 435 176; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 263 176 425 266; baseline 0 0"><span class='ocrx_word' id='word_1_11' title='bbox 263 176 425 266; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 229 266 419 357; baseline 0 -45"><span class='ocrx_word' id='word_1_12' title='bbox 229 266 419 357; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 229 357 430 423; baseline 0 239"><span class='ocrx_word' id='word_1_13' title='bbox 229 357 430 423; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 128 91 1124 662">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 128 91 1124 662">
+     <span class='ocr_line' id='line_1_8' title="bbox 437 91 1044 118; baseline 0 -6"><span class='ocrx_word' id='word_1_14' title='bbox 437 91 621 118; x_wconf 82' lang='eng' dir='ltr'><em>Hymenobacter</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 627 91 840 118; x_wconf 78' lang='eng' dir='ltr'><em>gel/purpurascens</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 849 91 921 118; x_wconf 84' lang='eng' dir='ltr'><em>T&gt;&lt;g1T</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 931 91 1044 117; x_wconf 85' lang='eng' dir='ltr'>(Y18836)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 417 136 1124 163; baseline 0 -6"><span class='ocrx_word' id='word_1_18' title='bbox 417 137 601 163; x_wconf 83' lang='eng' dir='ltr'><em>Hymenobacter</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 607 137 805 163; x_wconf 85' lang='eng' dir='ltr'><em>psychrotolerans</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 813 137 890 157; x_wconf 80' lang='eng' dir='ltr'><em>Tibet—I</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 895 137 931 157; x_wconf 96' lang='eng' dir='ltr'>|U1</span> <span class='ocrx_word' id='word_1_22' title='bbox 939 136 962 157; x_wconf 92' lang='eng' dir='ltr'><em>1T</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 972 136 1124 163; x_wconf 88' lang='eng' dir='ltr'><em>(DQ177475)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 429 181 1036 208; baseline -0.002 -5"><span class='ocrx_word' id='word_1_24' title='bbox 429 182 613 208; x_wconf 82' lang='eng' dir='ltr'><em>Hymenobacter</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 620 182 748 208; x_wconf 88' lang='eng' dir='ltr'><em>aerophilus</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 759 181 884 203; x_wconf 87' lang='eng' dir='ltr'><em>|/26—Cor1T</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 894 182 1036 208; x_wconf 85' lang='eng' dir='ltr'><em>(AJ276901)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 414 226 1077 253; baseline 0 -5"><span class='ocrx_word' id='word_1_28' title='bbox 414 227 598 253; x_wconf 84' lang='eng' dir='ltr'><em>Hymenobacter</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 604 227 767 248; x_wconf 80' lang='eng' dir='ltr'><em>actinosc/erus</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 776 227 857 248; x_wconf 90' lang='eng' dir='ltr'><em>CCUG</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 867 226 954 248; x_wconf 81' lang='eng' dir='ltr'><em>39621T</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 964 227 1077 253; x_wconf 86' lang='eng' dir='ltr'><em>(Y17356)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 405 272 953 299; baseline 0 -6"><span class='ocrx_word' id='word_1_33' title='bbox 405 272 589 299; x_wconf 79' lang='eng' dir='ltr'><em>Hymenobacter</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 596 272 751 293; x_wconf 83' lang='eng' dir='ltr'><em>chitinivorans</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 759 272 830 293; x_wconf 78' lang='eng' dir='ltr'><em>Tx&lt;31T</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 840 272 953 298; x_wconf 90' lang='eng' dir='ltr'><em>(Y18837)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 419 317 1021 344; baseline 0 -5"><span class='ocrx_word' id='word_1_37' title='bbox 419 318 603 344; x_wconf 87' lang='eng' dir='ltr'><em>Hymenobacter</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 610 318 771 339; x_wconf 74' lang='eng' dir='ltr'><em>norwr&#39;chens/s</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 781 317 868 339; x_wconf 88' lang='eng' dir='ltr'><em>NS/50T</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 878 318 1021 344; x_wconf 82' lang='eng' dir='ltr'><em>(AJ549285)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 434 362 1046 389; baseline 0 -5"><span class='ocrx_word' id='word_1_41' title='bbox 434 363 618 389; x_wconf 84' lang='eng' dir='ltr'><em>Hymenobacter</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 625 363 811 384; x_wconf 84' lang='eng' dir='ltr'><em>roseosa/ivarius</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 819 362 923 384; x_wconf 87' lang='eng' dir='ltr'><em>AA—718T</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 933 363 1046 389; x_wconf 88' lang='eng' dir='ltr'>(Y18833)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 433 408 909 435; baseline 0 -6"><span class='ocrx_word' id='word_1_45' title='bbox 433 409 617 435; x_wconf 83' lang='eng' dir='ltr'><em>Hymenobacter</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 624 409 666 429; x_wconf 88' lang='eng' dir='ltr'><em>soli</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 674 408 752 429; x_wconf 76' lang='eng' dir='ltr'><em>PB17T</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 761 409 909 435; x_wconf 88' lang='eng' dir='ltr'><em>(AB251884)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 128 453 735 484; baseline 0 -10"><span class='ocrx_word' id='word_1_49' title='bbox 128 463 153 481; x_wconf 75' lang='eng'>86</span> <span class='ocrx_word' id='word_1_50' title='bbox 297 462 390 484; x_wconf 70' lang='eng'><em>&#39;—</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 400 453 477 474; x_wconf 85' lang='eng' dir='ltr'><em>Strain</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 487 453 577 474; x_wconf 79' lang='eng' dir='ltr'><em>ZLB-3T</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 587 454 735 480; x_wconf 85' lang='eng' dir='ltr'><em>(EU325941)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 252 488 963 525; baseline 0.001 -6"><span class='ocrx_word' id='word_1_54' title='bbox 252 491 289 509; x_wconf 65' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 297 488 392 510; x_wconf 59' lang='eng'><strong>‘—</strong></span> <span class='ocrx_word' id='word_1_56' title='bbox 399 499 583 525; x_wconf 86' lang='eng' dir='ltr'><em>Hymenobacter</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 590 499 699 520; x_wconf 84' lang='eng' dir='ltr'><em>ocellatus</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 709 499 758 525; x_wconf 85' lang='eng' dir='ltr'><em>Myx</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 767 498 840 520; x_wconf 88' lang='eng' dir='ltr'><em>2105T</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 850 499 963 525; x_wconf 89' lang='eng' dir='ltr'>(Y18835)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 383 543 973 570; baseline 0 -5"><span class='ocrx_word' id='word_1_61' title='bbox 383 544 526 565; x_wconf 75' lang='eng' dir='ltr'><em>Pant/beater</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 532 544 660 565; x_wconf 83' lang='eng' dir='ltr'><em>actiniarum</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 671 544 732 565; x_wconf 88' lang='eng' dir='ltr'><em>KMM</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 743 543 815 565; x_wconf 84' lang='eng' dir='ltr'>6156T</span> <span class='ocrx_word' id='word_1_65' title='bbox 825 544 973 570; x_wconf 86' lang='eng' dir='ltr'><em>(AY989908)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 291 588 889 616; baseline 0 -5"><span class='ocrx_word' id='word_1_66' title='bbox 291 589 469 611; x_wconf 85' lang='eng' dir='ltr'><em>Adhaeribacter</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 475 589 594 616; x_wconf 86' lang='eng' dir='ltr'><em>aquaticus</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 604 588 736 611; x_wconf 90' lang='eng' dir='ltr'><em>MBRG1.5T</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 746 589 889 616; x_wconf 87' lang='eng' dir='ltr'><em>(AJ626894)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 439 634 1044 662; baseline 0 -6"><span class='ocrx_word' id='word_1_70' title='bbox 439 635 629 656; x_wconf 79' lang='eng' dir='ltr'><em>Flavobacterium</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 639 635 735 662; x_wconf 79' lang='eng' dir='ltr'><em>aquati/e</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 744 635 819 656; x_wconf 86' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 831 634 917 656; x_wconf 82' lang='eng' dir='ltr'><em>11947T</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 927 635 1044 662; x_wconf 81' lang='eng' dir='ltr'><em>(M62797)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 93 133 323 153">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 93 133 323 153">
+     <span class='ocr_line' id='line_1_21' title="bbox 93 133 323 153; baseline 0.009 -2"><span class='ocrx_word' id='word_1_75' title='bbox 93 133 138 151; x_wconf 85' lang='eng'>0.02</span> <span class='ocrx_word' id='word_1_76' title='bbox 298 135 323 153; x_wconf 82' lang='eng'><em>59</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 188 398 225 416">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 188 398 225 416">
+     <span class='ocr_line' id='line_1_22' title="bbox 188 398 225 416; baseline 0 0"><span class='ocrx_word' id='word_1_77' title='bbox 188 398 225 416; x_wconf 91' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 158 422 233 424">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 158 422 233 424">
+     <span class='ocr_line' id='line_1_23' title="bbox 158 422 233 424; baseline 0 238"><span class='ocrx_word' id='word_1_78' title='bbox 158 422 233 424; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 231 359 233 487">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 231 359 233 487">
+     <span class='ocr_line' id='line_1_24' title="bbox 231 359 233 487; baseline 0 175"><span class='ocrx_word' id='word_1_79' title='bbox 231 359 233 487; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 129 485 296 489">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 129 485 296 489">
+     <span class='ocr_line' id='line_1_25' title="bbox 129 485 296 489; baseline 0 173"><span class='ocrx_word' id='word_1_80' title='bbox 129 485 296 489; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 158 422 160 552">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 158 422 160 552">
+     <span class='ocr_line' id='line_1_26' title="bbox 158 422 160 552; baseline 0 110"><span class='ocrx_word' id='word_1_81' title='bbox 158 422 160 552; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 0 483 435 650">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 0 483 435 650">
+     <span class='ocr_line' id='line_1_27' title="bbox 0 483 133 543; baseline 0 119"><span class='ocrx_word' id='word_1_82' title='bbox 0 483 133 543; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 0 543 289 583; baseline 0 79"><span class='ocrx_word' id='word_1_83' title='bbox 0 543 289 583; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 0 583 435 650; baseline 0 0"><span class='ocrx_word' id='word_1_84' title='bbox 0 583 435 650; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000349-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000349-0-001.pbm.png
new file mode 100644
index 00000000..0bdaa1c0
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000349-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000349-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000349-0-001.pbm.png.hocr
new file mode 100644
index 00000000..276632cb
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000349-0-001.pbm.png.hocr
@@ -0,0 +1,143 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000349-0-001.pbm.png"; bbox 0 0 1598 1112; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 595 0 1242 28">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 595 0 1242 28">
+     <span class='ocr_line' id='line_1_1' title="bbox 595 0 1242 28; baseline 0.002 -5"><span class='ocrx_word' id='word_1_1' title='bbox 595 3 777 24; x_wconf 85' lang='eng' dir='ltr'><em>Anaerotruncus</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 787 3 923 24; x_wconf 84' lang='eng' dir='ltr'><em>colihominis</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 934 3 992 24; x_wconf 90' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_4' title='bbox 1005 3 1075 23; x_wconf 86' lang='eng'><strong>17241</strong></span> <span class='ocrx_word' id='word_1_5' title='bbox 1080 0 1090 13; x_wconf 78' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_6' title='bbox 1100 3 1242 28; x_wconf 82' lang='eng' dir='ltr'>(AJ315980)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 0 18 973 1033">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 0 18 973 1033">
+     <span class='ocr_line' id='line_1_2' title="bbox 123 18 701 125; baseline 0 -17"><span class='ocrx_word' id='word_1_7' title='bbox 123 18 701 125; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 114 125 701 192; baseline 0 -10"><span class='ocrx_word' id='word_1_8' title='bbox 114 125 701 192; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 114 192 701 252; baseline 0 0"><span class='ocrx_word' id='word_1_9' title='bbox 114 192 701 252; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 114 252 536 315; baseline 0 -3"><span class='ocrx_word' id='word_1_10' title='bbox 114 252 536 315; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 75 315 666 381; baseline 0 -9"><span class='ocrx_word' id='word_1_11' title='bbox 75 315 666 381; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 75 381 719 450; baseline 0 0"><span class='ocrx_word' id='word_1_12' title='bbox 75 381 719 450; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 80 450 825 513; baseline 0.009 -7"><span class='ocrx_word' id='word_1_13' title='bbox 80 450 825 513; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 80 513 825 579; baseline 0 0"><span class='ocrx_word' id='word_1_14' title='bbox 80 513 825 579; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 0 579 821 645; baseline 0 0"><span class='ocrx_word' id='word_1_15' title='bbox 0 579 821 645; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 0 645 919 726; baseline 0 0"><span class='ocrx_word' id='word_1_16' title='bbox 0 645 919 726; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 0 726 919 782; baseline 0.003 -3"><span class='ocrx_word' id='word_1_17' title='bbox 0 726 919 782; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 0 782 700 846; baseline 0 0"><span class='ocrx_word' id='word_1_18' title='bbox 0 782 700 846; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 0 846 756 909; baseline 0.009 -7"><span class='ocrx_word' id='word_1_19' title='bbox 0 846 756 909; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 0 909 756 965; baseline 0 147"><span class='ocrx_word' id='word_1_20' title='bbox 0 909 756 965; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 0 965 973 1033; baseline 0 79"><span class='ocrx_word' id='word_1_21' title='bbox 0 965 973 1033; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 155 43 1322 94">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 155 43 1322 94">
+     <span class='ocr_line' id='line_1_17' title="bbox 155 43 177 58; baseline 0 0"><span class='ocrx_word' id='word_1_22' title='bbox 155 43 177 58; x_wconf 77' lang='eng'><strong>73</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 612 66 1322 94; baseline 0 -5"><span class='ocrx_word' id='word_1_23' title='bbox 612 68 877 89; x_wconf 81' lang='eng' dir='ltr'><em>Acetanaerobacterium</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 887 68 1016 94; x_wconf 83' lang='eng' dir='ltr'><em>elongatum</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 1024 68 1060 89; x_wconf 92' lang='eng' dir='ltr'><em>AS</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 1073 66 1166 89; x_wconf 89' lang='eng' dir='ltr'><em>1.5012T</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 1176 68 1322 94; x_wconf 86' lang='eng' dir='ltr'>(AY518589)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 705 139 1570 168">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 705 139 1570 168">
+     <span class='ocr_line' id='line_1_19' title="bbox 705 139 1570 168; baseline 0 -6"><span class='ocrx_word' id='word_1_28' title='bbox 705 142 1078 168; x_wconf 83' lang='eng' dir='ltr'><em>Hydrogenoanaerobacterium</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 1086 142 1301 162; x_wconf 84' lang='eng' dir='ltr'><em>saccharovorans</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 1310 139 1412 162; x_wconf 88' lang='eng' dir='ltr'><em>SW512T</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 1422 142 1570 167; x_wconf 87' lang='eng' dir='ltr'>(EU158190)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 87 183 1520 231">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 87 183 1520 231">
+     <span class='ocr_line' id='line_1_20' title="bbox 87 183 109 199; baseline -0.045 0"><span class='ocrx_word' id='word_1_32' title='bbox 87 183 109 199; x_wconf 85' lang='eng'><em>62</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 702 205 1520 231; baseline -0.001 -5"><span class='ocrx_word' id='word_1_33' title='bbox 702 205 1075 231; x_wconf 87' lang='eng' dir='ltr'><em>Hydrogenoanaerobacterium</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 1083 205 1298 226; x_wconf 84' lang='eng' dir='ltr'><em>saccharovorans</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 1306 205 1362 225; x_wconf 94' lang='eng' dir='ltr'><strong>W72</strong></span> <span class='ocrx_word' id='word_1_36' title='bbox 1373 205 1520 231; x_wconf 87' lang='eng' dir='ltr'><em>(EU170433)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 540 266 1172 295">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 540 266 1172 295">
+     <span class='ocr_line' id='line_1_22' title="bbox 540 266 1172 295; baseline 0 -6"><span class='ocrx_word' id='word_1_37' title='bbox 540 268 677 289; x_wconf 86' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 687 269 890 295; x_wconf 78' lang='eng' dir='ltr'><em>methylpentosum</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 909 268 967 289; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 979 266 1050 289; x_wconf 80' lang='eng' dir='ltr'><em>5476T</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 1060 269 1172 294; x_wconf 90' lang='eng' dir='ltr'><em>(Y18181)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 636 329 1598 822">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 670 329 1226 358">
+     <span class='ocr_line' id='line_1_23' title="bbox 670 329 1226 358; baseline 0 -5"><span class='ocrx_word' id='word_1_42' title='bbox 670 332 852 353; x_wconf 80' lang='eng' dir='ltr'><em>Ruminococcus</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 861 332 927 353; x_wconf 85' lang='eng' dir='ltr'><em>albus</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 935 332 1009 353; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 1020 329 1107 353; x_wconf 89' lang='eng' dir='ltr'><em>27210T</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 1117 332 1226 358; x_wconf 85' lang='eng' dir='ltr'>(L76598)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 723 395 1359 424">
+     <span class='ocr_line' id='line_1_24' title="bbox 723 395 1359 424; baseline 0 -6"><span class='ocrx_word' id='word_1_47' title='bbox 723 398 904 418; x_wconf 81' lang='eng' dir='ltr'><em>Ruminococcus</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 914 398 1060 418; x_wconf 84' lang='eng' dir='ltr'><em>ﬂavefaciens</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 1068 398 1143 418; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 1156 395 1241 418; x_wconf 80' lang='eng' dir='ltr'><em>19208T</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 1251 398 1359 424; x_wconf 82' lang='eng' dir='ltr'><em>(L76603)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 758 464 1341 492">
+     <span class='ocr_line' id='line_1_25' title="bbox 758 464 1341 492; baseline 0 -5"><span class='ocrx_word' id='word_1_52' title='bbox 758 467 940 487; x_wconf 87' lang='eng' dir='ltr'><em>Ruminococcus</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 950 467 1041 487; x_wconf 85' lang='eng' dir='ltr'><em>cal/idus</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 1049 466 1124 487; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 1135 464 1223 487; x_wconf 88' lang='eng' dir='ltr'><em>27760T</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 1232 467 1341 492; x_wconf 84' lang='eng' dir='ltr'>(L76596)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 835 527 1398 556">
+     <span class='ocr_line' id='line_1_26' title="bbox 835 527 1398 556; baseline 0 -6"><span class='ocrx_word' id='word_1_57' title='bbox 835 530 991 550; x_wconf 80' lang='eng' dir='ltr'><em>Eubaoterium</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 1000 530 1098 550; x_wconf 85' lang='eng' dir='ltr'><em>siraeum</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 1106 530 1182 550; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 1192 527 1280 550; x_wconf 73' lang='eng' dir='ltr'><em>29066T</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 1290 530 1398 556; x_wconf 80' lang='eng' dir='ltr'><em>(L34625)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 825 593 1315 622">
+     <span class='ocr_line' id='line_1_27' title="bbox 825 593 1315 622; baseline 0 -6"><span class='ocrx_word' id='word_1_62' title='bbox 825 595 974 616; x_wconf 84' lang='eng' dir='ltr'><em>Anaerofi/um</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 984 595 1041 622; x_wconf 84' lang='eng' dir='ltr'><em>agile</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 1052 595 1110 616; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_65' title='bbox 1120 593 1193 616; x_wconf 89' lang='eng' dir='ltr'><em>4272T</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 1203 595 1315 622; x_wconf 85' lang='eng' dir='ltr'><em>(X98011)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 636 659 1598 822">
+     <span class='ocr_line' id='line_1_28' title="bbox 833 659 1447 688; baseline 0 -6"><span class='ocrx_word' id='word_1_67' title='bbox 833 662 982 682; x_wconf 87' lang='eng' dir='ltr'><em>Anaerofilum</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 991 662 1174 688; x_wconf 86' lang='eng' dir='ltr'><em>pentosovorans</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 1185 662 1242 682; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 1253 659 1325 682; x_wconf 89' lang='eng' dir='ltr'><em>7168T</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 1335 662 1447 688; x_wconf 88' lang='eng' dir='ltr'>(X97852)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 923 740 1598 768; baseline -0.001 -5"><span class='ocrx_word' id='word_1_72' title='bbox 923 742 1134 763; x_wconf 75' lang='eng' dir='ltr'><em>Faeca/ibacterium</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 1142 742 1270 768; x_wconf 85' lang='eng' dir='ltr'><em>prausnitzii</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 1276 742 1351 763; x_wconf 88' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 1361 740 1449 763; x_wconf 86' lang='eng' dir='ltr'><em>27768T</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 1457 742 1598 768; x_wconf 87' lang='eng' dir='ltr'>(AJ413954)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 636 793 1173 822; baseline 0 -6"><span class='ocrx_word' id='word_1_77' title='bbox 636 795 773 816; x_wconf 80' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 782 796 865 822; x_wconf 76' lang='eng' dir='ltr'><em>Ieptum</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 873 795 948 816; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 958 793 1046 816; x_wconf 82' lang='eng' dir='ltr'><em>29065T</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 1056 796 1173 822; x_wconf 90' lang='eng' dir='ltr'>(M59095)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 701 860 1376 888">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 701 860 1376 888">
+     <span class='ocr_line' id='line_1_31' title="bbox 701 860 1376 888; baseline 0 -5"><span class='ocrx_word' id='word_1_82' title='bbox 701 862 837 883; x_wconf 67' lang='eng' dir='ltr'><em>ClostridIum</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 847 862 1069 888; x_wconf 67' lang='eng' dir='ltr'><em>sporosphaeroIdes</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 1076 862 1151 883; x_wconf 88' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 1162 860 1249 883; x_wconf 89' lang='eng' dir='ltr'><em>25781T</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 1259 862 1332 888; x_wconf 88' lang='eng' dir='ltr'>(M591</span> <span class='ocrx_word' id='word_1_87' title='bbox 1340 862 1376 888; x_wconf 87' lang='eng'><em>16)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 757 923 1270 951">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 757 923 1270 951">
+     <span class='ocr_line' id='line_1_32' title="bbox 757 923 1270 951; baseline 0 -5"><span class='ocrx_word' id='word_1_88' title='bbox 757 925 894 946; x_wconf 78' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 904 926 1003 946; x_wconf 85' lang='eng' dir='ltr'><em>cellulosi</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 1009 925 1046 946; x_wconf 89' lang='eng' dir='ltr'><em>AS</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 1058 923 1152 946; x_wconf 78' lang='eng' dir='ltr'><em>1.1777T</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 1162 925 1270 951; x_wconf 86' lang='eng' dir='ltr'><em>(L09177)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 977 1005 1551 1034">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 977 1005 1551 1034">
+     <span class='ocr_line' id='line_1_33' title="bbox 977 1005 1551 1034; baseline 0 -6"><span class='ocrx_word' id='word_1_93' title='bbox 977 1007 1113 1028; x_wconf 79' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 1123 1007 1243 1034; x_wconf 87' lang='eng' dir='ltr'><em>butyricum</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 1251 1007 1326 1028; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 1338 1005 1424 1028; x_wconf 78' lang='eng' dir='ltr'><em>19398T</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 1435 1007 1551 1033; x_wconf 84' lang='eng' dir='ltr'>(M59085)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 72 1073 110 1090">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 72 1073 110 1090">
+     <span class='ocr_line' id='line_1_34' title="bbox 72 1073 110 1090; baseline 0 0"><span class='ocrx_word' id='word_1_98' title='bbox 72 1073 110 1090; x_wconf 84' lang='eng'><em>2%</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000364-0-002.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000364-0-002.pbm.png
new file mode 100644
index 00000000..ca931e8b
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000364-0-002.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000364-0-002.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000364-0-002.pbm.png.hocr
new file mode 100644
index 00000000..324c6b15
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000364-0-002.pbm.png.hocr
@@ -0,0 +1,207 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000364-0-002.pbm.png"; bbox 0 0 1243 1187; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 10 6 484 1169">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 10 6 484 1169">
+     <span class='ocr_line' id='line_1_1' title="bbox 375 6 386 27; baseline 0 1160"><span class='ocrx_word' id='word_1_1' title='bbox 375 6 386 27; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 290 45 331 83; baseline 0 1104"><span class='ocrx_word' id='word_1_2' title='bbox 290 45 331 83; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 289 83 386 159; baseline 0 -39"><span class='ocrx_word' id='word_1_3' title='bbox 289 83 386 159; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 201 159 384 198; baseline 0 989"><span class='ocrx_word' id='word_1_4' title='bbox 201 159 384 198; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 194 198 415 274; baseline 0 -15"><span class='ocrx_word' id='word_1_5' title='bbox 194 198 415 274; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 102 274 407 353; baseline 0 0"><span class='ocrx_word' id='word_1_6' title='bbox 102 274 407 353; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 102 353 471 416; baseline 0 0"><span class='ocrx_word' id='word_1_7' title='bbox 102 353 471 416; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 68 429 366 505; baseline 0 -37"><span class='ocrx_word' id='word_1_8' title='bbox 68 429 366 505; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 34 505 342 568; baseline 0 -27"><span class='ocrx_word' id='word_1_9' title='bbox 34 505 342 568; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 10 568 271 621; baseline 0 -40"><span class='ocrx_word' id='word_1_10' title='bbox 10 568 271 621; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 10 621 355 658; baseline 0 529"><span class='ocrx_word' id='word_1_11' title='bbox 10 621 355 658; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 10 658 425 699; baseline 0 0"><span class='ocrx_word' id='word_1_12' title='bbox 10 658 425 699; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 34 699 403 725; baseline 0 462"><span class='ocrx_word' id='word_1_13' title='bbox 34 699 403 725; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 34 725 484 754; baseline 0 433"><span class='ocrx_word' id='word_1_14' title='bbox 34 725 484 754; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 34 754 407 811; baseline 0 376"><span class='ocrx_word' id='word_1_15' title='bbox 34 754 407 811; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 34 811 478 833; baseline 0 354"><span class='ocrx_word' id='word_1_16' title='bbox 34 811 478 833; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 63 833 422 871; baseline 0 316"><span class='ocrx_word' id='word_1_17' title='bbox 63 833 422 871; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 63 871 384 889; baseline 0 298"><span class='ocrx_word' id='word_1_18' title='bbox 63 871 384 889; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 63 889 379 965; baseline 0 -56"><span class='ocrx_word' id='word_1_19' title='bbox 63 889 379 965; x_wconf 95' lang='eng' dir='ltr'>    </span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 99 965 340 1005; baseline 0 182"><span class='ocrx_word' id='word_1_20' title='bbox 99 965 340 1005; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 113 1005 399 1079; baseline 0 -15"><span class='ocrx_word' id='word_1_21' title='bbox 113 1005 399 1079; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 280 1079 397 1116; baseline 0 71"><span class='ocrx_word' id='word_1_22' title='bbox 280 1079 397 1116; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 330 1116 421 1169; baseline 0 0"><span class='ocrx_word' id='word_1_23' title='bbox 330 1116 421 1169; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 323 6 1136 455">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 391 6 823 32">
+     <span class='ocr_line' id='line_1_24' title="bbox 391 6 823 32; baseline 0 -5"><span class='ocrx_word' id='word_1_24' title='bbox 391 6 478 27; x_wconf 87' lang='eng' dir='ltr'>Human</span> <span class='ocrx_word' id='word_1_25' title='bbox 489 6 554 27; x_wconf 85' lang='eng' dir='ltr'>strain</span> <span class='ocrx_word' id='word_1_26' title='bbox 564 6 668 27; x_wconf 92' lang='eng' dir='ltr'>ADV244</span> <span class='ocrx_word' id='word_1_27' title='bbox 678 6 823 32; x_wconf 87' lang='eng' dir='ltr'>(EF468686)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 331 41 1002 107">
+     <span class='ocr_line' id='line_1_25' title="bbox 331 41 1002 69; baseline -0.003 -4"><span class='ocrx_word' id='word_1_28' title='bbox 331 49 365 65; x_wconf 82' lang='eng'>100</span> <span class='ocrx_word' id='word_1_29' title='bbox 388 43 601 69; x_wconf 85' lang='eng' dir='ltr'>Pyramidobacter</span> <span class='ocrx_word' id='word_1_30' title='bbox 607 43 736 69; x_wconf 87' lang='eng' dir='ltr'>piscolens</span> <span class='ocrx_word' id='word_1_31' title='bbox 744 41 845 64; x_wconf 89' lang='eng' dir='ltr'>W5455T</span> <span class='ocrx_word' id='word_1_32' title='bbox 854 43 1002 69; x_wconf 80' lang='eng' dir='ltr'>(EU309492)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 391 81 822 107; baseline 0.002 -6"><span class='ocrx_word' id='word_1_33' title='bbox 391 81 478 102; x_wconf 88' lang='eng' dir='ltr'>Human</span> <span class='ocrx_word' id='word_1_34' title='bbox 489 81 554 102; x_wconf 81' lang='eng' dir='ltr'>strain</span> <span class='ocrx_word' id='word_1_35' title='bbox 564 81 667 102; x_wconf 84' lang='eng' dir='ltr'>ADV746</span> <span class='ocrx_word' id='word_1_36' title='bbox 678 81 822 107; x_wconf 86' lang='eng' dir='ltr'>(EF468688)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 389 120 763 146">
+     <span class='ocr_line' id='line_1_27' title="bbox 389 120 763 146; baseline 0 -6"><span class='ocrx_word' id='word_1_37' title='bbox 389 120 439 140; x_wconf 88' lang='eng' dir='ltr'>Oral</span> <span class='ocrx_word' id='word_1_38' title='bbox 450 120 515 140; x_wconf 86' lang='eng' dir='ltr'>clone</span> <span class='ocrx_word' id='word_1_39' title='bbox 526 120 602 140; x_wconf 94' lang='eng' dir='ltr'>BA121</span> <span class='ocrx_word' id='word_1_40' title='bbox 617 120 763 146; x_wconf 89' lang='eng' dir='ltr'>(AY005444)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 385 159 1055 221">
+     <span class='ocr_line' id='line_1_28' title="bbox 385 159 1055 185; baseline -0.001 -5"><span class='ocrx_word' id='word_1_41' title='bbox 385 159 514 185; x_wconf 86' lang='eng' dir='ltr'>Orangutan</span> <span class='ocrx_word' id='word_1_42' title='bbox 524 159 597 180; x_wconf 85' lang='eng' dir='ltr'>faecal</span> <span class='ocrx_word' id='word_1_43' title='bbox 607 159 673 180; x_wconf 87' lang='eng' dir='ltr'>clone</span> <span class='ocrx_word' id='word_1_44' title='bbox 682 159 892 185; x_wconf 76' lang='eng' dir='ltr'>orang2_aai66011</span> <span class='ocrx_word' id='word_1_45' title='bbox 907 159 1055 185; x_wconf 85' lang='eng' dir='ltr'>(EU462629)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 386 195 899 221; baseline 0 -6"><span class='ocrx_word' id='word_1_46' title='bbox 386 195 464 221; x_wconf 87' lang='eng' dir='ltr'>Sheep</span> <span class='ocrx_word' id='word_1_47' title='bbox 475 200 550 215; x_wconf 94' lang='eng' dir='ltr'>rumen</span> <span class='ocrx_word' id='word_1_48' title='bbox 561 195 627 215; x_wconf 86' lang='eng' dir='ltr'>clone</span> <span class='ocrx_word' id='word_1_49' title='bbox 638 195 738 215; x_wconf 83' lang='eng' dir='ltr'>196.B09</span> <span class='ocrx_word' id='word_1_50' title='bbox 749 195 899 221; x_wconf 88' lang='eng' dir='ltr'>(DQ308572)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 419 235 934 261">
+     <span class='ocr_line' id='line_1_30' title="bbox 419 235 934 261; baseline 0.002 -6"><span class='ocrx_word' id='word_1_51' title='bbox 419 235 501 256; x_wconf 89' lang='eng' dir='ltr'>Bovine</span> <span class='ocrx_word' id='word_1_52' title='bbox 512 240 587 256; x_wconf 89' lang='eng' dir='ltr'>rumen</span> <span class='ocrx_word' id='word_1_53' title='bbox 598 235 663 256; x_wconf 86' lang='eng' dir='ltr'>clone</span> <span class='ocrx_word' id='word_1_54' title='bbox 675 235 775 261; x_wconf 90' lang='eng' dir='ltr'>P5_M14</span> <span class='ocrx_word' id='word_1_55' title='bbox 786 235 934 261; x_wconf 87' lang='eng' dir='ltr'>(EU382030)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 385 272 1136 380">
+     <span class='ocr_line' id='line_1_31' title="bbox 406 272 1136 298; baseline 0 -5"><span class='ocrx_word' id='word_1_56' title='bbox 406 272 484 293; x_wconf 88' lang='eng' dir='ltr'>Naked</span> <span class='ocrx_word' id='word_1_57' title='bbox 495 272 597 293; x_wconf 89' lang='eng' dir='ltr'>mole—rat</span> <span class='ocrx_word' id='word_1_58' title='bbox 605 272 678 293; x_wconf 86' lang='eng' dir='ltr'>faecal</span> <span class='ocrx_word' id='word_1_59' title='bbox 688 272 753 293; x_wconf 88' lang='eng' dir='ltr'>clone</span> <span class='ocrx_word' id='word_1_60' title='bbox 764 272 977 298; x_wconf 87' lang='eng' dir='ltr'>molerat_aai69f04</span> <span class='ocrx_word' id='word_1_61' title='bbox 988 272 1136 298; x_wconf 87' lang='eng' dir='ltr'>(EU463081)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 411 313 1005 340; baseline 0 -6"><span class='ocrx_word' id='word_1_62' title='bbox 411 313 485 334; x_wconf 88' lang='eng' dir='ltr'>Swine</span> <span class='ocrx_word' id='word_1_63' title='bbox 496 314 597 334; x_wconf 86' lang='eng' dir='ltr'>intestine</span> <span class='ocrx_word' id='word_1_64' title='bbox 607 314 673 334; x_wconf 87' lang='eng' dir='ltr'>clone</span> <span class='ocrx_word' id='word_1_65' title='bbox 683 314 850 340; x_wconf 83' lang='eng' dir='ltr'>p—4292-4Wa3</span> <span class='ocrx_word' id='word_1_66' title='bbox 861 314 1005 340; x_wconf 84' lang='eng' dir='ltr'>(AF371930)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 385 354 816 380; baseline 0 -6"><span class='ocrx_word' id='word_1_67' title='bbox 385 354 472 374; x_wconf 83' lang='eng' dir='ltr'>Human</span> <span class='ocrx_word' id='word_1_68' title='bbox 483 354 548 374; x_wconf 81' lang='eng' dir='ltr'>strain</span> <span class='ocrx_word' id='word_1_69' title='bbox 558 354 661 374; x_wconf 81' lang='eng' dir='ltr'>ADV403</span> <span class='ocrx_word' id='word_1_70' title='bbox 672 354 816 380; x_wconf 85' lang='eng' dir='ltr'>(EF468687)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 323 390 955 455">
+     <span class='ocr_line' id='line_1_34' title="bbox 474 390 955 416; baseline 0 -5"><span class='ocrx_word' id='word_1_71' title='bbox 474 390 560 411; x_wconf 85' lang='eng' dir='ltr'>Human</span> <span class='ocrx_word' id='word_1_72' title='bbox 571 390 637 411; x_wconf 85' lang='eng' dir='ltr'>strain</span> <span class='ocrx_word' id='word_1_73' title='bbox 649 390 709 411; x_wconf 91' lang='eng' dir='ltr'>RMA</span> <span class='ocrx_word' id='word_1_74' title='bbox 720 390 789 411; x_wconf 89' lang='eng'>14551</span> <span class='ocrx_word' id='word_1_75' title='bbox 804 390 955 416; x_wconf 91' lang='eng' dir='ltr'>(DQ412722)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 323 429 898 455; baseline 0 -6"><span class='ocrx_word' id='word_1_76' title='bbox 323 429 449 449; x_wconf 87' lang='eng' dir='ltr'>Anaerobic</span> <span class='ocrx_word' id='word_1_77' title='bbox 458 429 557 455; x_wconf 84' lang='eng' dir='ltr'>digestor</span> <span class='ocrx_word' id='word_1_78' title='bbox 566 429 631 449; x_wconf 87' lang='eng' dir='ltr'>clone</span> <span class='ocrx_word' id='word_1_79' title='bbox 640 429 773 449; x_wconf 88' lang='eng' dir='ltr'>vadinBBO2</span> <span class='ocrx_word' id='word_1_80' title='bbox 784 429 898 455; x_wconf 86' lang='eng' dir='ltr'>(U81658)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 298 465 929 528">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 298 465 929 528">
+     <span class='ocr_line' id='line_1_36' title="bbox 370 465 929 492; baseline 0 -6"><span class='ocrx_word' id='word_1_81' title='bbox 370 466 462 486; x_wconf 87' lang='eng' dir='ltr'>Hoatzin</span> <span class='ocrx_word' id='word_1_82' title='bbox 472 471 525 492; x_wconf 87' lang='eng' dir='ltr'>crop</span> <span class='ocrx_word' id='word_1_83' title='bbox 535 466 599 486; x_wconf 91' lang='eng' dir='ltr'>clone</span> <span class='ocrx_word' id='word_1_84' title='bbox 610 465 766 492; x_wconf 88' lang='eng' dir='ltr'>hoa61_11f11</span> <span class='ocrx_word' id='word_1_85' title='bbox 781 466 929 492; x_wconf 85' lang='eng' dir='ltr'>(EU344711)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 298 501 730 528; baseline -0.002 -6"><span class='ocrx_word' id='word_1_86' title='bbox 298 511 333 528; x_wconf 74' lang='eng'>100</span> <span class='ocrx_word' id='word_1_87' title='bbox 358 501 408 522; x_wconf 87' lang='eng' dir='ltr'>Oral</span> <span class='ocrx_word' id='word_1_88' title='bbox 419 501 485 522; x_wconf 84' lang='eng' dir='ltr'>strain</span> <span class='ocrx_word' id='word_1_89' title='bbox 497 501 574 527; x_wconf 86' lang='eng' dir='ltr'>E3_33</span> <span class='ocrx_word' id='word_1_90' title='bbox 585 501 730 527; x_wconf 85' lang='eng' dir='ltr'>(AF481216)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 271 538 1241 1030">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 346 538 883 567">
+     <span class='ocr_line' id='line_1_38' title="bbox 346 538 883 567; baseline 0 -6"><span class='ocrx_word' id='word_1_91' title='bbox 346 541 487 567; x_wconf 83' lang='eng' dir='ltr'>Jonquete/la</span> <span class='ocrx_word' id='word_1_92' title='bbox 497 541 598 567; x_wconf 80' lang='eng' dir='ltr'>anthropi</span> <span class='ocrx_word' id='word_1_93' title='bbox 605 541 663 561; x_wconf 93' lang='eng' dir='ltr'>ADV</span> <span class='ocrx_word' id='word_1_94' title='bbox 674 538 729 561; x_wconf 88' lang='eng' dir='ltr'>126T</span> <span class='ocrx_word' id='word_1_95' title='bbox 738 541 883 567; x_wconf 85' lang='eng' dir='ltr'>(EF436500)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 271 581 1037 685">
+     <span class='ocr_line' id='line_1_39' title="bbox 271 581 976 608; baseline 0 -6"><span class='ocrx_word' id='word_1_96' title='bbox 271 586 305 603; x_wconf 83' lang='eng'>100</span> <span class='ocrx_word' id='word_1_97' title='bbox 333 581 539 602; x_wconf 80' lang='eng' dir='ltr'>Dethiosu/fovibrio</span> <span class='ocrx_word' id='word_1_98' title='bbox 548 581 667 602; x_wconf 84' lang='eng' dir='ltr'>russensis</span> <span class='ocrx_word' id='word_1_99' title='bbox 677 581 734 602; x_wconf 90' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_100' title='bbox 747 581 821 602; x_wconf 90' lang='eng'>12577</span> <span class='ocrx_word' id='word_1_101' title='bbox 832 581 976 608; x_wconf 86' lang='eng' dir='ltr'>(AF234543)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 355 616 1037 644; baseline -0.001 -5"><span class='ocrx_word' id='word_1_102' title='bbox 355 618 561 639; x_wconf 82' lang='eng' dir='ltr'>Dethiosulfovibrio</span> <span class='ocrx_word' id='word_1_103' title='bbox 569 618 745 644; x_wconf 85' lang='eng' dir='ltr'>peptidovorans</span> <span class='ocrx_word' id='word_1_104' title='bbox 755 618 813 639; x_wconf 85' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_105' title='bbox 826 616 913 639; x_wconf 90' lang='eng' dir='ltr'>11002T</span> <span class='ocrx_word' id='word_1_106' title='bbox 923 618 1037 644; x_wconf 88' lang='eng' dir='ltr'>(U52817)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 430 657 962 685; baseline 0 -5"><span class='ocrx_word' id='word_1_107' title='bbox 430 659 574 685; x_wconf 80' lang='eng' dir='ltr'>Synergistes</span> <span class='ocrx_word' id='word_1_108' title='bbox 579 659 663 685; x_wconf 84' lang='eng' dir='ltr'>jonesii</span> <span class='ocrx_word' id='word_1_109' title='bbox 670 659 745 680; x_wconf 91' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_110' title='bbox 754 657 843 680; x_wconf 85' lang='eng' dir='ltr'>49833T</span> <span class='ocrx_word' id='word_1_111' title='bbox 853 659 962 685; x_wconf 85' lang='eng' dir='ltr'>(L08066)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 403 694 1183 797">
+     <span class='ocr_line' id='line_1_42' title="bbox 403 694 1101 722; baseline -0.001 -5"><span class='ocrx_word' id='word_1_112' title='bbox 403 701 438 717; x_wconf 85' lang='eng'>100</span> <span class='ocrx_word' id='word_1_113' title='bbox 495 696 691 717; x_wconf 85' lang='eng' dir='ltr'>Anaerobaculum</span> <span class='ocrx_word' id='word_1_114' title='bbox 701 696 781 717; x_wconf 88' lang='eng' dir='ltr'>mobile</span> <span class='ocrx_word' id='word_1_115' title='bbox 792 696 851 717; x_wconf 87' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_116' title='bbox 864 694 950 717; x_wconf 79' lang='eng' dir='ltr'>13181T</span> <span class='ocrx_word' id='word_1_117' title='bbox 960 696 1101 722; x_wconf 86' lang='eng' dir='ltr'>(AJ243189)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 488 730 1183 759; baseline 0 -6"><span class='ocrx_word' id='word_1_118' title='bbox 488 733 683 753; x_wconf 83' lang='eng' dir='ltr'>Anaerobacu/um</span> <span class='ocrx_word' id='word_1_119' title='bbox 694 733 892 753; x_wconf 80' lang='eng' dir='ltr'>thermoterrenum</span> <span class='ocrx_word' id='word_1_120' title='bbox 902 732 961 753; x_wconf 90' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_121' title='bbox 973 730 1060 753; x_wconf 78' lang='eng' dir='ltr'>13490T</span> <span class='ocrx_word' id='word_1_122' title='bbox 1070 733 1183 759; x_wconf 91' lang='eng' dir='ltr'>(U50711)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 407 768 934 797; baseline 0 -6"><span class='ocrx_word' id='word_1_123' title='bbox 407 771 561 797; x_wconf 85' lang='eng' dir='ltr'>Thermovirga</span> <span class='ocrx_word' id='word_1_124' title='bbox 570 771 627 791; x_wconf 68' lang='eng' dir='ltr'>lien/&#39;1&#39;</span> <span class='ocrx_word' id='word_1_125' title='bbox 635 768 773 791; x_wconf 79' lang='eng' dir='ltr'>Ca560314T</span> <span class='ocrx_word' id='word_1_126' title='bbox 783 770 934 797; x_wconf 88' lang='eng' dir='ltr'>(DQ071273)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 366 808 1241 951">
+     <span class='ocr_line' id='line_1_45' title="bbox 482 808 1241 836; baseline 0 -6"><span class='ocrx_word' id='word_1_127' title='bbox 482 810 714 831; x_wconf 84' lang='eng' dir='ltr'>Thermanaerovibrio</span> <span class='ocrx_word' id='word_1_128' title='bbox 723 810 935 831; x_wconf 80' lang='eng' dir='ltr'>acidaminovorans</span> <span class='ocrx_word' id='word_1_129' title='bbox 944 810 1002 831; x_wconf 87' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_130' title='bbox 1013 808 1087 831; x_wconf 78' lang='eng' dir='ltr'>6589T</span> <span class='ocrx_word' id='word_1_131' title='bbox 1096 810 1241 836; x_wconf 92' lang='eng' dir='ltr'>(AF071414)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 427 847 1102 875; baseline 0 -5"><span class='ocrx_word' id='word_1_132' title='bbox 427 849 591 870; x_wconf 86' lang='eng' dir='ltr'>Aminomonas</span> <span class='ocrx_word' id='word_1_133' title='bbox 599 849 780 875; x_wconf 84' lang='eng' dir='ltr'>paucivovorans</span> <span class='ocrx_word' id='word_1_134' title='bbox 790 849 848 870; x_wconf 90' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_135' title='bbox 862 847 948 870; x_wconf 80' lang='eng' dir='ltr'>12260T</span> <span class='ocrx_word' id='word_1_136' title='bbox 957 849 1102 875; x_wconf 88' lang='eng' dir='ltr'>(AFO72581)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 384 885 1075 914; baseline -0.001 -5"><span class='ocrx_word' id='word_1_137' title='bbox 384 888 586 909; x_wconf 84' lang='eng' dir='ltr'>Aminobacterium</span> <span class='ocrx_word' id='word_1_138' title='bbox 595 888 751 909; x_wconf 85' lang='eng' dir='ltr'>colombiense</span> <span class='ocrx_word' id='word_1_139' title='bbox 762 887 821 909; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_140' title='bbox 834 885 920 909; x_wconf 80' lang='eng' dir='ltr'>12261T</span> <span class='ocrx_word' id='word_1_141' title='bbox 930 888 1075 914; x_wconf 83' lang='eng' dir='ltr'>(AF069287)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_48' title="bbox 366 923 982 951; baseline -0.002 -5"><span class='ocrx_word' id='word_1_142' title='bbox 366 925 569 946; x_wconf 79' lang='eng' dir='ltr'>Aminobacterium</span> <span class='ocrx_word' id='word_1_143' title='bbox 578 925 659 946; x_wconf 85' lang='eng' dir='ltr'>mobile</span> <span class='ocrx_word' id='word_1_144' title='bbox 670 925 728 946; x_wconf 87' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_145' title='bbox 741 923 827 946; x_wconf 81' lang='eng' dir='ltr'>12262T</span> <span class='ocrx_word' id='word_1_146' title='bbox 838 925 982 951; x_wconf 88' lang='eng' dir='ltr'>(AFO73521)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 340 966 768 992">
+     <span class='ocr_line' id='line_1_49' title="bbox 340 966 768 992; baseline 0 -5"><span class='ocrx_word' id='word_1_147' title='bbox 340 971 375 987; x_wconf 87' lang='eng'>100</span> <span class='ocrx_word' id='word_1_148' title='bbox 406 966 456 987; x_wconf 92' lang='eng' dir='ltr'>Oral</span> <span class='ocrx_word' id='word_1_149' title='bbox 467 966 532 987; x_wconf 85' lang='eng' dir='ltr'>clone</span> <span class='ocrx_word' id='word_1_150' title='bbox 541 966 612 987; x_wconf 91' lang='eng' dir='ltr'>W028</span> <span class='ocrx_word' id='word_1_151' title='bbox 624 966 768 992; x_wconf 90' lang='eng' dir='ltr'>(AF125202)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 403 1003 832 1030">
+     <span class='ocr_line' id='line_1_50' title="bbox 403 1003 832 1030; baseline 0 -6"><span class='ocrx_word' id='word_1_152' title='bbox 403 1003 453 1024; x_wconf 91' lang='eng' dir='ltr'>Oral</span> <span class='ocrx_word' id='word_1_153' title='bbox 464 1004 529 1024; x_wconf 86' lang='eng' dir='ltr'>clone</span> <span class='ocrx_word' id='word_1_154' title='bbox 539 1003 677 1030; x_wconf 88' lang='eng' dir='ltr'>MCE3_120</span> <span class='ocrx_word' id='word_1_155' title='bbox 687 1004 832 1030; x_wconf 89' lang='eng' dir='ltr'>(AF481215)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 397 1040 774 1103">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 397 1040 774 1103">
+     <span class='ocr_line' id='line_1_51' title="bbox 405 1040 761 1066; baseline 0 -5"><span class='ocrx_word' id='word_1_156' title='bbox 405 1040 455 1061; x_wconf 93' lang='eng' dir='ltr'>Oral</span> <span class='ocrx_word' id='word_1_157' title='bbox 466 1040 531 1061; x_wconf 85' lang='eng' dir='ltr'>clone</span> <span class='ocrx_word' id='word_1_158' title='bbox 542 1040 605 1061; x_wconf 90' lang='eng' dir='ltr'>D084</span> <span class='ocrx_word' id='word_1_159' title='bbox 616 1040 761 1066; x_wconf 88' lang='eng' dir='ltr'>(AF125200)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_52' title="bbox 397 1077 774 1103; baseline -0.003 -5"><span class='ocrx_word' id='word_1_160' title='bbox 397 1077 448 1098; x_wconf 91' lang='eng' dir='ltr'>Oral</span> <span class='ocrx_word' id='word_1_161' title='bbox 459 1077 523 1098; x_wconf 85' lang='eng' dir='ltr'>clone</span> <span class='ocrx_word' id='word_1_162' title='bbox 535 1077 617 1098; x_wconf 90' lang='eng' dir='ltr'>BH007</span> <span class='ocrx_word' id='word_1_163' title='bbox 628 1077 774 1103; x_wconf 91' lang='eng' dir='ltr'>(AY005447)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 333 1115 809 1183">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 333 1115 809 1183">
+     <span class='ocr_line' id='line_1_53' title="bbox 411 1115 809 1142; baseline 0 -6"><span class='ocrx_word' id='word_1_164' title='bbox 411 1115 462 1136; x_wconf 91' lang='eng' dir='ltr'>Oral</span> <span class='ocrx_word' id='word_1_165' title='bbox 472 1116 537 1136; x_wconf 87' lang='eng' dir='ltr'>clone</span> <span class='ocrx_word' id='word_1_166' title='bbox 548 1115 654 1142; x_wconf 89' lang='eng' dir='ltr'>MCE7_5</span> <span class='ocrx_word' id='word_1_167' title='bbox 665 1116 809 1142; x_wconf 85' lang='eng' dir='ltr'>(AF481214)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_54' title="bbox 333 1156 803 1183; baseline -0.002 -5"><span class='ocrx_word' id='word_1_168' title='bbox 333 1156 355 1173; x_wconf 78' lang='eng'>92</span> <span class='ocrx_word' id='word_1_169' title='bbox 429 1157 479 1178; x_wconf 91' lang='eng' dir='ltr'>Oral</span> <span class='ocrx_word' id='word_1_170' title='bbox 489 1157 554 1178; x_wconf 89' lang='eng' dir='ltr'>clone</span> <span class='ocrx_word' id='word_1_171' title='bbox 565 1157 646 1178; x_wconf 80' lang='eng'>33062</span> <span class='ocrx_word' id='word_1_172' title='bbox 657 1157 803 1183; x_wconf 88' lang='eng' dir='ltr'>(AY005445)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 254 139 288 156">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 254 139 288 156">
+     <span class='ocr_line' id='line_1_55' title="bbox 254 139 288 156; baseline 0.029 -1"><span class='ocrx_word' id='word_1_173' title='bbox 254 139 288 156; x_wconf 86' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 177 246 200 262">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 177 246 200 262">
+     <span class='ocr_line' id='line_1_56' title="bbox 177 246 200 262; baseline -0.043 0"><span class='ocrx_word' id='word_1_174' title='bbox 177 246 200 262; x_wconf 91' lang='eng'>57</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 438 699 491 725">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 438 699 491 725">
+     <span class='ocr_line' id='line_1_57' title="bbox 438 699 491 725; baseline 0 -9"><span class='ocrx_word' id='word_1_175' title='bbox 438 699 491 725; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 7 1111 328 1159">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 7 1111 328 1159">
+     <span class='ocr_line' id='line_1_58' title="bbox 7 1111 328 1135; baseline 0 0"><span class='ocrx_word' id='word_1_176' title='bbox 7 1111 201 1127; x_wconf 81' lang='eng'>&#39;—&#39;</span> <span class='ocrx_word' id='word_1_177' title='bbox 294 1119 328 1135; x_wconf 86' lang='eng'>100</span> 
+     </span>
+     <span class='ocr_line' id='line_1_59' title="bbox 75 1138 127 1159; baseline 0 0"><span class='ocrx_word' id='word_1_178' title='bbox 75 1138 127 1159; x_wconf 91' lang='eng'>0.05</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000364-0-004.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000364-0-004.pbm.png
new file mode 100644
index 00000000..db9336d3
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000364-0-004.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000364-0-004.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000364-0-004.pbm.png.hocr
new file mode 100644
index 00000000..2f8d37ae
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000364-0-004.pbm.png.hocr
@@ -0,0 +1,150 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000364-0-004.pbm.png"; bbox 0 0 1243 1035; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 6 21 31 39">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 6 21 31 39">
+     <span class='ocr_line' id='line_1_1' title="bbox 6 21 31 39; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 6 21 31 39; x_wconf 81' lang='eng'><em>68</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 37 87 62 105">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 37 87 62 105">
+     <span class='ocr_line' id='line_1_2' title="bbox 37 87 62 105; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 37 87 62 105; x_wconf 88' lang='eng'><em>83</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 116 230 243 275">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 116 230 243 275">
+     <span class='ocr_line' id='line_1_3' title="bbox 205 230 243 248; baseline 0 0"><span class='ocrx_word' id='word_1_3' title='bbox 205 230 243 248; x_wconf 91' lang='eng'><em>100</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 116 258 153 275; baseline 0 0"><span class='ocrx_word' id='word_1_4' title='bbox 116 258 153 275; x_wconf 90' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 77 290 102 308">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 77 290 102 308">
+     <span class='ocr_line' id='line_1_5' title="bbox 77 290 102 308; baseline 0 0"><span class='ocrx_word' id='word_1_5' title='bbox 77 290 102 308; x_wconf 82' lang='eng'>96</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 93 413 293 458">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 93 413 293 458">
+     <span class='ocr_line' id='line_1_6' title="bbox 256 413 293 431; baseline 0.027 -1"><span class='ocrx_word' id='word_1_6' title='bbox 256 413 293 431; x_wconf 87' lang='eng'><em>100</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 93 440 117 458; baseline 0 0"><span class='ocrx_word' id='word_1_7' title='bbox 93 440 117 458; x_wconf 84' lang='eng'><em>98</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 70 560 131 613">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 70 560 131 613">
+     <span class='ocr_line' id='line_1_8' title="bbox 70 560 95 577; baseline 0 0"><span class='ocrx_word' id='word_1_8' title='bbox 70 560 95 577; x_wconf 95' lang='eng'>77</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 106 595 131 613; baseline 0 0"><span class='ocrx_word' id='word_1_9' title='bbox 106 595 131 613; x_wconf 78' lang='eng'><em>99</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 94 704 177 749">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 94 704 177 749">
+     <span class='ocr_line' id='line_1_10' title="bbox 140 704 177 722; baseline 0 0"><span class='ocrx_word' id='word_1_10' title='bbox 140 704 177 722; x_wconf 89' lang='eng'><em>100</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 94 731 120 749; baseline 0 0"><span class='ocrx_word' id='word_1_11' title='bbox 94 731 120 749; x_wconf 84' lang='eng'><em>97</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 54 813 160 848">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 54 813 160 848">
+     <span class='ocr_line' id='line_1_12' title="bbox 54 813 160 848; baseline 0 -17"><span class='ocrx_word' id='word_1_12' title='bbox 54 831 75 848; x_wconf 66' lang='eng'>71</span> <span class='ocrx_word' id='word_1_13' title='bbox 136 813 160 831; x_wconf 83' lang='eng'><em>98</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 95 892 132 910">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 95 892 132 910">
+     <span class='ocr_line' id='line_1_13' title="bbox 95 892 132 910; baseline 0 0"><span class='ocrx_word' id='word_1_14' title='bbox 95 892 132 910; x_wconf 89' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 145 934 223 979">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 145 934 223 979">
+     <span class='ocr_line' id='line_1_14' title="bbox 145 934 169 951; baseline 0 0"><span class='ocrx_word' id='word_1_15' title='bbox 145 934 169 951; x_wconf 83' lang='eng'><em>99</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 185 961 223 979; baseline 0.026 -1"><span class='ocrx_word' id='word_1_16' title='bbox 185 961 223 979; x_wconf 90' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 113 1013 142 1031">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 113 1013 142 1031">
+     <span class='ocr_line' id='line_1_16' title="bbox 113 1013 142 1031; baseline 0 0"><span class='ocrx_word' id='word_1_17' title='bbox 113 1013 142 1031; x_wconf 87' lang='eng'>0.1</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 346 6 1239 983">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 346 6 1239 983">
+     <span class='ocr_line' id='line_1_17' title="bbox 346 6 1009 37; baseline 0 -6"><span class='ocrx_word' id='word_1_18' title='bbox 346 9 576 37; x_wconf 79' lang='eng' dir='ltr'><em>Pyramidobacter</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 581 9 720 37; x_wconf 90' lang='eng' dir='ltr'><em>piscolens</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 729 6 837 31; x_wconf 91' lang='eng' dir='ltr'><em>W5455T</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 847 9 1009 37; x_wconf 89' lang='eng' dir='ltr'><em>(DU723069)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 380 45 849 73; baseline 0 -6"><span class='ocrx_word' id='word_1_22' title='bbox 380 45 482 73; x_wconf 86' lang='eng' dir='ltr'><em>‘Aquifex</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 493 45 607 67; x_wconf 79' lang='eng' dir='ltr'><em>aeolicus’</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 621 45 675 67; x_wconf 93' lang='eng' dir='ltr'>VF5</span> <span class='ocrx_word' id='word_1_25' title='bbox 686 45 849 73; x_wconf 84' lang='eng' dir='ltr'><em>(AACO7677)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 405 79 965 109; baseline 0.002 -6"><span class='ocrx_word' id='word_1_26' title='bbox 405 81 563 109; x_wconf 85' lang='eng' dir='ltr'><em>Thermotoga</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 573 81 687 104; x_wconf 81' lang='eng' dir='ltr'><em>maritime</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 699 79 792 104; x_wconf 89' lang='eng' dir='ltr'><em>MSB8T</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 802 81 965 109; x_wconf 85' lang='eng' dir='ltr'><em>(AAD36645)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 400 115 1081 146; baseline 0 -6"><span class='ocrx_word' id='word_1_30' title='bbox 400 117 609 146; x_wconf 83' lang='eng' dir='ltr'><em>Synechocoocus</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 618 118 748 146; x_wconf 81' lang='eng' dir='ltr'><em>elongatus</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 758 117 819 140; x_wconf 90' lang='eng' dir='ltr'><em>PCC</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 830 115 908 140; x_wconf 75' lang='eng' dir='ltr'><em>6301T</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 919 118 1081 146; x_wconf 87' lang='eng' dir='ltr'>(BAD79413)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 475 152 1017 182; baseline 0 -6"><span class='ocrx_word' id='word_1_35' title='bbox 475 154 666 182; x_wconf 87' lang='eng' dir='ltr'><em>Rhodopirellula</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 677 154 762 176; x_wconf 78' lang='eng' dir='ltr'><em>baltica</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 773 152 843 176; x_wconf 88' lang='eng' dir='ltr'><em>SH1T</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 853 154 1017 182; x_wconf 84' lang='eng' dir='ltr'><em>(CAD79269)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 359 190 963 218; baseline 0.002 -6"><span class='ocrx_word' id='word_1_39' title='bbox 359 190 532 213; x_wconf 87' lang='eng' dir='ltr'><em>Desulfovibrio</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 542 190 718 213; x_wconf 87' lang='eng' dir='ltr'><em>desulfuricans</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 737 190 791 213; x_wconf 88' lang='eng' dir='ltr'><em>G20</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 802 190 963 218; x_wconf 83' lang='eng' dir='ltr'><em>(ABB37883)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 431 226 1036 255; baseline 0 -6"><span class='ocrx_word' id='word_1_43' title='bbox 431 227 604 249; x_wconf 78' lang='eng' dir='ltr'><em>Lactobacillus</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 614 227 739 249; x_wconf 87' lang='eng' dir='ltr'><em>salivarius</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 749 226 862 249; x_wconf 89' lang='eng' dir='ltr'><em>UCC118</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 874 227 1036 255; x_wconf 84' lang='eng' dir='ltr'><em>(ABD99994)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 476 263 1051 291; baseline 0 -6"><span class='ocrx_word' id='word_1_47' title='bbox 476 263 665 291; x_wconf 76' lang='eng' dir='ltr'><em>Streptococcus</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 674 263 782 291; x_wconf 85' lang='eng' dir='ltr'><em>gordonii</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 790 263 879 285; x_wconf 88' lang='eng' dir='ltr'><em>Challis</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 890 263 970 291; x_wconf 92' lang='eng' dir='ltr'>(ABV1</span> <span class='ocrx_word' id='word_1_51' title='bbox 979 263 1051 291; x_wconf 85' lang='eng'>1046)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 437 299 872 328; baseline 0 -6"><span class='ocrx_word' id='word_1_52' title='bbox 437 299 539 322; x_wconf 81' lang='eng' dir='ltr'><em>Bacillus</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 548 299 640 322; x_wconf 83' lang='eng' dir='ltr'><em>subtilis</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 652 299 697 322; x_wconf 86' lang='eng'><em>168</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 709 299 872 328; x_wconf 89' lang='eng' dir='ltr'><em>(CAB15547)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 425 336 1021 364; baseline 0.002 -6"><span class='ocrx_word' id='word_1_56' title='bbox 425 336 562 364; x_wconf 85' lang='eng' dir='ltr'><em>Finegoldia</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 573 342 663 364; x_wconf 84' lang='eng' dir='ltr'><em>magna</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 672 336 754 359; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 764 336 846 359; x_wconf 87' lang='eng'>29328</span> <span class='ocrx_word' id='word_1_60' title='bbox 857 336 1021 364; x_wconf 83' lang='eng' dir='ltr'><em>(BAG08949)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 443 372 1026 401; baseline 0 -6"><span class='ocrx_word' id='word_1_61' title='bbox 443 372 608 395; x_wconf 87' lang='eng' dir='ltr'><em>Chloroﬂexus</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 617 373 772 395; x_wconf 83' lang='eng' dir='ltr'><em>aurantiacus</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 782 372 853 395; x_wconf 88' lang='eng' dir='ltr'>J-10fl</span> <span class='ocrx_word' id='word_1_64' title='bbox 865 373 1026 401; x_wconf 85' lang='eng' dir='ltr'><em>(ABY33776)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 498 409 1087 437; baseline 0 -6"><span class='ocrx_word' id='word_1_65' title='bbox 498 409 709 437; x_wconf 86' lang='eng' dir='ltr'><em>Porphyromonas</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 718 409 842 437; x_wconf 83' lang='eng' dir='ltr'><em>gingivalis</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 851 409 912 431; x_wconf 87' lang='eng' dir='ltr'><em>W83</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 923 409 1087 437; x_wconf 88' lang='eng' dir='ltr'><em>(AAQ65708)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 502 443 1111 473; baseline -0.002 -5"><span class='ocrx_word' id='word_1_69' title='bbox 502 445 659 468; x_wconf 80' lang='eng' dir='ltr'><em>Bacteroides</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 670 445 756 473; x_wconf 83' lang='eng' dir='ltr'><em>fragilis</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 766 445 847 468; x_wconf 92' lang='eng' dir='ltr'><em>NCTC</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 858 443 936 468; x_wconf 81' lang='eng' dir='ltr'><em>9343T</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 947 445 1111 473; x_wconf 86' lang='eng' dir='ltr'><em>(CAH06724)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 458 479 979 510; baseline 0 -6"><span class='ocrx_word' id='word_1_74' title='bbox 458 481 609 504; x_wconf 86' lang='eng' dir='ltr'><em>Chlorobium</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 620 482 725 510; x_wconf 82' lang='eng' dir='ltr'><em>tepidum</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 735 479 802 504; x_wconf 89' lang='eng' dir='ltr'><em>TLST</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 812 482 979 510; x_wconf 86' lang='eng' dir='ltr'><em>(AAM72469)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 402 516 1112 546; baseline 0 -6"><span class='ocrx_word' id='word_1_78' title='bbox 402 518 599 540; x_wconf 81' lang='eng' dir='ltr'><em>Fusobacterium</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 610 518 748 540; x_wconf 74' lang='eng' dir='ltr'><em>nucleatum</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 757 518 838 540; x_wconf 94' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 849 516 944 540; x_wconf 81' lang='eng' dir='ltr'><em>25586T</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 954 518 1112 546; x_wconf 83' lang='eng' dir='ltr'><em>(AAL93833)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 462 554 1090 583; baseline -0.002 -6"><span class='ocrx_word' id='word_1_83' title='bbox 462 554 668 577; x_wconf 78' lang='eng' dir='ltr'><em>Bifidobacterium</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 677 555 775 583; x_wconf 89' lang='eng' dir='ltr'><em>Iongum</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 786 554 916 577; x_wconf 88' lang='eng' dir='ltr'><em>NCC2705</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 927 555 1090 583; x_wconf 88' lang='eng' dir='ltr'><em>(AAN25218)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 594 591 1239 619; baseline 0.002 -6"><span class='ocrx_word' id='word_1_87' title='bbox 594 591 733 619; x_wconf 80' lang='eng' dir='ltr'><em>Chlamydia</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 744 591 899 614; x_wconf 81' lang='eng' dir='ltr'><em>trachomatis</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 910 591 1066 614; x_wconf 92' lang='eng' dir='ltr'><em>D/UW—3/CX</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 1076 591 1239 619; x_wconf 87' lang='eng' dir='ltr'><em>(AAC68296)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 496 627 975 656; baseline 0 -6"><span class='ocrx_word' id='word_1_91' title='bbox 496 627 605 656; x_wconf 81' lang='eng' dir='ltr'><em>Opitutus</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 615 628 692 650; x_wconf 75' lang='eng' dir='ltr'><em>terrae</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 704 628 796 650; x_wconf 81' lang='eng' dir='ltr'>PBQO-1</span> <span class='ocrx_word' id='word_1_94' title='bbox 812 627 975 656; x_wconf 86' lang='eng' dir='ltr'><em>(ACB74961)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 493 662 1140 692; baseline 0 -6"><span class='ocrx_word' id='word_1_95' title='bbox 493 664 643 692; x_wconf 84' lang='eng' dir='ltr'><em>Treponema</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 654 664 772 686; x_wconf 82' lang='eng' dir='ltr'><em>dent/cola</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 781 664 863 686; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 874 662 969 686; x_wconf 80' lang='eng' dir='ltr'><em>35405T</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 979 664 1140 692; x_wconf 87' lang='eng' dir='ltr'><em>(AAS12412)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 459 700 1029 728; baseline 0 -5"><span class='ocrx_word' id='word_1_100' title='bbox 459 700 622 723; x_wconf 85' lang='eng' dir='ltr'><em>Caulobacter</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 629 701 774 723; x_wconf 85' lang='eng' dir='ltr'><em>crescentus</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 784 700 857 723; x_wconf 92' lang='eng' dir='ltr'>CB15</span> <span class='ocrx_word' id='word_1_103' title='bbox 868 700 1029 728; x_wconf 89' lang='eng' dir='ltr'>(AAK25030)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 446 734 1119 765; baseline 0 -6"><span class='ocrx_word' id='word_1_104' title='bbox 446 736 634 759; x_wconf 84' lang='eng' dir='ltr'><em>Ochrobactrum</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 644 737 754 765; x_wconf 85' lang='eng' dir='ltr'><em>anthropi</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 760 736 842 759; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 852 734 948 759; x_wconf 79' lang='eng' dir='ltr'><em>49188T</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 958 736 1119 765; x_wconf 86' lang='eng' dir='ltr'><em>(ABS13742)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 464 771 1060 801; baseline 0 -6"><span class='ocrx_word' id='word_1_109' title='bbox 464 773 578 795; x_wconf 80' lang='eng' dir='ltr'><em>Ehrlichia</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 588 773 740 795; x_wconf 84' lang='eng' dir='ltr'><em>chaffeensis</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 748 771 887 795; x_wconf 84' lang='eng' dir='ltr'><em>ArkansasT</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 898 773 1060 801; x_wconf 91' lang='eng' dir='ltr'>(ABD45253)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 429 809 1002 838; baseline 0 -6"><span class='ocrx_word' id='word_1_113' title='bbox 429 810 562 832; x_wconf 80' lang='eng' dir='ltr'><em>Bordetella</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 571 810 693 838; x_wconf 79' lang='eng' dir='ltr'><em>pertussis</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 702 810 811 832; x_wconf 88' lang='eng' dir='ltr'><em>Tohama</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 823 810 826 831; x_wconf 99' lang='eng'><strong><em>|</em></strong></span> <span class='ocrx_word' id='word_1_117' title='bbox 839 809 1002 838; x_wconf 87' lang='eng' dir='ltr'><em>(CAE43285)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 429 846 1035 874; baseline 0 -6"><span class='ocrx_word' id='word_1_118' title='bbox 429 846 553 868; x_wconf 85' lang='eng' dir='ltr'><em>Neisseria</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 563 846 733 874; x_wconf 86' lang='eng' dir='ltr'><em>gonorrhoeae</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 744 846 780 868; x_wconf 95' lang='eng' dir='ltr'>FA</span> <span class='ocrx_word' id='word_1_121' title='bbox 792 846 855 868; x_wconf 82' lang='eng'>1090</span> <span class='ocrx_word' id='word_1_122' title='bbox 866 846 1035 874; x_wconf 84' lang='eng' dir='ltr'><em>(AAW89680)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 429 882 1034 911; baseline 0 -6"><span class='ocrx_word' id='word_1_123' title='bbox 429 882 619 905; x_wconf 85' lang='eng' dir='ltr'><em>Pseudomonas</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 629 882 776 911; x_wconf 86' lang='eng' dir='ltr'><em>aeruginosa</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 788 882 854 905; x_wconf 90' lang='eng' dir='ltr'>PA01</span> <span class='ocrx_word' id='word_1_126' title='bbox 870 882 1034 911; x_wconf 87' lang='eng' dir='ltr'><em>(AAGO7791)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 458 919 1050 947; baseline 0 -6"><span class='ocrx_word' id='word_1_127' title='bbox 458 919 633 947; x_wconf 82' lang='eng' dir='ltr'><em>Haemophilus</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 642 919 778 941; x_wconf 83' lang='eng' dir='ltr'><em>influenzae</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 789 919 875 941; x_wconf 82' lang='eng' dir='ltr'><em>PittGG</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 887 919 1050 947; x_wconf 91' lang='eng' dir='ltr'><em>(ABROO457)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 422 955 1064 983; baseline 0 -6"><span class='ocrx_word' id='word_1_131' title='bbox 422 955 576 978; x_wconf 85' lang='eng' dir='ltr'><em>Escherichia</em></span> <span class='ocrx_word' id='word_1_132' title='bbox 587 955 633 978; x_wconf 90' lang='eng' dir='ltr'><em>coli</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 641 955 759 978; x_wconf 88' lang='eng' dir='ltr'><em>O157:H7</em></span> <span class='ocrx_word' id='word_1_134' title='bbox 771 955 876 978; x_wconf 86' lang='eng' dir='ltr'><em>EDL933</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 888 955 1064 983; x_wconf 86' lang='eng' dir='ltr'><em>(NP_285794)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000406-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000406-0-000.pbm.png
new file mode 100644
index 00000000..57a52686
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000406-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000406-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000406-0-000.pbm.png.hocr
new file mode 100644
index 00000000..341f632a
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000406-0-000.pbm.png.hocr
@@ -0,0 +1,322 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000406-0-000.pbm.png"; bbox 0 0 1302 1004; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 165 582 190 600">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 165 582 190 600">
+     <span class='ocr_line' id='line_1_1' title="bbox 165 582 190 600; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 165 582 190 600; x_wconf 87' lang='eng'><em>78</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 229 5 280 127">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 229 5 280 127">
+     <span class='ocr_line' id='line_1_2' title="bbox 255 5 280 22; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 255 5 280 22; x_wconf 83' lang='eng'>67</span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 255 57 280 75; baseline -0.04 0"><span class='ocrx_word' id='word_1_3' title='bbox 255 57 280 75; x_wconf 84' lang='eng'><em>54</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 229 109 254 127; baseline 0 0"><span class='ocrx_word' id='word_1_4' title='bbox 229 109 254 127; x_wconf 86' lang='eng'><em>89</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 318 21 320 85">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 318 21 320 85">
+     <span class='ocr_line' id='line_1_5' title="bbox 318 21 320 85; baseline 0 919"><span class='ocrx_word' id='word_1_5' title='bbox 318 21 320 85; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 263 157 290 158">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 263 157 290 158">
+     <span class='ocr_line' id='line_1_6' title="bbox 263 157 290 158; baseline 0 846"><span class='ocrx_word' id='word_1_6' title='bbox 263 157 290 158; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 226 265 251 283">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 226 265 251 283">
+     <span class='ocr_line' id='line_1_7' title="bbox 226 265 251 283; baseline 0 0"><span class='ocrx_word' id='word_1_7' title='bbox 226 265 251 283; x_wconf 83' lang='eng'><em>89</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 225 294 264 295">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 225 294 264 295">
+     <span class='ocr_line' id='line_1_8' title="bbox 225 294 264 295; baseline 0 709"><span class='ocrx_word' id='word_1_8' title='bbox 225 294 264 295; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 263 157 264 432">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 263 157 264 432">
+     <span class='ocr_line' id='line_1_9' title="bbox 263 157 264 432; baseline 0 572"><span class='ocrx_word' id='word_1_9' title='bbox 263 157 264 432; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 288 102 290 214">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 288 102 290 214">
+     <span class='ocr_line' id='line_1_10' title="bbox 288 102 290 214; baseline 0 790"><span class='ocrx_word' id='word_1_10' title='bbox 288 102 290 214; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 312 281 336 299">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 312 281 336 299">
+     <span class='ocr_line' id='line_1_11' title="bbox 312 281 336 299; baseline 0 0"><span class='ocrx_word' id='word_1_11' title='bbox 312 281 336 299; x_wconf 93' lang='eng'>77</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 325 310 345 311">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 325 310 345 311">
+     <span class='ocr_line' id='line_1_12' title="bbox 325 310 345 311; baseline 0 693"><span class='ocrx_word' id='word_1_12' title='bbox 325 310 345 311; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 293 329 318 347">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 293 329 318 347">
+     <span class='ocr_line' id='line_1_13' title="bbox 293 329 318 347; baseline 0 0"><span class='ocrx_word' id='word_1_13' title='bbox 293 329 318 347; x_wconf 82' lang='eng'>68</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 295 358 326 359">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 295 358 326 359">
+     <span class='ocr_line' id='line_1_14' title="bbox 295 358 326 359; baseline 0 645"><span class='ocrx_word' id='word_1_14' title='bbox 295 358 326 359; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 325 310 326 408">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 325 310 326 408">
+     <span class='ocr_line' id='line_1_15' title="bbox 325 310 326 408; baseline 0 596"><span class='ocrx_word' id='word_1_15' title='bbox 325 310 326 408; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 263 431 296 432">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 263 431 296 432">
+     <span class='ocr_line' id='line_1_16' title="bbox 263 431 296 432; baseline 0 572"><span class='ocrx_word' id='word_1_16' title='bbox 263 431 296 432; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 205 462 226 463">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 205 462 226 463">
+     <span class='ocr_line' id='line_1_17' title="bbox 205 462 226 463; baseline 0 541"><span class='ocrx_word' id='word_1_17' title='bbox 205 462 226 463; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 156 611 206 612">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 156 611 206 612">
+     <span class='ocr_line' id='line_1_18' title="bbox 156 611 206 612; baseline 0 392"><span class='ocrx_word' id='word_1_18' title='bbox 156 611 206 612; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 7 749 157 751">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 7 749 157 751">
+     <span class='ocr_line' id='line_1_19' title="bbox 7 749 157 751; baseline 0 253"><span class='ocrx_word' id='word_1_19' title='bbox 7 749 157 751; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 7 749 8 987">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 7 749 8 987">
+     <span class='ocr_line' id='line_1_20' title="bbox 7 749 8 987; baseline 0 17"><span class='ocrx_word' id='word_1_20' title='bbox 7 749 8 987; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 156 611 157 889">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 156 611 157 889">
+     <span class='ocr_line' id='line_1_21' title="bbox 156 611 157 889; baseline 0 115"><span class='ocrx_word' id='word_1_21' title='bbox 156 611 157 889; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 205 462 206 760">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 205 462 206 760">
+     <span class='ocr_line' id='line_1_22' title="bbox 205 462 206 760; baseline 0 244"><span class='ocrx_word' id='word_1_22' title='bbox 205 462 206 760; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 255 448 280 466">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 255 448 280 466">
+     <span class='ocr_line' id='line_1_23' title="bbox 255 448 280 466; baseline 0 0"><span class='ocrx_word' id='word_1_23' title='bbox 255 448 280 466; x_wconf 92' lang='eng'><strong>77</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 225 294 226 632">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 225 294 226 632">
+     <span class='ocr_line' id='line_1_24' title="bbox 225 294 226 632; baseline 0 372"><span class='ocrx_word' id='word_1_24' title='bbox 225 294 226 632; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 228 640 264 658">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 228 640 264 658">
+     <span class='ocr_line' id='line_1_25' title="bbox 228 640 264 658; baseline 0 0"><span class='ocrx_word' id='word_1_25' title='bbox 228 640 264 658; x_wconf 91' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 295 357 296 503">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 295 357 296 503">
+     <span class='ocr_line' id='line_1_26' title="bbox 295 357 296 503; baseline 0 501"><span class='ocrx_word' id='word_1_26' title='bbox 295 357 296 503; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 344 278 345 343">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 344 278 345 343">
+     <span class='ocr_line' id='line_1_27' title="bbox 344 278 345 343; baseline 0 661"><span class='ocrx_word' id='word_1_27' title='bbox 344 278 345 343; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 320 9 1110 39">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 320 9 1110 39">
+     <span class='ocr_line' id='line_1_28' title="bbox 320 9 1110 39; baseline 0 -6"><span class='ocrx_word' id='word_1_28' title='bbox 320 21 430 22; x_wconf 42' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 437 11 606 33; x_wconf 85' lang='eng' dir='ltr'><em>Paenibaci/Ius</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 615 11 797 38; x_wconf 78' lang='eng' dir='ltr'><em>agar/devorans</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 807 11 867 33; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 880 9 953 33; x_wconf 90' lang='eng' dir='ltr'><em>1355T</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 963 11 1110 39; x_wconf 85' lang='eng' dir='ltr'><em>(AJ345023)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 290 52 683 167">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 290 52 683 167">
+     <span class='ocr_line' id='line_1_29' title="bbox 290 52 683 167; baseline 0 -6"><span class='ocrx_word' id='word_1_34' title='bbox 290 52 419 151; x_wconf 59' lang='eng' dir='ltr'>L</span> <span class='ocrx_word' id='word_1_35' title='bbox 426 137 519 161; x_wconf 79' lang='eng' dir='ltr'><em>33-4AT</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 529 139 683 167; x_wconf 82' lang='eng' dir='ltr'><em>(A3265205)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 466 74 725 104">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 466 74 725 104">
+     <span class='ocr_line' id='line_1_30' title="bbox 466 74 725 104; baseline 0 -6"><span class='ocrx_word' id='word_1_37' title='bbox 466 74 561 98; x_wconf 70' lang='eng' dir='ltr'><em>MX2-3T</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 570 76 725 104; x_wconf 79' lang='eng' dir='ltr'><em>(ABZGSZOG)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 489 202 1176 425">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 499 202 1057 232">
+     <span class='ocr_line' id='line_1_31' title="bbox 499 202 1057 232; baseline 0 -6"><span class='ocrx_word' id='word_1_39' title='bbox 499 205 668 226; x_wconf 84' lang='eng' dir='ltr'><em>Paenibacil/us</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 677 205 826 232; x_wconf 86' lang='eng' dir='ltr'><em>granivorans</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 835 202 898 226; x_wconf 81' lang='eng' dir='ltr'><em>A30T</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 908 205 1057 232; x_wconf 86' lang='eng' dir='ltr'><em>(AF237682)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 489 266 1176 361">
+     <span class='ocr_line' id='line_1_32' title="bbox 489 266 1153 296; baseline 0 -6"><span class='ocrx_word' id='word_1_43' title='bbox 489 269 657 290; x_wconf 87' lang='eng' dir='ltr'><em>Paenibaci/Ius</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 666 269 832 296; x_wconf 86' lang='eng' dir='ltr'><em>agarexedens</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 850 268 911 290; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 924 266 996 290; x_wconf 89' lang='eng' dir='ltr'><em>1327T</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 1006 268 1153 296; x_wconf 88' lang='eng' dir='ltr'><em>(AJ345020)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 516 331 1176 361; baseline 0 -6"><span class='ocrx_word' id='word_1_48' title='bbox 516 334 685 355; x_wconf 84' lang='eng' dir='ltr'><em>Paenibaci/Ius</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 694 334 833 355; x_wconf 85' lang='eng' dir='ltr'><em>alkaliterrae</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 852 334 913 355; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 926 331 1015 355; x_wconf 91' lang='eng' dir='ltr'><em>17040T</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 1024 334 1176 361; x_wconf 87' lang='eng' dir='ltr'><em>(AY960748)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 495 395 1089 425">
+     <span class='ocr_line' id='line_1_34' title="bbox 495 395 1089 425; baseline 0.002 -7"><span class='ocrx_word' id='word_1_53' title='bbox 495 397 664 419; x_wconf 86' lang='eng' dir='ltr'><em>Paenibacil/us</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 673 397 841 424; x_wconf 86' lang='eng' dir='ltr'><em>glycanilyticus</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 852 395 927 419; x_wconf 89' lang='eng' dir='ltr'><em>DS-1T</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 937 397 1089 425; x_wconf 84' lang='eng' dir='ltr'><em>(ABO42938)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 424 460 1145 490">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 424 460 1145 490">
+     <span class='ocr_line' id='line_1_35' title="bbox 424 460 1145 490; baseline 0 -6"><span class='ocrx_word' id='word_1_57' title='bbox 424 470 511 471; x_wconf 41' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 521 463 689 484; x_wconf 87' lang='eng' dir='ltr'><em>Paenibacillus</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 698 463 811 484; x_wconf 89' lang='eng' dir='ltr'><em>kobensis</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 821 462 882 484; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 895 460 983 484; x_wconf 89' lang='eng' dir='ltr'><em>10249T</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 993 462 1145 490; x_wconf 85' lang='eng' dir='ltr'><em>(ABO73363)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 295 502 424 503">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 295 502 424 503">
+     <span class='ocr_line' id='line_1_36' title="bbox 295 502 424 503; baseline 0 501"><span class='ocrx_word' id='word_1_63' title='bbox 295 502 424 503; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 298 511 335 529">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 298 511 335 529">
+     <span class='ocr_line' id='line_1_37' title="bbox 298 511 335 529; baseline 0.027 -1"><span class='ocrx_word' id='word_1_64' title='bbox 298 511 335 529; x_wconf 90' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 422 470 425 537">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 422 470 425 537">
+     <span class='ocr_line' id='line_1_38' title="bbox 422 470 425 537; baseline 0 467"><span class='ocrx_word' id='word_1_65' title='bbox 422 470 425 537; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 424 523 1247 618">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 424 523 1247 618">
+     <span class='ocr_line' id='line_1_39' title="bbox 424 523 1247 553; baseline 0 -6"><span class='ocrx_word' id='word_1_66' title='bbox 424 535 539 537; x_wconf 91' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_67' title='bbox 546 526 715 547; x_wconf 86' lang='eng' dir='ltr'><em>Paenibacillus</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 725 526 914 553; x_wconf 82' lang='eng' dir='ltr'><em>curd/anoiyticus</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 924 526 984 547; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 997 523 1086 547; x_wconf 89' lang='eng' dir='ltr'><em>10247T</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 1096 526 1247 553; x_wconf 89' lang='eng' dir='ltr'><em>(AB073202)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 470 588 1057 618; baseline -0.002 -5"><span class='ocrx_word' id='word_1_72' title='bbox 470 591 638 613; x_wconf 86' lang='eng' dir='ltr'><em>Paenibacillus</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 647 591 778 618; x_wconf 87' lang='eng' dir='ltr'><em>favisporus</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 787 588 896 613; x_wconf 92' lang='eng' dir='ltr'><em>GMP01T</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 906 591 1057 618; x_wconf 90' lang='eng' dir='ltr'><em>(AY208751)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 476 652 1156 682">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 476 652 1156 682">
+     <span class='ocr_line' id='line_1_41' title="bbox 476 652 1156 682; baseline 0 -6"><span class='ocrx_word' id='word_1_76' title='bbox 476 655 644 676; x_wconf 84' lang='eng' dir='ltr'><em>Paenibacillus</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 653 655 834 682; x_wconf 86' lang='eng' dir='ltr'><em>rhizosphaerae</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 852 652 995 676; x_wconf 90' lang='eng' dir='ltr'><em>CECAP06T</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 1005 654 1156 682; x_wconf 87' lang='eng' dir='ltr'><em>(AY751754)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 381 728 484 729">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 381 728 484 729">
+     <span class='ocr_line' id='line_1_42' title="bbox 381 728 484 729; baseline 0 275"><span class='ocrx_word' id='word_1_80' title='bbox 381 728 484 729; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_37' title="bbox 491 715 1163 745">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 491 715 1163 745">
+     <span class='ocr_line' id='line_1_43' title="bbox 491 715 1163 745; baseline -0.001 -5"><span class='ocrx_word' id='word_1_81' title='bbox 491 718 659 740; x_wconf 85' lang='eng' dir='ltr'><em>Paenibacillus</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 668 718 816 740; x_wconf 86' lang='eng' dir='ltr'><em>lentimorbus</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 825 718 902 740; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 915 715 1003 740; x_wconf 92' lang='eng' dir='ltr'><em>14707T</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 1013 718 1149 745; x_wconf 85' lang='eng' dir='ltr'><em>(AFO71861</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 1157 718 1163 745; x_wconf 91' lang='eng'>)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_38' title="bbox 205 759 381 761">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 205 759 381 761">
+     <span class='ocr_line' id='line_1_44' title="bbox 205 759 381 761; baseline 0 243"><span class='ocrx_word' id='word_1_87' title='bbox 205 759 381 761; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_39' title="bbox 208 768 245 786">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 208 768 245 786">
+     <span class='ocr_line' id='line_1_45' title="bbox 208 768 245 786; baseline 0 0"><span class='ocrx_word' id='word_1_88' title='bbox 208 768 245 786; x_wconf 90' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_40' title="bbox 380 728 381 794">
+    <p class='ocr_par' dir='ltr' id='par_1_42' title="bbox 380 728 381 794">
+     <span class='ocr_line' id='line_1_46' title="bbox 380 728 381 794; baseline 0 210"><span class='ocrx_word' id='word_1_89' title='bbox 380 728 381 794; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_41' title="bbox 523 781 1168 811">
+    <p class='ocr_par' dir='ltr' id='par_1_43' title="bbox 523 781 1168 811">
+     <span class='ocr_line' id='line_1_47' title="bbox 523 781 1168 811; baseline 0 -6"><span class='ocrx_word' id='word_1_90' title='bbox 523 784 691 805; x_wconf 89' lang='eng' dir='ltr'><em>Paenibacil/us</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 701 784 889 811; x_wconf 78' lang='eng' dir='ltr'><em>thiaminolyﬂcus</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 898 783 955 805; x_wconf 90' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 965 781 1040 805; x_wconf 80' lang='eng' dir='ltr'><em>8360T</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 1050 783 1168 811; x_wconf 88' lang='eng' dir='ltr'><em>(D78475)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_42' title="bbox 356 856 458 857">
+    <p class='ocr_par' dir='ltr' id='par_1_44' title="bbox 356 856 458 857">
+     <span class='ocr_line' id='line_1_48' title="bbox 356 856 458 857; baseline 0 147"><span class='ocrx_word' id='word_1_95' title='bbox 356 856 458 857; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_43' title="bbox 465 844 1044 874">
+    <p class='ocr_par' dir='ltr' id='par_1_45' title="bbox 465 844 1044 874">
+     <span class='ocr_line' id='line_1_49' title="bbox 465 844 1044 874; baseline 0 -6"><span class='ocrx_word' id='word_1_96' title='bbox 465 847 633 868; x_wconf 86' lang='eng' dir='ltr'><em>Paenibacil/us</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 644 847 732 868; x_wconf 87' lang='eng' dir='ltr'><em>validus</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 740 846 797 868; x_wconf 87' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 808 844 883 868; x_wconf 89' lang='eng' dir='ltr'><em>9077T</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 893 846 1044 874; x_wconf 87' lang='eng' dir='ltr'><em>(ABO73203)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_44' title="bbox 156 888 356 889">
+    <p class='ocr_par' dir='ltr' id='par_1_46' title="bbox 156 888 356 889">
+     <span class='ocr_line' id='line_1_50' title="bbox 156 888 356 889; baseline 0 115"><span class='ocrx_word' id='word_1_101' title='bbox 156 888 356 889; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_45' title="bbox 159 897 196 915">
+    <p class='ocr_par' dir='ltr' id='par_1_47' title="bbox 159 897 196 915">
+     <span class='ocr_line' id='line_1_51' title="bbox 159 897 196 915; baseline 0 0"><span class='ocrx_word' id='word_1_102' title='bbox 159 897 196 915; x_wconf 92' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_46' title="bbox 354 856 356 923">
+    <p class='ocr_par' dir='ltr' id='par_1_48' title="bbox 354 856 356 923">
+     <span class='ocr_line' id='line_1_52' title="bbox 354 856 356 923; baseline 0 81"><span class='ocrx_word' id='word_1_103' title='bbox 354 856 356 923; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_47' title="bbox 538 910 1300 940">
+    <p class='ocr_par' dir='ltr' id='par_1_49' title="bbox 538 910 1300 940">
+     <span class='ocr_line' id='line_1_53' title="bbox 538 910 1300 940; baseline 0 -6"><span class='ocrx_word' id='word_1_104' title='bbox 538 913 706 934; x_wconf 86' lang='eng' dir='ltr'><em>Paenibacil/us</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 715 913 959 939; x_wconf 85' lang='eng' dir='ltr'><em>naphtha/enovorans</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 978 912 1038 934; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 1051 910 1140 934; x_wconf 90' lang='eng' dir='ltr'><em>14203T</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 1150 912 1300 940; x_wconf 83' lang='eng' dir='ltr'><em>(AF353681)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_48' title="bbox 496 973 1171 1003">
+    <p class='ocr_par' dir='ltr' id='par_1_50' title="bbox 496 973 1171 1003">
+     <span class='ocr_line' id='line_1_54' title="bbox 496 973 1171 1003; baseline 0 -6"><span class='ocrx_word' id='word_1_109' title='bbox 496 976 698 997; x_wconf 83' lang='eng' dir='ltr'><em>Aneur/nibaci/Ius</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 707 976 888 1003; x_wconf 85' lang='eng' dir='ltr'><em>aneurin/Iyticus</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 899 975 959 997; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 970 973 1045 997; x_wconf 90' lang='eng' dir='ltr'><em>5562T</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 1055 975 1171 1003; x_wconf 86' lang='eng' dir='ltr'><em>(X94194)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000489-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000489-0-000.pbm.png
new file mode 100644
index 00000000..8d3ef98d
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000489-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000489-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000489-0-000.pbm.png.hocr
new file mode 100644
index 00000000..a08d2358
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000489-0-000.pbm.png.hocr
@@ -0,0 +1,91 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000489-0-000.pbm.png"; bbox 0 0 888 372; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 214 2 886 370">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 302 2 779 29">
+     <span class='ocr_line' id='line_1_1' title="bbox 302 2 779 29; baseline -0.004 -4"><span class='ocrx_word' id='word_1_1' title='bbox 302 7 339 25; x_wconf 90' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 372 2 397 24; x_wconf 91' lang='eng' dir='ltr'><em>G.</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 409 3 536 29; x_wconf 87' lang='eng' dir='ltr'><em>agarilytica</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 547 2 614 24; x_wconf 90' lang='eng' dir='ltr'><em>N02T</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 624 2 779 29; x_wconf 89' lang='eng' dir='ltr'><em>(DQ784575)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 357 39 831 67">
+     <span class='ocr_line' id='line_1_2' title="bbox 357 39 831 67; baseline 0 -6"><span class='ocrx_word' id='word_1_6' title='bbox 357 40 382 61; x_wconf 94' lang='eng' dir='ltr'><em>G.</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 394 40 569 61; x_wconf 82' lang='eng' dir='ltr'><em>chathamensis</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 578 39 674 61; x_wconf 87' lang='eng' dir='ltr'><em>S18K6T</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 681 40 831 67; x_wconf 79' lang='eng' dir='ltr'><em>(ABZ47623)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 378 77 818 105">
+     <span class='ocr_line' id='line_1_3' title="bbox 378 77 818 105; baseline 0 -6"><span class='ocrx_word' id='word_1_10' title='bbox 378 78 402 99; x_wconf 92' lang='eng' dir='ltr'><em>G.</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 413 78 497 104; x_wconf 86' lang='eng' dir='ltr'><em>polaris</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 507 78 566 99; x_wconf 90' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 576 77 665 99; x_wconf 82' lang='eng' dir='ltr'><em>21857T</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 673 78 818 105; x_wconf 81' lang='eng' dir='ltr'><em>(AJ293820)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 324 115 784 142">
+     <span class='ocr_line' id='line_1_4' title="bbox 324 115 784 142; baseline 0 -5"><span class='ocrx_word' id='word_1_15' title='bbox 324 115 349 137; x_wconf 93' lang='eng' dir='ltr'><em>G.</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 361 116 490 142; x_wconf 87' lang='eng' dir='ltr'><em>mesophi/a</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 500 116 563 137; x_wconf 92' lang='eng' dir='ltr'><em>KMM</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 573 115 631 137; x_wconf 91' lang='eng' dir='ltr'><em>241T</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 638 115 784 142; x_wconf 90' lang='eng' dir='ltr'><em>(AJ488501)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 391 153 818 218">
+     <span class='ocr_line' id='line_1_5' title="bbox 391 153 818 180; baseline 0 -5"><span class='ocrx_word' id='word_1_20' title='bbox 391 153 415 175; x_wconf 91' lang='eng' dir='ltr'><em>G.</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 426 154 586 180; x_wconf 87' lang='eng' dir='ltr'><em>psychrophi/a</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 598 153 653 175; x_wconf 91' lang='eng' dir='ltr'><em>170T</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 663 153 818 180; x_wconf 85' lang='eng' dir='ltr'><em>(DQOO7436)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 439 190 734 218; baseline 0.003 -6"><span class='ocrx_word' id='word_1_24' title='bbox 439 191 518 213; x_wconf 89' lang='eng' dir='ltr'><em>Strain</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 529 190 573 213; x_wconf 90' lang='eng' dir='ltr'><em>E3T</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 583 191 734 218; x_wconf 86' lang='eng' dir='ltr'><em>(EU183316)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 214 228 886 370">
+     <span class='ocr_line' id='line_1_7' title="bbox 470 228 886 256; baseline 0 -6"><span class='ocrx_word' id='word_1_27' title='bbox 470 229 494 250; x_wconf 91' lang='eng' dir='ltr'><strong><em>G.</em></strong></span> <span class='ocrx_word' id='word_1_28' title='bbox 505 229 604 256; x_wconf 86' lang='eng' dir='ltr'><em>punicea</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 613 229 694 250; x_wconf 88' lang='eng' dir='ltr'><em>ACAM</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 705 228 886 256; x_wconf 78' lang='eng' dir='ltr'><em>611T(U85853)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 347 266 850 294; baseline 0 -6"><span class='ocrx_word' id='word_1_31' title='bbox 347 267 372 288; x_wconf 94' lang='eng' dir='ltr'><em>G.</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 383 267 570 288; x_wconf 81' lang='eng' dir='ltr'><em>nitratireducens</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 580 266 691 288; x_wconf 80' lang='eng' dir='ltr'><em>FR1064T</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 701 267 850 294; x_wconf 89' lang='eng' dir='ltr'><em>(AY787042)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 214 304 824 332; baseline 0 -6"><span class='ocrx_word' id='word_1_35' title='bbox 214 304 251 322; x_wconf 83' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 400 305 424 326; x_wconf 90' lang='eng' dir='ltr'><em>G.</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 435 305 539 332; x_wconf 83' lang='eng' dir='ltr'><em>pallidu/a</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 548 305 629 326; x_wconf 94' lang='eng' dir='ltr'><em>ACAM</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 640 304 698 326; x_wconf 82' lang='eng' dir='ltr'><em>615T</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 708 305 824 332; x_wconf 88' lang='eng' dir='ltr'><em>(U85854)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 232 342 801 370; baseline 0 -6"><span class='ocrx_word' id='word_1_41' title='bbox 232 343 393 364; x_wconf 86' lang='eng' dir='ltr'><em>Alteromonas</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 402 343 524 364; x_wconf 82' lang='eng' dir='ltr'><em>mac/eodii</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 533 343 579 364; x_wconf 93' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 592 342 679 364; x_wconf 77' lang='eng' dir='ltr'><em>12920T</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 687 343 801 370; x_wconf 89' lang='eng' dir='ltr'><em>(X82145)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 0 11 465 331">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 0 11 465 331">
+     <span class='ocr_line' id='line_1_11' title="bbox 266 11 302 42; baseline 0 330"><span class='ocrx_word' id='word_1_46' title='bbox 266 11 302 42; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 209 42 377 119; baseline 0 -17"><span class='ocrx_word' id='word_1_47' title='bbox 209 42 377 119; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 128 119 324 155; baseline 0 217"><span class='ocrx_word' id='word_1_48' title='bbox 128 119 324 155; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 108 155 391 193; baseline 0 179"><span class='ocrx_word' id='word_1_49' title='bbox 108 155 391 193; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 0 193 439 232; baseline 0 140"><span class='ocrx_word' id='word_1_50' title='bbox 0 193 439 232; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 0 232 465 252; baseline 0 120"><span class='ocrx_word' id='word_1_51' title='bbox 0 232 465 252; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 0 252 347 308; baseline 0 0"><span class='ocrx_word' id='word_1_52' title='bbox 0 252 347 308; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> <span class='ocrx_word' id='word_1_53' title='bbox 251 295 347 308; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 0 308 9 331; baseline 0 41"><span class='ocrx_word' id='word_1_54' title='bbox 0 308 9 331; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 57 55 202 120">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 57 55 202 120">
+     <span class='ocr_line' id='line_1_19' title="bbox 57 55 99 73; baseline 0 0"><span class='ocrx_word' id='word_1_55' title='bbox 57 55 99 73; x_wconf 91' lang='eng'><em>0.01</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 180 102 202 120; baseline 0 0"><span class='ocrx_word' id='word_1_56' title='bbox 180 102 202 120; x_wconf 84' lang='eng'><em>91</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 0 308 397 355">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 0 308 397 355">
+     <span class='ocr_line' id='line_1_21' title="bbox 255 308 397 328; baseline 0 44"><span class='ocrx_word' id='word_1_57' title='bbox 255 308 397 328; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 0 331 229 355; baseline 0 17"><span class='ocrx_word' id='word_1_58' title='bbox 0 331 229 355; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000497-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000497-0-001.pbm.png
new file mode 100644
index 00000000..15261991
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000497-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000497-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000497-0-001.pbm.png.hocr
new file mode 100644
index 00000000..9c74ceab
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000497-0-001.pbm.png.hocr
@@ -0,0 +1,202 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000497-0-001.pbm.png"; bbox 0 0 1243 1021; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 56 771 58 855">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 56 771 58 855">
+     <span class='ocr_line' id='line_1_1' title="bbox 56 771 58 855; baseline 0 166"><span class='ocrx_word' id='word_1_1' title='bbox 56 771 58 855; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 73 517 106 534">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 73 517 106 534">
+     <span class='ocr_line' id='line_1_2' title="bbox 73 517 106 534; baseline -0.03 0"><span class='ocrx_word' id='word_1_2' title='bbox 73 517 106 534; x_wconf 57' lang='eng'><em>94*</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 219 371 241 387">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 219 371 241 387">
+     <span class='ocr_line' id='line_1_3' title="bbox 219 371 241 387; baseline 0 0"><span class='ocrx_word' id='word_1_3' title='bbox 219 371 241 387; x_wconf 89' lang='eng'><em>52</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 185 441 218 458">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 185 441 218 458">
+     <span class='ocr_line' id='line_1_4' title="bbox 185 441 218 458; baseline 0 0"><span class='ocrx_word' id='word_1_4' title='bbox 185 441 218 458; x_wconf 77' lang='eng'><em>97*</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 211 640 235 656">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 211 640 235 656">
+     <span class='ocr_line' id='line_1_5' title="bbox 211 640 235 656; baseline 0 0"><span class='ocrx_word' id='word_1_5' title='bbox 211 640 235 656; x_wconf 86' lang='eng'>90</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 162 995 224 1014">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 162 995 224 1014">
+     <span class='ocr_line' id='line_1_6' title="bbox 162 995 224 1014; baseline 0 0"><span class='ocrx_word' id='word_1_6' title='bbox 162 995 224 1014; x_wconf 91' lang='eng'>0.005</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 227 397 229 538">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 227 397 229 538">
+     <span class='ocr_line' id='line_1_7' title="bbox 227 397 229 538; baseline 0 483"><span class='ocrx_word' id='word_1_7' title='bbox 227 397 229 538; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 248 583 250 668">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 248 583 250 668">
+     <span class='ocr_line' id='line_1_8' title="bbox 248 583 250 668; baseline 0 353"><span class='ocrx_word' id='word_1_8' title='bbox 248 583 250 668; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 284 170 286 444">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 284 170 286 444">
+     <span class='ocr_line' id='line_1_9' title="bbox 284 170 286 444; baseline 0 577"><span class='ocrx_word' id='word_1_9' title='bbox 284 170 286 444; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 360 20 381 37">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 360 20 381 37">
+     <span class='ocr_line' id='line_1_10' title="bbox 360 20 381 37; baseline -0.048 0"><span class='ocrx_word' id='word_1_10' title='bbox 360 20 381 37; x_wconf 86' lang='eng'><em>61</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 342 178 365 194">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 342 178 365 194">
+     <span class='ocr_line' id='line_1_11' title="bbox 342 178 365 194; baseline 0 0"><span class='ocrx_word' id='word_1_11' title='bbox 342 178 365 194; x_wconf 87' lang='eng'><em>54</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 372 113 374 292">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 372 113 374 292">
+     <span class='ocr_line' id='line_1_12' title="bbox 372 113 374 292; baseline 0 729"><span class='ocrx_word' id='word_1_12' title='bbox 372 113 374 292; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 395 6 1087 128">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 395 6 1087 128">
+     <span class='ocr_line' id='line_1_13' title="bbox 395 6 1087 33; baseline 0 -5"><span class='ocrx_word' id='word_1_13' title='bbox 395 19 461 21; x_wconf 97' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_14' title='bbox 469 6 490 28; x_wconf 90' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 502 7 594 33; x_wconf 83' lang='eng' dir='ltr'><em>griseus</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 603 7 683 33; x_wconf 84' lang='eng' dir='ltr'><em>subsp.</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 694 7 786 33; x_wconf 86' lang='eng' dir='ltr'><em>griseus</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 796 6 840 28; x_wconf 94' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 853 7 927 28; x_wconf 87' lang='eng'>13550</span> <span class='ocrx_word' id='word_1_20' title='bbox 938 7 1087 33; x_wconf 87' lang='eng' dir='ltr'><em>(ABO45866)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 549 48 988 82; baseline 0 -6"><span class='ocrx_word' id='word_1_21' title='bbox 549 55 570 76; x_wconf 88' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 583 55 664 82; x_wconf 84' lang='eng' dir='ltr'><em>fragil/s</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 674 55 749 76; x_wconf 88' lang='eng' dir='ltr'><em>NRRL</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 758 48 988 82; x_wconf 60' lang='eng' dir='ltr'><em>2424T(AY999917)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 553 101 983 128; baseline 0 -6"><span class='ocrx_word' id='word_1_25' title='bbox 553 101 581 122; x_wconf 79' lang='eng'><em>‘8.</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 595 101 700 122; x_wconf 76' lang='eng' dir='ltr'><em>vel/osus’</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 713 101 787 122; x_wconf 90' lang='eng' dir='ltr'><em>NRRL</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 797 101 858 122; x_wconf 85' lang='eng'><em>8037</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 869 101 983 128; x_wconf 90' lang='eng' dir='ltr'>(X99942)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 502 141 1045 213">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 502 141 1045 213">
+     <span class='ocr_line' id='line_1_16' title="bbox 502 141 1045 175; baseline 0 -6"><span class='ocrx_word' id='word_1_30' title='bbox 502 148 523 169; x_wconf 89' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_31' title='bbox 536 148 688 175; x_wconf 79' lang='eng' dir='ltr'><em>champavatii</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 697 148 772 169; x_wconf 89' lang='eng' dir='ltr'><em>NRRL</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 783 141 883 169; x_wconf 77' lang='eng' dir='ltr'><em>B-5682T</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 891 148 1045 175; x_wconf 84' lang='eng' dir='ltr'><em>(DQ026642)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 503 180 974 213; baseline 0 -6"><span class='ocrx_word' id='word_1_35' title='bbox 503 186 524 207; x_wconf 88' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 537 187 666 213; x_wconf 84' lang='eng' dir='ltr'><em>sampsonii</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 673 186 749 207; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 759 180 849 207; x_wconf 75' lang='eng' dir='ltr'><em>25495T</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 859 187 974 213; x_wconf 84' lang='eng' dir='ltr'><em>(D63871)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 393 19 395 68">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 393 19 395 68">
+     <span class='ocr_line' id='line_1_18' title="bbox 393 19 395 68; baseline 0 953"><span class='ocrx_word' id='word_1_40' title='bbox 393 19 395 68; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 448 157 480 173">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 448 157 480 173">
+     <span class='ocr_line' id='line_1_19' title="bbox 448 157 480 173; baseline 0 0"><span class='ocrx_word' id='word_1_41' title='bbox 448 157 480 173; x_wconf 76' lang='eng'><em>71*</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 370 160 581 354">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 370 160 581 354">
+     <span class='ocr_line' id='line_1_20' title="bbox 370 160 502 286; baseline 0 0"><span class='ocrx_word' id='word_1_42' title='bbox 370 160 502 286; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 370 286 581 354; baseline 0 0"><span class='ocrx_word' id='word_1_43' title='bbox 370 286 581 354; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 451 204 474 220">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 451 204 474 220">
+     <span class='ocr_line' id='line_1_22' title="bbox 451 204 474 220; baseline 0 0"><span class='ocrx_word' id='word_1_44' title='bbox 451 204 474 220; x_wconf 91' lang='eng'><em>57</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 504 246 955 316">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 504 246 955 316">
+     <span class='ocr_line' id='line_1_23' title="bbox 504 246 938 273; baseline 0 -6"><span class='ocrx_word' id='word_1_45' title='bbox 504 246 533 267; x_wconf 75' lang='eng' dir='ltr'><em>‘S.</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 546 246 697 273; x_wconf 75' lang='eng' dir='ltr'><em>fungicidicus’</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 708 246 778 267; x_wconf 92' lang='eng' dir='ltr'><em>YHO4</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 788 246 938 273; x_wconf 71' lang='eng' dir='ltr'><em>(AW-336155)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 509 289 955 316; baseline 0 -6"><span class='ocrx_word' id='word_1_49' title='bbox 509 289 530 310; x_wconf 88' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 542 289 692 310; x_wconf 84' lang='eng' dir='ltr'><em>albidoﬂavus</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 703 289 797 310; x_wconf 84' lang='eng' dir='ltr'><em>HD-109</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 808 289 955 316; x_wconf 82' lang='eng' dir='ltr'><em>(EF620361)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 392 332 1239 647">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 392 332 1239 647">
+     <span class='ocr_line' id='line_1_25' title="bbox 587 332 1055 366; baseline 0 -6"><span class='ocrx_word' id='word_1_53' title='bbox 587 339 608 360; x_wconf 86' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 621 339 778 366; x_wconf 85' lang='eng' dir='ltr'><em>koyangensis</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 787 332 896 360; x_wconf 71' lang='eng' dir='ltr'><em>VK-AESOT</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 906 339 1055 366; x_wconf 85' lang='eng' dir='ltr'><em>(AY079156)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 417 376 977 409; baseline 0 -5"><span class='ocrx_word' id='word_1_57' title='bbox 417 383 437 404; x_wconf 89' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 450 383 657 409; x_wconf 78' lang='eng' dir='ltr'><em>spinoverrucosus</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 668 383 726 404; x_wconf 91' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 735 376 825 404; x_wconf 89' lang='eng' dir='ltr'><em>20321T</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 833 383 977 409; x_wconf 83' lang='eng' dir='ltr'><em>(AJ781376)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 579 424 1144 458; baseline 0 -6"><span class='ocrx_word' id='word_1_62' title='bbox 579 431 600 452; x_wconf 86' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 613 432 836 452; x_wconf 77' lang='eng' dir='ltr'><em>thermodiastaticus</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 845 431 900 452; x_wconf 88' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 911 424 985 452; x_wconf 82' lang='eng' dir='ltr'><em>4840T</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 995 432 1144 458; x_wconf 82' lang='eng' dir='ltr'><em>(ABO18096)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 447 471 998 504; baseline 0 -5"><span class='ocrx_word' id='word_1_67' title='bbox 447 478 468 499; x_wconf 11' lang='eng' dir='ltr'>S9</span> <span class='ocrx_word' id='word_1_68' title='bbox 481 478 647 504; x_wconf 85' lang='eng' dir='ltr'><em>albogriseo/us</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 658 478 732 499; x_wconf 89' lang='eng' dir='ltr'><em>NRRL</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 743 471 844 499; x_wconf 85' lang='eng' dir='ltr'><em>B-1305T</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 854 478 998 504; x_wconf 84' lang='eng' dir='ltr'><em>(AJ494865)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 392 517 876 551; baseline 0 -6"><span class='ocrx_word' id='word_1_72' title='bbox 392 524 413 545; x_wconf 89' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 427 524 556 551; x_wconf 76' lang='eng' dir='ltr'><em>variegatus</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 566 524 625 545; x_wconf 88' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 635 517 724 545; x_wconf 84' lang='eng' dir='ltr'><em>20315T</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 732 524 876 551; x_wconf 85' lang='eng' dir='ltr'><em>(AJ781371)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 471 564 950 597; baseline 0 -5"><span class='ocrx_word' id='word_1_77' title='bbox 471 571 492 592; x_wconf 84' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_78' title='bbox 505 571 656 592; x_wconf 86' lang='eng' dir='ltr'><em>mashuensis</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 666 571 725 592; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 735 564 825 592; x_wconf 79' lang='eng' dir='ltr'><em>40221T</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 836 571 950 597; x_wconf 85' lang='eng' dir='ltr'><em>(X79323)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 677 613 1239 647; baseline 0 -6"><span class='ocrx_word' id='word_1_82' title='bbox 677 620 698 641; x_wconf 86' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 710 620 868 646; x_wconf 85' lang='eng' dir='ltr'><em>kasugaensis</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 878 620 953 641; x_wconf 89' lang='eng' dir='ltr'><em>NRRL</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 964 613 1081 641; x_wconf 77' lang='eng' dir='ltr'><em>B-24288T</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 1091 620 1239 647; x_wconf 86' lang='eng' dir='ltr'>(AY999920)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 248 666 410 668">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 248 666 410 668">
+     <span class='ocr_line' id='line_1_32' title="bbox 248 666 410 668; baseline 0 353"><span class='ocrx_word' id='word_1_87' title='bbox 248 666 410 668; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 227 868 260 885">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 227 868 260 885">
+     <span class='ocr_line' id='line_1_33' title="bbox 227 868 260 885; baseline 0 0"><span class='ocrx_word' id='word_1_88' title='bbox 227 868 260 885; x_wconf 64' lang='eng'>98‘</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 408 630 410 702">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 408 630 410 702">
+     <span class='ocr_line' id='line_1_34' title="bbox 408 630 410 702; baseline 0 319"><span class='ocrx_word' id='word_1_89' title='bbox 408 630 410 702; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 364 661 1024 726">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 364 661 1024 694">
+     <span class='ocr_line' id='line_1_35' title="bbox 364 661 1024 694; baseline 0 -5"><span class='ocrx_word' id='word_1_90' title='bbox 364 673 397 690; x_wconf 68' lang='eng'>99*</span> <span class='ocrx_word' id='word_1_91' title='bbox 496 668 517 689; x_wconf 88' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 530 668 702 689; x_wconf 87' lang='eng' dir='ltr'><em>morookaense</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 712 668 770 689; x_wconf 92' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 780 661 870 689; x_wconf 91' lang='eng' dir='ltr'><em>20074T</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 880 668 1024 694; x_wconf 85' lang='eng' dir='ltr'><em>(AJ781349)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 390 708 1173 926">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 390 708 1173 926">
+     <span class='ocr_line' id='line_1_36' title="bbox 558 708 1156 741; baseline 0 -5"><span class='ocrx_word' id='word_1_96' title='bbox 558 715 579 736; x_wconf 89' lang='eng' dir='ltr'><em>s.</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 592 715 796 741; x_wconf 85' lang='eng' dir='ltr'><em>lavenduligriseus</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 806 715 881 735; x_wconf 90' lang='eng' dir='ltr'>NRRL</span> <span class='ocrx_word' id='word_1_99' title='bbox 892 708 992 736; x_wconf 77' lang='eng' dir='ltr'><em>3—3173T</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 1002 715 1156 741; x_wconf 85' lang='eng' dir='ltr'><em>(DQ442515)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 390 755 873 788; baseline 0.002 -6"><span class='ocrx_word' id='word_1_101' title='bbox 390 761 412 783; x_wconf 86' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 425 762 557 788; x_wconf 81' lang='eng' dir='ltr'><em>sodiiphilus</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 565 762 613 782; x_wconf 91' lang='eng' dir='ltr'><em>YIM</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 625 755 714 783; x_wconf 79' lang='eng' dir='ltr'><em>80305T</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 724 762 873 788; x_wconf 82' lang='eng' dir='ltr'><em>(AY236339)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 581 800 1173 833; baseline 0 -6"><span class='ocrx_word' id='word_1_106' title='bbox 581 806 605 827; x_wconf 89' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_107' title='bbox 614 807 786 827; x_wconf 87' lang='eng' dir='ltr'><em>xiamenensis</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 796 806 879 827; x_wconf 88' lang='eng' dir='ltr'><em>MCCC</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 890 800 1015 827; x_wconf 93' lang='eng' dir='ltr'><em>1A01550T</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 1024 807 1173 833; x_wconf 83' lang='eng' dir='ltr'><em>(EFO12099)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 618 847 1157 880; baseline 0 -5"><span class='ocrx_word' id='word_1_111' title='bbox 618 854 639 875; x_wconf 90' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 652 854 781 880; x_wconf 81' lang='eng' dir='ltr'><em>carpaticus</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 791 854 866 875; x_wconf 89' lang='eng' dir='ltr'>NRRL</span> <span class='ocrx_word' id='word_1_114' title='bbox 877 847 994 875; x_wconf 60' lang='eng' dir='ltr'><em>846359T</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 1004 854 1157 880; x_wconf 85' lang='eng' dir='ltr'>(DQ442494)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 414 893 1163 926; baseline 0 -5"><span class='ocrx_word' id='word_1_116' title='bbox 414 904 447 921; x_wconf 77' lang='eng'><em>98&quot;</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 461 912 667 914; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_118' title='bbox 676 899 697 921; x_wconf 87' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_119' title='bbox 710 900 885 921; x_wconf 78' lang='eng' dir='ltr'><em>cheonanens/s</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 893 893 1004 921; x_wconf 84' lang='eng' dir='ltr'><em>VC-A46T</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 1014 900 1163 926; x_wconf 87' lang='eng' dir='ltr'><em>(AY822606)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 459 865 461 914">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 459 865 461 914">
+     <span class='ocr_line' id='line_1_41' title="bbox 459 865 461 914; baseline 0 107"><span class='ocrx_word' id='word_1_122' title='bbox 459 865 461 914; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000521-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000521-0-000.pbm.png
new file mode 100644
index 00000000..00515e4e
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000521-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000521-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000521-0-000.pbm.png.hocr
new file mode 100644
index 00000000..dc80939d
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000521-0-000.pbm.png.hocr
@@ -0,0 +1,144 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000521-0-000.pbm.png"; bbox 0 0 1242 1099; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 65 0 1242 1099">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 65 0 1242 1099">
+     <span class='ocr_line' id='line_1_1' title="bbox 65 0 1113 28; baseline 0 -5"><span class='ocrx_word' id='word_1_1' title='bbox 65 4 108 23; x_wconf 88' lang='eng'><em>0.01</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 269 2 295 21; x_wconf 87' lang='eng'>53</span> <span class='ocrx_word' id='word_1_3' title='bbox 585 2 715 23; x_wconf 78' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 725 2 827 23; x_wconf 85' lang='eng' dir='ltr'><em>undico/a</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 838 2 894 23; x_wconf 92' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 907 0 993 23; x_wconf 84' lang='eng' dir='ltr'><em>11875T</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 1002 2 1113 28; x_wconf 94' lang='eng' dir='ltr'>(Y17047)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 739 37 1193 65; baseline 0.002 -6"><span class='ocrx_word' id='word_1_8' title='bbox 739 39 868 60; x_wconf 83' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 879 39 925 60; x_wconf 81' lang='eng' dir='ltr'><em>vitis</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 935 39 991 60; x_wconf 91' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 1002 37 1075 60; x_wconf 90' lang='eng' dir='ltr'><em>8750T</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 1082 39 1193 65; x_wconf 89' lang='eng' dir='ltr'><em>(X67225)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 561 74 1003 102; baseline 0 -6"><span class='ocrx_word' id='word_1_13' title='bbox 561 76 691 96; x_wconf 83' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 700 76 797 102; x_wconf 85' lang='eng' dir='ltr'><em>giardinii</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 806 74 882 96; x_wconf 91' lang='eng' dir='ltr'><em>H152T</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 890 76 1003 102; x_wconf 86' lang='eng' dir='ltr'>(U86344)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 611 110 1242 139; baseline 0 -6"><span class='ocrx_word' id='word_1_17' title='bbox 611 113 741 133; x_wconf 87' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 751 113 908 139; x_wconf 85' lang='eng' dir='ltr'><em>daejeonense</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 919 112 991 133; x_wconf 88' lang='eng' dir='ltr'><em>KCTC</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 1004 110 1089 133; x_wconf 88' lang='eng' dir='ltr'><em>12121T</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 1097 113 1242 139; x_wconf 86' lang='eng' dir='ltr'>(AY341343)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 663 148 1100 176; baseline 0 -6"><span class='ocrx_word' id='word_1_22' title='bbox 663 150 793 170; x_wconf 85' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 802 150 849 170; x_wconf 87' lang='eng' dir='ltr'><em>rubi</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 858 150 914 170; x_wconf 91' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 927 148 982 170; x_wconf 92' lang='eng' dir='ltr'><em>156T</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 989 150 1100 176; x_wconf 89' lang='eng' dir='ltr'><em>(X67228)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 611 184 1218 213; baseline 0 -6"><span class='ocrx_word' id='word_1_27' title='bbox 611 187 741 207; x_wconf 85' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 751 187 891 207; x_wconf 80' lang='eng' dir='ltr'><em>radiobacter</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 897 186 971 207; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 984 184 1070 207; x_wconf 80' lang='eng' dir='ltr'>19358T</span> <span class='ocrx_word' id='word_1_31' title='bbox 1078 187 1218 213; x_wconf 81' lang='eng' dir='ltr'>(AJ389904)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 649 221 1154 249; baseline 0 -5"><span class='ocrx_word' id='word_1_32' title='bbox 649 223 778 244; x_wconf 84' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 788 223 928 249; x_wconf 83' lang='eng' dir='ltr'><em>lanymoorei</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 935 223 991 244; x_wconf 24' lang='eng' dir='ltr'><em>AF3‘</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 997 223 1004 244; x_wconf 94' lang='eng'>1</span> <span class='ocrx_word' id='word_1_36' title='bbox 1011 221 1037 244; x_wconf 93' lang='eng' dir='ltr'><em>0T</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 1044 223 1154 249; x_wconf 85' lang='eng'>(230542)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 549 258 1160 286; baseline 0 -5"><span class='ocrx_word' id='word_1_38' title='bbox 549 261 679 281; x_wconf 84' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 689 261 865 286; x_wconf 75' lang='eng' dir='ltr'><em>cellulosi/yticus</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 873 258 1002 281; x_wconf 83' lang='eng' dir='ltr'><em>ALA1OBZT</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 1010 260 1160 286; x_wconf 87' lang='eng' dir='ltr'><em>(DQ855276)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 416 295 955 323; baseline 0 -5"><span class='ocrx_word' id='word_1_42' title='bbox 416 297 546 318; x_wconf 80' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 555 297 653 323; x_wconf 82' lang='eng' dir='ltr'><em>ga/egae</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 661 297 736 318; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 746 295 955 323; x_wconf 80' lang='eng' dir='ltr'>43677T(D11343)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 359 332 860 360; baseline 0 -6"><span class='ocrx_word' id='word_1_46' title='bbox 359 334 489 354; x_wconf 85' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 498 334 632 354; x_wconf 76' lang='eng' dir='ltr'><em>huautlense</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 642 332 708 354; x_wconf 82' lang='eng' dir='ltr'><em>802T</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 716 334 860 360; x_wconf 87' lang='eng' dir='ltr'>(AF025852)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 369 369 989 397; baseline 0 -5"><span class='ocrx_word' id='word_1_50' title='bbox 369 371 499 392; x_wconf 80' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 508 371 631 392; x_wconf 82' lang='eng' dir='ltr'><em>loessense</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 641 371 736 392; x_wconf 93' lang='eng' dir='ltr'><em>CCBAU</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 747 369 838 392; x_wconf 75' lang='eng' dir='ltr'><em>7190BT</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 846 371 989 397; x_wconf 83' lang='eng' dir='ltr'>(AF364069)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 289 408 769 434; baseline 0 -6"><span class='ocrx_word' id='word_1_55' title='bbox 289 408 430 428; x_wconf 91' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 439 408 519 428; x_wconf 87' lang='eng' dir='ltr'><em>alamii</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 526 408 613 428; x_wconf 81' lang='eng' dir='ltr'>YA834</span> <span class='ocrx_word' id='word_1_58' title='bbox 622 408 769 434; x_wconf 88' lang='eng' dir='ltr'>(AF239242)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 267 443 782 471; baseline 0.002 -6"><span class='ocrx_word' id='word_1_59' title='bbox 267 445 408 466; x_wconf 91' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 417 445 496 466; x_wconf 87' lang='eng' dir='ltr'><em>alamii</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 504 443 622 466; x_wconf 90' lang='eng' dir='ltr'><em>GBV016T</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 629 445 782 471; x_wconf 84' lang='eng' dir='ltr'>(AM931436)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 243 482 752 508; baseline 0 -6"><span class='ocrx_word' id='word_1_63' title='bbox 243 482 384 502; x_wconf 89' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 394 482 473 502; x_wconf 86' lang='eng' dir='ltr'><em>alamii</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 482 482 558 502; x_wconf 89' lang='eng' dir='ltr'><em>USDA</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 569 482 628 502; x_wconf 89' lang='eng'><em>1920</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 638 482 752 508; x_wconf 87' lang='eng' dir='ltr'>(U89823)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 269 516 691 544; baseline 0 -5"><span class='ocrx_word' id='word_1_68' title='bbox 269 519 399 539; x_wconf 84' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 409 519 480 539; x_wconf 85' lang='eng' dir='ltr'><em>sul/ae</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 491 516 573 539; x_wconf 80' lang='eng' dir='ltr'><em>|S123T</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 580 519 691 544; x_wconf 92' lang='eng' dir='ltr'>(Y10170)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 309 553 939 582; baseline 0 -6"><span class='ocrx_word' id='word_1_72' title='bbox 309 556 439 576; x_wconf 84' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 448 555 584 582; x_wconf 85' lang='eng' dir='ltr'><em>indigoferae</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 594 555 688 576; x_wconf 91' lang='eng' dir='ltr'><em>CCBAU</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 700 556 724 576; x_wconf 94' lang='eng'>71</span> <span class='ocrx_word' id='word_1_76' title='bbox 731 553 788 576; x_wconf 92' lang='eng' dir='ltr'><em>O42T</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 795 556 939 582; x_wconf 86' lang='eng' dir='ltr'>(AF364068)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 325 590 922 618; baseline 0.002 -6"><span class='ocrx_word' id='word_1_78' title='bbox 325 592 455 613; x_wconf 85' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 463 592 626 618; x_wconf 87' lang='eng' dir='ltr'><em>yang/ingense</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 636 592 671 613; x_wconf 88' lang='eng' dir='ltr'><em>SH</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 682 590 771 613; x_wconf 83' lang='eng' dir='ltr'><em>22623T</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 778 592 922 618; x_wconf 87' lang='eng' dir='ltr'>(AF003375)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 295 627 772 656; baseline 0 -6"><span class='ocrx_word' id='word_1_83' title='bbox 295 630 425 650; x_wconf 83' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 434 630 536 656; x_wconf 73' lang='eng' dir='ltr'><em>gall/Cum</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 546 627 652 656; x_wconf 81' lang='eng' dir='ltr'><em>R6025pT</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 659 630 772 656; x_wconf 85' lang='eng' dir='ltr'>(U86343)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 291 664 869 692; baseline 0 -5"><span class='ocrx_word' id='word_1_87' title='bbox 291 666 421 687; x_wconf 71' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 431 666 581 692; x_wconf 87' lang='eng' dir='ltr'><em>mongolense</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 592 666 666 687; x_wconf 91' lang='eng' dir='ltr'><em>USDA</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 678 664 869 692; x_wconf 80' lang='eng' dir='ltr'>1844T(U89817)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 390 701 851 729; baseline 0.002 -6"><span class='ocrx_word' id='word_1_91' title='bbox 390 703 520 724; x_wconf 86' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 530 703 672 724; x_wconf 83' lang='eng' dir='ltr'><em>hainanense</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 683 701 731 724; x_wconf 82' lang='eng' dir='ltr'><em>I66T</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 738 703 851 729; x_wconf 90' lang='eng' dir='ltr'>(U71078)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 315 738 726 766; baseline 0 -5"><span class='ocrx_word' id='word_1_95' title='bbox 315 740 445 761; x_wconf 85' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 454 740 490 761; x_wconf 78' lang='eng' dir='ltr'><em>etli</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 498 740 552 761; x_wconf 89' lang='eng' dir='ltr'><em>CFN</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 563 738 605 761; x_wconf 92' lang='eng' dir='ltr'><em>42T</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 613 740 726 766; x_wconf 85' lang='eng' dir='ltr'>(U28916)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 422 775 1039 803; baseline 0 -6"><span class='ocrx_word' id='word_1_100' title='bbox 422 777 552 797; x_wconf 85' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 561 777 751 803; x_wconf 81' lang='eng' dir='ltr'><em>legummosarum</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 762 777 837 797; x_wconf 90' lang='eng' dir='ltr'><em>USDA</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 845 775 918 797; x_wconf 84' lang='eng' dir='ltr'><em>2370T</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 926 777 1039 803; x_wconf 84' lang='eng' dir='ltr'>(U29386)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 609 812 1080 840; baseline 0.002 -6"><span class='ocrx_word' id='word_1_105' title='bbox 609 814 739 835; x_wconf 83' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 749 814 823 840; x_wconf 87' lang='eng' dir='ltr'><em>tropici</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 831 814 893 835; x_wconf 94' lang='eng' dir='ltr'><em>CIAT</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 903 812 960 835; x_wconf 79' lang='eng' dir='ltr'><em>899T</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 967 814 1080 840; x_wconf 85' lang='eng' dir='ltr'>(U89832)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 502 849 991 877; baseline 0 -6"><span class='ocrx_word' id='word_1_110' title='bbox 502 851 632 871; x_wconf 83' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 641 851 759 871; x_wconf 78' lang='eng' dir='ltr'><em>lusitanum</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 770 851 796 871; x_wconf 92' lang='eng' dir='ltr'>P1</span> <span class='ocrx_word' id='word_1_113' title='bbox 803 849 838 871; x_wconf 92' lang='eng' dir='ltr'><em>-7T</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 845 851 991 877; x_wconf 87' lang='eng' dir='ltr'>(AY738130)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 502 885 1110 914; baseline 0 -6"><span class='ocrx_word' id='word_1_115' title='bbox 502 888 632 908; x_wconf 84' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 641 888 777 914; x_wconf 86' lang='eng' dir='ltr'><em>rhizogenes</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 784 887 859 908; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 871 888 878 908; x_wconf 96' lang='eng'>1</span> <span class='ocrx_word' id='word_1_119' title='bbox 887 885 957 908; x_wconf 90' lang='eng' dir='ltr'><em>1325T</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 965 888 1110 913; x_wconf 87' lang='eng' dir='ltr'>(AY945955)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 433 922 971 951; baseline 0 -6"><span class='ocrx_word' id='word_1_121' title='bbox 433 924 520 945; x_wconf 86' lang='eng' dir='ltr'><em>Ensifer</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 527 925 648 945; x_wconf 79' lang='eng' dir='ltr'><em>kostiensis</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 658 924 715 945; x_wconf 92' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 727 922 813 945; x_wconf 77' lang='eng' dir='ltr'><em>19227T</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 821 925 971 951; x_wconf 88' lang='eng' dir='ltr'>(AM181748)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 426 959 1047 987; baseline 0 -5"><span class='ocrx_word' id='word_1_126' title='bbox 426 961 514 982; x_wconf 84' lang='eng' dir='ltr'><em>Ensifer</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 520 962 693 982; x_wconf 87' lang='eng' dir='ltr'><em>kummerowiae</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 703 961 797 982; x_wconf 88' lang='eng' dir='ltr'>CCBAU</span> <span class='ocrx_word' id='word_1_129' title='bbox 809 959 896 982; x_wconf 92' lang='eng' dir='ltr'><em>71714T</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 904 962 1047 987; x_wconf 86' lang='eng' dir='ltr'>(AF364067)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 489 996 1134 1024; baseline 0 -5"><span class='ocrx_word' id='word_1_131' title='bbox 489 998 662 1019; x_wconf 86' lang='eng' dir='ltr'><em>Sinorhizobium</em></span> <span class='ocrx_word' id='word_1_132' title='bbox 672 998 824 1019; x_wconf 83' lang='eng' dir='ltr'><em>americanum</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 834 998 914 1019; x_wconf 93' lang='eng' dir='ltr'><em>CFNEI</em></span> <span class='ocrx_word' id='word_1_134' title='bbox 927 996 982 1019; x_wconf 81' lang='eng' dir='ltr'><em>156T</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 990 998 1134 1024; x_wconf 81' lang='eng' dir='ltr'>(AF506513)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 414 1033 836 1061; baseline 0 -6"><span class='ocrx_word' id='word_1_136' title='bbox 414 1035 502 1056; x_wconf 85' lang='eng' dir='ltr'><em>Ensifer</em></span> <span class='ocrx_word' id='word_1_137' title='bbox 509 1035 569 1056; x_wconf 85' lang='eng' dir='ltr'><em>fredii</em></span> <span class='ocrx_word' id='word_1_138' title='bbox 578 1035 635 1056; x_wconf 91' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_139' title='bbox 645 1033 718 1056; x_wconf 77' lang='eng' dir='ltr'><em>6217T</em></span> <span class='ocrx_word' id='word_1_140' title='bbox 725 1035 836 1061; x_wconf 88' lang='eng' dir='ltr'>(X67231)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 481 1070 1102 1099; baseline 0 -6"><span class='ocrx_word' id='word_1_141' title='bbox 481 1072 655 1093; x_wconf 79' lang='eng' dir='ltr'><em>Ochrobaotrum</em></span> <span class='ocrx_word' id='word_1_142' title='bbox 664 1072 765 1099; x_wconf 80' lang='eng' dir='ltr'><em>anthropi</em></span> <span class='ocrx_word' id='word_1_143' title='bbox 772 1072 847 1093; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_144' title='bbox 856 1070 945 1093; x_wconf 78' lang='eng' dir='ltr'><em>49188T</em></span> <span class='ocrx_word' id='word_1_145' title='bbox 955 1072 1102 1099; x_wconf 92' lang='eng' dir='ltr'>(CP000758)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 0 8 734 1088">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 0 8 734 1075">
+     <span class='ocr_line' id='line_1_31' title="bbox 191 8 585 42; baseline 0 1057"><span class='ocrx_word' id='word_1_146' title='bbox 191 8 585 42; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 133 42 734 60; baseline 0 1039"><span class='ocrx_word' id='word_1_147' title='bbox 133 42 734 60; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 16 60 561 116; baseline 0 983"><span class='ocrx_word' id='word_1_148' title='bbox 16 60 561 116; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 16 116 547 281; baseline 0 -37"><span class='ocrx_word' id='word_1_149' title='bbox 16 116 547 281; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 17 281 416 300; baseline 0 799"><span class='ocrx_word' id='word_1_150' title='bbox 17 281 416 300; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 17 300 414 318; baseline 0 781"><span class='ocrx_word' id='word_1_151' title='bbox 17 300 414 318; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 17 318 359 337; baseline 0 762"><span class='ocrx_word' id='word_1_152' title='bbox 17 318 359 337; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 16 337 359 374; baseline 0 725"><span class='ocrx_word' id='word_1_153' title='bbox 16 337 359 374; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 16 374 366 411; baseline 0 0"><span class='ocrx_word' id='word_1_154' title='bbox 16 374 366 411; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 0 411 287 485; baseline 0 -56"><span class='ocrx_word' id='word_1_155' title='bbox 0 411 287 485; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 0 485 243 521; baseline 0 578"><span class='ocrx_word' id='word_1_156' title='bbox 0 485 243 521; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 0 521 269 558; baseline 0 541"><span class='ocrx_word' id='word_1_157' title='bbox 0 521 269 558; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 0 558 322 613; baseline 0 0"><span class='ocrx_word' id='word_1_158' title='bbox 0 558 322 613; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 0 613 295 632; baseline 0 467"><span class='ocrx_word' id='word_1_159' title='bbox 0 613 295 632; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 0 632 289 670; baseline 0 429"><span class='ocrx_word' id='word_1_160' title='bbox 0 632 289 670; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 0 670 386 724; baseline 0 0"><span class='ocrx_word' id='word_1_161' title='bbox 0 670 386 724; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 0 724 315 743; baseline 0 356"><span class='ocrx_word' id='word_1_162' title='bbox 0 724 315 743; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_48' title="bbox 0 743 315 780; baseline 0 319"><span class='ocrx_word' id='word_1_163' title='bbox 0 743 315 780; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_49' title="bbox 0 780 422 817; baseline 0 282"><span class='ocrx_word' id='word_1_164' title='bbox 0 780 422 817; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_50' title="bbox 0 817 607 835; baseline 0 264"><span class='ocrx_word' id='word_1_165' title='bbox 0 817 607 835; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_51' title="bbox 0 835 502 871; baseline 0 228"><span class='ocrx_word' id='word_1_166' title='bbox 0 835 502 871; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_52' title="bbox 0 871 497 908; baseline 0 0"><span class='ocrx_word' id='word_1_167' title='bbox 0 871 497 908; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_53' title="bbox 0 908 433 945; baseline 0 154"><span class='ocrx_word' id='word_1_168' title='bbox 0 908 433 945; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_54' title="bbox 0 945 426 965; baseline 0 134"><span class='ocrx_word' id='word_1_169' title='bbox 0 945 426 965; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_55' title="bbox 0 965 426 1001; baseline 0 98"><span class='ocrx_word' id='word_1_170' title='bbox 0 965 426 1001; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_56' title="bbox 0 1001 485 1019; baseline 0 80"><span class='ocrx_word' id='word_1_171' title='bbox 0 1001 485 1019; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_57' title="bbox 0 1019 414 1075; baseline 0 24"><span class='ocrx_word' id='word_1_172' title='bbox 0 1019 414 1075; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 263 86 265 167">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 263 86 265 167">
+     <span class='ocr_line' id='line_1_58' title="bbox 263 86 265 167; baseline 0 932"><span class='ocrx_word' id='word_1_173' title='bbox 263 86 265 167; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000547-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000547-0-000.pbm.png
new file mode 100644
index 00000000..1b4f1d33
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000547-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000547-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000547-0-000.pbm.png.hocr
new file mode 100644
index 00000000..0ef94788
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000547-0-000.pbm.png.hocr
@@ -0,0 +1,285 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000547-0-000.pbm.png"; bbox 0 0 993 1233; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 31 22 70 39">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 31 22 70 39">
+     <span class='ocr_line' id='line_1_1' title="bbox 31 22 70 39; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 31 22 70 39; x_wconf 87' lang='eng'>0.01</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 0 840 504 1221">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 0 840 504 1221">
+     <span class='ocr_line' id='line_1_2' title="bbox 0 840 91 885; baseline 0 348"><span class='ocrx_word' id='word_1_2' title='bbox 0 840 91 885; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 0 885 91 965; baseline 0 0"><span class='ocrx_word' id='word_1_3' title='bbox 0 885 91 965; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 0 965 7 1004; baseline 0 229"><span class='ocrx_word' id='word_1_4' title='bbox 0 965 7 1004; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 0 1004 7 1045; baseline 0 188"><span class='ocrx_word' id='word_1_5' title='bbox 0 1004 7 1045; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 0 1045 7 1085; baseline 0 148"><span class='ocrx_word' id='word_1_6' title='bbox 0 1045 7 1085; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 0 1085 7 1125; baseline 0 108"><span class='ocrx_word' id='word_1_7' title='bbox 0 1085 7 1125; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 0 1125 504 1221; baseline 0 -22"><span class='ocrx_word' id='word_1_8' title='bbox 0 1125 504 1221; x_wconf 95' lang='eng' dir='ltr'>    </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 87 537 91 1155">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 87 537 91 1155">
+     <span class='ocr_line' id='line_1_9' title="bbox 87 537 91 1155; baseline 0 78"><span class='ocrx_word' id='word_1_9' title='bbox 87 537 91 1155; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 88 1135 205 1178">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 88 1135 205 1178">
+     <span class='ocr_line' id='line_1_10' title="bbox 88 1135 205 1178; baseline 0 0"><span class='ocrx_word' id='word_1_10' title='bbox 88 1135 205 1178; x_wconf 83' lang='eng' dir='ltr'>-l_—</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 80 1161 593 1192">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 80 1162 593 1191">
+     <span class='ocr_line' id='line_1_11' title="bbox 80 1162 593 1191; baseline 0 -5"><span class='ocrx_word' id='word_1_11' title='bbox 80 1162 103 1179; x_wconf 72' lang='eng'>50</span> <span class='ocrx_word' id='word_1_12' title='bbox 170 1166 192 1186; x_wconf 93' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_13' title='bbox 204 1166 292 1186; x_wconf 78' lang='eng' dir='ltr'>stutzeri</span> <span class='ocrx_word' id='word_1_14' title='bbox 300 1166 378 1186; x_wconf 91' lang='eng' dir='ltr'><strong>CCUG</strong></span> <span class='ocrx_word' id='word_1_15' title='bbox 390 1164 473 1186; x_wconf 81' lang='eng' dir='ltr'>11256T</span> <span class='ocrx_word' id='word_1_16' title='bbox 483 1166 593 1191; x_wconf 86' lang='eng' dir='ltr'>(U26262)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 240 2 275 19">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 240 2 275 19">
+     <span class='ocr_line' id='line_1_12' title="bbox 240 2 275 19; baseline 0 0"><span class='ocrx_word' id='word_1_17' title='bbox 240 2 275 19; x_wconf 88' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 167 1 945 1153">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 291 1 746 30">
+     <span class='ocr_line' id='line_1_13' title="bbox 291 1 746 30; baseline 0 -6"><span class='ocrx_word' id='word_1_18' title='bbox 291 4 327 24; x_wconf 95' lang='eng' dir='ltr'><strong><em>-P.</em></strong></span> <span class='ocrx_word' id='word_1_19' title='bbox 337 4 530 30; x_wconf 84' lang='eng' dir='ltr'>psychrotolerans</span> <span class='ocrx_word' id='word_1_20' title='bbox 540 1 599 24; x_wconf 79' lang='eng' dir='ltr'>C36T</span> <span class='ocrx_word' id='word_1_21' title='bbox 609 4 746 29; x_wconf 85' lang='eng' dir='ltr'>(AJ575816)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 291 41 747 69">
+     <span class='ocr_line' id='line_1_14' title="bbox 291 41 747 69; baseline 0 -5"><span class='ocrx_word' id='word_1_22' title='bbox 291 53 318 56; x_wconf 96' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_23' title='bbox 326 44 348 64; x_wconf 90' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_24' title='bbox 360 44 492 64; x_wconf 81' lang='eng' dir='ltr'>oleovorans</span> <span class='ocrx_word' id='word_1_25' title='bbox 502 44 547 64; x_wconf 94' lang='eng' dir='ltr'>IAM</span> <span class='ocrx_word' id='word_1_26' title='bbox 559 41 628 64; x_wconf 79' lang='eng' dir='ltr'>1508T</span> <span class='ocrx_word' id='word_1_27' title='bbox 637 44 747 69; x_wconf 90' lang='eng' dir='ltr'>(D84018)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 289 82 761 109">
+     <span class='ocr_line' id='line_1_15' title="bbox 289 82 761 109; baseline 0 -5"><span class='ocrx_word' id='word_1_28' title='bbox 289 84 311 104; x_wconf 96' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_29' title='bbox 323 84 501 104; x_wconf 86' lang='eng' dir='ltr'>tuomuerensis</span> <span class='ocrx_word' id='word_1_30' title='bbox 510 82 604 104; x_wconf 81' lang='eng' dir='ltr'>78-123T</span> <span class='ocrx_word' id='word_1_31' title='bbox 613 84 761 109; x_wconf 85' lang='eng' dir='ltr'>(D0868767)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 167 121 637 149">
+     <span class='ocr_line' id='line_1_16' title="bbox 167 121 637 149; baseline 0 -5"><span class='ocrx_word' id='word_1_32' title='bbox 167 132 190 148; x_wconf 82' lang='eng'>93</span> <span class='ocrx_word' id='word_1_33' title='bbox 211 124 233 144; x_wconf 92' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_34' title='bbox 245 124 363 149; x_wconf 78' lang='eng' dir='ltr'>alcaliphila</span> <span class='ocrx_word' id='word_1_35' title='bbox 371 121 637 149; x_wconf 60' lang='eng' dir='ltr'>AL15—21T(ABO30583)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 234 162 699 190">
+     <span class='ocr_line' id='line_1_17' title="bbox 234 162 699 190; baseline 0 -6"><span class='ocrx_word' id='word_1_36' title='bbox 234 164 255 184; x_wconf 86' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_37' title='bbox 267 164 399 185; x_wconf 80' lang='eng' dir='ltr'>mendocina</span> <span class='ocrx_word' id='word_1_38' title='bbox 407 164 480 185; x_wconf 87' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_39' title='bbox 490 162 576 185; x_wconf 90' lang='eng' dir='ltr'>25411T</span> <span class='ocrx_word' id='word_1_40' title='bbox 586 164 699 190; x_wconf 84' lang='eng' dir='ltr'>(M59154)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 198 202 751 230">
+     <span class='ocr_line' id='line_1_18' title="bbox 198 202 751 230; baseline 0 -6"><span class='ocrx_word' id='word_1_41' title='bbox 198 204 220 224; x_wconf 93' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_42' title='bbox 231 204 456 230; x_wconf 82' lang='eng' dir='ltr'>pseudoalcaligenes</span> <span class='ocrx_word' id='word_1_43' title='bbox 465 204 519 224; x_wconf 89' lang='eng' dir='ltr'>JCM</span> <span class='ocrx_word' id='word_1_44' title='bbox 529 202 599 224; x_wconf 80' lang='eng' dir='ltr'>5968T</span> <span class='ocrx_word' id='word_1_45' title='bbox 609 204 751 229; x_wconf 82' lang='eng' dir='ltr'>(AB021379)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 268 242 652 270">
+     <span class='ocr_line' id='line_1_19' title="bbox 268 242 652 270; baseline -0.003 -5"><span class='ocrx_word' id='word_1_46' title='bbox 268 244 289 264; x_wconf 92' lang='eng' dir='ltr'><strong><em>P.</em></strong></span> <span class='ocrx_word' id='word_1_47' title='bbox 301 244 387 270; x_wconf 82' lang='eng' dir='ltr'>segetis</span> <span class='ocrx_word' id='word_1_48' title='bbox 396 242 502 265; x_wconf 82' lang='eng' dir='ltr'>FR1439T</span> <span class='ocrx_word' id='word_1_49' title='bbox 509 244 652 270; x_wconf 86' lang='eng' dir='ltr'>(AY770691)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 261 282 655 310">
+     <span class='ocr_line' id='line_1_20' title="bbox 261 282 655 310; baseline 0 -6"><span class='ocrx_word' id='word_1_50' title='bbox 261 284 283 304; x_wconf 94' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_51' title='bbox 294 284 380 305; x_wconf 85' lang='eng' dir='ltr'>borbari</span> <span class='ocrx_word' id='word_1_52' title='bbox 388 282 655 310; x_wconf 69' lang='eng' dir='ltr'>R—20821T(AM114527)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 321 322 844 350">
+     <span class='ocr_line' id='line_1_21' title="bbox 321 322 844 350; baseline 0 -6"><span class='ocrx_word' id='word_1_53' title='bbox 321 325 343 344; x_wconf 95' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_54' title='bbox 355 325 524 350; x_wconf 86' lang='eng' dir='ltr'>anguilliseptica</span> <span class='ocrx_word' id='word_1_55' title='bbox 534 324 612 345; x_wconf 88' lang='eng' dir='ltr'>NCMB</span> <span class='ocrx_word' id='word_1_56' title='bbox 623 322 692 345; x_wconf 78' lang='eng' dir='ltr'>1949T</span> <span class='ocrx_word' id='word_1_57' title='bbox 702 325 844 350; x_wconf 79' lang='eng' dir='ltr'>(ABOZ1376)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 340 362 772 390">
+     <span class='ocr_line' id='line_1_22' title="bbox 340 362 772 390; baseline 0 -6"><span class='ocrx_word' id='word_1_58' title='bbox 340 364 362 384; x_wconf 97' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_59' title='bbox 373 365 454 390; x_wconf 89' lang='eng' dir='ltr'><em>guinea</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 464 364 519 385; x_wconf 91' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_61' title='bbox 530 362 615 385; x_wconf 91' lang='eng' dir='ltr'>24017T</span> <span class='ocrx_word' id='word_1_62' title='bbox 625 364 772 390; x_wconf 86' lang='eng' dir='ltr'>(AM491811)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 249 402 686 430">
+     <span class='ocr_line' id='line_1_23' title="bbox 249 402 686 430; baseline -0.002 -5"><span class='ocrx_word' id='word_1_63' title='bbox 249 403 272 420; x_wconf 82' lang='eng'>99</span> <span class='ocrx_word' id='word_1_64' title='bbox 332 405 354 425; x_wconf 92' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_65' title='bbox 364 405 408 430; x_wconf 80' lang='eng' dir='ltr'><em>peli</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 417 402 530 425; x_wconf 74' lang='eng' dir='ltr'>R-20805T</span> <span class='ocrx_word' id='word_1_67' title='bbox 540 405 686 430; x_wconf 86' lang='eng' dir='ltr'>(AM114534)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 256 442 604 470">
+     <span class='ocr_line' id='line_1_24' title="bbox 256 442 604 470; baseline 0.003 -6"><span class='ocrx_word' id='word_1_68' title='bbox 256 445 277 464; x_wconf 90' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_69' title='bbox 289 445 417 465; x_wconf 84' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_70' title='bbox 427 442 484 465; x_wconf 81' lang='eng' dir='ltr'>B62T</span> <span class='ocrx_word' id='word_1_71' title='bbox 494 445 604 470; x_wconf 82' lang='eng' dir='ltr'>(U01916)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 315 482 723 510">
+     <span class='ocr_line' id='line_1_25' title="bbox 315 482 723 510; baseline 0 -5"><span class='ocrx_word' id='word_1_72' title='bbox 315 485 336 505; x_wconf 95' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_73' title='bbox 348 485 467 505; x_wconf 84' lang='eng' dir='ltr'>straminea</span> <span class='ocrx_word' id='word_1_74' title='bbox 477 485 522 505; x_wconf 93' lang='eng' dir='ltr'>IAM</span> <span class='ocrx_word' id='word_1_75' title='bbox 534 482 603 505; x_wconf 81' lang='eng' dir='ltr'>1598T</span> <span class='ocrx_word' id='word_1_76' title='bbox 612 485 723 510; x_wconf 84' lang='eng' dir='ltr'>(D84023)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 232 521 716 550">
+     <span class='ocr_line' id='line_1_26' title="bbox 232 521 716 550; baseline 0 -5"><span class='ocrx_word' id='word_1_77' title='bbox 232 521 255 538; x_wconf 79' lang='eng'>99</span> <span class='ocrx_word' id='word_1_78' title='bbox 281 525 303 545; x_wconf 91' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_79' title='bbox 315 525 476 550; x_wconf 80' lang='eng' dir='ltr'>argentinensis</span> <span class='ocrx_word' id='word_1_80' title='bbox 485 522 564 545; x_wconf 78' lang='eng' dir='ltr'>CH01T</span> <span class='ocrx_word' id='word_1_81' title='bbox 574 525 716 550; x_wconf 87' lang='eng' dir='ltr'>(AY691188)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 292 562 848 591">
+     <span class='ocr_line' id='line_1_27' title="bbox 292 562 848 591; baseline -0.004 -4"><span class='ocrx_word' id='word_1_82' title='bbox 292 571 315 587; x_wconf 83' lang='eng'>99</span> <span class='ocrx_word' id='word_1_83' title='bbox 434 565 456 585; x_wconf 93' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_84' title='bbox 468 565 597 591; x_wconf 78' lang='eng' dir='ltr'>azotiﬁgens</span> <span class='ocrx_word' id='word_1_85' title='bbox 606 562 696 585; x_wconf 81' lang='eng' dir='ltr'>6H33bT</span> <span class='ocrx_word' id='word_1_86' title='bbox 706 565 848 590; x_wconf 86' lang='eng' dir='ltr'>(AB189452)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 468 602 816 630">
+     <span class='ocr_line' id='line_1_28' title="bbox 468 602 816 630; baseline 0 -5"><span class='ocrx_word' id='word_1_87' title='bbox 468 605 490 625; x_wconf 93' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_88' title='bbox 502 605 571 625; x_wconf 84' lang='eng' dir='ltr'>ind/ca</span> <span class='ocrx_word' id='word_1_89' title='bbox 582 602 816 630; x_wconf 61' lang='eng' dir='ltr'>|MT37T(AF302795)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 508 643 944 670">
+     <span class='ocr_line' id='line_1_29' title="bbox 508 643 944 670; baseline 0 -5"><span class='ocrx_word' id='word_1_90' title='bbox 508 645 530 665; x_wconf 92' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_91' title='bbox 542 645 723 665; x_wconf 80' lang='eng' dir='ltr'>thermotolerans</span> <span class='ocrx_word' id='word_1_92' title='bbox 732 643 799 665; x_wconf 78' lang='eng' dir='ltr'>CM3T</span> <span class='ocrx_word' id='word_1_93' title='bbox 806 645 871 670; x_wconf 81' lang='eng' dir='ltr'>(AJ31</span> <span class='ocrx_word' id='word_1_94' title='bbox 879 645 944 670; x_wconf 85' lang='eng'>1980)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 368 683 747 710">
+     <span class='ocr_line' id='line_1_30' title="bbox 368 683 747 710; baseline 0 -5"><span class='ocrx_word' id='word_1_95' title='bbox 368 685 390 705; x_wconf 93' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_96' title='bbox 402 685 511 705; x_wconf 80' lang='eng' dir='ltr'>ba/earica</span> <span class='ocrx_word' id='word_1_97' title='bbox 520 683 627 705; x_wconf 78' lang='eng' dir='ltr'>SP1402T</span> <span class='ocrx_word' id='word_1_98' title='bbox 637 685 747 710; x_wconf 88' lang='eng' dir='ltr'>(U26418)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 295 723 812 751">
+     <span class='ocr_line' id='line_1_31' title="bbox 295 723 812 751; baseline 0 -6"><span class='ocrx_word' id='word_1_99' title='bbox 295 725 316 745; x_wconf 90' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_100' title='bbox 328 725 484 746; x_wconf 84' lang='eng' dir='ltr'>resinovorans</span> <span class='ocrx_word' id='word_1_101' title='bbox 491 725 564 746; x_wconf 87' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_102' title='bbox 576 723 660 745; x_wconf 75' lang='eng' dir='ltr'>14235T</span> <span class='ocrx_word' id='word_1_103' title='bbox 670 725 812 751; x_wconf 82' lang='eng' dir='ltr'>(ABOZ1373)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 275 763 705 791">
+     <span class='ocr_line' id='line_1_32' title="bbox 275 763 705 791; baseline 0 -6"><span class='ocrx_word' id='word_1_104' title='bbox 275 766 296 785; x_wconf 93' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_105' title='bbox 308 766 441 791; x_wconf 86' lang='eng' dir='ltr'><em>aeruginosa</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 452 765 507 785; x_wconf 90' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_107' title='bbox 520 763 588 785; x_wconf 87' lang='eng' dir='ltr'>1242T</span> <span class='ocrx_word' id='word_1_108' title='bbox 598 766 705 791; x_wconf 91' lang='eng' dir='ltr'>(Z76651)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 255 803 673 831">
+     <span class='ocr_line' id='line_1_33' title="bbox 255 803 673 831; baseline 0 -5"><span class='ocrx_word' id='word_1_109' title='bbox 255 806 276 826; x_wconf 64' lang='eng' dir='ltr'><strong><em>P,</em></strong></span> <span class='ocrx_word' id='word_1_110' title='bbox 288 806 364 826; x_wconf 79' lang='eng' dir='ltr'>otitidis</span> <span class='ocrx_word' id='word_1_111' title='bbox 374 803 521 826; x_wconf 77' lang='eng' dir='ltr'>MCC10330T</span> <span class='ocrx_word' id='word_1_112' title='bbox 530 806 673 831; x_wconf 83' lang='eng' dir='ltr'>(AY953147)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 237 843 677 871">
+     <span class='ocr_line' id='line_1_34' title="bbox 237 843 677 871; baseline 0 -5"><span class='ocrx_word' id='word_1_113' title='bbox 237 846 259 865; x_wconf 94' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_114' title='bbox 271 846 406 871; x_wconf 86' lang='eng' dir='ltr'>alcaligenes</span> <span class='ocrx_word' id='word_1_115' title='bbox 416 846 461 866; x_wconf 92' lang='eng' dir='ltr'>IAM</span> <span class='ocrx_word' id='word_1_116' title='bbox 474 843 557 866; x_wconf 91' lang='eng' dir='ltr'>12411T</span> <span class='ocrx_word' id='word_1_117' title='bbox 566 846 677 871; x_wconf 85' lang='eng' dir='ltr'>(D84006)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 282 883 809 911">
+     <span class='ocr_line' id='line_1_35' title="bbox 282 883 809 911; baseline 0 -6"><span class='ocrx_word' id='word_1_118' title='bbox 282 891 305 908; x_wconf 78' lang='eng'>78</span> <span class='ocrx_word' id='word_1_119' title='bbox 359 886 380 905; x_wconf 89' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_120' title='bbox 392 886 556 906; x_wconf 86' lang='eng' dir='ltr'>nitroreducens</span> <span class='ocrx_word' id='word_1_121' title='bbox 567 886 611 905; x_wconf 93' lang='eng' dir='ltr'>IAM</span> <span class='ocrx_word' id='word_1_122' title='bbox 623 883 809 911; x_wconf 78' lang='eng' dir='ltr'>1439T(D84021)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 359 923 906 951">
+     <span class='ocr_line' id='line_1_36' title="bbox 359 923 906 951; baseline 0 -5"><span class='ocrx_word' id='word_1_123' title='bbox 359 926 381 946; x_wconf 91' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_124' title='bbox 392 926 596 946; x_wconf 83' lang='eng' dir='ltr'>multiresinivorans</span> <span class='ocrx_word' id='word_1_125' title='bbox 604 925 677 946; x_wconf 90' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_126' title='bbox 687 923 788 946; x_wconf 79' lang='eng' dir='ltr'>700690T</span> <span class='ocrx_word' id='word_1_127' title='bbox 797 926 906 951; x_wconf 87' lang='eng' dir='ltr'>(X96787)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 390 964 787 991">
+     <span class='ocr_line' id='line_1_37' title="bbox 390 964 787 991; baseline 0 -5"><span class='ocrx_word' id='word_1_128' title='bbox 390 966 412 986; x_wconf 92' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_129' title='bbox 419 966 534 991; x_wconf 79' lang='eng' dir='ltr'>jinjuensis</span> <span class='ocrx_word' id='word_1_130' title='bbox 544 966 587 986; x_wconf 88' lang='eng' dir='ltr'>Pss</span> <span class='ocrx_word' id='word_1_131' title='bbox 597 964 637 986; x_wconf 76' lang='eng' dir='ltr'>26T</span> <span class='ocrx_word' id='word_1_132' title='bbox 646 966 787 991; x_wconf 87' lang='eng' dir='ltr'>(AF468448)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 353 1003 749 1031">
+     <span class='ocr_line' id='line_1_38' title="bbox 353 1003 749 1031; baseline 0 -5"><span class='ocrx_word' id='word_1_133' title='bbox 353 1006 375 1026; x_wconf 72' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_134' title='bbox 386 1006 536 1026; x_wconf 83' lang='eng' dir='ltr'>knackmussii</span> <span class='ocrx_word' id='word_1_135' title='bbox 544 1003 601 1026; x_wconf 80' lang='eng' dir='ltr'>B13T</span> <span class='ocrx_word' id='word_1_136' title='bbox 609 1006 749 1031; x_wconf 82' lang='eng' dir='ltr'>(AF039489)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 319 1043 860 1111">
+     <span class='ocr_line' id='line_1_39' title="bbox 368 1043 860 1071; baseline 0 -5"><span class='ocrx_word' id='word_1_137' title='bbox 368 1046 389 1066; x_wconf 91' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_138' title='bbox 401 1046 535 1066; x_wconf 83' lang='eng' dir='ltr'>citrone/lolis</span> <span class='ocrx_word' id='word_1_139' title='bbox 543 1046 616 1066; x_wconf 90' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_140' title='bbox 628 1043 711 1066; x_wconf 83' lang='eng' dir='ltr'>13674T</span> <span class='ocrx_word' id='word_1_141' title='bbox 719 1046 860 1071; x_wconf 83' lang='eng' dir='ltr'>(ABOZ1396)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 319 1083 793 1111; baseline 0 -5"><span class='ocrx_word' id='word_1_142' title='bbox 319 1084 342 1100; x_wconf 78' lang='eng'>93</span> <span class='ocrx_word' id='word_1_143' title='bbox 389 1086 410 1106; x_wconf 93' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_144' title='bbox 422 1086 542 1106; x_wconf 88' lang='eng' dir='ltr'>delhiensis</span> <span class='ocrx_word' id='word_1_145' title='bbox 552 1083 793 1111; x_wconf 78' lang='eng' dir='ltr'>RLD—1T(DQ339153)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 216 1124 716 1152">
+     <span class='ocr_line' id='line_1_41' title="bbox 216 1124 716 1152; baseline 0 -6"><span class='ocrx_word' id='word_1_146' title='bbox 216 1126 237 1146; x_wconf 91' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_147' title='bbox 248 1127 413 1147; x_wconf 86' lang='eng' dir='ltr'>xanthoman&#39;na</span> <span class='ocrx_word' id='word_1_148' title='bbox 424 1126 483 1146; x_wconf 92' lang='eng' dir='ltr'>KMM</span> <span class='ocrx_word' id='word_1_149' title='bbox 496 1124 564 1146; x_wconf 90' lang='eng' dir='ltr'>1447T</span> <span class='ocrx_word' id='word_1_150' title='bbox 574 1126 716 1152; x_wconf 84' lang='eng' dir='ltr'>(AB176954)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 289 13 291 56">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 289 13 291 56">
+     <span class='ocr_line' id='line_1_42' title="bbox 289 13 291 56; baseline 0 1177"><span class='ocrx_word' id='word_1_151' title='bbox 289 13 291 56; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 104 40 127 56">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 104 40 127 56">
+     <span class='ocr_line' id='line_1_43' title="bbox 104 40 127 56; baseline 0 0"><span class='ocrx_word' id='word_1_152' title='bbox 104 40 127 56; x_wconf 91' lang='eng'>42</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 107 33 336 536">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 108 33 336 536">
+     <span class='ocr_line' id='line_1_44' title="bbox 115 33 289 83; baseline 0 0"><span class='ocrx_word' id='word_1_153' title='bbox 115 33 289 83; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 115 83 284 122; baseline 0 0"><span class='ocrx_word' id='word_1_154' title='bbox 115 83 284 122; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 108 122 231 204; baseline 0 0"><span class='ocrx_word' id='word_1_155' title='bbox 108 122 231 204; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 108 204 198 244; baseline 0 989"><span class='ocrx_word' id='word_1_156' title='bbox 108 204 198 244; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_48' title="bbox 108 244 261 324; baseline 0 0"><span class='ocrx_word' id='word_1_157' title='bbox 108 244 261 324; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_49' title="bbox 115 324 336 428; baseline 0 0"><span class='ocrx_word' id='word_1_158' title='bbox 115 324 336 428; x_wconf 95' lang='eng' dir='ltr'>    </span> <span class='ocrx_word' id='word_1_159' title='bbox 272 395 324 428; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_50' title="bbox 128 428 310 507; baseline 0 0"><span class='ocrx_word' id='word_1_160' title='bbox 128 428 310 507; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_51' title="bbox 128 507 232 536; baseline 0 697"><span class='ocrx_word' id='word_1_161' title='bbox 128 507 232 536; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 110 574 504 1097">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 111 574 504 1097">
+     <span class='ocr_line' id='line_1_52' title="bbox 229 574 434 605; baseline 0 -10"><span class='ocrx_word' id='word_1_162' title='bbox 229 574 434 605; x_wconf 95' lang='eng' dir='ltr'>  </span> <span class='ocrx_word' id='word_1_163' title='bbox 315 574 426 595; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_53' title="bbox 189 605 468 644; baseline 0 589"><span class='ocrx_word' id='word_1_164' title='bbox 189 605 468 644; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_54' title="bbox 147 644 504 670; baseline 0 563"><span class='ocrx_word' id='word_1_165' title='bbox 147 644 504 670; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_55' title="bbox 130 670 368 723; baseline 0 -14"><span class='ocrx_word' id='word_1_166' title='bbox 130 670 368 723; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_56' title="bbox 130 723 293 749; baseline 0 484"><span class='ocrx_word' id='word_1_167' title='bbox 130 723 293 749; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_57' title="bbox 130 749 275 805; baseline 0 -16"><span class='ocrx_word' id='word_1_168' title='bbox 130 749 275 805; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_58' title="bbox 130 805 245 829; baseline 0 404"><span class='ocrx_word' id='word_1_169' title='bbox 130 805 245 829; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_59' title="bbox 111 829 237 845; baseline 0 388"><span class='ocrx_word' id='word_1_170' title='bbox 111 829 237 845; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_60' title="bbox 111 845 233 885; baseline 0 348"><span class='ocrx_word' id='word_1_171' title='bbox 111 845 233 885; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_61' title="bbox 111 885 351 925; baseline 0 -9"><span class='ocrx_word' id='word_1_172' title='bbox 111 885 351 925; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_62' title="bbox 130 925 387 989; baseline 0 0"><span class='ocrx_word' id='word_1_173' title='bbox 130 925 387 989; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_63' title="bbox 278 1045 388 1097; baseline 0 0"><span class='ocrx_word' id='word_1_174' title='bbox 278 1045 363 1085; x_wconf 95' lang='eng' dir='ltr'>  </span> <span class='ocrx_word' id='word_1_175' title='bbox 342 1076 388 1097; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 111 218 115 853">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 111 218 115 853">
+     <span class='ocr_line' id='line_1_64' title="bbox 111 218 115 853; baseline 0 380"><span class='ocrx_word' id='word_1_176' title='bbox 111 218 115 853; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 262 1018 285 1035">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 262 1018 285 1035">
+     <span class='ocr_line' id='line_1_65' title="bbox 262 1018 285 1035; baseline 0 0"><span class='ocrx_word' id='word_1_177' title='bbox 262 1018 285 1035; x_wconf 80' lang='eng'>37</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 507 1203 993 1232">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 507 1204 993 1232">
+     <span class='ocr_line' id='line_1_66' title="bbox 507 1204 993 1232; baseline 0 -6"><span class='ocrx_word' id='word_1_178' title='bbox 507 1206 529 1226; x_wconf 90' lang='eng' dir='ltr'><strong><em>C.</em></strong></span> <span class='ocrx_word' id='word_1_179' title='bbox 541 1206 684 1226; x_wconf 74' lang='eng' dir='ltr'>ostraviensis</span> <span class='ocrx_word' id='word_1_180' title='bbox 694 1206 750 1226; x_wconf 90' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_181' title='bbox 762 1204 845 1226; x_wconf 75' lang='eng' dir='ltr'>19434T</span> <span class='ocrx_word' id='word_1_182' title='bbox 855 1206 993 1232; x_wconf 83' lang='eng' dir='ltr'>(AJ493583)</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000588-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000588-0-000.pbm.png
new file mode 100644
index 00000000..ffd956aa
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000588-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000588-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000588-0-000.pbm.png.hocr
new file mode 100644
index 00000000..993f084c
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000588-0-000.pbm.png.hocr
@@ -0,0 +1,200 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000588-0-000.pbm.png"; bbox 0 0 1302 603; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 0 17 3 467">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 0 17 3 467">
+     <span class='ocr_line' id='line_1_1' title="bbox 0 17 3 467; baseline 0 136"><span class='ocrx_word' id='word_1_1' title='bbox 0 17 3 467; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 244 327 268 344">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 244 327 268 344">
+     <span class='ocr_line' id='line_1_2' title="bbox 244 327 268 344; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 244 327 268 344; x_wconf 86' lang='eng'>76</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 347 136 349 214">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 347 136 349 214">
+     <span class='ocr_line' id='line_1_3' title="bbox 347 136 349 214; baseline 0 389"><span class='ocrx_word' id='word_1_3' title='bbox 347 136 349 214; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 272 236 310 238">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 272 236 310 238">
+     <span class='ocr_line' id='line_1_4' title="bbox 272 236 310 238; baseline 0 365"><span class='ocrx_word' id='word_1_4' title='bbox 272 236 310 238; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 308 176 310 292">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 308 176 310 292">
+     <span class='ocr_line' id='line_1_5' title="bbox 308 176 310 292; baseline 0 311"><span class='ocrx_word' id='word_1_5' title='bbox 308 176 310 292; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 363 0 840 25">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 363 0 840 25">
+     <span class='ocr_line' id='line_1_6' title="bbox 363 0 840 25; baseline 0 -5"><span class='ocrx_word' id='word_1_6' title='bbox 363 3 511 20; x_wconf 84' lang='eng' dir='ltr'><em>Thermomonas</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 519 2 573 20; x_wconf 84' lang='eng' dir='ltr'><em>fusca</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 582 2 630 20; x_wconf 90' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 639 0 713 20; x_wconf 77' lang='eng' dir='ltr'><em>21737T</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 721 3 840 25; x_wconf 78' lang='eng' dir='ltr'><em>(AJ519986)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 382 113 406 130">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 382 113 406 130">
+     <span class='ocr_line' id='line_1_7' title="bbox 382 113 406 130; baseline 0 0"><span class='ocrx_word' id='word_1_11' title='bbox 382 113 406 130; x_wconf 83' lang='eng'><em>83</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 409 101 411 172">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 409 101 411 172">
+     <span class='ocr_line' id='line_1_8' title="bbox 409 101 411 172; baseline 0 431"><span class='ocrx_word' id='word_1_12' title='bbox 409 101 411 172; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 504 30 1088 136">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 504 30 1088 136">
+     <span class='ocr_line' id='line_1_9' title="bbox 524 30 1088 54; baseline 0 -5"><span class='ocrx_word' id='word_1_13' title='bbox 524 32 535 49; x_wconf 90' lang='eng'><strong>5</strong></span> <span class='ocrx_word' id='word_1_14' title='bbox 569 32 685 54; x_wconf 82' lang='eng' dir='ltr'><em>Lysobacter</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 690 37 805 54; x_wconf 86' lang='eng' dir='ltr'><em>gummosus</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 811 32 874 50; x_wconf 88' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 883 30 956 50; x_wconf 77' lang='eng' dir='ltr'><em>29489T</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 965 32 1088 54; x_wconf 83' lang='eng' dir='ltr'><em>(AB161361)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 504 72 1087 96; baseline 0 -5"><span class='ocrx_word' id='word_1_19' title='bbox 504 79 540 96; x_wconf 81' lang='eng'>100</span> <span class='ocrx_word' id='word_1_20' title='bbox 591 74 706 96; x_wconf 79' lang='eng' dir='ltr'><em>Lysobacter</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 712 74 828 91; x_wconf 81' lang='eng' dir='ltr'><em>antibioticus</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 837 74 886 91; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 895 72 955 91; x_wconf 88' lang='eng' dir='ltr'><em>2044T</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 964 74 1087 96; x_wconf 82' lang='eng' dir='ltr'><em>(ABO19582)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 591 112 1014 136; baseline 0 -5"><span class='ocrx_word' id='word_1_25' title='bbox 591 114 707 136; x_wconf 78' lang='eng' dir='ltr'><em>Lysobacter</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 713 114 784 136; x_wconf 85' lang='eng' dir='ltr'><em>capsici</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 791 112 884 131; x_wconf 72' lang='eng' dir='ltr'><em>YCS194T</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 893 114 1014 136; x_wconf 85' lang='eng' dir='ltr'><em>(EF488749)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 524 155 1094 219">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 524 155 1094 219">
+     <span class='ocr_line' id='line_1_12' title="bbox 572 155 1094 179; baseline -0.002 -4"><span class='ocrx_word' id='word_1_29' title='bbox 572 157 583 174; x_wconf 92' lang='eng' dir='ltr'><strong><em>L</em></strong></span> <span class='ocrx_word' id='word_1_30' title='bbox 584 157 688 179; x_wconf 82' lang='eng' dir='ltr'><em>ysobacter</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 694 162 839 179; x_wconf 85' lang='eng' dir='ltr'><em>enzymogenes</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 847 157 897 175; x_wconf 86' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 906 155 966 175; x_wconf 76' lang='eng' dir='ltr'><em>2043T</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 975 157 1082 179; x_wconf 82' lang='eng' dir='ltr'><em>(AJ298291</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 1089 157 1094 179; x_wconf 90' lang='eng'><em>)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 524 195 983 219; baseline -0.002 -4"><span class='ocrx_word' id='word_1_36' title='bbox 524 197 535 214; x_wconf 92' lang='eng' dir='ltr'><strong><em>L</em></strong></span> <span class='ocrx_word' id='word_1_37' title='bbox 536 197 640 219; x_wconf 74' lang='eng' dir='ltr'><em>ysobacrer</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 646 197 750 215; x_wconf 83' lang='eng' dir='ltr'><em>niastensis</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 757 195 847 215; x_wconf 89' lang='eng' dir='ltr'><em>GH41-7T</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 856 197 983 219; x_wconf 85' lang='eng' dir='ltr'>(DQ462462)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 620 239 1154 263">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 620 239 1154 263">
+     <span class='ocr_line' id='line_1_14' title="bbox 620 239 1154 263; baseline 0 -5"><span class='ocrx_word' id='word_1_41' title='bbox 620 241 631 258; x_wconf 92' lang='eng' dir='ltr'><strong><em>L</em></strong></span> <span class='ocrx_word' id='word_1_42' title='bbox 632 241 736 263; x_wconf 78' lang='eng' dir='ltr'><em>ysobacler</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 742 241 879 263; x_wconf 82' lang='eng' dir='ltr'><em>daejeonensis</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 888 241 937 258; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 947 239 1019 258; x_wconf 73' lang='eng' dir='ltr'><em>17634T</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 1027 241 1104 263; x_wconf 85' lang='eng' dir='ltr'><em>(DQ191</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 1111 241 1154 263; x_wconf 88' lang='eng'>178)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 308 290 423 292">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 308 290 423 292">
+     <span class='ocr_line' id='line_1_15' title="bbox 308 290 423 292; baseline 0 311"><span class='ocrx_word' id='word_1_48' title='bbox 308 290 423 292; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 168 348 274 350">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 168 348 274 350">
+     <span class='ocr_line' id='line_1_16' title="bbox 168 348 274 350; baseline 0 253"><span class='ocrx_word' id='word_1_49' title='bbox 168 348 274 350; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 0 465 171 467">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 0 465 171 467">
+     <span class='ocr_line' id='line_1_17' title="bbox 0 465 171 467; baseline 0 136"><span class='ocrx_word' id='word_1_50' title='bbox 0 465 171 467; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 54 554 95 571">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 54 554 95 571">
+     <span class='ocr_line' id='line_1_18' title="bbox 54 554 95 571; baseline 0 0"><span class='ocrx_word' id='word_1_51' title='bbox 54 554 95 571; x_wconf 90' lang='eng'><em>0.01</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 168 348 170 589">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 168 348 170 589">
+     <span class='ocr_line' id='line_1_19' title="bbox 168 348 170 589; baseline 0 14"><span class='ocrx_word' id='word_1_52' title='bbox 168 348 170 589; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 272 236 274 459">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 272 236 274 459">
+     <span class='ocr_line' id='line_1_20' title="bbox 272 236 274 459; baseline 0 144"><span class='ocrx_word' id='word_1_53' title='bbox 272 236 274 459; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 322 422 324 495">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 322 422 324 495">
+     <span class='ocr_line' id='line_1_21' title="bbox 322 422 324 495; baseline 0 108"><span class='ocrx_word' id='word_1_54' title='bbox 322 422 324 495; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 394 298 415 316">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 394 298 415 316">
+     <span class='ocr_line' id='line_1_22' title="bbox 394 298 415 316; baseline 0 0"><span class='ocrx_word' id='word_1_55' title='bbox 394 298 415 316; x_wconf 84' lang='eng'>91</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 421 255 423 328">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 421 255 423 328">
+     <span class='ocr_line' id='line_1_23' title="bbox 421 255 423 328; baseline 0 275"><span class='ocrx_word' id='word_1_56' title='bbox 421 255 423 328; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 485 280 1302 471">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 485 280 1165 355">
+     <span class='ocr_line' id='line_1_24' title="bbox 510 280 1134 328; baseline 0 -29"><span class='ocrx_word' id='word_1_57' title='bbox 510 297 678 328; x_wconf 17' lang='eng' dir='ltr'>ﬂ</span> <span class='ocrx_word' id='word_1_58' title='bbox 686 282 802 305; x_wconf 76' lang='eng' dir='ltr'><em>Lysobacter</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 807 282 932 299; x_wconf 80' lang='eng' dir='ltr'><em>concretionis</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 940 280 1002 299; x_wconf 78' lang='eng' dir='ltr'><em>K007T</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 1011 282 1134 305; x_wconf 86' lang='eng' dir='ltr'><em>(AB161359)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 485 321 1165 355; baseline 0 -15"><span class='ocrx_word' id='word_1_62' title='bbox 485 338 509 355; x_wconf 70' lang='eng'><em>95</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 680 323 795 345; x_wconf 83' lang='eng' dir='ltr'><em>Lysobacter</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 801 323 917 345; x_wconf 73' lang='eng' dir='ltr'><em>spongiicola</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 926 323 977 340; x_wconf 86' lang='eng' dir='ltr'>KMM</span> <span class='ocrx_word' id='word_1_66' title='bbox 986 321 1033 340; x_wconf 77' lang='eng' dir='ltr'><em>329T</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 1042 323 1165 345; x_wconf 79' lang='eng' dir='ltr'><em>(A8299978)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 510 338 1302 429">
+     <span class='ocr_line' id='line_1_26' title="bbox 510 338 1302 388; baseline 0 -5"><span class='ocrx_word' id='word_1_68' title='bbox 510 367 534 384; x_wconf 87' lang='eng'>66</span> <span class='ocrx_word' id='word_1_69' title='bbox 539 338 806 381; x_wconf 63' lang='eng'>;</span> <span class='ocrx_word' id='word_1_70' title='bbox 815 366 931 388; x_wconf 76' lang='eng' dir='ltr'><em>Lysobacter</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 936 365 1009 383; x_wconf 74' lang='eng' dir='ltr'><em>def/uvii</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 1017 366 1082 383; x_wconf 92' lang='eng' dir='ltr'><em>IMMIB</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 1090 364 1166 383; x_wconf 73' lang='eng' dir='ltr'><em>APB-9T</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 1175 365 1302 388; x_wconf 86' lang='eng' dir='ltr'>(AM283465)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 602 405 1107 429; baseline 0 -4"><span class='ocrx_word' id='word_1_75' title='bbox 602 408 613 425; x_wconf 97' lang='eng' dir='ltr'><strong><em>L</em></strong></span> <span class='ocrx_word' id='word_1_76' title='bbox 614 408 718 429; x_wconf 82' lang='eng' dir='ltr'><em>ysobacter</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 724 408 823 425; x_wconf 82' lang='eng' dir='ltr'><em>koreensis</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 831 407 893 425; x_wconf 86' lang='eng' dir='ltr'><em>KCTC</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 903 405 975 425; x_wconf 90' lang='eng' dir='ltr'><em>12204T</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 984 407 1107 429; x_wconf 86' lang='eng' dir='ltr'><em>(AB166878)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 630 447 1083 471">
+     <span class='ocr_line' id='line_1_28' title="bbox 630 447 1083 471; baseline 0 -5"><span class='ocrx_word' id='word_1_81' title='bbox 630 449 746 471; x_wconf 85' lang='eng' dir='ltr'><em>Lysobacter</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 752 449 850 466; x_wconf 83' lang='eng' dir='ltr'><em>niabensis</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 858 447 948 466; x_wconf 82' lang='eng' dir='ltr'><em>GH34-4T</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 957 449 1083 471; x_wconf 88' lang='eng' dir='ltr'><em>(DQ462461)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 423 327 506 328">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 423 327 506 328">
+     <span class='ocr_line' id='line_1_29' title="bbox 423 327 506 328; baseline 0 275"><span class='ocrx_word' id='word_1_85' title='bbox 423 327 506 328; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 322 493 445 495">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 322 493 445 495">
+     <span class='ocr_line' id='line_1_30' title="bbox 322 493 445 495; baseline 0 108"><span class='ocrx_word' id='word_1_86' title='bbox 322 493 445 495; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 634 489 1212 514">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 634 489 1212 514">
+     <span class='ocr_line' id='line_1_31' title="bbox 634 489 1212 514; baseline 0 -5"><span class='ocrx_word' id='word_1_87' title='bbox 634 492 750 514; x_wconf 81' lang='eng' dir='ltr'><em>Lysobacter</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 755 492 937 514; x_wconf 84' lang='eng' dir='ltr'><em>yangpyeongensis</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 946 491 994 509; x_wconf 86' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 1005 489 1077 509; x_wconf 79' lang='eng' dir='ltr'><em>17635T</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 1086 491 1212 514; x_wconf 84' lang='eng' dir='ltr'><em>(DQ191179)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 418 501 997 554">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 418 501 997 554">
+     <span class='ocr_line' id='line_1_32' title="bbox 418 501 626 547; baseline 0 -29"><span class='ocrx_word' id='word_1_92' title='bbox 418 501 440 518; x_wconf 81' lang='eng'>91</span> <span class='ocrx_word' id='word_1_93' title='bbox 505 505 626 547; x_wconf 47' lang='eng' dir='ltr'>i</span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 483 530 997 554; baseline 0 -5"><span class='ocrx_word' id='word_1_94' title='bbox 483 532 507 549; x_wconf 83' lang='eng'>89</span> <span class='ocrx_word' id='word_1_95' title='bbox 559 532 685 554; x_wconf 83' lang='eng' dir='ltr'><em>Lysabacter</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 691 537 764 554; x_wconf 87' lang='eng' dir='ltr'><em>oryzae</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 771 530 865 549; x_wconf 75' lang='eng' dir='ltr'><em>YC6269T</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 873 532 997 554; x_wconf 80' lang='eng' dir='ltr'><em>(EU376963)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 437 578 962 603">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 437 578 962 603">
+     <span class='ocr_line' id='line_1_34' title="bbox 437 578 962 603; baseline 0 -6"><span class='ocrx_word' id='word_1_99' title='bbox 437 580 448 597; x_wconf 92' lang='eng' dir='ltr'><strong><em>L</em></strong></span> <span class='ocrx_word' id='word_1_100' title='bbox 449 580 553 603; x_wconf 82' lang='eng' dir='ltr'><em>ysobacter</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 559 580 679 597; x_wconf 81' lang='eng' dir='ltr'><em>brunescens</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 686 580 749 597; x_wconf 86' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 757 578 831 597; x_wconf 73' lang='eng' dir='ltr'><em>29482T</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 839 580 962 603; x_wconf 83' lang='eng' dir='ltr'><em>(AB161360)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 444 464 445 525">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 444 464 445 525">
+     <span class='ocr_line' id='line_1_35' title="bbox 444 464 445 525; baseline 0 78"><span class='ocrx_word' id='word_1_105' title='bbox 444 464 445 525; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000620-0-002.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000620-0-002.pbm.png
new file mode 100644
index 00000000..943ce2ea
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000620-0-002.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000620-0-002.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000620-0-002.pbm.png.hocr
new file mode 100644
index 00000000..0862fbc5
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000620-0-002.pbm.png.hocr
@@ -0,0 +1,133 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000620-0-002.pbm.png"; bbox 0 0 994 517; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 95 6 983 432">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 95 6 773 71">
+     <span class='ocr_line' id='line_1_1' title="bbox 95 6 773 36; baseline 0.001 -11"><span class='ocrx_word' id='word_1_1' title='bbox 95 13 177 36; x_wconf 76' lang='eng'><em>99_—</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 185 6 402 31; x_wconf 85' lang='eng' dir='ltr'><em>Desulfosporosinus</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 411 6 495 26; x_wconf 74' lang='eng' dir='ltr'><em>orientis</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 505 6 560 26; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 571 6 627 26; x_wconf 84' lang='eng'><em>7493</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 637 6 773 31; x_wconf 82' lang='eng' dir='ltr'><em>(AJ493052)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 208 44 745 71; baseline 0 -6"><span class='ocrx_word' id='word_1_7' title='bbox 208 46 426 65; x_wconf 78' lang='eng' dir='ltr'><em>Desu/ﬂtobacterium</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 436 46 532 71; x_wconf 82' lang='eng' dir='ltr'><em>frappien&#39;</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 540 44 627 65; x_wconf 85' lang='eng' dir='ltr'><em>PCP—1T</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 637 46 745 71; x_wconf 88' lang='eng' dir='ltr'><em>(U40078)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 204 84 723 111">
+     <span class='ocr_line' id='line_1_3' title="bbox 204 84 723 111; baseline 0 -6"><span class='ocrx_word' id='word_1_11' title='bbox 204 86 363 105; x_wconf 81' lang='eng' dir='ltr'><em>Dehalobacter</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 369 86 476 105; x_wconf 77' lang='eng' dir='ltr'><em>restrictus</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 486 84 605 105; x_wconf 79' lang='eng' dir='ltr'><em>PER—K23T</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 615 86 723 111; x_wconf 83' lang='eng' dir='ltr'><em>(U84497)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 188 124 821 151">
+     <span class='ocr_line' id='line_1_4' title="bbox 188 124 821 151; baseline -0.002 -5"><span class='ocrx_word' id='word_1_15' title='bbox 188 126 406 146; x_wconf 83' lang='eng' dir='ltr'><em>Desulfotomaculum</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 415 126 534 151; x_wconf 81' lang='eng' dir='ltr'><em>nigriﬁcans</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 543 126 626 146; x_wconf 90' lang='eng' dir='ltr'><em>NCIMB</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 635 124 704 146; x_wconf 78' lang='eng' dir='ltr'><em>8395T</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 713 126 821 151; x_wconf 84' lang='eng' dir='ltr'><em>(X62176)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 260 164 753 191">
+     <span class='ocr_line' id='line_1_5' title="bbox 260 164 753 191; baseline -0.002 -5"><span class='ocrx_word' id='word_1_20' title='bbox 260 166 410 191; x_wconf 82' lang='eng' dir='ltr'><em>Peptococcus</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 419 166 480 191; x_wconf 89' lang='eng' dir='ltr'><em>niger</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 487 166 542 186; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 552 164 636 186; x_wconf 89' lang='eng' dir='ltr'><em>20475T</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 646 166 753 191; x_wconf 86' lang='eng' dir='ltr'><em>(X55797)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 192 204 792 231">
+     <span class='ocr_line' id='line_1_6' title="bbox 192 204 792 231; baseline 0 -6"><span class='ocrx_word' id='word_1_25' title='bbox 192 206 372 231; x_wconf 81' lang='eng' dir='ltr'><em>Carboxydocella</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 382 206 594 231; x_wconf 78' lang='eng' dir='ltr'><em>the/mautotrophica</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 603 204 643 225; x_wconf 75' lang='eng' dir='ltr'><em>4‘1T</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 652 206 792 231; x_wconf 86' lang='eng' dir='ltr'><em>(AYO61974)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 158 244 704 271">
+     <span class='ocr_line' id='line_1_7' title="bbox 158 244 704 271; baseline 0 -6"><span class='ocrx_word' id='word_1_29' title='bbox 158 246 300 265; x_wconf 83' lang='eng' dir='ltr'><em>Thermincola</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 310 246 477 271; x_wconf 81' lang='eng' dir='ltr'><em>carboxydiphi/a</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 487 244 556 265; x_wconf 89' lang='eng' dir='ltr'><em>2204T</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 565 246 704 271; x_wconf 83' lang='eng' dir='ltr'><em>(AY603000)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 210 284 507 311">
+     <span class='ocr_line' id='line_1_8' title="bbox 210 284 507 311; baseline 0 -5"><span class='ocrx_word' id='word_1_33' title='bbox 210 286 283 306; x_wconf 84' lang='eng' dir='ltr'><em>Strain</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 294 284 507 311; x_wconf 80' lang='eng' dir='ltr'><em>1315T(EF542810)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 232 324 876 351">
+     <span class='ocr_line' id='line_1_9' title="bbox 232 324 876 351; baseline 0 -5"><span class='ocrx_word' id='word_1_35' title='bbox 232 327 455 351; x_wconf 84' lang='eng' dir='ltr'><em>Carboxydothermus</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 463 327 617 346; x_wconf 83' lang='eng' dir='ltr'><em>ferrireducens</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 626 324 759 346; x_wconf 76' lang='eng' dir='ltr'><em>.JW/AS—Y7T</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 768 327 876 351; x_wconf 82' lang='eng' dir='ltr'><em>(U76363)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 206 364 983 391">
+     <span class='ocr_line' id='line_1_10' title="bbox 206 364 983 391; baseline 0 -5"><span class='ocrx_word' id='word_1_39' title='bbox 206 366 429 391; x_wconf 78' lang='eng' dir='ltr'><em>Carboxydothermus</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 437 366 658 391; x_wconf 79' lang='eng' dir='ltr'><em>hydrogenofonnans</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 666 364 761 386; x_wconf 79' lang='eng' dir='ltr'><em>2-2901T</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 770 367 816 386; x_wconf 86' lang='eng' dir='ltr'><em>rrsA</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 827 366 983 391; x_wconf 34' lang='eng' dir='ltr'><em>(NC7007503)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 170 404 983 432">
+     <span class='ocr_line' id='line_1_11' title="bbox 170 404 983 432; baseline 0 -6"><span class='ocrx_word' id='word_1_44' title='bbox 170 417 190 432; x_wconf 70' lang='eng'><em>95</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 206 406 429 431; x_wconf 85' lang='eng' dir='ltr'><em>Carboxydothermus</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 437 406 658 431; x_wconf 76' lang='eng' dir='ltr'><em>hydrogenofonnans</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 666 404 761 426; x_wconf 77' lang='eng' dir='ltr'><em>2-2901T</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 770 407 817 426; x_wconf 89' lang='eng' dir='ltr'><em>rrsB</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 827 406 983 431; x_wconf 34' lang='eng' dir='ltr'><em>(NC7007503)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 122 13 124 55">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 122 13 124 55">
+     <span class='ocr_line' id='line_1_12' title="bbox 122 13 124 55; baseline 0 462"><span class='ocrx_word' id='word_1_50' title='bbox 122 13 124 55; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 124 53 200 55">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 124 53 200 55">
+     <span class='ocr_line' id='line_1_13' title="bbox 124 53 200 55; baseline 0 462"><span class='ocrx_word' id='word_1_51' title='bbox 124 53 200 55; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 43 64 104 66">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 43 64 104 66">
+     <span class='ocr_line' id='line_1_14' title="bbox 43 64 104 66; baseline 0 451"><span class='ocrx_word' id='word_1_52' title='bbox 43 64 104 66; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 102 34 104 96">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 102 34 104 96">
+     <span class='ocr_line' id='line_1_15' title="bbox 102 34 104 96; baseline 0 421"><span class='ocrx_word' id='word_1_53' title='bbox 102 34 104 96; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 104 94 196 96">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 104 94 196 96">
+     <span class='ocr_line' id='line_1_16' title="bbox 104 94 196 96; baseline 0 421"><span class='ocrx_word' id='word_1_54' title='bbox 104 94 196 96; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 43 64 45 136">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 43 64 45 136">
+     <span class='ocr_line' id='line_1_17' title="bbox 43 64 45 136; baseline 0 381"><span class='ocrx_word' id='word_1_55' title='bbox 43 64 45 136; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 1 143 256 390">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 1 143 256 390">
+     <span class='ocr_line' id='line_1_18' title="bbox 28 143 188 164; baseline 0 353"><span class='ocrx_word' id='word_1_56' title='bbox 28 143 188 164; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 1 164 256 244; baseline 0 0"><span class='ocrx_word' id='word_1_57' title='bbox 1 164 256 244; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 1 244 158 284; baseline 0 233"><span class='ocrx_word' id='word_1_58' title='bbox 1 244 158 284; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 1 284 227 351; baseline 0 0"><span class='ocrx_word' id='word_1_59' title='bbox 1 284 227 351; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 13 351 206 390; baseline 0 127"><span class='ocrx_word' id='word_1_60' title='bbox 13 351 206 390; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 62 432 986 471">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 62 432 986 471">
+     <span class='ocr_line' id='line_1_23' title="bbox 82 432 119 446; baseline 0 0"><span class='ocrx_word' id='word_1_61' title='bbox 82 432 119 446; x_wconf 88' lang='eng'><em>0.05</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 62 445 986 471; baseline 0 -5"><span class='ocrx_word' id='word_1_62' title='bbox 62 447 140 460; x_wconf 64' lang='eng'><em>|—‘</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 174 452 194 467; x_wconf 81' lang='eng'><em>98</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 208 447 430 471; x_wconf 79' lang='eng' dir='ltr'><em>Carboxydothermus</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 439 447 659 471; x_wconf 82' lang='eng' dir='ltr'><em>hydrogenoformans</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 668 445 763 466; x_wconf 82' lang='eng' dir='ltr'><em>2-2901T</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 771 447 821 466; x_wconf 89' lang='eng' dir='ltr'><em>rrsC</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 830 447 986 471; x_wconf 34' lang='eng' dir='ltr'><em>(NC7007503)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 174 482 990 511">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 174 482 990 511">
+     <span class='ocr_line' id='line_1_25' title="bbox 174 482 990 511; baseline 0 -5"><span class='ocrx_word' id='word_1_69' title='bbox 174 482 194 496; x_wconf 75' lang='eng'>70</span> <span class='ocrx_word' id='word_1_70' title='bbox 212 487 434 511; x_wconf 79' lang='eng' dir='ltr'><em>Carboxydothermus</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 443 487 664 511; x_wconf 85' lang='eng' dir='ltr'><em>hydrogenoformans</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 672 485 767 506; x_wconf 75' lang='eng' dir='ltr'><em>Z—290‘1T</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 776 487 825 506; x_wconf 87' lang='eng' dir='ltr'><em>rrsD</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 834 487 990 511; x_wconf 35' lang='eng' dir='ltr'><em>(N07007503)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000695-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000695-0-000.pbm.png
new file mode 100644
index 00000000..4c158a5e
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000695-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000695-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000695-0-000.pbm.png.hocr
new file mode 100644
index 00000000..34af0f7d
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000695-0-000.pbm.png.hocr
@@ -0,0 +1,362 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000695-0-000.pbm.png"; bbox 0 0 1302 869; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 39 5 1300 732">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 39 5 1300 732">
+     <span class='ocr_line' id='line_1_1' title="bbox 370 5 1042 32; baseline 0.003 -9"><span class='ocrx_word' id='word_1_1' title='bbox 370 7 448 32; x_wconf 89' lang='eng'>52_—</span> <span class='ocrx_word' id='word_1_2' title='bbox 456 6 600 25; x_wconf 86' lang='eng' dir='ltr'>Micrococcus</span> <span class='ocrx_word' id='word_1_3' title='bbox 609 6 678 25; x_wconf 80' lang='eng' dir='ltr'>luteus</span> <span class='ocrx_word' id='word_1_4' title='bbox 687 6 774 25; x_wconf 83' lang='eng' dir='ltr'>Ballarat</span> <span class='ocrx_word' id='word_1_5' title='bbox 783 5 862 30; x_wconf 84' lang='eng' dir='ltr'>(biovar</span> <span class='ocrx_word' id='word_1_6' title='bbox 872 5 899 30; x_wconf 93' lang='eng' dir='ltr'>Ill)</span> <span class='ocrx_word' id='word_1_7' title='bbox 909 5 1042 30; x_wconf 82' lang='eng' dir='ltr'>(AJ409096)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 360 32 961 63; baseline 0 -5"><span class='ocrx_word' id='word_1_8' title='bbox 360 32 384 49; x_wconf 73' lang='eng'>63</span> <span class='ocrx_word' id='word_1_9' title='bbox 400 47 511 49; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_10' title='bbox 518 39 663 58; x_wconf 83' lang='eng' dir='ltr'>Micrococcus</span> <span class='ocrx_word' id='word_1_11' title='bbox 671 39 739 58; x_wconf 87' lang='eng' dir='ltr'><em>ﬂavus</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 748 38 810 58; x_wconf 74' lang='eng' dir='ltr'>LW4T</span> <span class='ocrx_word' id='word_1_13' title='bbox 819 39 961 63; x_wconf 82' lang='eng' dir='ltr'>(DQ491453)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 336 64 947 97; baseline 0.002 -6"><span class='ocrx_word' id='word_1_14' title='bbox 336 64 359 80; x_wconf 74' lang='eng'>99</span> <span class='ocrx_word' id='word_1_15' title='bbox 478 72 622 92; x_wconf 86' lang='eng' dir='ltr'>Micrococcus</span> <span class='ocrx_word' id='word_1_16' title='bbox 631 72 757 92; x_wconf 84' lang='eng' dir='ltr'>antarcticus</span> <span class='ocrx_word' id='word_1_17' title='bbox 765 72 805 91; x_wconf 90' lang='eng' dir='ltr'>T2T</span> <span class='ocrx_word' id='word_1_18' title='bbox 814 72 947 97; x_wconf 86' lang='eng' dir='ltr'>(AJ005932)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 257 103 973 130; baseline 0 -5"><span class='ocrx_word' id='word_1_19' title='bbox 257 103 280 120; x_wconf 75' lang='eng'>62</span> <span class='ocrx_word' id='word_1_20' title='bbox 367 113 487 116; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_21' title='bbox 496 106 640 125; x_wconf 84' lang='eng' dir='ltr'>Micrococcus</span> <span class='ocrx_word' id='word_1_22' title='bbox 648 106 701 130; x_wconf 86' lang='eng' dir='ltr'>Iy/ae</span> <span class='ocrx_word' id='word_1_23' title='bbox 711 105 766 125; x_wconf 90' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_24' title='bbox 776 105 858 125; x_wconf 82' lang='eng' dir='ltr'>20315T</span> <span class='ocrx_word' id='word_1_25' title='bbox 867 105 973 130; x_wconf 86' lang='eng' dir='ltr'>(X80750)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 430 138 1027 164; baseline 0 -6"><span class='ocrx_word' id='word_1_26' title='bbox 430 139 575 158; x_wconf 80' lang='eng' dir='ltr'>-Ci(ricoccus</span> <span class='ocrx_word' id='word_1_27' title='bbox 583 139 736 158; x_wconf 79' lang='eng' dir='ltr'>alkalito/erans</span> <span class='ocrx_word' id='word_1_28' title='bbox 743 139 788 158; x_wconf 94' lang='eng' dir='ltr'>YIM</span> <span class='ocrx_word' id='word_1_29' title='bbox 798 138 880 158; x_wconf 84' lang='eng' dir='ltr'>70010T</span> <span class='ocrx_word' id='word_1_30' title='bbox 890 139 1027 164; x_wconf 84' lang='eng' dir='ltr'>(AY376164)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 241 164 895 197; baseline -0.002 -5"><span class='ocrx_word' id='word_1_31' title='bbox 241 164 264 180; x_wconf 70' lang='eng'>52</span> <span class='ocrx_word' id='word_1_32' title='bbox 385 169 419 185; x_wconf 77' lang='eng'>100</span> <span class='ocrx_word' id='word_1_33' title='bbox 430 180 470 182; x_wconf 98' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_34' title='bbox 479 172 605 192; x_wconf 83' lang='eng' dir='ltr'>Citricoccus</span> <span class='ocrx_word' id='word_1_35' title='bbox 613 172 697 192; x_wconf 80' lang='eng' dir='ltr'>mural/s</span> <span class='ocrx_word' id='word_1_36' title='bbox 705 172 753 192; x_wconf 80' lang='eng' dir='ltr'>4-0T</span> <span class='ocrx_word' id='word_1_37' title='bbox 762 172 895 197; x_wconf 84' lang='eng' dir='ltr'>(AJ344143)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 494 205 1102 230; baseline 0 -5"><span class='ocrx_word' id='word_1_38' title='bbox 494 206 655 230; x_wconf 84' lang='eng' dir='ltr'>Zhihengliuella</span> <span class='ocrx_word' id='word_1_39' title='bbox 664 206 806 225; x_wconf 86' lang='eng' dir='ltr'>ha/oto/erans</span> <span class='ocrx_word' id='word_1_40' title='bbox 814 206 858 225; x_wconf 94' lang='eng' dir='ltr'>YIM</span> <span class='ocrx_word' id='word_1_41' title='bbox 869 205 951 225; x_wconf 88' lang='eng' dir='ltr'>70185T</span> <span class='ocrx_word' id='word_1_42' title='bbox 960 205 1102 230; x_wconf 84' lang='eng' dir='ltr'>(DQ372937)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 261 238 1072 267; baseline 0 -8"><span class='ocrx_word' id='word_1_43' title='bbox 261 250 282 267; x_wconf 70' lang='eng'><strong>61</strong></span> <span class='ocrx_word' id='word_1_44' title='bbox 543 239 690 259; x_wconf 72' lang='eng' dir='ltr'>Anhrobacter</span> <span class='ocrx_word' id='word_1_45' title='bbox 696 239 801 259; x_wconf 86' lang='eng' dir='ltr'>sulfureus</span> <span class='ocrx_word' id='word_1_46' title='bbox 811 239 865 259; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_47' title='bbox 875 238 958 259; x_wconf 86' lang='eng' dir='ltr'>20167T</span> <span class='ocrx_word' id='word_1_48' title='bbox 967 239 1072 264; x_wconf 83' lang='eng' dir='ltr'>(X83409)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 484 272 1077 297; baseline 0 -5"><span class='ocrx_word' id='word_1_49' title='bbox 484 273 631 292; x_wconf 73' lang='eng' dir='ltr'>Arthrobacter</span> <span class='ocrx_word' id='word_1_50' title='bbox 636 273 805 297; x_wconf 83' lang='eng' dir='ltr'>protophormiae</span> <span class='ocrx_word' id='word_1_51' title='bbox 815 272 870 292; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_52' title='bbox 880 272 962 292; x_wconf 78' lang='eng' dir='ltr'>20168T</span> <span class='ocrx_word' id='word_1_53' title='bbox 971 272 1077 297; x_wconf 89' lang='eng' dir='ltr'>(X80745)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 205 306 1016 331; baseline 0 -5"><span class='ocrx_word' id='word_1_54' title='bbox 205 310 240 312; x_wconf 84' lang='eng'>—</span> <span class='ocrx_word' id='word_1_55' title='bbox 351 313 374 330; x_wconf 76' lang='eng'>67</span> <span class='ocrx_word' id='word_1_56' title='bbox 408 307 620 326; x_wconf 70' lang='eng' dir='ltr'>—Ar1hrobacter</span> <span class='ocrx_word' id='word_1_57' title='bbox 626 307 745 326; x_wconf 82' lang='eng' dir='ltr'>nicotianae</span> <span class='ocrx_word' id='word_1_58' title='bbox 755 306 809 326; x_wconf 90' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_59' title='bbox 819 306 902 326; x_wconf 87' lang='eng' dir='ltr'>20123T</span> <span class='ocrx_word' id='word_1_60' title='bbox 911 306 1016 331; x_wconf 81' lang='eng' dir='ltr'>(X80739)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 70 336 1109 374; baseline 0 -15"><span class='ocrx_word' id='word_1_61' title='bbox 70 357 109 374; x_wconf 36' lang='eng'>0-01</span> <span class='ocrx_word' id='word_1_62' title='bbox 375 336 398 353; x_wconf 75' lang='eng'>78</span> <span class='ocrx_word' id='word_1_63' title='bbox 408 340 689 359; x_wconf 72' lang='eng' dir='ltr'>—Arthrobacter</span> <span class='ocrx_word' id='word_1_64' title='bbox 696 340 837 364; x_wconf 76' lang='eng' dir='ltr'>uratoxydans</span> <span class='ocrx_word' id='word_1_65' title='bbox 847 340 901 359; x_wconf 85' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_66' title='bbox 911 339 994 359; x_wconf 83' lang='eng' dir='ltr'>20647T</span> <span class='ocrx_word' id='word_1_67' title='bbox 1003 340 1109 364; x_wconf 80' lang='eng' dir='ltr'>(X83410)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 39 372 1173 398; baseline 0 -6"><span class='ocrx_word' id='word_1_68' title='bbox 39 376 143 391; x_wconf 70' lang='eng'>1—1</span> <span class='ocrx_word' id='word_1_69' title='bbox 281 377 304 394; x_wconf 77' lang='eng'>34</span> <span class='ocrx_word' id='word_1_70' title='bbox 314 373 743 393; x_wconf 83' lang='eng' dir='ltr'>—Acaricomes</span> <span class='ocrx_word' id='word_1_71' title='bbox 750 373 876 398; x_wconf 81' lang='eng' dir='ltr'>phytoseiuli</span> <span class='ocrx_word' id='word_1_72' title='bbox 884 373 938 393; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_73' title='bbox 951 372 1031 392; x_wconf 92' lang='eng' dir='ltr'>14247T</span> <span class='ocrx_word' id='word_1_74' title='bbox 1040 373 1173 398; x_wconf 85' lang='eng' dir='ltr'>(AJ812213)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 314 406 1300 431; baseline 0 -5"><span class='ocrx_word' id='word_1_75' title='bbox 314 415 669 417; x_wconf 94' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_76' title='bbox 676 407 843 426; x_wconf 67' lang='eng' dir='ltr'>Hen/&quot;bacterium</span> <span class='ocrx_word' id='word_1_77' title='bbox 852 407 1016 426; x_wconf 82' lang='eng' dir='ltr'>salmoninarum</span> <span class='ocrx_word' id='word_1_78' title='bbox 1024 406 1094 426; x_wconf 90' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_79' title='bbox 1104 406 1186 426; x_wconf 80' lang='eng' dir='ltr'>33209T</span> <span class='ocrx_word' id='word_1_80' title='bbox 1195 406 1300 431; x_wconf 87' lang='eng' dir='ltr'>(X51601)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 357 439 961 465; baseline 0.002 -6"><span class='ocrx_word' id='word_1_81' title='bbox 357 440 587 460; x_wconf 80' lang='eng' dir='ltr'>—Arthrobacter</span> <span class='ocrx_word' id='word_1_82' title='bbox 593 440 690 465; x_wconf 87' lang='eng' dir='ltr'>oxydans</span> <span class='ocrx_word' id='word_1_83' title='bbox 699 440 754 460; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_84' title='bbox 764 440 802 460; x_wconf 90' lang='eng'>201</span> <span class='ocrx_word' id='word_1_85' title='bbox 810 439 846 460; x_wconf 79' lang='eng' dir='ltr'>19T</span> <span class='ocrx_word' id='word_1_86' title='bbox 855 440 961 465; x_wconf 83' lang='eng' dir='ltr'>(X83408)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 323 473 1008 498; baseline -0.003 -3"><span class='ocrx_word' id='word_1_87' title='bbox 323 478 346 495; x_wconf 83' lang='eng'>99</span> <span class='ocrx_word' id='word_1_88' title='bbox 422 474 682 493; x_wconf 82' lang='eng' dir='ltr'>—Arthrobacter</span> <span class='ocrx_word' id='word_1_89' title='bbox 688 474 737 493; x_wconf 86' lang='eng' dir='ltr'><em>ilicis</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 746 473 801 493; x_wconf 91' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_91' title='bbox 811 473 893 493; x_wconf 78' lang='eng' dir='ltr'>20138T</span> <span class='ocrx_word' id='word_1_92' title='bbox 902 473 1008 498; x_wconf 86' lang='eng' dir='ltr'>(X83407)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 388 503 1025 531; baseline 0 -5"><span class='ocrx_word' id='word_1_93' title='bbox 388 503 412 520; x_wconf 75' lang='eng'>98</span> <span class='ocrx_word' id='word_1_94' title='bbox 422 507 608 526; x_wconf 75' lang='eng' dir='ltr'>—Arthrobacter</span> <span class='ocrx_word' id='word_1_95' title='bbox 614 507 783 526; x_wconf 79' lang='eng' dir='ltr'>nicotinovorans</span> <span class='ocrx_word' id='word_1_96' title='bbox 792 507 847 526; x_wconf 90' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_97' title='bbox 856 506 910 526; x_wconf 90' lang='eng' dir='ltr'>420T</span> <span class='ocrx_word' id='word_1_98' title='bbox 919 507 1025 531; x_wconf 86' lang='eng' dir='ltr'>(X80743)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 465 540 967 565; baseline 0.002 -6"><span class='ocrx_word' id='word_1_99' title='bbox 465 548 493 550; x_wconf 97' lang='eng'>—</span> <span class='ocrx_word' id='word_1_100' title='bbox 499 540 639 560; x_wconf 89' lang='eng' dir='ltr'>Sinomonas</span> <span class='ocrx_word' id='word_1_101' title='bbox 648 540 706 560; x_wconf 87' lang='eng' dir='ltr'>flava</span> <span class='ocrx_word' id='word_1_102' title='bbox 715 540 757 560; x_wconf 92' lang='eng' dir='ltr'><strong>CW</strong></span> <span class='ocrx_word' id='word_1_103' title='bbox 767 540 819 560; x_wconf 84' lang='eng' dir='ltr'>108T</span> <span class='ocrx_word' id='word_1_104' title='bbox 828 540 967 565; x_wconf 90' lang='eng' dir='ltr'>(EU370704)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 421 572 1089 598; baseline 0 -5"><span class='ocrx_word' id='word_1_105' title='bbox 421 572 456 588; x_wconf 77' lang='eng'>100</span> <span class='ocrx_word' id='word_1_106' title='bbox 465 582 492 583; x_wconf 39' lang='eng'><em>*</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 499 573 638 593; x_wconf 84' lang='eng' dir='ltr'>Sinomonas</span> <span class='ocrx_word' id='word_1_108' title='bbox 647 575 784 598; x_wconf 84' lang='eng' dir='ltr'>atrocyanea</span> <span class='ocrx_word' id='word_1_109' title='bbox 794 573 849 593; x_wconf 91' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_110' title='bbox 858 573 941 593; x_wconf 90' lang='eng' dir='ltr'>20127T</span> <span class='ocrx_word' id='word_1_111' title='bbox 950 573 1089 598; x_wconf 85' lang='eng' dir='ltr'>(EU697388)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 336 607 844 632; baseline -0.004 -4"><span class='ocrx_word' id='word_1_112' title='bbox 336 611 370 628; x_wconf 88' lang='eng'>100</span> <span class='ocrx_word' id='word_1_113' title='bbox 380 615 405 617; x_wconf 25' lang='eng'><strong>#</strong></span> <span class='ocrx_word' id='word_1_114' title='bbox 412 608 499 627; x_wconf 82' lang='eng' dir='ltr'>Kocuria</span> <span class='ocrx_word' id='word_1_115' title='bbox 508 612 572 627; x_wconf 87' lang='eng' dir='ltr'><em>rosea</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 582 607 637 627; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_117' title='bbox 647 607 730 627; x_wconf 79' lang='eng' dir='ltr'>20447T</span> <span class='ocrx_word' id='word_1_118' title='bbox 739 607 844 632; x_wconf 82' lang='eng' dir='ltr'>(X87756)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 156 636 865 666; baseline 0.001 -6"><span class='ocrx_word' id='word_1_119' title='bbox 156 636 180 652; x_wconf 85' lang='eng'>75</span> <span class='ocrx_word' id='word_1_120' title='bbox 380 641 502 661; x_wconf 84' lang='eng' dir='ltr'>—Kocuria</span> <span class='ocrx_word' id='word_1_121' title='bbox 510 641 587 665; x_wconf 88' lang='eng' dir='ltr'>polaris</span> <span class='ocrx_word' id='word_1_122' title='bbox 596 641 652 661; x_wconf 86' lang='eng' dir='ltr'>CMS</span> <span class='ocrx_word' id='word_1_123' title='bbox 662 640 723 661; x_wconf 85' lang='eng' dir='ltr'>760rT</span> <span class='ocrx_word' id='word_1_124' title='bbox 732 641 865 666; x_wconf 84' lang='eng' dir='ltr'>(AJ278868)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 260 672 973 699; baseline 0 -6"><span class='ocrx_word' id='word_1_125' title='bbox 260 672 283 689; x_wconf 83' lang='eng'>99</span> <span class='ocrx_word' id='word_1_126' title='bbox 336 675 581 694; x_wconf 73' lang='eng' dir='ltr'>—Kocuria</span> <span class='ocrx_word' id='word_1_127' title='bbox 590 675 701 699; x_wconf 88' lang='eng' dir='ltr'>rhizophi/a</span> <span class='ocrx_word' id='word_1_128' title='bbox 711 674 765 694; x_wconf 87' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_129' title='bbox 777 674 858 694; x_wconf 75' lang='eng' dir='ltr'>11926T</span> <span class='ocrx_word' id='word_1_130' title='bbox 867 674 973 699; x_wconf 88' lang='eng' dir='ltr'>(Y16264)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 300 706 899 732; baseline 0 -5"><span class='ocrx_word' id='word_1_131' title='bbox 300 706 320 723; x_wconf 77' lang='eng'>91</span> <span class='ocrx_word' id='word_1_132' title='bbox 435 708 522 727; x_wconf 86' lang='eng' dir='ltr'>Kocuria</span> <span class='ocrx_word' id='word_1_133' title='bbox 530 708 628 732; x_wconf 81' lang='eng' dir='ltr'>palustris</span> <span class='ocrx_word' id='word_1_134' title='bbox 637 708 692 727; x_wconf 91' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_135' title='bbox 704 707 784 727; x_wconf 80' lang='eng' dir='ltr'>11925T</span> <span class='ocrx_word' id='word_1_136' title='bbox 793 708 899 732; x_wconf 87' lang='eng' dir='ltr'>(Y16263)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 398 13 400 49">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 398 13 400 49">
+     <span class='ocr_line' id='line_1_23' title="bbox 398 13 400 49; baseline 0 820"><span class='ocrx_word' id='word_1_137' title='bbox 398 13 400 49; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 367 55 389 57">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 367 55 389 57">
+     <span class='ocr_line' id='line_1_24' title="bbox 367 55 389 57; baseline 0 812"><span class='ocrx_word' id='word_1_138' title='bbox 367 55 389 57; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 387 30 389 82">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 387 30 389 82">
+     <span class='ocr_line' id='line_1_25' title="bbox 387 30 389 82; baseline 0 787"><span class='ocrx_word' id='word_1_139' title='bbox 387 30 389 82; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 389 80 473 82">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 389 80 473 82">
+     <span class='ocr_line' id='line_1_26' title="bbox 389 80 473 82; baseline 0 787"><span class='ocrx_word' id='word_1_140' title='bbox 389 80 473 82; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 284 84 369 86">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 284 84 369 86">
+     <span class='ocr_line' id='line_1_27' title="bbox 284 84 369 86; baseline 0 783"><span class='ocrx_word' id='word_1_141' title='bbox 284 84 369 86; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 367 55 369 113">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 367 55 369 113">
+     <span class='ocr_line' id='line_1_28' title="bbox 367 55 369 113; baseline 0 756"><span class='ocrx_word' id='word_1_142' title='bbox 367 55 369 113; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 268 124 286 126">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 268 124 286 126">
+     <span class='ocr_line' id='line_1_29' title="bbox 268 124 286 126; baseline 0 743"><span class='ocrx_word' id='word_1_143' title='bbox 268 124 286 126; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 284 84 286 165">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 284 84 286 165">
+     <span class='ocr_line' id='line_1_30' title="bbox 284 84 286 165; baseline 0 704"><span class='ocrx_word' id='word_1_144' title='bbox 284 84 286 165; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 284 164 430 165">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 284 164 430 165">
+     <span class='ocr_line' id='line_1_31' title="bbox 284 164 430 165; baseline 0 704"><span class='ocrx_word' id='word_1_145' title='bbox 284 164 430 165; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 428 147 430 182">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 428 147 430 182">
+     <span class='ocr_line' id='line_1_32' title="bbox 428 147 430 182; baseline 0 687"><span class='ocrx_word' id='word_1_146' title='bbox 428 147 430 182; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 241 184 269 186">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 241 184 269 186">
+     <span class='ocr_line' id='line_1_33' title="bbox 241 184 269 186; baseline 0 683"><span class='ocrx_word' id='word_1_147' title='bbox 241 184 269 186; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 268 124 269 247">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 268 124 269 247">
+     <span class='ocr_line' id='line_1_34' title="bbox 268 124 269 247; baseline 0 622"><span class='ocrx_word' id='word_1_148' title='bbox 268 124 269 247; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 267 245 538 247">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 267 245 538 247">
+     <span class='ocr_line' id='line_1_35' title="bbox 267 245 538 247; baseline 0 622"><span class='ocrx_word' id='word_1_149' title='bbox 267 245 538 247; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 288 214 290 278">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 288 214 290 278">
+     <span class='ocr_line' id='line_1_36' title="bbox 288 214 290 278; baseline 0 591"><span class='ocrx_word' id='word_1_150' title='bbox 288 214 290 278; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 290 276 361 278">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 290 276 361 278">
+     <span class='ocr_line' id='line_1_37' title="bbox 290 276 361 278; baseline 0 591"><span class='ocrx_word' id='word_1_151' title='bbox 290 276 361 278; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 382 281 480 282">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 382 281 480 282">
+     <span class='ocr_line' id='line_1_38' title="bbox 382 281 480 282; baseline 0 587"><span class='ocrx_word' id='word_1_152' title='bbox 382 281 480 282; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 362 247 364 308">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 362 247 364 308">
+     <span class='ocr_line' id='line_1_39' title="bbox 362 247 364 308; baseline 0 561"><span class='ocrx_word' id='word_1_153' title='bbox 362 247 364 308; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 362 306 382 308">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 362 306 382 308">
+     <span class='ocr_line' id='line_1_40' title="bbox 362 306 382 308; baseline 0 561"><span class='ocrx_word' id='word_1_154' title='bbox 362 306 382 308; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 380 281 382 333">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 380 281 382 333">
+     <span class='ocr_line' id='line_1_41' title="bbox 380 281 382 333; baseline 0 536"><span class='ocrx_word' id='word_1_155' title='bbox 380 281 382 333; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 380 331 408 333">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 380 331 408 333">
+     <span class='ocr_line' id='line_1_42' title="bbox 380 331 408 333; baseline 0 536"><span class='ocrx_word' id='word_1_156' title='bbox 380 331 408 333; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 406 314 408 350">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 406 314 408 350">
+     <span class='ocr_line' id='line_1_43' title="bbox 406 314 408 350; baseline 0 519"><span class='ocrx_word' id='word_1_157' title='bbox 406 314 408 350; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 255 398 314 400">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 255 398 314 400">
+     <span class='ocr_line' id='line_1_44' title="bbox 255 398 314 400; baseline 0 469"><span class='ocrx_word' id='word_1_158' title='bbox 255 398 314 400; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 241 184 243 437">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 241 184 243 437">
+     <span class='ocr_line' id='line_1_45' title="bbox 241 184 243 437; baseline 0 432"><span class='ocrx_word' id='word_1_159' title='bbox 241 184 243 437; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 312 381 314 417">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 312 381 314 417">
+     <span class='ocr_line' id='line_1_46' title="bbox 312 381 314 417; baseline 0 452"><span class='ocrx_word' id='word_1_160' title='bbox 312 381 314 417; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 240 435 257 437">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 240 435 257 437">
+     <span class='ocr_line' id='line_1_47' title="bbox 240 435 257 437; baseline 0 432"><span class='ocrx_word' id='word_1_161' title='bbox 240 435 257 437; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 255 398 257 475">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 255 398 257 475">
+     <span class='ocr_line' id='line_1_48' title="bbox 255 398 257 475; baseline 0 394"><span class='ocrx_word' id='word_1_162' title='bbox 255 398 257 475; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 255 473 357 475">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 255 473 357 475">
+     <span class='ocr_line' id='line_1_49' title="bbox 255 473 357 475; baseline 0 394"><span class='ocrx_word' id='word_1_163' title='bbox 255 473 357 475; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 355 448 357 500">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 355 448 357 500">
+     <span class='ocr_line' id='line_1_50' title="bbox 355 448 357 500; baseline 0 369"><span class='ocrx_word' id='word_1_164' title='bbox 355 448 357 500; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 355 498 422 500">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 355 498 422 500">
+     <span class='ocr_line' id='line_1_51' title="bbox 355 498 422 500; baseline 0 369"><span class='ocrx_word' id='word_1_165' title='bbox 355 498 422 500; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 420 481 422 517">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 420 481 422 517">
+     <span class='ocr_line' id='line_1_52' title="bbox 420 481 422 517; baseline 0 352"><span class='ocrx_word' id='word_1_166' title='bbox 420 481 422 517; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 203 310 205 567">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 203 310 205 567">
+     <span class='ocr_line' id='line_1_53' title="bbox 203 310 205 567; baseline 0 302"><span class='ocrx_word' id='word_1_167' title='bbox 203 310 205 567; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 203 565 465 567">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 203 565 465 567">
+     <span class='ocr_line' id='line_1_54' title="bbox 203 565 465 567; baseline 0 302"><span class='ocrx_word' id='word_1_168' title='bbox 203 565 465 567; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 463 548 465 583">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 463 548 465 583">
+     <span class='ocr_line' id='line_1_55' title="bbox 463 548 465 583; baseline 0 286"><span class='ocrx_word' id='word_1_169' title='bbox 463 548 465 583; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 294 632 380 634">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 294 632 380 634">
+     <span class='ocr_line' id='line_1_56' title="bbox 294 632 380 634; baseline 0 235"><span class='ocrx_word' id='word_1_170' title='bbox 294 632 380 634; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 378 615 380 651">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 378 615 380 651">
+     <span class='ocr_line' id='line_1_57' title="bbox 378 615 380 651; baseline 0 218"><span class='ocrx_word' id='word_1_171' title='bbox 378 615 380 651; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_37' title="bbox 128 659 188 661">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 128 659 188 661">
+     <span class='ocr_line' id='line_1_58' title="bbox 128 659 188 661; baseline 0 208"><span class='ocrx_word' id='word_1_172' title='bbox 128 659 188 661; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_38' title="bbox 294 632 296 700">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 294 632 296 700">
+     <span class='ocr_line' id='line_1_59' title="bbox 294 632 296 700; baseline 0 169"><span class='ocrx_word' id='word_1_173' title='bbox 294 632 296 700; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_39' title="bbox 294 699 336 701">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 294 699 336 701">
+     <span class='ocr_line' id='line_1_60' title="bbox 294 699 336 701; baseline 0 168"><span class='ocrx_word' id='word_1_174' title='bbox 294 699 336 701; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_40' title="bbox 334 683 336 718">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 334 683 336 718">
+     <span class='ocr_line' id='line_1_61' title="bbox 334 683 336 718; baseline 0 151"><span class='ocrx_word' id='word_1_175' title='bbox 334 683 336 718; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_41' title="bbox 336 716 430 718">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 336 716 430 718">
+     <span class='ocr_line' id='line_1_62' title="bbox 336 716 430 718; baseline 0 151"><span class='ocrx_word' id='word_1_176' title='bbox 336 716 430 718; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_42' title="bbox 0 737 130 739">
+    <p class='ocr_par' dir='ltr' id='par_1_42' title="bbox 0 737 130 739">
+     <span class='ocr_line' id='line_1_63' title="bbox 0 737 130 739; baseline 0 130"><span class='ocrx_word' id='word_1_177' title='bbox 0 737 130 739; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_43' title="bbox 0 737 2 851">
+    <p class='ocr_par' dir='ltr' id='par_1_43' title="bbox 0 737 2 851">
+     <span class='ocr_line' id='line_1_64' title="bbox 0 737 2 851; baseline 0 18"><span class='ocrx_word' id='word_1_178' title='bbox 0 737 2 851; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_44' title="bbox 186 551 188 768">
+    <p class='ocr_par' dir='ltr' id='par_1_44' title="bbox 186 551 188 768">
+     <span class='ocr_line' id='line_1_65' title="bbox 186 551 188 768; baseline 0 101"><span class='ocrx_word' id='word_1_179' title='bbox 186 551 188 768; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_45' title="bbox 193 740 1083 832">
+    <p class='ocr_par' dir='ltr' id='par_1_45' title="bbox 193 740 1083 832">
+     <span class='ocr_line' id='line_1_66' title="bbox 227 740 1083 766; baseline 0 -6"><span class='ocrx_word' id='word_1_180' title='bbox 227 749 544 751; x_wconf 94' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_181' title='bbox 550 741 640 760; x_wconf 80' lang='eng' dir='ltr'>YanieI/a</span> <span class='ocrx_word' id='word_1_182' title='bbox 649 741 791 760; x_wconf 79' lang='eng' dir='ltr'>ha/otolerans</span> <span class='ocrx_word' id='word_1_183' title='bbox 799 741 843 760; x_wconf 93' lang='eng' dir='ltr'>YIM</span> <span class='ocrx_word' id='word_1_184' title='bbox 854 740 936 760; x_wconf 90' lang='eng' dir='ltr'>70085T</span> <span class='ocrx_word' id='word_1_185' title='bbox 945 741 1083 766; x_wconf 88' lang='eng' dir='ltr'>(AY228479)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_67' title="bbox 193 773 957 799; baseline 0 -5"><span class='ocrx_word' id='word_1_186' title='bbox 193 773 216 789; x_wconf 78' lang='eng'>62</span> <span class='ocrx_word' id='word_1_187' title='bbox 227 775 615 794; x_wconf 84' lang='eng' dir='ltr'>—Nesterenkonia</span> <span class='ocrx_word' id='word_1_188' title='bbox 621 775 708 799; x_wconf 83' lang='eng' dir='ltr'>jeotgali</span> <span class='ocrx_word' id='word_1_189' title='bbox 715 774 810 794; x_wconf 70' lang='eng' dir='ltr'>JCS-241T</span> <span class='ocrx_word' id='word_1_190' title='bbox 819 774 957 799; x_wconf 82' lang='eng' dir='ltr'>(AY928901)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_68' title="bbox 437 807 848 832; baseline 0 -5"><span class='ocrx_word' id='word_1_191' title='bbox 437 808 511 827; x_wconf 81' lang='eng' dir='ltr'><em>Rothia</em></span> <span class='ocrx_word' id='word_1_192' title='bbox 520 808 576 827; x_wconf 84' lang='eng' dir='ltr'><em>aeria</em></span> <span class='ocrx_word' id='word_1_193' title='bbox 586 808 639 827; x_wconf 90' lang='eng' dir='ltr'>GTC</span> <span class='ocrx_word' id='word_1_194' title='bbox 648 807 701 827; x_wconf 77' lang='eng' dir='ltr'>867T</span> <span class='ocrx_word' id='word_1_195' title='bbox 710 808 848 832; x_wconf 87' lang='eng' dir='ltr'>(ABO71952)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_46' title="bbox 186 766 227 768">
+    <p class='ocr_par' dir='ltr' id='par_1_46' title="bbox 186 766 227 768">
+     <span class='ocr_line' id='line_1_69' title="bbox 186 766 227 768; baseline 0 101"><span class='ocrx_word' id='word_1_196' title='bbox 186 766 227 768; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_47' title="bbox 225 749 227 785">
+    <p class='ocr_par' dir='ltr' id='par_1_47' title="bbox 225 749 227 785">
+     <span class='ocr_line' id='line_1_70' title="bbox 225 749 227 785; baseline 0 84"><span class='ocrx_word' id='word_1_197' title='bbox 225 749 227 785; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_48' title="bbox 128 658 130 818">
+    <p class='ocr_par' dir='ltr' id='par_1_48' title="bbox 128 658 130 818">
+     <span class='ocr_line' id='line_1_71' title="bbox 128 658 130 818; baseline 0 51"><span class='ocrx_word' id='word_1_198' title='bbox 128 658 130 818; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_49' title="bbox 0 849 669 851">
+    <p class='ocr_par' dir='ltr' id='par_1_49' title="bbox 0 849 669 851">
+     <span class='ocr_line' id='line_1_72' title="bbox 0 849 669 851; baseline 0 18"><span class='ocrx_word' id='word_1_199' title='bbox 0 849 669 851; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_50' title="bbox 677 841 1204 866">
+    <p class='ocr_par' dir='ltr' id='par_1_50' title="bbox 677 841 1204 866">
+     <span class='ocr_line' id='line_1_73' title="bbox 677 841 1204 866; baseline 0 -5"><span class='ocrx_word' id='word_1_200' title='bbox 677 842 780 861; x_wconf 86' lang='eng' dir='ltr'>Nocardia</span> <span class='ocrx_word' id='word_1_201' title='bbox 789 842 929 861; x_wconf 85' lang='eng' dir='ltr'>inohanensis</span> <span class='ocrx_word' id='word_1_202' title='bbox 938 842 979 861; x_wconf 95' lang='eng' dir='ltr'>IFM</span> <span class='ocrx_word' id='word_1_203' title='bbox 989 841 1057 861; x_wconf 81' lang='eng' dir='ltr'>0092T</span> <span class='ocrx_word' id='word_1_204' title='bbox 1066 841 1204 866; x_wconf 85' lang='eng' dir='ltr'>(AB092560)</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000737-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000737-0-000.pbm.png
new file mode 100644
index 00000000..502b7258
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000737-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000737-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000737-0-000.pbm.png.hocr
new file mode 100644
index 00000000..77c96de3
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000737-0-000.pbm.png.hocr
@@ -0,0 +1,316 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000737-0-000.pbm.png"; bbox 0 0 994 969; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 7 46 72 66">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 7 46 72 66">
+     <span class='ocr_line' id='line_1_1' title="bbox 7 46 72 56; baseline -0.015 0"><span class='ocrx_word' id='word_1_1' title='bbox 7 46 22 56; x_wconf 65' lang='eng' dir='ltr'><strong>&lt;r</strong></span> <span class='ocrx_word' id='word_1_2' title='bbox 58 46 72 55; x_wconf 76' lang='eng' dir='ltr'><em>m</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 7 57 72 66; baseline 0 0"><span class='ocrx_word' id='word_1_3' title='bbox 7 57 22 66; x_wconf 69' lang='eng' dir='ltr'>o)</span> <span class='ocrx_word' id='word_1_4' title='bbox 57 57 72 66; x_wconf 65' lang='eng' dir='ltr'>o)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 101 3 233 24">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 102 3 233 24">
+     <span class='ocr_line' id='line_1_3' title="bbox 102 3 233 24; baseline 0 -5"><span class='ocrx_word' id='word_1_5' title='bbox 102 3 193 24; x_wconf 84' lang='eng' dir='ltr'>Similarity</span> <span class='ocrx_word' id='word_1_6' title='bbox 200 3 233 24; x_wconf 83' lang='eng'>(%)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 108 46 172 67">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 108 46 172 67">
+     <span class='ocr_line' id='line_1_4' title="bbox 108 46 172 56; baseline 0 0"><span class='ocrx_word' id='word_1_7' title='bbox 108 46 122 56; x_wconf 62' lang='eng' dir='ltr'>no</span> <span class='ocrx_word' id='word_1_8' title='bbox 157 46 172 56; x_wconf 73' lang='eng' dir='ltr'>I\</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 108 58 172 67; baseline 0 0"><span class='ocrx_word' id='word_1_9' title='bbox 108 58 122 67; x_wconf 66' lang='eng' dir='ltr'>on</span> <span class='ocrx_word' id='word_1_10' title='bbox 157 58 172 67; x_wconf 73' lang='eng'>07</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 207 46 222 66">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 207 46 222 66">
+     <span class='ocr_line' id='line_1_6' title="bbox 207 46 222 55; baseline 0 0"><span class='ocrx_word' id='word_1_11' title='bbox 207 46 222 55; x_wconf 81' lang='eng' dir='ltr'><strong>co</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 207 57 222 66; baseline 0 0"><span class='ocrx_word' id='word_1_12' title='bbox 207 57 222 66; x_wconf 62' lang='eng' dir='ltr'>cu</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 260 46 275 66">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 260 46 275 66">
+     <span class='ocr_line' id='line_1_8' title="bbox 260 46 275 55; baseline 0 0"><span class='ocrx_word' id='word_1_13' title='bbox 260 46 275 55; x_wconf 67' lang='eng' dir='ltr'><strong>m</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 260 57 275 66; baseline 0 0"><span class='ocrx_word' id='word_1_14' title='bbox 260 57 275 66; x_wconf 65' lang='eng' dir='ltr'><strong>m</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 308 34 323 66">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 308 35 323 65">
+     <span class='ocr_line' id='line_1_10' title="bbox 308 35 323 65; textangle 90"><span class='ocrx_word' id='word_1_15' title='bbox 308 35 323 65; x_wconf 92' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 5 73 317 87">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 5 74 317 86">
+     <span class='ocr_line' id='line_1_11' title="bbox 5 74 317 86; baseline 0 0"><span class='ocrx_word' id='word_1_16' title='bbox 5 74 317 86; x_wconf 34' lang='eng' dir='ltr'>MW</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 42 335 72 349">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 42 335 72 349">
+     <span class='ocr_line' id='line_1_12' title="bbox 42 335 72 349; baseline 0 0"><span class='ocrx_word' id='word_1_17' title='bbox 42 335 72 349; x_wconf 87' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 4 343 8 946">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 4 343 8 946">
+     <span class='ocr_line' id='line_1_13' title="bbox 4 343 8 946; baseline 0 23"><span class='ocrx_word' id='word_1_18' title='bbox 4 343 8 946; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 93 104 95 148">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 93 104 95 148">
+     <span class='ocr_line' id='line_1_14' title="bbox 93 104 95 148; baseline 0 821"><span class='ocrx_word' id='word_1_19' title='bbox 93 104 95 148; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 102 119 132 134">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 102 119 132 134">
+     <span class='ocr_line' id='line_1_15' title="bbox 102 119 132 134; baseline 0 0"><span class='ocrx_word' id='word_1_20' title='bbox 102 119 132 134; x_wconf 88' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 95 146 161 148">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 95 146 161 148">
+     <span class='ocr_line' id='line_1_16' title="bbox 95 146 161 148; baseline 0 821"><span class='ocrx_word' id='word_1_21' title='bbox 95 146 161 148; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 131 204 151 219">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 131 204 151 219">
+     <span class='ocr_line' id='line_1_17' title="bbox 131 204 151 219; baseline 0 0"><span class='ocrx_word' id='word_1_22' title='bbox 131 204 151 219; x_wconf 88' lang='eng'><strong>52</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 95 104 167 106">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 95 104 167 106">
+     <span class='ocr_line' id='line_1_18' title="bbox 95 104 167 106; baseline 0 863"><span class='ocrx_word' id='word_1_23' title='bbox 95 104 167 106; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 125 232 199 234">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 125 232 199 234">
+     <span class='ocr_line' id='line_1_19' title="bbox 125 232 199 234; baseline 0 735"><span class='ocrx_word' id='word_1_24' title='bbox 125 232 199 234; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 123 310 205 312">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 123 310 205 312">
+     <span class='ocr_line' id='line_1_20' title="bbox 123 310 205 312; baseline 0 657"><span class='ocrx_word' id='word_1_25' title='bbox 123 310 205 312; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 133 389 153 403">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 133 389 153 403">
+     <span class='ocr_line' id='line_1_21' title="bbox 133 389 153 403; baseline 0 0"><span class='ocrx_word' id='word_1_26' title='bbox 133 389 153 403; x_wconf 86' lang='eng'><em>58</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 123 188 125 480">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 123 188 125 480">
+     <span class='ocr_line' id='line_1_22' title="bbox 123 188 125 480; baseline 0 489"><span class='ocrx_word' id='word_1_27' title='bbox 123 188 125 480; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 128 485 158 500">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 128 485 158 500">
+     <span class='ocr_line' id='line_1_23' title="bbox 128 485 158 500; baseline 0 0"><span class='ocrx_word' id='word_1_28' title='bbox 128 485 158 500; x_wconf 87' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 108 547 138 562">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 108 547 138 562">
+     <span class='ocr_line' id='line_1_24' title="bbox 108 547 138 562; baseline 0 0"><span class='ocrx_word' id='word_1_29' title='bbox 108 547 138 562; x_wconf 87' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 98 302 102 808">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 98 302 102 808">
+     <span class='ocr_line' id='line_1_25' title="bbox 98 302 102 808; baseline 0 161"><span class='ocrx_word' id='word_1_30' title='bbox 98 302 102 808; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 143 655 145 844">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 143 655 145 844">
+     <span class='ocr_line' id='line_1_26' title="bbox 143 655 145 844; baseline 0 125"><span class='ocrx_word' id='word_1_31' title='bbox 143 655 145 844; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 203 274 205 345">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 203 274 205 345">
+     <span class='ocr_line' id='line_1_27' title="bbox 203 274 205 345; baseline 0 624"><span class='ocrx_word' id='word_1_32' title='bbox 203 274 205 345; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 168 315 198 329">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 168 315 198 329">
+     <span class='ocr_line' id='line_1_28' title="bbox 168 315 198 329; baseline 0 0"><span class='ocrx_word' id='word_1_33' title='bbox 168 315 198 329; x_wconf 88' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 180 513 210 559">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 180 513 210 559">
+     <span class='ocr_line' id='line_1_29' title="bbox 180 513 210 527; baseline 0 0"><span class='ocrx_word' id='word_1_34' title='bbox 180 513 210 527; x_wconf 89' lang='eng'>100</span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 180 545 210 559; baseline 0 0"><span class='ocrx_word' id='word_1_35' title='bbox 180 545 210 559; x_wconf 89' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 95 606 217 911">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 95 606 217 911">
+     <span class='ocr_line' id='line_1_31' title="bbox 95 606 217 911; baseline 0 58"><span class='ocrx_word' id='word_1_36' title='bbox 95 606 217 911; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 125 188 221 190">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 125 188 221 190">
+     <span class='ocr_line' id='line_1_32' title="bbox 125 188 221 190; baseline 0 779"><span class='ocrx_word' id='word_1_37' title='bbox 125 188 221 190; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 219 341 239 356">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 219 341 239 356">
+     <span class='ocr_line' id='line_1_33' title="bbox 219 341 239 356; baseline 0 0"><span class='ocrx_word' id='word_1_38' title='bbox 219 341 239 356; x_wconf 79' lang='eng'>73</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 254 375 274 389">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 254 375 274 389">
+     <span class='ocr_line' id='line_1_34' title="bbox 254 375 274 389; baseline 0 0"><span class='ocrx_word' id='word_1_39' title='bbox 254 375 274 389; x_wconf 79' lang='eng'>99</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 330 96 575 962">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 331 96 548 245">
+     <span class='ocr_line' id='line_1_35' title="bbox 333 96 424 119; baseline 0 0"><span class='ocrx_word' id='word_1_40' title='bbox 333 96 424 119; x_wconf 86' lang='eng' dir='ltr'>HJ039T</span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 333 138 548 161; baseline 0 0"><span class='ocrx_word' id='word_1_41' title='bbox 333 138 548 161; x_wconf 89' lang='eng' dir='ltr'>UST040317—058T</span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 332 180 430 203; baseline 0 0"><span class='ocrx_word' id='word_1_42' title='bbox 332 180 430 203; x_wconf 84' lang='eng' dir='ltr'>OSZ17T</span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 331 222 418 245; baseline 0 0"><span class='ocrx_word' id='word_1_43' title='bbox 331 222 418 245; x_wconf 92' lang='eng' dir='ltr'>TF-27T</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 333 264 406 287">
+     <span class='ocr_line' id='line_1_39' title="bbox 333 264 406 287; baseline 0 0"><span class='ocrx_word' id='word_1_44' title='bbox 333 266 374 287; x_wconf 95' lang='eng' dir='ltr'>LT1</span> <span class='ocrx_word' id='word_1_45' title='bbox 380 264 406 287; x_wconf 92' lang='eng' dir='ltr'>7T</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 331 306 478 497">
+     <span class='ocr_line' id='line_1_40' title="bbox 331 306 447 329; baseline 0 0"><span class='ocrx_word' id='word_1_46' title='bbox 331 308 410 329; x_wconf 89' lang='eng' dir='ltr'>ACEM</span> <span class='ocrx_word' id='word_1_47' title='bbox 421 306 447 329; x_wconf 86' lang='eng' dir='ltr'>9T</span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 333 348 478 371; baseline 0 0"><span class='ocrx_word' id='word_1_48' title='bbox 333 351 395 371; x_wconf 93' lang='eng' dir='ltr'>KMM</span> <span class='ocrx_word' id='word_1_49' title='bbox 406 348 478 371; x_wconf 85' lang='eng' dir='ltr'>3597T</span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 333 390 478 413; baseline 0 0"><span class='ocrx_word' id='word_1_50' title='bbox 333 392 395 413; x_wconf 94' lang='eng' dir='ltr'>KMM</span> <span class='ocrx_word' id='word_1_51' title='bbox 405 390 478 413; x_wconf 87' lang='eng' dir='ltr'>3299T</span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 331 432 478 455; baseline 0 0"><span class='ocrx_word' id='word_1_52' title='bbox 331 434 410 455; x_wconf 92' lang='eng' dir='ltr'>ACAM</span> <span class='ocrx_word' id='word_1_53' title='bbox 421 434 461 455; x_wconf 85' lang='eng'>591</span> <span class='ocrx_word' id='word_1_54' title='bbox 467 432 478 447; x_wconf 95' lang='eng' dir='ltr'>T</span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 333 474 382 497; baseline 0 0"><span class='ocrx_word' id='word_1_55' title='bbox 333 474 382 497; x_wconf 88' lang='eng' dir='ltr'>M7T</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 333 516 489 581">
+     <span class='ocr_line' id='line_1_45' title="bbox 333 516 489 539; baseline 0 0"><span class='ocrx_word' id='word_1_56' title='bbox 333 518 390 539; x_wconf 93' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_57' title='bbox 402 516 489 539; x_wconf 86' lang='eng' dir='ltr'>19866T</span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 333 560 369 581; baseline 0 0"><span class='ocrx_word' id='word_1_58' title='bbox 333 560 369 581; x_wconf 90' lang='eng' dir='ltr'>M5</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 333 601 408 624">
+     <span class='ocr_line' id='line_1_47' title="bbox 333 601 408 624; baseline 0.013 -1"><span class='ocrx_word' id='word_1_59' title='bbox 333 601 408 624; x_wconf 89' lang='eng' dir='ltr'>PO10T</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 333 642 422 666">
+     <span class='ocr_line' id='line_1_48' title="bbox 333 642 422 666; baseline 0.011 -1"><span class='ocrx_word' id='word_1_60' title='bbox 333 645 374 665; x_wconf 96' lang='eng' dir='ltr'>LT1</span> <span class='ocrx_word' id='word_1_61' title='bbox 380 642 422 666; x_wconf 74' lang='eng' dir='ltr'>SaT</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 331 684 489 749">
+     <span class='ocr_line' id='line_1_49' title="bbox 331 684 489 708; baseline 0.006 -1"><span class='ocrx_word' id='word_1_62' title='bbox 331 686 406 708; x_wconf 92' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_63' title='bbox 416 687 473 708; x_wconf 88' lang='eng'>8071</span> <span class='ocrx_word' id='word_1_64' title='bbox 478 684 489 699; x_wconf 92' lang='eng' dir='ltr'>T</span> 
+     </span>
+     <span class='ocr_line' id='line_1_50' title="bbox 333 726 412 749; baseline 0 0"><span class='ocrx_word' id='word_1_65' title='bbox 333 729 352 749; x_wconf 94' lang='eng' dir='ltr'>M</span> <span class='ocrx_word' id='word_1_66' title='bbox 356 729 395 749; x_wconf 92' lang='eng' dir='ltr'>R—1</span> <span class='ocrx_word' id='word_1_67' title='bbox 400 726 412 741; x_wconf 92' lang='eng' dir='ltr'>T</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 331 768 507 833">
+     <span class='ocr_line' id='line_1_51' title="bbox 333 768 507 791; baseline 0 0"><span class='ocrx_word' id='word_1_68' title='bbox 333 770 408 791; x_wconf 93' lang='eng' dir='ltr'>NCTC</span> <span class='ocrx_word' id='word_1_69' title='bbox 420 768 507 791; x_wconf 85' lang='eng' dir='ltr'>10735T</span> 
+     </span>
+     <span class='ocr_line' id='line_1_52' title="bbox 331 810 406 833; baseline 0 0"><span class='ocrx_word' id='word_1_70' title='bbox 331 810 406 833; x_wconf 86' lang='eng' dir='ltr'>T147T</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 331 854 574 962">
+     <span class='ocr_line' id='line_1_53' title="bbox 333 854 425 877; baseline 0 0"><span class='ocrx_word' id='word_1_71' title='bbox 333 857 393 877; x_wconf 96' lang='eng' dir='ltr'>U141</span> <span class='ocrx_word' id='word_1_72' title='bbox 399 854 425 877; x_wconf 91' lang='eng' dir='ltr'>7T</span> 
+     </span>
+     <span class='ocr_line' id='line_1_54' title="bbox 332 896 574 920; baseline 0 0"><span class='ocrx_word' id='word_1_73' title='bbox 332 898 429 920; x_wconf 88' lang='eng' dir='ltr'><strong>CCTCC</strong></span> <span class='ocrx_word' id='word_1_74' title='bbox 439 899 459 920; x_wconf 93' lang='eng' dir='ltr'>M</span> <span class='ocrx_word' id='word_1_75' title='bbox 469 896 574 920; x_wconf 84' lang='eng' dir='ltr'>203093T</span> 
+     </span>
+     <span class='ocr_line' id='line_1_55' title="bbox 331 939 505 962; baseline 0 0"><span class='ocrx_word' id='word_1_76' title='bbox 331 941 406 962; x_wconf 89' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_77' title='bbox 417 941 442 962; x_wconf 93' lang='eng'>51</span> <span class='ocrx_word' id='word_1_78' title='bbox 449 939 505 962; x_wconf 86' lang='eng' dir='ltr'>192T</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 603 97 992 968">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 604 98 992 967">
+     <span class='ocr_line' id='line_1_56' title="bbox 604 98 992 124; baseline 0 -5"><span class='ocrx_word' id='word_1_79' title='bbox 604 98 626 119; x_wconf 88' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_80' title='bbox 637 98 750 124; x_wconf 87' lang='eng' dir='ltr'>spongiae</span> <span class='ocrx_word' id='word_1_81' title='bbox 860 98 992 120; x_wconf 87' lang='eng' dir='ltr'>DQ167234</span> 
+     </span>
+     <span class='ocr_line' id='line_1_57' title="bbox 604 140 992 162; baseline 0 -1"><span class='ocrx_word' id='word_1_82' title='bbox 604 140 626 161; x_wconf 87' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_83' title='bbox 638 140 725 161; x_wconf 87' lang='eng' dir='ltr'>irciniae</span> <span class='ocrx_word' id='word_1_84' title='bbox 860 140 992 162; x_wconf 88' lang='eng' dir='ltr'>DQ180743</span> 
+     </span>
+     <span class='ocr_line' id='line_1_58' title="bbox 604 182 983 203; baseline 0 0"><span class='ocrx_word' id='word_1_85' title='bbox 604 182 626 203; x_wconf 87' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_86' title='bbox 638 182 786 203; x_wconf 85' lang='eng' dir='ltr'>denitriﬁcans</span> <span class='ocrx_word' id='word_1_87' title='bbox 858 182 983 203; x_wconf 88' lang='eng' dir='ltr'>AJ311964</span> 
+     </span>
+     <span class='ocr_line' id='line_1_59' title="bbox 604 224 987 251; baseline 0 -6"><span class='ocrx_word' id='word_1_88' title='bbox 604 224 626 245; x_wconf 90' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_89' title='bbox 637 224 736 251; x_wconf 82' lang='eng' dir='ltr'>gaetbuli</span> <span class='ocrx_word' id='word_1_90' title='bbox 858 224 987 245; x_wconf 83' lang='eng' dir='ltr'>AY190533</span> 
+     </span>
+     <span class='ocr_line' id='line_1_60' title="bbox 604 266 987 293; baseline 0 -6"><span class='ocrx_word' id='word_1_91' title='bbox 604 266 626 287; x_wconf 89' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_92' title='bbox 638 266 795 293; x_wconf 83' lang='eng' dir='ltr'>donghaensis</span> <span class='ocrx_word' id='word_1_93' title='bbox 858 266 987 287; x_wconf 89' lang='eng' dir='ltr'>AY326275</span> 
+     </span>
+     <span class='ocr_line' id='line_1_61' title="bbox 604 308 986 335; baseline 0 -6"><span class='ocrx_word' id='word_1_94' title='bbox 604 308 626 329; x_wconf 89' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_95' title='bbox 637 309 740 335; x_wconf 84' lang='eng' dir='ltr'>o/Ieyana</span> <span class='ocrx_word' id='word_1_96' title='bbox 858 309 986 329; x_wconf 83' lang='eng' dir='ltr'>AF295592</span> 
+     </span>
+     <span class='ocr_line' id='line_1_62' title="bbox 604 350 986 377; baseline 0 -6"><span class='ocrx_word' id='word_1_97' title='bbox 604 350 626 371; x_wconf 90' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_98' title='bbox 636 350 731 377; x_wconf 85' lang='eng' dir='ltr'>paciﬁca</span> <span class='ocrx_word' id='word_1_99' title='bbox 858 351 986 371; x_wconf 88' lang='eng' dir='ltr'>AF500075</span> 
+     </span>
+     <span class='ocr_line' id='line_1_63' title="bbox 604 392 982 419; baseline 0 -6"><span class='ocrx_word' id='word_1_100' title='bbox 604 392 626 413; x_wconf 90' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_101' title='bbox 633 392 740 419; x_wconf 84' lang='eng' dir='ltr'>japonica</span> <span class='ocrx_word' id='word_1_102' title='bbox 858 392 982 413; x_wconf 88' lang='eng' dir='ltr'>AF145921</span> 
+     </span>
+     <span class='ocr_line' id='line_1_64' title="bbox 604 434 955 461; baseline 0 -6"><span class='ocrx_word' id='word_1_103' title='bbox 604 434 626 455; x_wconf 90' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_104' title='bbox 638 434 789 461; x_wconf 78' lang='eng' dir='ltr'>frigid/marina</span> <span class='ocrx_word' id='word_1_105' title='bbox 860 434 955 455; x_wconf 86' lang='eng' dir='ltr'>U85903</span> 
+     </span>
+     <span class='ocr_line' id='line_1_65' title="bbox 855 476 990 497; baseline 0 0"><span class='ocrx_word' id='word_1_106' title='bbox 855 476 990 497; x_wconf 87' lang='eng' dir='ltr'>AM980877</span> 
+     </span>
+     <span class='ocr_line' id='line_1_66' title="bbox 604 518 983 545; baseline 0 -6"><span class='ocrx_word' id='word_1_107' title='bbox 604 518 626 539; x_wconf 87' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_108' title='bbox 637 518 819 545; x_wconf 81' lang='eng' dir='ltr'>livingstonensis</span> <span class='ocrx_word' id='word_1_109' title='bbox 858 518 983 539; x_wconf 90' lang='eng' dir='ltr'>AJ300834</span> 
+     </span>
+     <span class='ocr_line' id='line_1_67' title="bbox 855 560 989 581; baseline 0 0"><span class='ocrx_word' id='word_1_110' title='bbox 855 560 989 581; x_wconf 85' lang='eng' dir='ltr'>AM980878</span> 
+     </span>
+     <span class='ocr_line' id='line_1_68' title="bbox 604 603 987 624; baseline 0.003 -1"><span class='ocrx_word' id='word_1_111' title='bbox 604 603 626 624; x_wconf 89' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_112' title='bbox 637 603 763 624; x_wconf 84' lang='eng' dir='ltr'>hafniensis</span> <span class='ocrx_word' id='word_1_113' title='bbox 858 603 987 624; x_wconf 80' lang='eng' dir='ltr'>A8205566</span> 
+     </span>
+     <span class='ocr_line' id='line_1_69' title="bbox 604 644 983 671; baseline -0.003 -5"><span class='ocrx_word' id='word_1_114' title='bbox 604 644 626 666; x_wconf 90' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_115' title='bbox 636 644 747 671; x_wconf 85' lang='eng' dir='ltr'><em>profunda</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 858 645 983 666; x_wconf 85' lang='eng' dir='ltr'>AY445591</span> 
+     </span>
+     <span class='ocr_line' id='line_1_70' title="bbox 604 686 953 713; baseline -0.003 -5"><span class='ocrx_word' id='word_1_117' title='bbox 604 686 626 708; x_wconf 88' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_118' title='bbox 636 686 789 713; x_wconf 85' lang='eng' dir='ltr'>putrefaciens</span> <span class='ocrx_word' id='word_1_119' title='bbox 858 687 953 708; x_wconf 83' lang='eng' dir='ltr'>X82133</span> 
+     </span>
+     <span class='ocr_line' id='line_1_71' title="bbox 604 728 982 750; baseline -0.003 0"><span class='ocrx_word' id='word_1_120' title='bbox 604 728 626 750; x_wconf 91' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_121' title='bbox 638 729 770 750; x_wconf 86' lang='eng' dir='ltr'>oneidensis</span> <span class='ocrx_word' id='word_1_122' title='bbox 858 729 982 750; x_wconf 89' lang='eng' dir='ltr'>AF005251</span> 
+     </span>
+     <span class='ocr_line' id='line_1_72' title="bbox 604 770 983 791; baseline 0 0"><span class='ocrx_word' id='word_1_123' title='bbox 604 770 626 791; x_wconf 89' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_124' title='bbox 637 771 717 791; x_wconf 82' lang='eng' dir='ltr'>baltica</span> <span class='ocrx_word' id='word_1_125' title='bbox 858 771 983 791; x_wconf 89' lang='eng' dir='ltr'>AJ000214</span> 
+     </span>
+     <span class='ocr_line' id='line_1_73' title="bbox 604 812 983 839; baseline 0 -6"><span class='ocrx_word' id='word_1_126' title='bbox 604 812 626 833; x_wconf 87' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_127' title='bbox 637 812 830 839; x_wconf 85' lang='eng' dir='ltr'>glacia/ipiscico/a</span> <span class='ocrx_word' id='word_1_128' title='bbox 858 812 983 833; x_wconf 86' lang='eng' dir='ltr'>AB205571</span> 
+     </span>
+     <span class='ocr_line' id='line_1_74' title="bbox 604 856 987 877; baseline 0 0"><span class='ocrx_word' id='word_1_129' title='bbox 604 856 626 877; x_wconf 68' lang='eng' dir='ltr'>S,</span> <span class='ocrx_word' id='word_1_130' title='bbox 637 857 747 877; x_wconf 88' lang='eng' dir='ltr'><em>morhuae</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 858 857 987 877; x_wconf 78' lang='eng' dir='ltr'>A3205576</span> 
+     </span>
+     <span class='ocr_line' id='line_1_75' title="bbox 604 898 979 920; baseline 0 0"><span class='ocrx_word' id='word_1_132' title='bbox 604 898 626 920; x_wconf 86' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_133' title='bbox 638 899 810 920; x_wconf 85' lang='eng' dir='ltr'>deco/orationis</span> <span class='ocrx_word' id='word_1_134' title='bbox 858 899 979 920; x_wconf 85' lang='eng' dir='ltr'>AJ609571</span> 
+     </span>
+     <span class='ocr_line' id='line_1_76' title="bbox 604 941 986 967; baseline 0 -5"><span class='ocrx_word' id='word_1_135' title='bbox 604 941 626 962; x_wconf 87' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_136' title='bbox 637 941 704 967; x_wconf 84' lang='eng' dir='ltr'><em>algae</em></span> <span class='ocrx_word' id='word_1_137' title='bbox 858 941 986 962; x_wconf 83' lang='eng' dir='ltr'>AF005249</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000737-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000737-0-001.pbm.png
new file mode 100644
index 00000000..6c507c27
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000737-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000737-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000737-0-001.pbm.png.hocr
new file mode 100644
index 00000000..f9971b18
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000737-0-001.pbm.png.hocr
@@ -0,0 +1,416 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000737-0-001.pbm.png"; bbox 0 0 1231 1126; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 7 1 1230 913">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 75 1 1230 384">
+     <span class='ocr_line' id='line_1_1' title="bbox 342 1 981 31; baseline 0 -6"><span class='ocrx_word' id='word_1_1' title='bbox 342 12 366 29; x_wconf 77' lang='eng'><em>73</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 383 13 509 15; x_wconf 91' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_3' title='bbox 518 3 540 25; x_wconf 91' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 552 4 633 25; x_wconf 84' lang='eng' dir='ltr'><em>bait/ca</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 644 3 720 25; x_wconf 94' lang='eng' dir='ltr'><em>NCTC</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 732 1 821 25; x_wconf 90' lang='eng' dir='ltr'><em>10735T</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 831 3 981 31; x_wconf 79' lang='eng' dir='ltr'><em>(A8231331)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 313 36 932 66; baseline 0 -6"><span class='ocrx_word' id='word_1_8' title='bbox 313 38 338 56; x_wconf 79' lang='eng'><em>88</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 383 48 512 50; x_wconf 91' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_10' title='bbox 524 39 545 60; x_wconf 90' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 557 39 685 60; x_wconf 81' lang='eng' dir='ltr'><em>hafniensis</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 695 36 772 60; x_wconf 92' lang='eng' dir='ltr'><em>PO10T</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 782 39 932 66; x_wconf 86' lang='eng' dir='ltr'><em>(AB208056)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 75 71 1081 102; baseline -0.007 0"><span class='ocrx_word' id='word_1_14' title='bbox 75 84 86 102; x_wconf 92' lang='eng'>0</span> <span class='ocrx_word' id='word_1_15' title='bbox 94 84 119 102; x_wconf 91' lang='eng'><em>02</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 284 78 308 95; x_wconf 84' lang='eng'><strong><em>88</em></strong></span> <span class='ocrx_word' id='word_1_17' title='bbox 354 84 553 86; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_18' title='bbox 564 74 586 95; x_wconf 89' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 597 74 753 101; x_wconf 83' lang='eng' dir='ltr'><em>putrefaciens</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 762 74 838 95; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 849 71 922 95; x_wconf 89' lang='eng' dir='ltr'><em>8071T</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 932 74 1081 101; x_wconf 82' lang='eng' dir='ltr'><em>(AFOO5669)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 483 107 1036 136; baseline 0 -6"><span class='ocrx_word' id='word_1_23' title='bbox 483 119 551 121; x_wconf 94' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_24' title='bbox 561 109 583 130; x_wconf 91' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 594 109 790 136; x_wconf 84' lang='eng' dir='ltr'><em>glacialipiscico/a</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 799 107 876 130; x_wconf 93' lang='eng' dir='ltr'><em>T147T</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 885 109 1036 136; x_wconf 82' lang='eng' dir='ltr'><em>(ABZ66200)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 598 142 1008 171; baseline -0.002 -5"><span class='ocrx_word' id='word_1_28' title='bbox 598 144 620 166; x_wconf 94' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 632 144 744 166; x_wconf 84' lang='eng' dir='ltr'><em>morhuae</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 754 142 848 166; x_wconf 91' lang='eng' dir='ltr'><em>U1417T</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 858 144 1008 171; x_wconf 79' lang='eng' dir='ltr'><em>(A3208062)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 382 177 1230 207; baseline 0 -6"><span class='ocrx_word' id='word_1_32' title='bbox 382 189 599 191; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_33' title='bbox 610 180 632 201; x_wconf 92' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 644 180 819 201; x_wconf 78' lang='eng' dir='ltr'><em>deceleration/s</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 829 179 927 201; x_wconf 91' lang='eng' dir='ltr'><strong>CCTCC</strong></span> <span class='ocrx_word' id='word_1_36' title='bbox 938 180 958 201; x_wconf 95' lang='eng' dir='ltr'>M</span> <span class='ocrx_word' id='word_1_37' title='bbox 969 177 1075 201; x_wconf 79' lang='eng' dir='ltr'><em>203093T</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 1085 180 1230 207; x_wconf 84' lang='eng' dir='ltr'><em>(AJ609572)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 331 212 991 242; baseline 0 -6"><span class='ocrx_word' id='word_1_39' title='bbox 331 216 368 233; x_wconf 89' lang='eng'>100</span> <span class='ocrx_word' id='word_1_40' title='bbox 382 224 562 226; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_41' title='bbox 571 215 593 236; x_wconf 87' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 605 215 741 236; x_wconf 83' lang='eng' dir='ltr'><em>oneidensis</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 751 212 830 236; x_wconf 92' lang='eng' dir='ltr'><em>MR-1T</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 840 215 991 242; x_wconf 83' lang='eng' dir='ltr'><em>(AEO14299)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 220 248 1080 277; baseline 0.002 -7"><span class='ocrx_word' id='word_1_45' title='bbox 220 260 613 262; x_wconf 94' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_46' title='bbox 623 250 645 271; x_wconf 88' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 658 250 810 272; x_wconf 81' lang='eng' dir='ltr'><em>denitrificans</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 819 248 918 272; x_wconf 83' lang='eng' dir='ltr'><em>08217T</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 928 250 1080 277; x_wconf 85' lang='eng' dir='ltr'><em>(CP000302)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 179 283 905 318; baseline 0 -11"><span class='ocrx_word' id='word_1_50' title='bbox 179 299 203 318; x_wconf 71' lang='eng'><em>79</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 370 295 595 297; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_52' title='bbox 603 285 682 307; x_wconf 85' lang='eng' dir='ltr'><em>Strain</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 694 283 743 307; x_wconf 90' lang='eng' dir='ltr'><em>M7T</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 753 286 905 313; x_wconf 91' lang='eng' dir='ltr'><em>(EU702750)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 321 319 1192 349; baseline -0.001 -6"><span class='ocrx_word' id='word_1_55' title='bbox 321 331 358 349; x_wconf 74' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 427 331 675 333; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_57' title='bbox 686 321 708 343; x_wconf 89' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 720 321 874 348; x_wconf 84' lang='eng' dir='ltr'><em>frigidimarina</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 883 321 964 343; x_wconf 90' lang='eng' dir='ltr'><em>ACAM</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 975 319 1033 343; x_wconf 77' lang='eng' dir='ltr'><em>591T</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 1043 321 1192 348; x_wconf 83' lang='eng' dir='ltr'><em>(AF014947)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 386 354 1195 384; baseline 0 -6"><span class='ocrx_word' id='word_1_62' title='bbox 386 357 410 375; x_wconf 82' lang='eng'><em>97</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 427 366 691 368; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_64' title='bbox 701 356 724 378; x_wconf 92' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 735 357 944 384; x_wconf 86' lang='eng' dir='ltr'><em>livingstonensis</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 954 354 1034 378; x_wconf 86' lang='eng' dir='ltr'><em>NF22T</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 1043 356 1195 384; x_wconf 92' lang='eng' dir='ltr'><em>(EU702751)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 97 389 956 454">
+     <span class='ocr_line' id='line_1_12' title="bbox 137 389 900 419; baseline 0 -6"><span class='ocrx_word' id='word_1_68' title='bbox 137 401 451 403; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_69' title='bbox 460 392 482 413; x_wconf 91' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 495 392 669 419; x_wconf 82' lang='eng' dir='ltr'><em>algidipisc/cola</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 679 389 740 413; x_wconf 78' lang='eng' dir='ltr'><em>S13T</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 750 392 900 419; x_wconf 82' lang='eng' dir='ltr'><em>(ABZ66202)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 97 424 956 454; baseline 0 -6"><span class='ocrx_word' id='word_1_73' title='bbox 97 428 122 445; x_wconf 88' lang='eng'><em>82</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 137 436 429 438; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_75' title='bbox 438 427 460 448; x_wconf 89' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 472 427 610 448; x_wconf 83' lang='eng' dir='ltr'><em>colwelliana</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 619 427 696 448; x_wconf 88' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 707 424 796 448; x_wconf 81' lang='eng' dir='ltr'><em>39565T</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 806 427 956 454; x_wconf 88' lang='eng' dir='ltr'><em>(AB266207)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 173 460 924 489">
+     <span class='ocr_line' id='line_1_14' title="bbox 173 460 924 489; baseline 0 -6"><span class='ocrx_word' id='word_1_80' title='bbox 173 472 464 474; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_81' title='bbox 474 462 496 483; x_wconf 92' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 507 462 677 489; x_wconf 80' lang='eng' dir='ltr'><em>piezotolerans</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 686 460 759 483; x_wconf 50' lang='eng' dir='ltr'><em>WP?)T</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 769 462 924 489; x_wconf 88' lang='eng' dir='ltr'><em>(AM229308)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 158 497 914 631">
+     <span class='ocr_line' id='line_1_15' title="bbox 529 497 799 525; baseline 0 -6"><span class='ocrx_word' id='word_1_85' title='bbox 529 497 550 519; x_wconf 91' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 563 497 635 519; x_wconf 83' lang='eng' dir='ltr'><em>fidelis</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 644 497 799 525; x_wconf 85' lang='eng' dir='ltr'><em>(AM229309)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 260 530 897 560; baseline 0 -6"><span class='ocrx_word' id='word_1_88' title='bbox 260 541 285 558; x_wconf 80' lang='eng'><em>93</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 300 542 443 545; x_wconf 83' lang='eng'>—</span> <span class='ocrx_word' id='word_1_90' title='bbox 453 533 475 554; x_wconf 92' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 487 533 664 554; x_wconf 79' lang='eng' dir='ltr'><em>marinintestina</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 675 530 737 554; x_wconf 93' lang='eng' dir='ltr'><em>IK-1T</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 747 533 897 560; x_wconf 86' lang='eng' dir='ltr'><em>(AB081763)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 158 561 819 595; baseline 0 -6"><span class='ocrx_word' id='word_1_94' title='bbox 158 561 183 579; x_wconf 74' lang='eng'><em>89</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 300 577 432 579; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_96' title='bbox 443 568 465 589; x_wconf 87' lang='eng' dir='ltr'><strong><em>s.</em></strong></span> <span class='ocrx_word' id='word_1_97' title='bbox 477 568 554 589; x_wconf 80' lang='eng' dir='ltr'><em>sairae</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 564 565 658 589; x_wconf 83' lang='eng' dir='ltr'><em>SM2-1T</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 668 568 819 595; x_wconf 88' lang='eng' dir='ltr'><em>(AB081768)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 195 601 914 631; baseline -0.001 -5"><span class='ocrx_word' id='word_1_100' title='bbox 195 609 220 626; x_wconf 84' lang='eng'><em>63</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 447 604 469 625; x_wconf 94' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 481 604 638 631; x_wconf 82' lang='eng' dir='ltr'><em>sohlegeliana</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 649 601 754 625; x_wconf 90' lang='eng' dir='ltr'><em>HRKA1T</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 764 604 914 631; x_wconf 79' lang='eng' dir='ltr'><em>(ABOB1766)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 7 636 1071 913">
+     <span class='ocr_line' id='line_1_19' title="bbox 7 636 965 672; baseline 0 -12"><span class='ocrx_word' id='word_1_105' title='bbox 7 654 32 672; x_wconf 75' lang='eng'><em>65</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 206 649 230 666; x_wconf 77' lang='eng'><em>72</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 305 648 461 651; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_108' title='bbox 472 639 494 660; x_wconf 88' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 507 639 655 660; x_wconf 84' lang='eng' dir='ltr'><em>halifaxensis</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 665 636 806 660; x_wconf 95' lang='eng' dir='ltr'><em>HAW-EB4T</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 816 639 965 666; x_wconf 88' lang='eng' dir='ltr'><em>(AY842131)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 267 672 1071 701; baseline 0.002 -7"><span class='ocrx_word' id='word_1_112' title='bbox 267 675 292 693; x_wconf 89' lang='eng'><em>98</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 307 684 604 686; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_114' title='bbox 613 674 635 696; x_wconf 91' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 646 674 763 701; x_wconf 86' lang='eng' dir='ltr'><em>pea/eana</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 772 672 913 697; x_wconf 87' lang='eng' dir='ltr'><em>ANG—SQ1T</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 922 674 1071 701; x_wconf 88' lang='eng' dir='ltr'><em>(AF014945)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 195 707 1036 737; baseline 0 -6"><span class='ocrx_word' id='word_1_118' title='bbox 195 719 521 721; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_119' title='bbox 532 710 554 731; x_wconf 93' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 565 710 718 737; x_wconf 81' lang='eng' dir='ltr'><em>gel/dimarina</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 727 709 808 731; x_wconf 88' lang='eng' dir='ltr'><em>ACAM</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 818 707 877 731; x_wconf 81' lang='eng' dir='ltr'><em>456T</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 887 710 1036 737; x_wconf 86' lang='eng' dir='ltr'><em>(AF014946)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 145 742 913 771; baseline 0 -5"><span class='ocrx_word' id='word_1_124' title='bbox 145 745 181 763; x_wconf 89' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 195 754 424 756; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_126' title='bbox 435 744 457 766; x_wconf 89' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 469 745 571 766; x_wconf 84' lang='eng' dir='ltr'><em>hanedai</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 578 744 654 766; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 665 742 755 766; x_wconf 77' lang='eng' dir='ltr'><em>33224T</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 765 744 913 771; x_wconf 84' lang='eng' dir='ltr'><em>(AFOO5693)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 141 777 844 807; baseline 0 -6"><span class='ocrx_word' id='word_1_131' title='bbox 141 789 370 791; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_132' title='bbox 381 780 403 801; x_wconf 90' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 415 780 533 801; x_wconf 84' lang='eng' dir='ltr'><em>sediminis</em></span> <span class='ocrx_word' id='word_1_134' title='bbox 544 777 683 801; x_wconf 83' lang='eng' dir='ltr'><em>HAW-EB3T</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 693 780 844 807; x_wconf 88' lang='eng' dir='ltr'><em>(AY842130)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 99 813 907 847; baseline 0 -11"><span class='ocrx_word' id='word_1_136' title='bbox 99 829 123 847; x_wconf 68' lang='eng'>99</span> <span class='ocrx_word' id='word_1_137' title='bbox 143 824 521 827; x_wconf 85' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_138' title='bbox 532 815 554 836; x_wconf 91' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_139' title='bbox 567 815 655 842; x_wconf 91' lang='eng' dir='ltr'><em>woodyi</em></span> <span class='ocrx_word' id='word_1_140' title='bbox 664 813 748 836; x_wconf 80' lang='eng' dir='ltr'><em>M332T</em></span> <span class='ocrx_word' id='word_1_141' title='bbox 758 815 907 842; x_wconf 85' lang='eng' dir='ltr'><em>(AF014944)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 179 848 873 877; baseline -0.001 -5"><span class='ocrx_word' id='word_1_142' title='bbox 179 860 414 862; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_143' title='bbox 423 850 445 872; x_wconf 95' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_144' title='bbox 457 850 562 872; x_wconf 82' lang='eng' dir='ltr'><em>atlantica</em></span> <span class='ocrx_word' id='word_1_145' title='bbox 573 848 713 872; x_wconf 80' lang='eng' dir='ltr'><em>HAW-E35T</em></span> <span class='ocrx_word' id='word_1_146' title='bbox 723 850 873 877; x_wconf 86' lang='eng' dir='ltr'><em>(AY842132)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 138 883 933 913; baseline 0.003 -8"><span class='ocrx_word' id='word_1_147' title='bbox 138 887 162 905; x_wconf 88' lang='eng'><em>78</em></span> <span class='ocrx_word' id='word_1_148' title='bbox 179 895 434 897; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_149' title='bbox 445 886 467 907; x_wconf 90' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_150' title='bbox 479 886 623 907; x_wconf 86' lang='eng' dir='ltr'><em>canadensis</em></span> <span class='ocrx_word' id='word_1_151' title='bbox 633 883 773 907; x_wconf 81' lang='eng' dir='ltr'><em>HAW-E82T</em></span> <span class='ocrx_word' id='word_1_152' title='bbox 783 886 933 913; x_wconf 88' lang='eng' dir='ltr'><em>(AY842129)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 40 919 976 1019">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 40 919 976 1019">
+     <span class='ocr_line' id='line_1_27' title="bbox 452 919 892 948; baseline -0.002 -5"><span class='ocrx_word' id='word_1_153' title='bbox 452 921 474 943; x_wconf 89' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_154' title='bbox 485 922 645 948; x_wconf 87' lang='eng' dir='ltr'><em>psychrophila</em></span> <span class='ocrx_word' id='word_1_155' title='bbox 654 919 727 942; x_wconf 89' lang='eng' dir='ltr'><em>WP2T</em></span> <span class='ocrx_word' id='word_1_156' title='bbox 737 921 892 948; x_wconf 86' lang='eng' dir='ltr'><em>(AM229307)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 40 931 976 1003; baseline 0 -25"><span class='ocrx_word' id='word_1_157' title='bbox 40 931 513 1003; x_wconf 49' lang='eng'><em>£8.</em></span> <span class='ocrx_word' id='word_1_158' title='bbox 525 957 631 978; x_wconf 84' lang='eng' dir='ltr'><em>benthica</em></span> <span class='ocrx_word' id='word_1_159' title='bbox 641 956 717 978; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_160' title='bbox 727 954 818 978; x_wconf 78' lang='eng' dir='ltr'><em>43992T</em></span> <span class='ocrx_word' id='word_1_161' title='bbox 828 956 976 984; x_wconf 83' lang='eng' dir='ltr'><em>(AFO14949)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 276 992 798 1019; baseline 0 -6"><span class='ocrx_word' id='word_1_162' title='bbox 276 993 300 1010; x_wconf 83' lang='eng'><em>99</em></span> <span class='ocrx_word' id='word_1_163' title='bbox 500 992 522 1013; x_wconf 91' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_164' title='bbox 535 992 637 1013; x_wconf 84' lang='eng' dir='ltr'><em>violacea</em></span> <span class='ocrx_word' id='word_1_165' title='bbox 647 992 798 1019; x_wconf 79' lang='eng' dir='ltr'><em>(A8092340)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 1 1025 1143 1125">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 1 1025 1143 1125">
+     <span class='ocr_line' id='line_1_30' title="bbox 40 1025 809 1054; baseline 0.004 -8"><span class='ocrx_word' id='word_1_166' title='bbox 40 1036 439 1038; x_wconf 94' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_167' title='bbox 450 1027 472 1049; x_wconf 89' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_168' title='bbox 484 1027 563 1049; x_wconf 86' lang='eng' dir='ltr'><em>Ioihica</em></span> <span class='ocrx_word' id='word_1_169' title='bbox 575 1025 648 1048; x_wconf 91' lang='eng' dir='ltr'><em>PV-4T</em></span> <span class='ocrx_word' id='word_1_170' title='bbox 657 1027 809 1054; x_wconf 83' lang='eng' dir='ltr'><em>(CP000606)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 1 1060 1143 1090; baseline 0 -6"><span class='ocrx_word' id='word_1_171' title='bbox 1 1072 25 1089; x_wconf 67' lang='eng'><em>35</em></span> <span class='ocrx_word' id='word_1_172' title='bbox 696 1062 718 1084; x_wconf 87' lang='eng' dir='ltr'><strong><em>s.</em></strong></span> <span class='ocrx_word' id='word_1_173' title='bbox 730 1063 799 1090; x_wconf 86' lang='eng' dir='ltr'><em>algae</em></span> <span class='ocrx_word' id='word_1_174' title='bbox 808 1062 884 1084; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_175' title='bbox 895 1060 984 1084; x_wconf 76' lang='eng' dir='ltr'><em>51192T</em></span> <span class='ocrx_word' id='word_1_176' title='bbox 995 1062 1143 1090; x_wconf 86' lang='eng' dir='ltr'><em>(AF005686)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 89 1095 1009 1125; baseline 0.003 -8"><span class='ocrx_word' id='word_1_177' title='bbox 89 1099 125 1116; x_wconf 86' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_178' title='bbox 137 1107 545 1109; x_wconf 94' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_179' title='bbox 556 1098 578 1119; x_wconf 90' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_180' title='bbox 590 1098 758 1119; x_wconf 86' lang='eng' dir='ltr'><em>amazonensis</em></span> <span class='ocrx_word' id='word_1_181' title='bbox 767 1095 850 1119; x_wconf 80' lang='eng' dir='ltr'><em>SBZBT</em></span> <span class='ocrx_word' id='word_1_182' title='bbox 860 1098 1009 1125; x_wconf 89' lang='eng' dir='ltr'><em>(AF005257)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 381 13 383 50">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 381 13 383 50">
+     <span class='ocr_line' id='line_1_33' title="bbox 381 13 383 50; baseline 0 1076"><span class='ocrx_word' id='word_1_183' title='bbox 381 13 383 50; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 322 57 354 59">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 322 57 354 59">
+     <span class='ocr_line' id='line_1_34' title="bbox 322 57 354 59; baseline 0 1067"><span class='ocrx_word' id='word_1_184' title='bbox 322 57 354 59; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 352 31 354 86">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 352 31 354 86">
+     <span class='ocr_line' id='line_1_35' title="bbox 352 31 354 86; baseline 0 1040"><span class='ocrx_word' id='word_1_185' title='bbox 352 31 354 86; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 322 57 324 138">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 322 57 324 138">
+     <span class='ocr_line' id='line_1_36' title="bbox 322 57 324 138; baseline 0 988"><span class='ocrx_word' id='word_1_186' title='bbox 322 57 324 138; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 322 136 483 138">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 322 136 483 138">
+     <span class='ocr_line' id='line_1_37' title="bbox 322 136 483 138; baseline 0 988"><span class='ocrx_word' id='word_1_187' title='bbox 322 136 483 138; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 236 132 273 150">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 236 132 273 150">
+     <span class='ocr_line' id='line_1_38' title="bbox 236 132 273 150; baseline 0.027 -1"><span class='ocrx_word' id='word_1_188' title='bbox 236 132 273 150; x_wconf 92' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 184 152 286 154">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 184 152 286 154">
+     <span class='ocr_line' id='line_1_39' title="bbox 184 152 286 154; baseline 0 972"><span class='ocrx_word' id='word_1_189' title='bbox 184 152 286 154; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 481 119 483 156">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 481 119 483 156">
+     <span class='ocr_line' id='line_1_40' title="bbox 481 119 483 156; baseline 0 970"><span class='ocrx_word' id='word_1_190' title='bbox 481 119 483 156; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 435 145 471 163">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 435 145 471 163">
+     <span class='ocr_line' id='line_1_41' title="bbox 435 145 471 163; baseline 0 0"><span class='ocrx_word' id='word_1_191' title='bbox 435 145 471 163; x_wconf 89' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 483 154 589 156">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 483 154 589 156">
+     <span class='ocr_line' id='line_1_42' title="bbox 483 154 589 156; baseline 0 970"><span class='ocrx_word' id='word_1_192' title='bbox 483 154 589 156; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 380 13 383 226">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 380 13 383 226">
+     <span class='ocr_line' id='line_1_43' title="bbox 380 13 383 226; baseline 0 900"><span class='ocrx_word' id='word_1_193' title='bbox 380 13 383 226; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 285 97 286 209">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 285 97 286 209">
+     <span class='ocr_line' id='line_1_44' title="bbox 285 97 286 209; baseline 0 917"><span class='ocrx_word' id='word_1_194' title='bbox 285 97 286 209; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 284 207 382 209">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 284 207 382 209">
+     <span class='ocr_line' id='line_1_45' title="bbox 284 207 382 209; baseline 0 917"><span class='ocrx_word' id='word_1_195' title='bbox 284 207 382 209; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 145 202 169 220">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 145 202 169 220">
+     <span class='ocr_line' id='line_1_46' title="bbox 145 202 169 220; baseline 0 0"><span class='ocrx_word' id='word_1_196' title='bbox 145 202 169 220; x_wconf 82' lang='eng'><em>94</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 93 222 186 224">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 93 222 186 224">
+     <span class='ocr_line' id='line_1_47' title="bbox 93 222 186 224; baseline 0 902"><span class='ocrx_word' id='word_1_197' title='bbox 93 222 186 224; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 184 152 186 292">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 184 152 186 292">
+     <span class='ocr_line' id='line_1_48' title="bbox 184 152 186 292; baseline 0 834"><span class='ocrx_word' id='word_1_198' title='bbox 184 152 186 292; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 184 290 220 292">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 184 290 220 292">
+     <span class='ocr_line' id='line_1_49' title="bbox 184 290 220 292; baseline 0 834"><span class='ocrx_word' id='word_1_199' title='bbox 184 290 220 292; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 218 260 220 324">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 218 260 220 324">
+     <span class='ocr_line' id='line_1_50' title="bbox 218 260 220 324; baseline 0 802"><span class='ocrx_word' id='word_1_200' title='bbox 218 260 220 324; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 218 322 370 324">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 218 322 370 324">
+     <span class='ocr_line' id='line_1_51' title="bbox 218 322 370 324; baseline 0 802"><span class='ocrx_word' id='word_1_201' title='bbox 218 322 370 324; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 368 295 370 350">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 368 295 370 350">
+     <span class='ocr_line' id='line_1_52' title="bbox 368 295 370 350; baseline 0 776"><span class='ocrx_word' id='word_1_202' title='bbox 368 295 370 350; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 368 348 428 350">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 368 348 428 350">
+     <span class='ocr_line' id='line_1_53' title="bbox 368 348 428 350; baseline 0 776"><span class='ocrx_word' id='word_1_203' title='bbox 368 348 428 350; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 425 331 427 368">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 425 331 427 368">
+     <span class='ocr_line' id='line_1_54' title="bbox 425 331 427 368; baseline 0 758"><span class='ocrx_word' id='word_1_204' title='bbox 425 331 427 368; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 93 222 95 421">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 93 222 95 421">
+     <span class='ocr_line' id='line_1_55' title="bbox 93 222 95 421; baseline 0 705"><span class='ocrx_word' id='word_1_205' title='bbox 93 222 95 421; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 93 419 137 421">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 93 419 137 421">
+     <span class='ocr_line' id='line_1_56' title="bbox 93 419 137 421; baseline 0 705"><span class='ocrx_word' id='word_1_206' title='bbox 93 419 137 421; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 135 401 137 438">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 135 401 137 438">
+     <span class='ocr_line' id='line_1_57' title="bbox 135 401 137 438; baseline 0 688"><span class='ocrx_word' id='word_1_207' title='bbox 135 401 137 438; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 89 513 173 515">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 89 513 173 515">
+     <span class='ocr_line' id='line_1_58' title="bbox 89 513 173 515; baseline 0 611"><span class='ocrx_word' id='word_1_208' title='bbox 89 513 173 515; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 51 508 76 526">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 51 508 76 526">
+     <span class='ocr_line' id='line_1_59' title="bbox 51 508 76 526; baseline 0 0"><span class='ocrx_word' id='word_1_209' title='bbox 51 508 76 526; x_wconf 83' lang='eng'>63</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 45 529 91 531">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 45 529 91 531">
+     <span class='ocr_line' id='line_1_60' title="bbox 45 529 91 531; baseline 0 595"><span class='ocrx_word' id='word_1_210' title='bbox 45 529 91 531; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 171 472 173 556">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 171 472 173 556">
+     <span class='ocr_line' id='line_1_61' title="bbox 171 472 173 556; baseline 0 570"><span class='ocrx_word' id='word_1_211' title='bbox 171 472 173 556; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 131 520 156 538">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 131 520 156 538">
+     <span class='ocr_line' id='line_1_62' title="bbox 131 520 156 538; baseline 0 0"><span class='ocrx_word' id='word_1_212' title='bbox 131 520 156 538; x_wconf 90' lang='eng'><em>96</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 171 554 198 556">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 171 554 198 556">
+     <span class='ocr_line' id='line_1_63' title="bbox 171 554 198 556; baseline 0 570"><span class='ocrx_word' id='word_1_213' title='bbox 171 554 198 556; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 233 560 300 562">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 233 560 300 562">
+     <span class='ocr_line' id='line_1_64' title="bbox 233 560 300 562; baseline 0 564"><span class='ocrx_word' id='word_1_214' title='bbox 233 560 300 562; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 298 542 300 579">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 298 542 300 579">
+     <span class='ocr_line' id='line_1_65' title="bbox 298 542 300 579; baseline 0 547"><span class='ocrx_word' id='word_1_215' title='bbox 298 542 300 579; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_37' title="bbox 196 507 199 602">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 196 507 199 602">
+     <span class='ocr_line' id='line_1_66' title="bbox 196 507 199 602; baseline 0 524"><span class='ocrx_word' id='word_1_216' title='bbox 196 507 199 602; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_38' title="bbox 196 600 235 602">
+    <p class='ocr_par' dir='ltr' id='par_1_42' title="bbox 196 600 235 602">
+     <span class='ocr_line' id='line_1_67' title="bbox 196 600 235 602; baseline 0 524"><span class='ocrx_word' id='word_1_217' title='bbox 196 600 235 602; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_39' title="bbox 233 560 235 642">
+    <p class='ocr_par' dir='ltr' id='par_1_43' title="bbox 233 560 235 642">
+     <span class='ocr_line' id='line_1_68' title="bbox 233 560 235 642; baseline 0 484"><span class='ocrx_word' id='word_1_218' title='bbox 233 560 235 642; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_40' title="bbox 305 651 307 686">
+    <p class='ocr_par' dir='ltr' id='par_1_44' title="bbox 305 651 307 686">
+     <span class='ocr_line' id='line_1_69' title="bbox 305 651 307 686; baseline 0 440"><span class='ocrx_word' id='word_1_219' title='bbox 305 651 307 686; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_41' title="bbox 89 321 91 739">
+    <p class='ocr_par' dir='ltr' id='par_1_45' title="bbox 89 321 91 739">
+     <span class='ocr_line' id='line_1_70' title="bbox 89 321 91 739; baseline 0 387"><span class='ocrx_word' id='word_1_220' title='bbox 89 321 91 739; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_42' title="bbox 89 737 195 739">
+    <p class='ocr_par' dir='ltr' id='par_1_46' title="bbox 89 737 195 739">
+     <span class='ocr_line' id='line_1_71' title="bbox 89 737 195 739; baseline 0 387"><span class='ocrx_word' id='word_1_221' title='bbox 89 737 195 739; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_43' title="bbox 193 719 195 756">
+    <p class='ocr_par' dir='ltr' id='par_1_47' title="bbox 193 719 195 756">
+     <span class='ocr_line' id='line_1_72' title="bbox 193 719 195 756; baseline 0 370"><span class='ocrx_word' id='word_1_222' title='bbox 193 719 195 756; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_44' title="bbox 45 529 47 822">
+    <p class='ocr_par' dir='ltr' id='par_1_48' title="bbox 45 529 47 822">
+     <span class='ocr_line' id='line_1_73' title="bbox 45 529 47 822; baseline 0 304"><span class='ocrx_word' id='word_1_223' title='bbox 45 529 47 822; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_45' title="bbox 5 816 40 818">
+    <p class='ocr_par' dir='ltr' id='par_1_49' title="bbox 5 816 40 818">
+     <span class='ocr_line' id='line_1_74' title="bbox 5 816 40 818; baseline 0 308"><span class='ocrx_word' id='word_1_224' title='bbox 5 816 40 818; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_46' title="bbox 47 820 138 822">
+    <p class='ocr_par' dir='ltr' id='par_1_50' title="bbox 47 820 138 822">
+     <span class='ocr_line' id='line_1_75' title="bbox 47 820 138 822; baseline 0 304"><span class='ocrx_word' id='word_1_225' title='bbox 47 820 138 822; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_47' title="bbox 139 789 142 879">
+    <p class='ocr_par' dir='ltr' id='par_1_51' title="bbox 139 789 142 879">
+     <span class='ocr_line' id='line_1_76' title="bbox 139 789 142 879; baseline 0 247"><span class='ocrx_word' id='word_1_226' title='bbox 139 789 142 879; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_48' title="bbox 140 877 179 879">
+    <p class='ocr_par' dir='ltr' id='par_1_52' title="bbox 140 877 179 879">
+     <span class='ocr_line' id='line_1_77' title="bbox 140 877 179 879; baseline 0 247"><span class='ocrx_word' id='word_1_227' title='bbox 140 877 179 879; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_49' title="bbox 177 860 179 897">
+    <p class='ocr_par' dir='ltr' id='par_1_53' title="bbox 177 860 179 897">
+     <span class='ocr_line' id='line_1_78' title="bbox 177 860 179 897; baseline 0 229"><span class='ocrx_word' id='word_1_228' title='bbox 177 860 179 897; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_50' title="bbox 5 816 7 1065">
+    <p class='ocr_par' dir='ltr' id='par_1_54' title="bbox 5 816 7 1065">
+     <span class='ocr_line' id='line_1_79' title="bbox 5 816 7 1065; baseline 0 61"><span class='ocrx_word' id='word_1_229' title='bbox 5 816 7 1065; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_51' title="bbox 5 1063 40 1065">
+    <p class='ocr_par' dir='ltr' id='par_1_55' title="bbox 5 1063 40 1065">
+     <span class='ocr_line' id='line_1_80' title="bbox 5 1063 40 1065; baseline 0 61"><span class='ocrx_word' id='word_1_230' title='bbox 5 1063 40 1065; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_52' title="bbox 38 675 40 1092">
+    <p class='ocr_par' dir='ltr' id='par_1_56' title="bbox 38 675 40 1092">
+     <span class='ocr_line' id='line_1_81' title="bbox 38 675 40 1092; baseline 0 34"><span class='ocrx_word' id='word_1_231' title='bbox 38 675 40 1092; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_53' title="bbox 135 1072 687 1074">
+    <p class='ocr_par' dir='ltr' id='par_1_57' title="bbox 135 1072 687 1074">
+     <span class='ocr_line' id='line_1_82' title="bbox 135 1072 687 1074; baseline 0 52"><span class='ocrx_word' id='word_1_232' title='bbox 135 1072 687 1074; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_54' title="bbox 38 1090 137 1092">
+    <p class='ocr_par' dir='ltr' id='par_1_58' title="bbox 38 1090 137 1092">
+     <span class='ocr_line' id='line_1_83' title="bbox 38 1090 137 1092; baseline 0 34"><span class='ocrx_word' id='word_1_233' title='bbox 38 1090 137 1092; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_55' title="bbox 135 1072 137 1109">
+    <p class='ocr_par' dir='ltr' id='par_1_59' title="bbox 135 1072 137 1109">
+     <span class='ocr_line' id='line_1_84' title="bbox 135 1072 137 1109; baseline 0 17"><span class='ocrx_word' id='word_1_234' title='bbox 135 1072 137 1109; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000760-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000760-0-001.pbm.png
new file mode 100644
index 00000000..4e8e0b1b
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000760-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000760-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000760-0-001.pbm.png.hocr
new file mode 100644
index 00000000..ee246358
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000760-0-001.pbm.png.hocr
@@ -0,0 +1,545 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000760-0-001.pbm.png"; bbox 0 0 2603 1473; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 8 4 1102 55">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 8 4 1102 55">
+     <span class='ocr_line' id='line_1_1' title="bbox 8 4 207 35; baseline -0.005 -6"><span class='ocrx_word' id='word_1_1' title='bbox 8 4 46 35; x_wconf 86' lang='eng' dir='ltr'>(a)</span> <span class='ocrx_word' id='word_1_2' title='bbox 60 4 114 29; x_wconf 89' lang='eng' dir='ltr'>16S</span> <span class='ocrx_word' id='word_1_3' title='bbox 128 4 207 28; x_wconf 93' lang='eng' dir='ltr'>rRNA</span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 583 32 1102 55; baseline 0 -5"><span class='ocrx_word' id='word_1_4' title='bbox 583 32 607 50; x_wconf 93' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_5' title='bbox 617 32 679 50; x_wconf 74' lang='eng' dir='ltr'><em>avium</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 688 32 755 54; x_wconf 87' lang='eng' dir='ltr'>subsp.</span> <span class='ocrx_word' id='word_1_7' title='bbox 766 32 828 50; x_wconf 81' lang='eng' dir='ltr'><em>avium</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 837 32 888 50; x_wconf 87' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_9' title='bbox 896 32 971 50; x_wconf 80' lang='eng' dir='ltr'>44155T</span> <span class='ocrx_word' id='word_1_10' title='bbox 980 32 1102 55; x_wconf 87' lang='eng' dir='ltr'>(AJ536037)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 246 38 783 230">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 247 38 783 230">
+     <span class='ocr_line' id='line_1_3' title="bbox 318 38 574 66; baseline 0 1407"><span class='ocrx_word' id='word_1_11' title='bbox 318 38 574 66; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 293 66 574 83; baseline 0 1390"><span class='ocrx_word' id='word_1_12' title='bbox 293 66 574 83; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 293 83 550 128; baseline 0 1345"><span class='ocrx_word' id='word_1_13' title='bbox 293 83 550 128; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 293 128 767 163; baseline 0 1310"><span class='ocrx_word' id='word_1_14' title='bbox 293 128 767 163; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 247 163 783 194; baseline 0 1279"><span class='ocrx_word' id='word_1_15' title='bbox 247 163 783 194; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 247 194 593 230; baseline 0.003 -1"><span class='ocrx_word' id='word_1_16' title='bbox 247 194 593 230; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 537 94 1184 335">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 550 94 945 117">
+     <span class='ocr_line' id='line_1_9' title="bbox 550 94 945 117; baseline 0 -5"><span class='ocrx_word' id='word_1_17' title='bbox 550 94 573 112; x_wconf 94' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_18' title='bbox 583 94 685 112; x_wconf 71' lang='eng' dir='ltr'>shimoidei</span> <span class='ocrx_word' id='word_1_19' title='bbox 691 94 755 112; x_wconf 91' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_20' title='bbox 763 94 838 112; x_wconf 78' lang='eng' dir='ltr'>27962T</span> <span class='ocrx_word' id='word_1_21' title='bbox 848 94 945 117; x_wconf 84' lang='eng' dir='ltr'>(X82459)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 593 129 1183 228">
+     <span class='ocr_line' id='line_1_10' title="bbox 767 129 1183 152; baseline 0 -5"><span class='ocrx_word' id='word_1_22' title='bbox 767 129 790 147; x_wconf 90' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_23' title='bbox 801 129 976 147; x_wconf 81' lang='eng' dir='ltr'>heckeshornense</span> <span class='ocrx_word' id='word_1_24' title='bbox 984 129 1048 147; x_wconf 81' lang='eng' dir='ltr'>S369T</span> <span class='ocrx_word' id='word_1_25' title='bbox 1058 129 1183 152; x_wconf 87' lang='eng' dir='ltr'>(AF174290)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 790 168 1167 191; baseline 0 -5"><span class='ocrx_word' id='word_1_26' title='bbox 790 168 813 186; x_wconf 91' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_27' title='bbox 823 168 895 190; x_wconf 83' lang='eng' dir='ltr'><em>xenopi</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 903 168 953 186; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_29' title='bbox 961 168 1036 186; x_wconf 84' lang='eng' dir='ltr'>43995T</span> <span class='ocrx_word' id='word_1_30' title='bbox 1045 168 1167 191; x_wconf 85' lang='eng' dir='ltr'>(AJ536033)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 593 203 1109 228; baseline 0 -5"><span class='ocrx_word' id='word_1_31' title='bbox 593 203 617 221; x_wconf 88' lang='eng'>54</span> <span class='ocrx_word' id='word_1_32' title='bbox 770 205 793 223; x_wconf 90' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_33' title='bbox 804 205 907 223; x_wconf 80' lang='eng' dir='ltr'>batniense</span> <span class='ocrx_word' id='word_1_34' title='bbox 916 205 979 223; x_wconf 75' lang='eng' dir='ltr'>E347T</span> <span class='ocrx_word' id='word_1_35' title='bbox 987 205 1109 228; x_wconf 84' lang='eng' dir='ltr'>(AJO12756)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 537 240 911 263">
+     <span class='ocr_line' id='line_1_13' title="bbox 537 240 911 263; baseline 0 -5"><span class='ocrx_word' id='word_1_36' title='bbox 537 240 560 258; x_wconf 94' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_37' title='bbox 570 240 652 258; x_wconf 77' lang='eng' dir='ltr'><em>celatum</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 660 240 724 258; x_wconf 87' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_39' title='bbox 733 240 807 258; x_wconf 82' lang='eng' dir='ltr'>51131T</span> <span class='ocrx_word' id='word_1_40' title='bbox 817 240 911 263; x_wconf 84' lang='eng' dir='ltr'>(L08169)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 587 279 969 302">
+     <span class='ocr_line' id='line_1_14' title="bbox 587 279 969 302; baseline 0 -5"><span class='ocrx_word' id='word_1_41' title='bbox 587 280 610 297; x_wconf 68' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_42' title='bbox 620 280 682 297; x_wconf 80' lang='eng' dir='ltr'>cookii</span> <span class='ocrx_word' id='word_1_43' title='bbox 688 279 752 297; x_wconf 88' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_44' title='bbox 760 279 836 297; x_wconf 88' lang='eng' dir='ltr'>49103T</span> <span class='ocrx_word' id='word_1_45' title='bbox 844 279 969 302; x_wconf 83' lang='eng' dir='ltr'>(AF480598)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 605 312 1013 335">
+     <span class='ocr_line' id='line_1_15' title="bbox 605 312 1013 335; baseline 0.002 -5"><span class='ocrx_word' id='word_1_46' title='bbox 605 313 628 330; x_wconf 93' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_47' title='bbox 638 313 796 331; x_wconf 84' lang='eng' dir='ltr'>branderiATCC</span> <span class='ocrx_word' id='word_1_48' title='bbox 806 312 879 331; x_wconf 67' lang='eng' dir='ltr'>51789T</span> <span class='ocrx_word' id='word_1_49' title='bbox 889 313 1013 335; x_wconf 86' lang='eng' dir='ltr'>(AF480574)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 503 343 939 397">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 503 343 939 397">
+     <span class='ocr_line' id='line_1_16' title="bbox 503 343 787 366; baseline 0 -5"><span class='ocrx_word' id='word_1_50' title='bbox 503 343 555 361; x_wconf 96' lang='eng' dir='ltr'>KUM</span> <span class='ocrx_word' id='word_1_51' title='bbox 563 343 653 361; x_wconf 76' lang='eng' dir='ltr'>060204T</span> <span class='ocrx_word' id='word_1_52' title='bbox 661 343 787 366; x_wconf 89' lang='eng' dir='ltr'>(AB370111)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 577 374 939 397; baseline 0 -5"><span class='ocrx_word' id='word_1_53' title='bbox 577 375 600 392; x_wconf 92' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_54' title='bbox 610 375 678 392; x_wconf 83' lang='eng' dir='ltr'>trivia/e</span> <span class='ocrx_word' id='word_1_55' title='bbox 685 374 750 392; x_wconf 88' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_56' title='bbox 758 374 833 392; x_wconf 76' lang='eng' dir='ltr'>23292T</span> <span class='ocrx_word' id='word_1_57' title='bbox 842 374 939 397; x_wconf 83' lang='eng' dir='ltr'>(X88924)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 469 409 1057 620">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 526 409 919 432">
+     <span class='ocr_line' id='line_1_18' title="bbox 526 409 919 432; baseline 0 -5"><span class='ocrx_word' id='word_1_58' title='bbox 526 410 549 427; x_wconf 93' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_59' title='bbox 559 410 657 427; x_wconf 85' lang='eng' dir='ltr'><em>hiberniae</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 665 410 729 427; x_wconf 89' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_61' title='bbox 737 409 812 427; x_wconf 81' lang='eng' dir='ltr'>49874T</span> <span class='ocrx_word' id='word_1_62' title='bbox 822 409 919 432; x_wconf 87' lang='eng' dir='ltr'>(X67096)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 505 449 1057 508">
+     <span class='ocr_line' id='line_1_19' title="bbox 505 449 1057 471; baseline 0.002 -5"><span class='ocrx_word' id='word_1_63' title='bbox 505 452 529 470; x_wconf 81' lang='eng'>99</span> <span class='ocrx_word' id='word_1_64' title='bbox 553 449 576 466; x_wconf 97' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_65' title='bbox 586 449 796 471; x_wconf 84' lang='eng' dir='ltr'>nonchromogenicum</span> <span class='ocrx_word' id='word_1_66' title='bbox 803 449 867 467; x_wconf 88' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_67' title='bbox 878 449 951 467; x_wconf 79' lang='eng' dir='ltr'>19530T</span> <span class='ocrx_word' id='word_1_68' title='bbox 961 449 1057 471; x_wconf 81' lang='eng' dir='ltr'>(X52928)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 553 485 941 508; baseline 0 -5"><span class='ocrx_word' id='word_1_69' title='bbox 553 486 576 503; x_wconf 96' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_70' title='bbox 587 490 686 508; x_wconf 82' lang='eng' dir='ltr'>arupense</span> <span class='ocrx_word' id='word_1_71' title='bbox 693 485 802 503; x_wconf 78' lang='eng' dir='ltr'>AR30097T</span> <span class='ocrx_word' id='word_1_72' title='bbox 811 485 941 508; x_wconf 86' lang='eng' dir='ltr'>(DQ157760)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 476 522 832 545">
+     <span class='ocr_line' id='line_1_21' title="bbox 476 522 832 545; baseline 0 -5"><span class='ocrx_word' id='word_1_73' title='bbox 476 523 500 540; x_wconf 92' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_74' title='bbox 510 524 571 540; x_wconf 80' lang='eng' dir='ltr'>terrae</span> <span class='ocrx_word' id='word_1_75' title='bbox 579 522 643 540; x_wconf 86' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_76' title='bbox 653 522 726 540; x_wconf 77' lang='eng' dir='ltr'>15755T</span> <span class='ocrx_word' id='word_1_77' title='bbox 735 523 832 545; x_wconf 89' lang='eng' dir='ltr'>(X52925)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 469 560 938 583">
+     <span class='ocr_line' id='line_1_22' title="bbox 469 560 938 583; baseline 0 -5"><span class='ocrx_word' id='word_1_78' title='bbox 469 560 492 578; x_wconf 96' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_79' title='bbox 502 560 679 578; x_wconf 75' lang='eng' dir='ltr'>kumamotonense</span> <span class='ocrx_word' id='word_1_80' title='bbox 687 560 734 578; x_wconf 87' lang='eng' dir='ltr'>CST</span> <span class='ocrx_word' id='word_1_81' title='bbox 742 560 803 578; x_wconf 80' lang='eng' dir='ltr'>7247T</span> <span class='ocrx_word' id='word_1_82' title='bbox 812 560 938 583; x_wconf 77' lang='eng' dir='ltr'>(A8239925)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 553 596 947 620">
+     <span class='ocr_line' id='line_1_23' title="bbox 553 596 947 620; baseline 0 -5"><span class='ocrx_word' id='word_1_83' title='bbox 553 597 576 615; x_wconf 93' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_84' title='bbox 587 597 671 615; x_wconf 86' lang='eng' dir='ltr'>doricum</span> <span class='ocrx_word' id='word_1_85' title='bbox 680 597 730 615; x_wconf 92' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_86' title='bbox 739 596 814 615; x_wconf 78' lang='eng' dir='ltr'>44339T</span> <span class='ocrx_word' id='word_1_87' title='bbox 822 597 947 620; x_wconf 86' lang='eng' dir='ltr'>(AF264700)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 633 642 1121 665">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 633 642 1121 665">
+     <span class='ocr_line' id='line_1_24' title="bbox 633 642 1121 665; baseline 0 -5"><span class='ocrx_word' id='word_1_88' title='bbox 633 642 727 660; x_wconf 84' lang='eng' dir='ltr'>Nocardia</span> <span class='ocrx_word' id='word_1_89' title='bbox 736 642 845 660; x_wconf 71' lang='eng' dir='ltr'>asteroides</span> <span class='ocrx_word' id='word_1_90' title='bbox 854 642 904 660; x_wconf 90' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_91' title='bbox 913 642 988 660; x_wconf 65' lang='eng' dir='ltr'>43757r</span> <span class='ocrx_word' id='word_1_92' title='bbox 997 642 1121 665; x_wconf 83' lang='eng' dir='ltr'>(AF430019)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 1062 680 1236 716">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 1114 680 1156 697">
+     <span class='ocr_line' id='line_1_25' title="bbox 1114 680 1156 697; baseline 0 0"><span class='ocrx_word' id='word_1_93' title='bbox 1114 680 1156 697; x_wconf 88' lang='eng'>0.01</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 0 194 770 659">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 0 194 770 659">
+     <span class='ocr_line' id='line_1_26' title="bbox 617 194 770 229; baseline 0 1244"><span class='ocrx_word' id='word_1_94' title='bbox 617 194 770 229; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 170 230 537 274; baseline 0 1199"><span class='ocrx_word' id='word_1_95' title='bbox 170 230 537 274; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 170 274 587 313; baseline 0 1160"><span class='ocrx_word' id='word_1_96' title='bbox 170 274 587 313; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 170 313 600 346; baseline 0 0"><span class='ocrx_word' id='word_1_97' title='bbox 170 313 600 346; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 171 346 503 377; baseline 0 1096"><span class='ocrx_word' id='word_1_98' title='bbox 171 346 503 377; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 171 377 570 408; baseline 0 0"><span class='ocrx_word' id='word_1_99' title='bbox 171 377 570 408; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 171 408 519 443; baseline 0 0"><span class='ocrx_word' id='word_1_100' title='bbox 171 408 519 443; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 0 443 505 482; baseline 0 991"><span class='ocrx_word' id='word_1_101' title='bbox 0 443 505 482; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 0 482 546 519; baseline 0 0"><span class='ocrx_word' id='word_1_102' title='bbox 0 482 546 519; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 0 519 465 556; baseline 0 917"><span class='ocrx_word' id='word_1_103' title='bbox 0 519 465 556; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 0 556 469 594; baseline 0 879"><span class='ocrx_word' id='word_1_104' title='bbox 0 556 469 594; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 0 594 553 632; baseline 0 841"><span class='ocrx_word' id='word_1_105' title='bbox 0 594 553 632; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 0 632 627 659; baseline 0 814"><span class='ocrx_word' id='word_1_106' title='bbox 0 632 627 659; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 8 735 125 766">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 8 735 125 766">
+     <span class='ocr_line' id='line_1_39' title="bbox 8 735 125 766; baseline -0.009 -6"><span class='ocrx_word' id='word_1_107' title='bbox 8 735 44 766; x_wconf 87' lang='eng' dir='ltr'>(c)</span> <span class='ocrx_word' id='word_1_108' title='bbox 56 735 125 766; x_wconf 90' lang='eng' dir='ltr'>rpoB</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 235 865 1247 1035">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 235 865 1063 891">
+     <span class='ocr_line' id='line_1_40' title="bbox 235 865 1063 891; baseline 0 -5"><span class='ocrx_word' id='word_1_109' title='bbox 235 865 258 882; x_wconf 78' lang='eng'>17</span> <span class='ocrx_word' id='word_1_110' title='bbox 683 868 706 886; x_wconf 92' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_111' title='bbox 717 868 785 886; x_wconf 72' lang='eng' dir='ltr'>trivia/e</span> <span class='ocrx_word' id='word_1_112' title='bbox 794 868 843 886; x_wconf 86' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_113' title='bbox 852 868 928 886; x_wconf 78' lang='eng' dir='ltr'>44153T</span> <span class='ocrx_word' id='word_1_114' title='bbox 937 868 1063 891; x_wconf 85' lang='eng' dir='ltr'>(AY544971)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 782 896 1194 920">
+     <span class='ocr_line' id='line_1_41' title="bbox 782 896 1194 920; baseline 0 -5"><span class='ocrx_word' id='word_1_115' title='bbox 782 897 805 915; x_wconf 79' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_116' title='bbox 815 897 917 915; x_wconf 82' lang='eng' dir='ltr'>shimoidei</span> <span class='ocrx_word' id='word_1_117' title='bbox 925 897 975 915; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_118' title='bbox 983 896 1059 915; x_wconf 76' lang='eng' dir='ltr'>44152T</span> <span class='ocrx_word' id='word_1_119' title='bbox 1068 897 1194 920; x_wconf 86' lang='eng' dir='ltr'>(AY544962)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 811 927 1192 950">
+     <span class='ocr_line' id='line_1_42' title="bbox 811 927 1192 950; baseline 0 -5"><span class='ocrx_word' id='word_1_120' title='bbox 811 928 833 945; x_wconf 87' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_121' title='bbox 843 928 915 950; x_wconf 83' lang='eng' dir='ltr'><em>xenopi</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 922 927 960 945; x_wconf 87' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_123' title='bbox 971 927 1057 945; x_wconf 82' lang='eng' dir='ltr'>104035T</span> <span class='ocrx_word' id='word_1_124' title='bbox 1066 927 1192 950; x_wconf 89' lang='eng' dir='ltr'>(AY544979)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 759 955 1247 1007">
+     <span class='ocr_line' id='line_1_43' title="bbox 759 955 1247 978; baseline 0 -5"><span class='ocrx_word' id='word_1_125' title='bbox 759 955 782 973; x_wconf 95' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_126' title='bbox 792 955 968 973; x_wconf 80' lang='eng' dir='ltr'>heckeshornense</span> <span class='ocrx_word' id='word_1_127' title='bbox 977 955 1027 973; x_wconf 84' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_128' title='bbox 1036 955 1111 973; x_wconf 77' lang='eng' dir='ltr'>44428T</span> <span class='ocrx_word' id='word_1_129' title='bbox 1120 955 1247 978; x_wconf 82' lang='eng' dir='ltr'>(AY544922)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 780 984 1194 1007; baseline 0 -5"><span class='ocrx_word' id='word_1_130' title='bbox 780 985 802 1002; x_wconf 94' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_131' title='bbox 813 985 916 1002; x_wconf 81' lang='eng' dir='ltr'>botniense</span> <span class='ocrx_word' id='word_1_132' title='bbox 925 985 975 1002; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_133' title='bbox 983 984 1059 1002; x_wconf 75' lang='eng' dir='ltr'>44537T</span> <span class='ocrx_word' id='word_1_134' title='bbox 1067 985 1194 1007; x_wconf 87' lang='eng' dir='ltr'>(AY544891)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 478 1012 1001 1035">
+     <span class='ocr_line' id='line_1_45' title="bbox 478 1012 1001 1035; baseline 0 -5"><span class='ocrx_word' id='word_1_135' title='bbox 478 1013 501 1030; x_wconf 91' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_136' title='bbox 511 1013 573 1031; x_wconf 84' lang='eng' dir='ltr'><em>avium</em></span> <span class='ocrx_word' id='word_1_137' title='bbox 582 1013 650 1035; x_wconf 79' lang='eng' dir='ltr'>subsp.</span> <span class='ocrx_word' id='word_1_138' title='bbox 660 1013 723 1031; x_wconf 80' lang='eng' dir='ltr'><em>avium</em></span> <span class='ocrx_word' id='word_1_139' title='bbox 732 1013 769 1031; x_wconf 85' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_140' title='bbox 780 1012 866 1031; x_wconf 75' lang='eng' dir='ltr'>104244T</span> <span class='ocrx_word' id='word_1_141' title='bbox 875 1013 1001 1035; x_wconf 88' lang='eng' dir='ltr'>(AY544887)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 647 1044 1245 1167">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 700 1044 1245 1100">
+     <span class='ocr_line' id='line_1_46' title="bbox 850 1044 1245 1067; baseline 0 -5"><span class='ocrx_word' id='word_1_142' title='bbox 850 1045 874 1062; x_wconf 92' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_143' title='bbox 884 1045 966 1062; x_wconf 78' lang='eng' dir='ltr'>celatum</span> <span class='ocrx_word' id='word_1_144' title='bbox 974 1045 1012 1062; x_wconf 90' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_145' title='bbox 1023 1044 1109 1062; x_wconf 79' lang='eng' dir='ltr'>106109T</span> <span class='ocrx_word' id='word_1_146' title='bbox 1118 1045 1245 1067; x_wconf 84' lang='eng' dir='ltr'>(AY544897)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 700 1077 1098 1100; baseline 0 -5"><span class='ocrx_word' id='word_1_147' title='bbox 700 1077 723 1095; x_wconf 92' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_148' title='bbox 733 1077 821 1095; x_wconf 82' lang='eng' dir='ltr'>branderi</span> <span class='ocrx_word' id='word_1_149' title='bbox 828 1077 866 1095; x_wconf 83' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_150' title='bbox 877 1077 963 1095; x_wconf 86' lang='eng' dir='ltr'>104592T</span> <span class='ocrx_word' id='word_1_151' title='bbox 972 1077 1098 1100; x_wconf 86' lang='eng' dir='ltr'>(AY544895)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 839 1107 1124 1130">
+     <span class='ocr_line' id='line_1_48' title="bbox 839 1107 1124 1130; baseline 0 -5"><span class='ocrx_word' id='word_1_152' title='bbox 839 1108 891 1125; x_wconf 92' lang='eng' dir='ltr'>KUM</span> <span class='ocrx_word' id='word_1_153' title='bbox 900 1107 989 1125; x_wconf 77' lang='eng' dir='ltr'>060204T</span> <span class='ocrx_word' id='word_1_154' title='bbox 998 1107 1124 1130; x_wconf 87' lang='eng' dir='ltr'>(AB370178)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 647 1144 1040 1167">
+     <span class='ocr_line' id='line_1_49' title="bbox 647 1144 1040 1167; baseline 0 -5"><span class='ocrx_word' id='word_1_155' title='bbox 647 1145 670 1162; x_wconf 98' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_156' title='bbox 680 1145 762 1162; x_wconf 81' lang='eng' dir='ltr'><em>kubicae</em></span> <span class='ocrx_word' id='word_1_157' title='bbox 770 1145 808 1162; x_wconf 87' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_158' title='bbox 818 1144 905 1162; x_wconf 72' lang='eng' dir='ltr'>106428T</span> <span class='ocrx_word' id='word_1_159' title='bbox 914 1145 1040 1167; x_wconf 84' lang='eng' dir='ltr'>(AY544937)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 448 1177 1235 1229">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 448 1177 1235 1229">
+     <span class='ocr_line' id='line_1_50' title="bbox 839 1177 1235 1200; baseline 0 -5"><span class='ocrx_word' id='word_1_160' title='bbox 839 1178 862 1195; x_wconf 92' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_161' title='bbox 873 1178 956 1195; x_wconf 81' lang='eng' dir='ltr'><em>doricum</em></span> <span class='ocrx_word' id='word_1_162' title='bbox 966 1177 1016 1195; x_wconf 87' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_163' title='bbox 1024 1177 1100 1195; x_wconf 78' lang='eng' dir='ltr'>44339T</span> <span class='ocrx_word' id='word_1_164' title='bbox 1108 1178 1235 1200; x_wconf 86' lang='eng' dir='ltr'>(AY544906)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_51' title="bbox 448 1206 877 1229; baseline 0 -5"><span class='ocrx_word' id='word_1_165' title='bbox 448 1207 471 1224; x_wconf 94' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_166' title='bbox 481 1207 598 1229; x_wconf 77' lang='eng' dir='ltr'>interjectum</span> <span class='ocrx_word' id='word_1_167' title='bbox 608 1207 658 1225; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_168' title='bbox 666 1206 742 1225; x_wconf 66' lang='eng' dir='ltr'>44064T</span> <span class='ocrx_word' id='word_1_169' title='bbox 751 1207 877 1229; x_wconf 88' lang='eng' dir='ltr'>(AY544928)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 451 1242 1101 1333">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 451 1242 1101 1333">
+     <span class='ocr_line' id='line_1_52' title="bbox 451 1242 823 1265; baseline 0 -5"><span class='ocrx_word' id='word_1_170' title='bbox 451 1243 474 1260; x_wconf 95' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_171' title='bbox 484 1243 546 1260; x_wconf 83' lang='eng' dir='ltr'>cookii</span> <span class='ocrx_word' id='word_1_172' title='bbox 553 1242 592 1260; x_wconf 89' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_173' title='bbox 602 1242 689 1260; x_wconf 76' lang='eng' dir='ltr'>105396T</span> <span class='ocrx_word' id='word_1_174' title='bbox 697 1242 823 1265; x_wconf 84' lang='eng' dir='ltr'>(AY544904)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_53' title="bbox 527 1275 966 1298; baseline 0 -5"><span class='ocrx_word' id='word_1_175' title='bbox 527 1276 549 1293; x_wconf 94' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_176' title='bbox 560 1276 687 1298; x_wconf 82' lang='eng' dir='ltr'>conspicuum</span> <span class='ocrx_word' id='word_1_177' title='bbox 695 1275 734 1293; x_wconf 90' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_178' title='bbox 744 1275 830 1293; x_wconf 82' lang='eng' dir='ltr'>105165T</span> <span class='ocrx_word' id='word_1_179' title='bbox 839 1275 966 1298; x_wconf 79' lang='eng' dir='ltr'>(AY544903)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_54' title="bbox 626 1310 1101 1333; baseline 0 -5"><span class='ocrx_word' id='word_1_180' title='bbox 626 1311 770 1328; x_wconf 78' lang='eng' dir='ltr'>Rhodococcus</span> <span class='ocrx_word' id='word_1_181' title='bbox 778 1311 823 1333; x_wconf 83' lang='eng' dir='ltr'><em>equi</em></span> <span class='ocrx_word' id='word_1_182' title='bbox 829 1310 893 1328; x_wconf 90' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_183' title='bbox 904 1311 967 1328; x_wconf 86' lang='eng'>10146</span> <span class='ocrx_word' id='word_1_184' title='bbox 976 1310 1101 1333; x_wconf 88' lang='eng' dir='ltr'>(AF057494)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 0 874 848 1327">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 0 874 848 1327">
+     <span class='ocr_line' id='line_1_55' title="bbox 114 874 683 902; baseline 0 571"><span class='ocrx_word' id='word_1_185' title='bbox 114 874 683 902; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_56' title="bbox 114 902 808 944; baseline 0 0"><span class='ocrx_word' id='word_1_186' title='bbox 114 902 808 944; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_57' title="bbox 93 944 759 961; baseline 0 512"><span class='ocrx_word' id='word_1_187' title='bbox 93 944 759 961; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_58' title="bbox 93 961 777 1001; baseline 0 0"><span class='ocrx_word' id='word_1_188' title='bbox 93 961 777 1001; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_59' title="bbox 96 1001 478 1018; baseline 0 455"><span class='ocrx_word' id='word_1_189' title='bbox 96 1001 478 1018; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_60' title="bbox 96 1018 478 1046; baseline 0 427"><span class='ocrx_word' id='word_1_190' title='bbox 96 1018 478 1046; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_61' title="bbox 2 1046 848 1066; baseline 0 407"><span class='ocrx_word' id='word_1_191' title='bbox 2 1046 848 1066; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_62' title="bbox 2 1066 700 1111; baseline 0 362"><span class='ocrx_word' id='word_1_192' title='bbox 2 1066 700 1111; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_63' title="bbox 1 1111 837 1133; baseline 0 340"><span class='ocrx_word' id='word_1_193' title='bbox 1 1111 837 1133; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_64' title="bbox 1 1133 647 1178; baseline 0 295"><span class='ocrx_word' id='word_1_194' title='bbox 1 1133 647 1178; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_65' title="bbox 1 1178 837 1195; baseline 0 278"><span class='ocrx_word' id='word_1_195' title='bbox 1 1178 837 1195; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_66' title="bbox 0 1195 448 1240; baseline 0 233"><span class='ocrx_word' id='word_1_196' title='bbox 0 1195 448 1240; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_67' title="bbox 0 1240 451 1276; baseline 0 197"><span class='ocrx_word' id='word_1_197' title='bbox 0 1240 451 1276; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_68' title="bbox 0 1276 527 1309; baseline 0 164"><span class='ocrx_word' id='word_1_198' title='bbox 0 1276 527 1309; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_69' title="bbox 0 1309 617 1327; baseline 0 146"><span class='ocrx_word' id='word_1_199' title='bbox 0 1309 617 1327; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 1104 1432 1145 1449">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 1104 1432 1145 1449">
+     <span class='ocr_line' id='line_1_70' title="bbox 1104 1432 1145 1449; baseline 0 0"><span class='ocrx_word' id='word_1_200' title='bbox 1104 1432 1145 1449; x_wconf 90' lang='eng'>001</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 1355 4 2367 73">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 1355 4 2367 73">
+     <span class='ocr_line' id='line_1_71' title="bbox 1355 4 1495 35; baseline 0 -6"><span class='ocrx_word' id='word_1_201' title='bbox 1355 4 1392 35; x_wconf 93' lang='eng' dir='ltr'>(b)</span> <span class='ocrx_word' id='word_1_202' title='bbox 1404 4 1495 35; x_wconf 89' lang='eng' dir='ltr'>hsp65</span> 
+     </span>
+     <span class='ocr_line' id='line_1_72' title="bbox 1988 50 2367 73; baseline 0 -5"><span class='ocrx_word' id='word_1_203' title='bbox 1988 50 2011 68; x_wconf 95' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_204' title='bbox 2021 50 2090 68; x_wconf 71' lang='eng' dir='ltr'>trivia/e</span> <span class='ocrx_word' id='word_1_205' title='bbox 2098 50 2148 68; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_206' title='bbox 2157 50 2232 68; x_wconf 68' lang='eng' dir='ltr'>44153T</span> <span class='ocrx_word' id='word_1_207' title='bbox 2242 50 2367 73; x_wconf 83' lang='eng' dir='ltr'>(AF547883)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 1883 94 2469 156">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 1883 94 2468 156">
+     <span class='ocr_line' id='line_1_73' title="bbox 1883 94 2254 117; baseline 0 -5"><span class='ocrx_word' id='word_1_208' title='bbox 1883 95 1906 112; x_wconf 93' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_209' title='bbox 1916 95 1978 112; x_wconf 79' lang='eng' dir='ltr'><em>cookii</em></span> <span class='ocrx_word' id='word_1_210' title='bbox 1986 95 2024 112; x_wconf 92' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_211' title='bbox 2035 94 2121 112; x_wconf 69' lang='eng' dir='ltr'>105396T</span> <span class='ocrx_word' id='word_1_212' title='bbox 2130 95 2254 117; x_wconf 88' lang='eng' dir='ltr'>(AF547824)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_74' title="bbox 2042 133 2468 156; baseline 0 -5"><span class='ocrx_word' id='word_1_213' title='bbox 2042 134 2065 151; x_wconf 92' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_214' title='bbox 2075 133 2202 151; x_wconf 77' lang='eng' dir='ltr'>tuberculosis</span> <span class='ocrx_word' id='word_1_215' title='bbox 2210 133 2248 151; x_wconf 91' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_216' title='bbox 2258 133 2335 151; x_wconf 86' lang='eng'>105795</span> <span class='ocrx_word' id='word_1_217' title='bbox 2344 133 2468 156; x_wconf 89' lang='eng' dir='ltr'>(AF547885)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 1857 177 2252 231">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 1857 177 2252 231">
+     <span class='ocr_line' id='line_1_75' title="bbox 1873 177 2239 200; baseline 0 -5"><span class='ocrx_word' id='word_1_218' title='bbox 1873 177 1896 195; x_wconf 96' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_219' title='bbox 1906 177 1961 195; x_wconf 84' lang='eng' dir='ltr'><em>lacus</em></span> <span class='ocrx_word' id='word_1_220' title='bbox 1970 177 2020 195; x_wconf 86' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_221' title='bbox 2029 177 2104 195; x_wconf 78' lang='eng' dir='ltr'>44577T</span> <span class='ocrx_word' id='word_1_222' title='bbox 2113 177 2239 200; x_wconf 85' lang='eng' dir='ltr'>(AY438090)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_76' title="bbox 1857 208 2252 231; baseline 0 -5"><span class='ocrx_word' id='word_1_223' title='bbox 1857 209 1880 226; x_wconf 96' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_224' title='bbox 1890 209 1977 226; x_wconf 80' lang='eng' dir='ltr'>kansasii</span> <span class='ocrx_word' id='word_1_225' title='bbox 1984 209 2022 226; x_wconf 87' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_226' title='bbox 2033 208 2119 226; x_wconf 73' lang='eng' dir='ltr'>104589T</span> <span class='ocrx_word' id='word_1_227' title='bbox 2128 209 2252 231; x_wconf 87' lang='eng' dir='ltr'>(AF547849)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 1841 238 2545 311">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 1841 238 2545 311">
+     <span class='ocr_line' id='line_1_77' title="bbox 1841 238 2209 261; baseline 0.003 -6"><span class='ocrx_word' id='word_1_228' title='bbox 1841 238 1864 255; x_wconf 94' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_229' title='bbox 1874 238 1934 260; x_wconf 71' lang='eng' dir='ltr'>gastri</span> <span class='ocrx_word' id='word_1_230' title='bbox 1941 238 1979 256; x_wconf 89' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_231' title='bbox 1989 238 2076 256; x_wconf 79' lang='eng' dir='ltr'>104530T</span> <span class='ocrx_word' id='word_1_232' title='bbox 2085 238 2209 261; x_wconf 81' lang='eng' dir='ltr'>(AF547836)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_78' title="bbox 1949 263 2360 285; baseline 0 -5"><span class='ocrx_word' id='word_1_233' title='bbox 1949 263 1972 280; x_wconf 94' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_234' title='bbox 1982 263 2084 281; x_wconf 84' lang='eng' dir='ltr'><em>shimoidei</em></span> <span class='ocrx_word' id='word_1_235' title='bbox 2092 263 2142 281; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_236' title='bbox 2150 263 2226 281; x_wconf 81' lang='eng' dir='ltr'>44152T</span> <span class='ocrx_word' id='word_1_237' title='bbox 2235 263 2360 285; x_wconf 84' lang='eng' dir='ltr'>(AF547874)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_79' title="bbox 2133 288 2545 311; baseline 0 -4"><span class='ocrx_word' id='word_1_238' title='bbox 2133 289 2155 307; x_wconf 83' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_239' title='bbox 2166 289 2269 307; x_wconf 76' lang='eng' dir='ltr'>botn/‘ense</span> <span class='ocrx_word' id='word_1_240' title='bbox 2277 289 2328 307; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_241' title='bbox 2336 288 2412 307; x_wconf 67' lang='eng' dir='ltr'>44537T</span> <span class='ocrx_word' id='word_1_242' title='bbox 2420 289 2545 311; x_wconf 85' lang='eng' dir='ltr'>(AF547812)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 1811 318 2234 378">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 1811 318 2234 378">
+     <span class='ocr_line' id='line_1_80' title="bbox 1841 318 2234 341; baseline -0.003 -4"><span class='ocrx_word' id='word_1_243' title='bbox 1841 319 1864 336; x_wconf 93' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_244' title='bbox 1875 319 1957 337; x_wconf 80' lang='eng' dir='ltr'>celatum</span> <span class='ocrx_word' id='word_1_245' title='bbox 1965 319 2003 337; x_wconf 90' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_246' title='bbox 2013 318 2100 337; x_wconf 73' lang='eng' dir='ltr'>105109T</span> <span class='ocrx_word' id='word_1_247' title='bbox 2109 319 2234 341; x_wconf 83' lang='eng' dir='ltr'>(AF547817)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_81' title="bbox 1811 355 2208 378; baseline 0 -5"><span class='ocrx_word' id='word_1_248' title='bbox 1811 356 1834 373; x_wconf 93' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_249' title='bbox 1844 356 1933 373; x_wconf 85' lang='eng' dir='ltr'><em>branderi</em></span> <span class='ocrx_word' id='word_1_250' title='bbox 1940 356 1978 373; x_wconf 90' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_251' title='bbox 1988 355 2075 373; x_wconf 79' lang='eng' dir='ltr'>104592T</span> <span class='ocrx_word' id='word_1_252' title='bbox 2084 356 2208 378; x_wconf 85' lang='eng' dir='ltr'>(AF547815)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 1776 389 2147 440">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 1776 389 2147 440">
+     <span class='ocr_line' id='line_1_82' title="bbox 1855 389 2125 412; baseline 0 -5"><span class='ocrx_word' id='word_1_253' title='bbox 1855 390 1907 407; x_wconf 91' lang='eng' dir='ltr'>KUM</span> <span class='ocrx_word' id='word_1_254' title='bbox 1915 389 2004 407; x_wconf 68' lang='eng'>060204&#39;</span> <span class='ocrx_word' id='word_1_255' title='bbox 2010 391 2125 412; x_wconf 73' lang='eng' dir='ltr'>(ABS7D171)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_83' title="bbox 1776 417 2147 440; baseline 0 -5"><span class='ocrx_word' id='word_1_256' title='bbox 1776 418 1799 435; x_wconf 89' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_257' title='bbox 1810 419 1871 436; x_wconf 82' lang='eng' dir='ltr'>terrae</span> <span class='ocrx_word' id='word_1_258' title='bbox 1879 418 1917 436; x_wconf 90' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_259' title='bbox 1928 417 2014 436; x_wconf 76' lang='eng' dir='ltr'>104321T</span> <span class='ocrx_word' id='word_1_260' title='bbox 2022 418 2147 440; x_wconf 87' lang='eng' dir='ltr'>(AF547879)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 1758 451 2312 593">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 1758 451 2226 474">
+     <span class='ocr_line' id='line_1_84' title="bbox 1758 451 2226 474; baseline 0 -5"><span class='ocrx_word' id='word_1_261' title='bbox 1758 452 1781 469; x_wconf 92' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_262' title='bbox 1791 452 1967 469; x_wconf 80' lang='eng' dir='ltr'>kumamotonense</span> <span class='ocrx_word' id='word_1_263' title='bbox 1975 452 2022 469; x_wconf 84' lang='eng' dir='ltr'>CST</span> <span class='ocrx_word' id='word_1_264' title='bbox 2030 451 2091 469; x_wconf 71' lang='eng' dir='ltr'>7247T</span> <span class='ocrx_word' id='word_1_265' title='bbox 2100 452 2226 474; x_wconf 79' lang='eng' dir='ltr'>(A8239920)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 1800 479 2194 502">
+     <span class='ocr_line' id='line_1_85' title="bbox 1800 479 2194 502; baseline 0 -5"><span class='ocrx_word' id='word_1_266' title='bbox 1800 480 1823 497; x_wconf 66' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_267' title='bbox 1833 480 1917 497; x_wconf 78' lang='eng' dir='ltr'><em>doricum</em></span> <span class='ocrx_word' id='word_1_268' title='bbox 1927 479 1977 497; x_wconf 91' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_269' title='bbox 1985 479 2060 497; x_wconf 64' lang='eng' dir='ltr'>44339T</span> <span class='ocrx_word' id='word_1_270' title='bbox 2069 479 2194 502; x_wconf 81' lang='eng' dir='ltr'>(AF547826)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 1768 508 2312 564">
+     <span class='ocr_line' id='line_1_86' title="bbox 1792 508 2312 531; baseline 0 -5"><span class='ocrx_word' id='word_1_271' title='bbox 1792 508 1815 526; x_wconf 96' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_272' title='bbox 1825 508 2035 531; x_wconf 79' lang='eng' dir='ltr'>nonchromogen/‘cum</span> <span class='ocrx_word' id='word_1_273' title='bbox 2044 508 2094 526; x_wconf 86' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_274' title='bbox 2103 508 2178 526; x_wconf 73' lang='eng' dir='ltr'>44164T</span> <span class='ocrx_word' id='word_1_275' title='bbox 2187 508 2312 531; x_wconf 85' lang='eng' dir='ltr'>(AF547861)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_87' title="bbox 1768 541 2177 564; baseline 0 -5"><span class='ocrx_word' id='word_1_276' title='bbox 1768 541 1790 559; x_wconf 96' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_277' title='bbox 1801 541 1898 559; x_wconf 82' lang='eng' dir='ltr'>hiberniae</span> <span class='ocrx_word' id='word_1_278' title='bbox 1907 541 1957 559; x_wconf 87' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_279' title='bbox 1966 541 2041 559; x_wconf 80' lang='eng' dir='ltr'>44241T</span> <span class='ocrx_word' id='word_1_280' title='bbox 2051 541 2177 564; x_wconf 85' lang='eng' dir='ltr'>(AY438083)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 1878 570 2301 593">
+     <span class='ocr_line' id='line_1_88' title="bbox 1878 570 2301 593; baseline 0 -5"><span class='ocrx_word' id='word_1_281' title='bbox 1878 571 1901 588; x_wconf 67' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_282' title='bbox 1911 575 2010 593; x_wconf 83' lang='eng' dir='ltr'>arupense</span> <span class='ocrx_word' id='word_1_283' title='bbox 2019 570 2088 588; x_wconf 85' lang='eng' dir='ltr'>CCUG</span> <span class='ocrx_word' id='word_1_284' title='bbox 2097 571 2161 588; x_wconf 87' lang='eng'>39146</span> <span class='ocrx_word' id='word_1_285' title='bbox 2171 570 2301 593; x_wconf 88' lang='eng' dir='ltr'>(DQ168662)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 1910 603 2412 626">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 1910 603 2412 626">
+     <span class='ocr_line' id='line_1_89' title="bbox 1910 603 2412 626; baseline 0 -5"><span class='ocrx_word' id='word_1_286' title='bbox 1910 603 2004 621; x_wconf 75' lang='eng' dir='ltr'>Nocardia</span> <span class='ocrx_word' id='word_1_287' title='bbox 2013 603 2123 621; x_wconf 75' lang='eng' dir='ltr'>asteroides</span> <span class='ocrx_word' id='word_1_288' title='bbox 2130 603 2194 621; x_wconf 89' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_289' title='bbox 2205 603 2277 621; x_wconf 75' lang='eng' dir='ltr'>19247T</span> <span class='ocrx_word' id='word_1_290' title='bbox 2286 603 2412 626; x_wconf 76' lang='eng' dir='ltr'>(AY756513)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 1470 54 2130 411">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 1470 54 2130 411">
+     <span class='ocr_line' id='line_1_90' title="bbox 1527 54 1979 84; baseline 0.002 -1"><span class='ocrx_word' id='word_1_291' title='bbox 1527 54 1979 84; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_91' title="bbox 1527 84 1883 128; baseline 0 1345"><span class='ocrx_word' id='word_1_292' title='bbox 1527 84 1883 128; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_92' title="bbox 1518 128 2039 167; baseline 0.002 -1"><span class='ocrx_word' id='word_1_293' title='bbox 1518 128 2039 167; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_93' title="bbox 1518 167 1873 211; baseline 0 0"><span class='ocrx_word' id='word_1_294' title='bbox 1518 167 1873 211; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_94' title="bbox 1518 211 1852 227; baseline 0 1246"><span class='ocrx_word' id='word_1_295' title='bbox 1518 211 1852 227; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_95' title="bbox 1518 227 1841 242; baseline 0 1231"><span class='ocrx_word' id='word_1_296' title='bbox 1518 227 1841 242; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_96' title="bbox 1518 242 1841 272; baseline 0 1201"><span class='ocrx_word' id='word_1_297' title='bbox 1518 242 1841 272; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_97' title="bbox 1517 272 2130 307; baseline 0 -11"><span class='ocrx_word' id='word_1_298' title='bbox 1517 272 2130 307; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_98' title="bbox 1517 307 1841 352; baseline 0 0"><span class='ocrx_word' id='word_1_299' title='bbox 1517 307 1841 352; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_99' title="bbox 1491 352 1809 378; baseline 0 1095"><span class='ocrx_word' id='word_1_300' title='bbox 1491 352 1809 378; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_100' title="bbox 1470 378 1809 411; baseline 0 -22"><span class='ocrx_word' id='word_1_301' title='bbox 1470 378 1751 411; x_wconf 95' lang='eng' dir='ltr'>  </span> <span class='ocrx_word' id='word_1_302' title='bbox 1775 378 1809 389; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 1505 161 1529 179">
+    <p class='ocr_par' dir='ltr' id='par_1_42' title="bbox 1505 161 1529 179">
+     <span class='ocr_line' id='line_1_101' title="bbox 1505 161 1529 179; baseline 0 0"><span class='ocrx_word' id='word_1_303' title='bbox 1505 161 1529 179; x_wconf 85' lang='eng'>26</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 1751 386 1775 403">
+    <p class='ocr_par' dir='ltr' id='par_1_43' title="bbox 1751 386 1775 403">
+     <span class='ocr_line' id='line_1_102' title="bbox 1751 386 1775 403; baseline 0 0"><span class='ocrx_word' id='word_1_304' title='bbox 1751 386 1775 403; x_wconf 91' lang='eng'>50</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 1446 389 1906 619">
+    <p class='ocr_par' dir='ltr' id='par_1_44' title="bbox 1446 389 1906 619">
+     <span class='ocr_line' id='line_1_103' title="bbox 1778 389 1848 406; baseline 0 1067"><span class='ocrx_word' id='word_1_305' title='bbox 1778 389 1848 406; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_104' title="bbox 1470 411 1774 423; baseline 0 1050"><span class='ocrx_word' id='word_1_306' title='bbox 1470 411 1774 423; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_105' title="bbox 1470 423 1774 440; baseline 0 1033"><span class='ocrx_word' id='word_1_307' title='bbox 1470 423 1774 440; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_106' title="bbox 1446 440 1758 485; baseline 0 0"><span class='ocrx_word' id='word_1_308' title='bbox 1446 440 1758 485; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_107' title="bbox 1446 485 1797 497; baseline 0 976"><span class='ocrx_word' id='word_1_309' title='bbox 1446 485 1797 497; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_108' title="bbox 1447 497 1792 513; baseline 0 960"><span class='ocrx_word' id='word_1_310' title='bbox 1447 497 1792 513; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_109' title="bbox 1447 513 1790 530; baseline 0 943"><span class='ocrx_word' id='word_1_311' title='bbox 1447 513 1790 530; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_110' title="bbox 1447 530 1768 575; baseline 0 0"><span class='ocrx_word' id='word_1_312' title='bbox 1447 530 1768 575; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_111' title="bbox 1447 575 1878 604; baseline 0 869"><span class='ocrx_word' id='word_1_313' title='bbox 1447 575 1878 604; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_112' title="bbox 1447 604 1906 619; baseline 0 854"><span class='ocrx_word' id='word_1_314' title='bbox 1447 604 1906 619; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 1355 674 2600 1204">
+    <p class='ocr_par' dir='ltr' id='par_1_45' title="bbox 1355 674 2478 837">
+     <span class='ocr_line' id='line_1_113' title="bbox 2437 674 2478 692; baseline 0 0"><span class='ocrx_word' id='word_1_315' title='bbox 2437 674 2478 692; x_wconf 62' lang='eng'>0,01</span> 
+     </span>
+     <span class='ocr_line' id='line_1_114' title="bbox 1355 735 2438 772; baseline 0.001 -6"><span class='ocrx_word' id='word_1_316' title='bbox 1355 735 1392 766; x_wconf 81' lang='eng' dir='ltr'>(d)</span> <span class='ocrx_word' id='word_1_317' title='bbox 1404 735 1478 760; x_wconf 77' lang='eng' dir='ltr'><em>SOdA</em></span> <span class='ocrx_word' id='word_1_318' title='bbox 1685 750 1709 768; x_wconf 85' lang='eng'>39</span> <span class='ocrx_word' id='word_1_319' title='bbox 2066 750 2089 767; x_wconf 99' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_320' title='bbox 2100 750 2161 767; x_wconf 77' lang='eng' dir='ltr'><em>cookii</em></span> <span class='ocrx_word' id='word_1_321' title='bbox 2169 750 2206 767; x_wconf 92' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_322' title='bbox 2217 749 2303 767; x_wconf 76' lang='eng' dir='ltr'>105396T</span> <span class='ocrx_word' id='word_1_323' title='bbox 2312 750 2438 772; x_wconf 87' lang='eng' dir='ltr'>(AY544815)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_115' title="bbox 1961 781 2360 804; baseline 0 -5"><span class='ocrx_word' id='word_1_324' title='bbox 1961 782 1984 802; x_wconf 91' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_325' title='bbox 1994 782 2083 799; x_wconf 85' lang='eng' dir='ltr'>branderi</span> <span class='ocrx_word' id='word_1_326' title='bbox 2090 782 2128 799; x_wconf 89' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_327' title='bbox 2138 781 2225 799; x_wconf 55' lang='eng' dir='ltr'>104592‘r</span> <span class='ocrx_word' id='word_1_328' title='bbox 2234 782 2360 804; x_wconf 85' lang='eng' dir='ltr'>(AY544810)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_116' title="bbox 1961 809 2448 837; baseline 0.002 -6"><span class='ocrx_word' id='word_1_329' title='bbox 1961 809 1984 832; x_wconf 78' lang='eng'>10</span> <span class='ocrx_word' id='word_1_330' title='bbox 2066 814 2089 831; x_wconf 94' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_331' title='bbox 2099 814 2171 836; x_wconf 82' lang='eng' dir='ltr'>xenopi</span> <span class='ocrx_word' id='word_1_332' title='bbox 2178 814 2216 832; x_wconf 88' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_333' title='bbox 2226 814 2313 832; x_wconf 78' lang='eng' dir='ltr'>104035T</span> <span class='ocrx_word' id='word_1_334' title='bbox 2322 814 2448 837; x_wconf 86' lang='eng' dir='ltr'>(AY544878)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_46' title="bbox 1975 845 2600 930">
+     <span class='ocr_line' id='line_1_117' title="bbox 1975 845 2564 867; baseline 0 -5"><span class='ocrx_word' id='word_1_335' title='bbox 1975 855 1977 857; x_wconf 98' lang='eng'><strong><em>-</em></strong></span> <span class='ocrx_word' id='word_1_336' title='bbox 2077 845 2100 862; x_wconf 95' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_337' title='bbox 2110 845 2285 863; x_wconf 75' lang='eng' dir='ltr'>heckeshornense</span> <span class='ocrx_word' id='word_1_338' title='bbox 2294 845 2345 863; x_wconf 87' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_339' title='bbox 2353 845 2429 863; x_wconf 78' lang='eng' dir='ltr'>44428T</span> <span class='ocrx_word' id='word_1_340' title='bbox 2438 845 2564 867; x_wconf 81' lang='eng' dir='ltr'>(AY544830)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_118' title="bbox 2187 874 2600 897; baseline 0 -5"><span class='ocrx_word' id='word_1_341' title='bbox 2187 874 2210 892; x_wconf 70' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_342' title='bbox 2220 874 2323 892; x_wconf 78' lang='eng' dir='ltr'>botm‘ense</span> <span class='ocrx_word' id='word_1_343' title='bbox 2332 874 2382 892; x_wconf 86' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_344' title='bbox 2391 874 2466 892; x_wconf 73' lang='eng' dir='ltr'>44537T</span> <span class='ocrx_word' id='word_1_345' title='bbox 2474 874 2600 897; x_wconf 85' lang='eng' dir='ltr'>(AY544806)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_119' title="bbox 2045 907 2411 930; baseline 0 -5"><span class='ocrx_word' id='word_1_346' title='bbox 2045 908 2068 925; x_wconf 95' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_347' title='bbox 2078 908 2133 925; x_wconf 84' lang='eng' dir='ltr'>lacus</span> <span class='ocrx_word' id='word_1_348' title='bbox 2143 908 2192 925; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_349' title='bbox 2201 907 2276 925; x_wconf 74' lang='eng' dir='ltr'>44577T</span> <span class='ocrx_word' id='word_1_350' title='bbox 2285 908 2411 930; x_wconf 83' lang='eng' dir='ltr'>(AY544841)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_47' title="bbox 1982 939 2401 962">
+     <span class='ocr_line' id='line_1_120' title="bbox 1982 939 2401 962; baseline -0.002 -5"><span class='ocrx_word' id='word_1_351' title='bbox 1982 939 2005 956; x_wconf 94' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_352' title='bbox 2016 939 2143 957; x_wconf 78' lang='eng' dir='ltr'>tuberculosis</span> <span class='ocrx_word' id='word_1_353' title='bbox 2150 939 2188 957; x_wconf 86' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_354' title='bbox 2197 939 2265 957; x_wconf 74' lang='eng' dir='ltr'>64.31T</span> <span class='ocrx_word' id='word_1_355' title='bbox 2274 939 2401 962; x_wconf 84' lang='eng' dir='ltr'>(AY544875)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_48' title="bbox 1967 969 2429 992">
+     <span class='ocr_line' id='line_1_121' title="bbox 1967 969 2429 992; baseline 0 -5"><span class='ocrx_word' id='word_1_356' title='bbox 1967 970 1990 988; x_wconf 89' lang='eng'>10</span> <span class='ocrx_word' id='word_1_357' title='bbox 2027 970 2050 987; x_wconf 94' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_358' title='bbox 2061 970 2150 988; x_wconf 80' lang='eng' dir='ltr'>ulcerans</span> <span class='ocrx_word' id='word_1_359' title='bbox 2159 970 2197 988; x_wconf 90' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_360' title='bbox 2207 969 2293 988; x_wconf 85' lang='eng' dir='ltr'>105425T</span> <span class='ocrx_word' id='word_1_361' title='bbox 2303 970 2429 992; x_wconf 85' lang='eng' dir='ltr'>(AY544876)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_49' title="bbox 2040 999 2445 1022">
+     <span class='ocr_line' id='line_1_122' title="bbox 2040 999 2445 1022; baseline 0 -5"><span class='ocrx_word' id='word_1_362' title='bbox 2040 1000 2063 1017; x_wconf 97' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_363' title='bbox 2073 1000 2165 1017; x_wconf 84' lang='eng' dir='ltr'><em>marinum</em></span> <span class='ocrx_word' id='word_1_364' title='bbox 2174 1000 2212 1017; x_wconf 91' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_365' title='bbox 2223 999 2309 1017; x_wconf 80' lang='eng' dir='ltr'>104528T</span> <span class='ocrx_word' id='word_1_366' title='bbox 2319 1000 2445 1022; x_wconf 85' lang='eng' dir='ltr'>(AY544845)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_50' title="bbox 2035 1030 2432 1053">
+     <span class='ocr_line' id='line_1_123' title="bbox 2035 1030 2432 1053; baseline 0.003 -6"><span class='ocrx_word' id='word_1_367' title='bbox 2035 1030 2058 1047; x_wconf 93' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_368' title='bbox 2068 1030 2155 1048; x_wconf 73' lang='eng' dir='ltr'>kansasii</span> <span class='ocrx_word' id='word_1_369' title='bbox 2162 1030 2200 1048; x_wconf 92' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_370' title='bbox 2210 1030 2297 1048; x_wconf 81' lang='eng' dir='ltr'>104589T</span> <span class='ocrx_word' id='word_1_371' title='bbox 2305 1030 2432 1053; x_wconf 84' lang='eng' dir='ltr'>(AY544838)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_51' title="bbox 2051 1061 2420 1084">
+     <span class='ocr_line' id='line_1_124' title="bbox 2051 1061 2420 1084; baseline 0 -5"><span class='ocrx_word' id='word_1_372' title='bbox 2051 1062 2074 1079; x_wconf 92' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_373' title='bbox 2084 1062 2143 1084; x_wconf 70' lang='eng' dir='ltr'>gastri</span> <span class='ocrx_word' id='word_1_374' title='bbox 2150 1062 2188 1080; x_wconf 91' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_375' title='bbox 2198 1061 2285 1080; x_wconf 79' lang='eng' dir='ltr'>104530T</span> <span class='ocrx_word' id='word_1_376' title='bbox 2294 1062 2420 1084; x_wconf 85' lang='eng' dir='ltr'>(AY544825)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_52' title="bbox 2061 1092 2446 1115">
+     <span class='ocr_line' id='line_1_125' title="bbox 2061 1092 2446 1115; baseline 0 -5"><span class='ocrx_word' id='word_1_377' title='bbox 2061 1092 2084 1110; x_wconf 94' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_378' title='bbox 2094 1092 2169 1115; x_wconf 84' lang='eng' dir='ltr'>szu/gai</span> <span class='ocrx_word' id='word_1_379' title='bbox 2176 1092 2214 1110; x_wconf 89' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_380' title='bbox 2224 1092 2311 1110; x_wconf 77' lang='eng' dir='ltr'>104532T</span> <span class='ocrx_word' id='word_1_381' title='bbox 2320 1092 2446 1115; x_wconf 86' lang='eng' dir='ltr'>(AY544867)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_53' title="bbox 2040 1121 2452 1144">
+     <span class='ocr_line' id='line_1_126' title="bbox 2040 1121 2452 1144; baseline 0 -5"><span class='ocrx_word' id='word_1_382' title='bbox 2040 1122 2063 1139; x_wconf 97' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_383' title='bbox 2073 1122 2175 1139; x_wconf 82' lang='eng' dir='ltr'>shimoidei</span> <span class='ocrx_word' id='word_1_384' title='bbox 2183 1121 2232 1139; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_385' title='bbox 2241 1121 2316 1139; x_wconf 87' lang='eng' dir='ltr'>44152T</span> <span class='ocrx_word' id='word_1_386' title='bbox 2326 1121 2452 1144; x_wconf 84' lang='eng' dir='ltr'>(AY544863)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_54' title="bbox 1985 1154 2423 1176">
+     <span class='ocr_line' id='line_1_127' title="bbox 1985 1154 2423 1176; baseline -0.002 -4"><span class='ocrx_word' id='word_1_387' title='bbox 1985 1154 2008 1171; x_wconf 95' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_388' title='bbox 2018 1154 2145 1176; x_wconf 82' lang='eng' dir='ltr'><em>conspicuum</em></span> <span class='ocrx_word' id='word_1_389' title='bbox 2154 1154 2191 1172; x_wconf 86' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_390' title='bbox 2202 1154 2288 1172; x_wconf 78' lang='eng' dir='ltr'>105165T</span> <span class='ocrx_word' id='word_1_391' title='bbox 2297 1154 2423 1176; x_wconf 86' lang='eng' dir='ltr'>(AY544814)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_55' title="bbox 2051 1181 2553 1204">
+     <span class='ocr_line' id='line_1_128' title="bbox 2051 1181 2553 1204; baseline 0 -5"><span class='ocrx_word' id='word_1_392' title='bbox 2051 1182 2074 1199; x_wconf 92' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_393' title='bbox 2083 1182 2273 1204; x_wconf 78' lang='eng' dir='ltr'>parascmfulaceum</span> <span class='ocrx_word' id='word_1_394' title='bbox 2282 1182 2321 1199; x_wconf 94' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_395' title='bbox 2331 1181 2418 1199; x_wconf 75' lang='eng' dir='ltr'>108112T</span> <span class='ocrx_word' id='word_1_396' title='bbox 2427 1182 2553 1204; x_wconf 85' lang='eng' dir='ltr'>(AY943181)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 2019 1212 2529 1260">
+    <p class='ocr_par' dir='ltr' id='par_1_56' title="bbox 2019 1212 2529 1260">
+     <span class='ocr_line' id='line_1_129' title="bbox 2019 1212 2447 1234; baseline 0.002 -5"><span class='ocrx_word' id='word_1_397' title='bbox 2019 1212 2042 1229; x_wconf 95' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_398' title='bbox 2052 1212 2169 1234; x_wconf 78' lang='eng' dir='ltr'>interjectum</span> <span class='ocrx_word' id='word_1_399' title='bbox 2178 1212 2228 1230; x_wconf 91' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_400' title='bbox 2237 1212 2312 1230; x_wconf 60' lang='eng' dir='ltr'>44064T</span> <span class='ocrx_word' id='word_1_401' title='bbox 2321 1212 2447 1234; x_wconf 85' lang='eng' dir='ltr'>(AY544835)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_130' title="bbox 2113 1237 2529 1260; baseline 0 -5"><span class='ocrx_word' id='word_1_402' title='bbox 2113 1238 2136 1255; x_wconf 70' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_403' title='bbox 2145 1242 2252 1260; x_wconf 83' lang='eng' dir='ltr'>parmense</span> <span class='ocrx_word' id='word_1_404' title='bbox 2260 1237 2298 1255; x_wconf 90' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_405' title='bbox 2308 1237 2395 1255; x_wconf 72' lang='eng' dir='ltr'>107385T</span> <span class='ocrx_word' id='word_1_406' title='bbox 2403 1237 2529 1260; x_wconf 86' lang='eng' dir='ltr'>(AY943182)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 1967 1267 2453 1321">
+    <p class='ocr_par' dir='ltr' id='par_1_57' title="bbox 1967 1267 2453 1321">
+     <span class='ocr_line' id='line_1_131' title="bbox 2019 1267 2453 1290; baseline 0.002 -5"><span class='ocrx_word' id='word_1_407' title='bbox 2019 1268 2042 1285; x_wconf 94' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_408' title='bbox 2052 1268 2175 1286; x_wconf 82' lang='eng' dir='ltr'><em>bohemicum</em></span> <span class='ocrx_word' id='word_1_409' title='bbox 2184 1268 2222 1286; x_wconf 90' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_410' title='bbox 2232 1267 2318 1286; x_wconf 87' lang='eng' dir='ltr'>105811T</span> <span class='ocrx_word' id='word_1_411' title='bbox 2328 1268 2453 1290; x_wconf 87' lang='eng' dir='ltr'>(AY544805)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_132' title="bbox 1967 1298 2361 1321; baseline 0 -5"><span class='ocrx_word' id='word_1_412' title='bbox 1967 1298 1989 1316; x_wconf 95' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_413' title='bbox 2000 1298 2082 1316; x_wconf 77' lang='eng' dir='ltr'>celatum</span> <span class='ocrx_word' id='word_1_414' title='bbox 2091 1298 2129 1316; x_wconf 90' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_415' title='bbox 2139 1298 2225 1316; x_wconf 73' lang='eng' dir='ltr'>106109T</span> <span class='ocrx_word' id='word_1_416' title='bbox 2235 1298 2361 1321; x_wconf 85' lang='eng' dir='ltr'>(AY544812)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 1980 1329 2496 1378">
+    <p class='ocr_par' dir='ltr' id='par_1_58' title="bbox 1980 1329 2496 1378">
+     <span class='ocr_line' id='line_1_133' title="bbox 1980 1329 2265 1352; baseline 0 -5"><span class='ocrx_word' id='word_1_417' title='bbox 1980 1329 2032 1347; x_wconf 94' lang='eng' dir='ltr'>KUM</span> <span class='ocrx_word' id='word_1_418' title='bbox 2041 1329 2130 1347; x_wconf 79' lang='eng' dir='ltr'>060204T</span> <span class='ocrx_word' id='word_1_419' title='bbox 2139 1329 2265 1352; x_wconf 86' lang='eng' dir='ltr'>(AB370184)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_134' title="bbox 1982 1355 2496 1378; baseline 0 -5"><span class='ocrx_word' id='word_1_420' title='bbox 1982 1356 2005 1373; x_wconf 96' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_421' title='bbox 2016 1356 2219 1373; x_wconf 73' lang='eng' dir='ltr'>saskatchewanense</span> <span class='ocrx_word' id='word_1_422' title='bbox 2227 1356 2265 1373; x_wconf 90' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_423' title='bbox 2275 1355 2361 1373; x_wconf 71' lang='eng' dir='ltr'>108114T</span> <span class='ocrx_word' id='word_1_424' title='bbox 2370 1356 2496 1378; x_wconf 87' lang='eng' dir='ltr'>(AY943183)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 1686 1396 2178 1419">
+    <p class='ocr_par' dir='ltr' id='par_1_59' title="bbox 1686 1396 2178 1419">
+     <span class='ocr_line' id='line_1_135' title="bbox 1686 1396 2178 1419; baseline 0 -5"><span class='ocrx_word' id='word_1_425' title='bbox 1686 1397 1780 1414; x_wconf 81' lang='eng' dir='ltr'><em>Nocardia</em></span> <span class='ocrx_word' id='word_1_426' title='bbox 1789 1397 1901 1414; x_wconf 82' lang='eng' dir='ltr'>abscessus</span> <span class='ocrx_word' id='word_1_427' title='bbox 1910 1396 1960 1414; x_wconf 91' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_428' title='bbox 1968 1396 2043 1414; x_wconf 71' lang='eng' dir='ltr'>44432T</span> <span class='ocrx_word' id='word_1_429' title='bbox 2053 1396 2178 1419; x_wconf 86' lang='eng' dir='ltr'>(AY544981)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 1344 753 2184 1411">
+    <p class='ocr_par' dir='ltr' id='par_1_60' title="bbox 1344 753 2184 1411">
+     <span class='ocr_line' id='line_1_136' title="bbox 1671 753 2064 783; baseline 0 -13"><span class='ocrx_word' id='word_1_430' title='bbox 1671 753 2064 783; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_137' title="bbox 1671 783 1961 881; baseline 0 0"><span class='ocrx_word' id='word_1_431' title='bbox 1671 783 1961 881; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_138' title="bbox 1671 881 2184 896; baseline 0 577"><span class='ocrx_word' id='word_1_432' title='bbox 1671 881 2184 896; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_139' title="bbox 1671 896 2045 941; baseline 0 0"><span class='ocrx_word' id='word_1_433' title='bbox 1671 896 2045 941; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_140' title="bbox 1671 941 1980 961; baseline 0 512"><span class='ocrx_word' id='word_1_434' title='bbox 1671 941 1980 961; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_141' title="bbox 1345 961 2020 1003; baseline 0 -6"><span class='ocrx_word' id='word_1_435' title='bbox 1345 961 2011 1003; x_wconf 95' lang='eng' dir='ltr'>   </span> <span class='ocrx_word' id='word_1_436' title='bbox 1990 973 2020 997; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_142' title="bbox 1345 1003 2034 1033; baseline 0 440"><span class='ocrx_word' id='word_1_437' title='bbox 1345 1003 2034 1033; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_143' title="bbox 1345 1033 2035 1064; baseline 0 409"><span class='ocrx_word' id='word_1_438' title='bbox 1345 1033 2035 1064; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_144' title="bbox 1345 1064 2051 1095; baseline 0 378"><span class='ocrx_word' id='word_1_439' title='bbox 1345 1064 2051 1095; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_145' title="bbox 1345 1095 2059 1110; baseline 0 363"><span class='ocrx_word' id='word_1_440' title='bbox 1345 1095 2059 1110; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_146' title="bbox 1345 1110 2040 1126; baseline 0 347"><span class='ocrx_word' id='word_1_441' title='bbox 1345 1110 2040 1126; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_147' title="bbox 1345 1126 2031 1155; baseline 0 0"><span class='ocrx_word' id='word_1_442' title='bbox 1345 1126 2031 1155; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_148' title="bbox 1345 1155 2046 1201; baseline 0 0"><span class='ocrx_word' id='word_1_443' title='bbox 1345 1155 2046 1201; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_149' title="bbox 1345 1201 2109 1256; baseline 0 -11"><span class='ocrx_word' id='word_1_444' title='bbox 1345 1201 2109 1256; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_150' title="bbox 1345 1256 2019 1301; baseline 0 0"><span class='ocrx_word' id='word_1_445' title='bbox 1345 1256 2019 1301; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_151' title="bbox 1344 1301 1976 1385; baseline 0 -53"><span class='ocrx_word' id='word_1_446' title='bbox 1344 1301 1976 1385; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_152' title="bbox 1344 1385 1677 1411; baseline 0 62"><span class='ocrx_word' id='word_1_447' title='bbox 1344 1385 1677 1411; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 1984 815 2184 881">
+    <p class='ocr_par' dir='ltr' id='par_1_61' title="bbox 1984 815 2184 881">
+     <span class='ocr_line' id='line_1_153' title="bbox 1984 815 2184 881; baseline 0.015 -3"><span class='ocrx_word' id='word_1_448' title='bbox 1984 815 2184 881; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 1642 980 1666 997">
+    <p class='ocr_par' dir='ltr' id='par_1_62' title="bbox 1642 980 1666 997">
+     <span class='ocr_line' id='line_1_154' title="bbox 1642 980 1666 997; baseline 0 0"><span class='ocrx_word' id='word_1_449' title='bbox 1642 980 1666 997; x_wconf 83' lang='eng'>97</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000794-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000794-0-000.pbm.png
new file mode 100644
index 00000000..8195d16f
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000794-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000794-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000794-0-000.pbm.png.hocr
new file mode 100644
index 00000000..370b6c36
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000794-0-000.pbm.png.hocr
@@ -0,0 +1,98 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000794-0-000.pbm.png"; bbox 0 0 1089 809; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 259 0 1089 809">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 311 0 1006 396">
+     <span class='ocr_line' id='line_1_1' title="bbox 411 0 998 28; baseline 0 -6"><span class='ocrx_word' id='word_1_1' title='bbox 411 1 530 22; x_wconf 88' lang='eng' dir='ltr'><em>Lewinella</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 538 1 631 28; x_wconf 83' lang='eng' dir='ltr'><em>persica</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 641 1 720 22; x_wconf 90' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 733 0 836 22; x_wconf 90' lang='eng' dir='ltr'><em>102663T</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 846 1 998 28; x_wconf 74' lang='eng' dir='ltr'><em>(ABBO‘IG‘IB)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 444 46 984 74; baseline 0 -6"><span class='ocrx_word' id='word_1_6' title='bbox 444 47 561 68; x_wconf 84' lang='eng' dir='ltr'><em>Lewinel/a</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 572 47 700 74; x_wconf 73' lang='eng' dir='ltr'><em>agan’lytica</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 710 46 817 68; x_wconf 80' lang='eng' dir='ltr'><em>SST-19T</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 827 47 984 74; x_wconf 84' lang='eng' dir='ltr'>(AM286229)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 417 92 1006 120; baseline 0 -6"><span class='ocrx_word' id='word_1_10' title='bbox 417 93 546 114; x_wconf 87' lang='eng' dir='ltr'><em>Lewinella</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 555 93 690 114; x_wconf 86' lang='eng' dir='ltr'><em>antarctica</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 700 92 847 114; x_wconf 80' lang='eng' dir='ltr'><em>IMCC3223T</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 856 93 1006 120; x_wconf 88' lang='eng' dir='ltr'><em>(EF554367)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 421 138 978 166; baseline 0 -6"><span class='ocrx_word' id='word_1_14' title='bbox 421 139 540 160; x_wconf 86' lang='eng' dir='ltr'><em>LewineI/a</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 549 139 610 160; x_wconf 86' lang='eng' dir='ltr'><em>Iutea</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 621 139 699 160; x_wconf 90' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 712 138 816 160; x_wconf 79' lang='eng' dir='ltr'><em>102634T</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 826 139 978 166; x_wconf 88' lang='eng' dir='ltr'><em>(AB301494)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 390 184 972 211; baseline 0 -5"><span class='ocrx_word' id='word_1_19' title='bbox 390 185 508 206; x_wconf 88' lang='eng' dir='ltr'><em>Lewine/la</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 518 185 604 206; x_wconf 87' lang='eng' dir='ltr'><em>marina</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 615 185 693 206; x_wconf 87' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 707 184 810 206; x_wconf 83' lang='eng' dir='ltr'><em>102633T</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 820 185 972 211; x_wconf 78' lang='eng' dir='ltr'><em>(ABSO1495)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 334 230 963 257; baseline 0 -5"><span class='ocrx_word' id='word_1_24' title='bbox 334 231 452 252; x_wconf 87' lang='eng' dir='ltr'><em>Lewinella</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 463 231 596 252; x_wconf 82' lang='eng' dir='ltr'><em>cohaerens</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 606 231 684 252; x_wconf 92' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 697 230 801 252; x_wconf 74' lang='eng' dir='ltr'><em>102661T</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 811 231 963 257; x_wconf 74' lang='eng' dir='ltr'><em>(ABBO1614)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 329 276 939 304; baseline 0 -6"><span class='ocrx_word' id='word_1_29' title='bbox 329 277 448 298; x_wconf 86' lang='eng' dir='ltr'><em>Lewinella</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 458 277 572 304; x_wconf 84' lang='eng' dir='ltr'><em>nigricans</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 582 277 661 298; x_wconf 90' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 674 276 778 298; x_wconf 76' lang='eng' dir='ltr'><em>102662T</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 787 277 939 304; x_wconf 75' lang='eng' dir='ltr'><em>(ABBO1615)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 311 322 1003 350; baseline 0 -6"><span class='ocrx_word' id='word_1_34' title='bbox 311 323 559 344; x_wconf 81' lang='eng' dir='ltr'><em>Haliscomenobacter</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 565 323 686 350; x_wconf 87' lang='eng' dir='ltr'><em>hydrossis</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 695 323 771 344; x_wconf 87' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 782 322 872 344; x_wconf 89' lang='eng' dir='ltr'><em>27775T</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 883 323 1003 350; x_wconf 86' lang='eng' dir='ltr'>(M58790)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 373 368 811 396; baseline 0 -6"><span class='ocrx_word' id='word_1_39' title='bbox 373 369 502 396; x_wconf 87' lang='eng' dir='ltr'><em>Aureispira</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 512 369 598 390; x_wconf 87' lang='eng' dir='ltr'><em>marina</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 607 368 649 390; x_wconf 94' lang='eng' dir='ltr'><em>24T</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 660 369 811 396; x_wconf 84' lang='eng' dir='ltr'><em>(AB245933)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 280 414 1089 717">
+     <span class='ocr_line' id='line_1_10' title="bbox 444 414 1041 441; baseline 0 -5"><span class='ocrx_word' id='word_1_43' title='bbox 444 415 557 436; x_wconf 83' lang='eng' dir='ltr'><em>Flexithrix</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 567 415 695 436; x_wconf 87' lang='eng' dir='ltr'><em>dorotheae</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 704 415 780 436; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 791 414 881 436; x_wconf 75' lang='eng' dir='ltr'><em>23163T</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 891 415 1041 441; x_wconf 86' lang='eng' dir='ltr'><em>(AF039296)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 381 460 989 487; baseline 0 -5"><span class='ocrx_word' id='word_1_48' title='bbox 381 461 559 482; x_wconf 76' lang='eng' dir='ltr'><em>Persicobacter</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 565 461 671 482; x_wconf 81' lang='eng' dir='ltr'><em>diff/uens</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 680 461 757 482; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 767 460 858 482; x_wconf 88' lang='eng' dir='ltr'><em>23140T</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 868 461 989 487; x_wconf 87' lang='eng' dir='ltr'>(M58765)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 468 506 1012 533; baseline 0 -5"><span class='ocrx_word' id='word_1_53' title='bbox 468 507 610 528; x_wconf 82' lang='eng' dir='ltr'><em>Flexibacter</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 617 506 695 528; x_wconf 82' lang='eng' dir='ltr'><em>ﬂexilis</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 703 506 780 528; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 790 506 881 528; x_wconf 76' lang='eng' dir='ltr'><em>23079T</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 891 507 1012 533; x_wconf 88' lang='eng' dir='ltr'><em>(M62794)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 452 552 1022 579; baseline -0.002 -5"><span class='ocrx_word' id='word_1_58' title='bbox 452 553 625 574; x_wconf 84' lang='eng' dir='ltr'><em>FIectobaciI/us</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 634 553 708 579; x_wconf 87' lang='eng' dir='ltr'><em>major</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 713 552 790 574; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 801 552 891 574; x_wconf 87' lang='eng' dir='ltr'><em>29496T</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 901 553 1022 579; x_wconf 88' lang='eng' dir='ltr'><em>(M62787)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 386 597 1089 626; baseline 0 -6"><span class='ocrx_word' id='word_1_63' title='bbox 386 598 616 626; x_wconf 81' lang='eng' dir='ltr'><em>Sphingobacterium</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 626 599 772 626; x_wconf 77' lang='eng' dir='ltr'><em>spirit/vorurn</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 781 598 857 620; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 869 597 959 620; x_wconf 73' lang='eng' dir='ltr'><em>33861T</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 968 599 1089 626; x_wconf 88' lang='eng' dir='ltr'><em>(M58778)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 382 644 979 672; baseline 0 -6"><span class='ocrx_word' id='word_1_68' title='bbox 382 645 549 672; x_wconf 85' lang='eng' dir='ltr'><em>Chitinophaga</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 557 645 663 671; x_wconf 88' lang='eng' dir='ltr'><em>pinensis</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 671 645 733 666; x_wconf 94' lang='eng' dir='ltr'><em>ACM</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 744 644 819 666; x_wconf 82' lang='eng' dir='ltr'><em>2034T</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 829 645 979 671; x_wconf 87' lang='eng' dir='ltr'>(AF078775)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 280 690 817 717; baseline -0.002 -5"><span class='ocrx_word' id='word_1_73' title='bbox 280 691 423 717; x_wconf 80' lang='eng' dir='ltr'><em>Aequorivita</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 433 691 557 712; x_wconf 83' lang='eng' dir='ltr'><em>antarctica</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 567 690 656 712; x_wconf 78' lang='eng' dir='ltr'><em>SW49T</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 666 691 817 717; x_wconf 89' lang='eng' dir='ltr'>(AY027802)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 259 735 892 809">
+     <span class='ocr_line' id='line_1_17' title="bbox 270 735 892 763; baseline 0 -5"><span class='ocrx_word' id='word_1_77' title='bbox 270 737 465 758; x_wconf 79' lang='eng' dir='ltr'><em>Flavobacterium</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 475 737 574 763; x_wconf 79' lang='eng' dir='ltr'><em>aquati/e</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 583 736 660 758; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 673 735 761 758; x_wconf 88' lang='eng' dir='ltr'><em>11947T</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 771 737 892 763; x_wconf 88' lang='eng' dir='ltr'>(M62797)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 259 782 769 809; baseline -0.002 -5"><span class='ocrx_word' id='word_1_82' title='bbox 259 783 446 804; x_wconf 76' lang='eng' dir='ltr'><em>Rhodothermus</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 456 783 557 804; x_wconf 84' lang='eng' dir='ltr'><em>man&#39;nus</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 566 782 642 804; x_wconf 92' lang='eng' dir='ltr'>OKD7</span> <span class='ocrx_word' id='word_1_85' title='bbox 653 783 769 809; x_wconf 85' lang='eng' dir='ltr'><em>(X95071)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 0 4 462 798">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 0 4 462 798">
+     <span class='ocr_line' id='line_1_19' title="bbox 303 4 436 88; baseline 0 0"><span class='ocrx_word' id='word_1_86' title='bbox 303 4 436 88; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 210 88 416 180; baseline 0 0"><span class='ocrx_word' id='word_1_87' title='bbox 210 88 416 180; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 151 180 384 270; baseline 0 -53"><span class='ocrx_word' id='word_1_88' title='bbox 151 180 384 270; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 101 270 328 364; baseline 0 -56"><span class='ocrx_word' id='word_1_89' title='bbox 101 270 328 364; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 57 364 438 454; baseline 0 0"><span class='ocrx_word' id='word_1_90' title='bbox 57 364 438 454; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 57 454 381 500; baseline 0 309"><span class='ocrx_word' id='word_1_91' title='bbox 57 454 381 500; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 57 500 462 539; baseline 0 270"><span class='ocrx_word' id='word_1_92' title='bbox 57 500 462 539; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 53 539 452 592; baseline 0 0"><span class='ocrx_word' id='word_1_93' title='bbox 53 539 452 592; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 0 677 277 730; baseline 0 0"><span class='ocrx_word' id='word_1_94' title='bbox 0 677 277 730; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 0 730 265 798; baseline 0 0"><span class='ocrx_word' id='word_1_95' title='bbox 0 730 265 798; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 106 67 144 82">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 106 67 144 82">
+     <span class='ocr_line' id='line_1_29' title="bbox 106 67 144 82; baseline 0 0"><span class='ocrx_word' id='word_1_96' title='bbox 106 67 144 82; x_wconf 84' lang='eng'>0.05</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 86 93 164 96">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 86 93 164 96">
+     <span class='ocr_line' id='line_1_30' title="bbox 86 93 164 96; baseline 0 713"><span class='ocrx_word' id='word_1_97' title='bbox 86 93 164 96; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000802-0-002.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000802-0-002.pbm.png
new file mode 100644
index 00000000..d6f9794b
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000802-0-002.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000802-0-002.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000802-0-002.pbm.png.hocr
new file mode 100644
index 00000000..ea762aa3
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000802-0-002.pbm.png.hocr
@@ -0,0 +1,87 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000802-0-002.pbm.png"; bbox 0 0 994 429; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 199 0 994 429">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 244 0 920 80">
+     <span class='ocr_line' id='line_1_1' title="bbox 244 0 920 32; baseline 0 -8"><span class='ocrx_word' id='word_1_1' title='bbox 244 15 267 32; x_wconf 74' lang='eng'>99</span> <span class='ocrx_word' id='word_1_2' title='bbox 292 3 512 24; x_wconf 84' lang='eng' dir='ltr'><em>Thermobrachium</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 522 3 601 24; x_wconf 84' lang='eng' dir='ltr'><em>celere</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 610 0 791 24; x_wconf 86' lang='eng' dir='ltr'><em>JW/YL—N235T</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 801 3 920 30; x_wconf 83' lang='eng' dir='ltr'><em>(X99238)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 298 50 792 80; baseline 0 -6"><span class='ocrx_word' id='word_1_6' title='bbox 298 52 558 74; x_wconf 81' lang='eng' dir='ltr'><em>Ca/oramatorindicus</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 569 50 662 74; x_wconf 91' lang='eng' dir='ltr'><em>|ndiB4T</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 672 52 792 80; x_wconf 84' lang='eng' dir='ltr'><em>(X75788)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 292 102 942 229">
+     <span class='ocr_line' id='line_1_3' title="bbox 292 102 942 130; baseline 0 -6"><span class='ocrx_word' id='word_1_9' title='bbox 292 102 462 124; x_wconf 77' lang='eng' dir='ltr'><em>‘Ca/oramator</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 469 102 611 124; x_wconf 85' lang='eng' dir='ltr'><em>uzoniensis’</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 622 102 778 124; x_wconf 87' lang='eng' dir='ltr'><em>JW/VK—KU2</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 789 102 942 130; x_wconf 87' lang='eng' dir='ltr'><em>(AF489534)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 334 149 871 179; baseline 0 -6"><span class='ocrx_word' id='word_1_13' title='bbox 334 152 497 173; x_wconf 83' lang='eng' dir='ltr'><em>Caloramator</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 503 152 700 179; x_wconf 82' lang='eng' dir='ltr'><em>proteoc/asticus</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 710 149 741 173; x_wconf 95' lang='eng' dir='ltr'><em>UT</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 752 152 871 179; x_wconf 86' lang='eng' dir='ltr'><em>(X90488)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 307 199 809 229; baseline 0 -6"><span class='ocrx_word' id='word_1_17' title='bbox 307 201 470 223; x_wconf 86' lang='eng' dir='ltr'><em>Caloramator</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 477 202 609 223; x_wconf 83' lang='eng' dir='ltr'><em>coo/haasi/</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 616 199 646 223; x_wconf 95' lang='eng' dir='ltr'><em>ZT</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 656 202 809 229; x_wconf 88' lang='eng' dir='ltr'><em>(AF104215)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 206 249 994 332">
+     <span class='ocr_line' id='line_1_6' title="bbox 206 249 994 279; baseline 0 -6"><span class='ocrx_word' id='word_1_21' title='bbox 206 261 323 263; x_wconf 91' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_22' title='bbox 333 251 496 273; x_wconf 81' lang='eng' dir='ltr'><em>Caloramator</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 504 251 649 273; x_wconf 77' lang='eng' dir='ltr'><em>viterbiensis</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 658 249 831 273; x_wconf 79' lang='eng' dir='ltr'><em>JW/MS-VSST</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 841 251 994 279; x_wconf 88' lang='eng' dir='ltr'><em>(AF181848)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 230 298 915 332; baseline 0 -8"><span class='ocrx_word' id='word_1_26' title='bbox 230 316 264 332; x_wconf 66' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 274 311 326 313; x_wconf 95' lang='eng'>—</span> <span class='ocrx_word' id='word_1_28' title='bbox 335 301 510 324; x_wconf 88' lang='eng' dir='ltr'><em>Caloramator</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 517 302 672 324; x_wconf 87' lang='eng' dir='ltr'><em>australicus</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 682 298 751 324; x_wconf 90' lang='eng' dir='ltr'><em>RC3T</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 759 301 915 329; x_wconf 85' lang='eng' dir='ltr'><em>(EU409943)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 199 349 916 429">
+     <span class='ocr_line' id='line_1_8' title="bbox 274 349 916 379; baseline 0 -6"><span class='ocrx_word' id='word_1_32' title='bbox 274 361 318 363; x_wconf 96' lang='eng'>—</span> <span class='ocrx_word' id='word_1_33' title='bbox 327 351 490 373; x_wconf 81' lang='eng' dir='ltr'><em>Caloramator</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 497 351 599 373; x_wconf 88' lang='eng' dir='ltr'><em>fen/idus</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 608 351 687 373; x_wconf 93' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 696 349 790 373; x_wconf 90' lang='eng' dir='ltr'><em>43204T</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 801 351 916 379; x_wconf 88' lang='eng' dir='ltr'><em>(L09187)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 199 399 807 429; baseline 0 -6"><span class='ocrx_word' id='word_1_38' title='bbox 199 401 344 423; x_wconf 86' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 354 401 480 429; x_wconf 76' lang='eng' dir='ltr'><em>butyricum</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 489 401 568 423; x_wconf 93' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 581 399 672 423; x_wconf 79' lang='eng' dir='ltr'><em>19398T</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 682 401 807 429; x_wconf 88' lang='eng' dir='ltr'><em>(M59085)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 88 27 129 43">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 88 27 129 43">
+     <span class='ocr_line' id='line_1_10' title="bbox 88 27 129 43; baseline 0 0"><span class='ocrx_word' id='word_1_43' title='bbox 88 27 129 43; x_wconf 88' lang='eng'><em>0.02</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 0 48 329 417">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 0 48 329 417">
+     <span class='ocr_line' id='line_1_11' title="bbox 256 48 293 95; baseline 0 -7"><span class='ocrx_word' id='word_1_44' title='bbox 256 48 293 95; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 185 95 292 144; baseline 0 285"><span class='ocrx_word' id='word_1_45' title='bbox 185 95 292 144; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 0 144 329 184; baseline 0 245"><span class='ocrx_word' id='word_1_46' title='bbox 0 144 329 184; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 0 184 307 283; baseline 0 0"><span class='ocrx_word' id='word_1_47' title='bbox 0 184 307 283; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 0 283 210 344; baseline 0 85"><span class='ocrx_word' id='word_1_48' title='bbox 0 283 210 344; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 0 344 210 417; baseline 0 0"><span class='ocrx_word' id='word_1_49' title='bbox 0 344 210 417; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 204 261 206 338">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 204 261 206 338">
+     <span class='ocr_line' id='line_1_17' title="bbox 204 261 206 338; baseline 0 91"><span class='ocrx_word' id='word_1_50' title='bbox 204 261 206 338; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 204 336 275 338">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 204 336 275 338">
+     <span class='ocr_line' id='line_1_18' title="bbox 204 336 275 338; baseline 0 91"><span class='ocrx_word' id='word_1_51' title='bbox 204 336 275 338; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 272 311 274 363">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 272 311 274 363">
+     <span class='ocr_line' id='line_1_19' title="bbox 272 311 274 363; baseline 0 66"><span class='ocrx_word' id='word_1_52' title='bbox 272 311 274 363; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000851-0-002.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000851-0-002.pbm.png
new file mode 100644
index 00000000..a9c8a980
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000851-0-002.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000851-0-002.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000851-0-002.pbm.png.hocr
new file mode 100644
index 00000000..9383debd
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000851-0-002.pbm.png.hocr
@@ -0,0 +1,155 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000851-0-002.pbm.png"; bbox 0 0 1302 781; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 412 6 1301 728">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 517 6 1118 34">
+     <span class='ocr_line' id='line_1_1' title="bbox 517 6 1118 34; baseline 0 -6"><span class='ocrx_word' id='word_1_1' title='bbox 517 7 663 28; x_wconf 83' lang='eng' dir='ltr'><em>Arcobacter</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 670 7 765 28; x_wconf 83' lang='eng' dir='ltr'><em>butz/eri</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 772 6 851 28; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 860 6 953 28; x_wconf 80' lang='eng' dir='ltr'><em>49616T</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 963 6 1054 34; x_wconf 88' lang='eng' dir='ltr'><em>(AY621</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 1062 6 1070 28; x_wconf 98' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 1079 6 1118 34; x_wconf 88' lang='eng'><em>16)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 413 55 1095 84">
+     <span class='ocr_line' id='line_1_2' title="bbox 413 55 1095 84; baseline -0.001 -6"><span class='ocrx_word' id='word_1_8' title='bbox 413 64 528 66; x_wconf 91' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_9' title='bbox 536 56 701 78; x_wconf 87' lang='eng' dir='ltr'><em>Helicobacter</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 706 56 778 84; x_wconf 87' lang='eng' dir='ltr'><em>pylori</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 787 56 866 78; x_wconf 91' lang='eng' dir='ltr'><em>NCTC</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 879 56 887 77; x_wconf 96' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 895 55 968 78; x_wconf 83' lang='eng' dir='ltr'><em>1637T</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 978 56 1080 84; x_wconf 90' lang='eng'><em>(225741</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 1088 56 1095 84; x_wconf 93' lang='eng'>)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 412 105 1253 233">
+     <span class='ocr_line' id='line_1_3' title="bbox 412 105 1142 133; baseline 0 -6"><span class='ocrx_word' id='word_1_16' title='bbox 412 114 504 116; x_wconf 91' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_17' title='bbox 514 106 629 127; x_wconf 87' lang='eng' dir='ltr'><em>Wolinella</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 639 106 819 133; x_wconf 83' lang='eng' dir='ltr'><em>succinogenes</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 827 105 906 127; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 916 105 1008 127; x_wconf 85' lang='eng' dir='ltr'><em>29543T</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 1018 105 1142 133; x_wconf 85' lang='eng' dir='ltr'><em>(M88159)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 503 154 1253 183; baseline 0 -6"><span class='ocrx_word' id='word_1_22' title='bbox 503 155 701 183; x_wconf 85' lang='eng' dir='ltr'><em>Campy/obacter</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 709 155 771 177; x_wconf 81' lang='eng' dir='ltr'><em>fetus</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 780 155 864 183; x_wconf 86' lang='eng' dir='ltr'><em>subsp.</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 876 155 939 177; x_wconf 83' lang='eng' dir='ltr'><em>fetus</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 947 155 1026 177; x_wconf 94' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 1036 154 1127 177; x_wconf 85' lang='eng' dir='ltr'><em>27374T</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 1138 155 1253 183; x_wconf 88' lang='eng' dir='ltr'><em>(LO4314)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 439 204 1188 233; baseline -0.001 -6"><span class='ocrx_word' id='word_1_29' title='bbox 439 218 471 233; x_wconf 69' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 478 213 508 215; x_wconf 88' lang='eng'>—</span> <span class='ocrx_word' id='word_1_31' title='bbox 517 205 715 233; x_wconf 87' lang='eng' dir='ltr'><em>Campy/obacter</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 723 205 867 232; x_wconf 85' lang='eng' dir='ltr'><em>upsaliensis</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 877 205 960 227; x_wconf 91' lang='eng' dir='ltr'><em>CCUG</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 973 204 1062 227; x_wconf 81' lang='eng' dir='ltr'><em>14913T</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 1072 205 1188 233; x_wconf 87' lang='eng' dir='ltr'><em>(L14628)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 441 254 1301 728">
+     <span class='ocr_line' id='line_1_6' title="bbox 478 254 1156 282; baseline 0 -6"><span class='ocrx_word' id='word_1_36' title='bbox 478 263 491 265; x_wconf 92' lang='eng'>-</span> <span class='ocrx_word' id='word_1_37' title='bbox 499 254 698 282; x_wconf 84' lang='eng' dir='ltr'><em>Campy/obacter</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 704 255 834 276; x_wconf 82' lang='eng' dir='ltr'><em>helveticus</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 845 254 923 276; x_wconf 91' lang='eng' dir='ltr'><em>NCTC</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 936 254 1025 276; x_wconf 83' lang='eng' dir='ltr'><em>12470T</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 1035 254 1156 282; x_wconf 86' lang='eng' dir='ltr'><em>(U03022)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 498 305 1137 332; baseline 0 -6"><span class='ocrx_word' id='word_1_42' title='bbox 498 305 696 332; x_wconf 85' lang='eng' dir='ltr'><em>Campy/obacter</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 702 305 812 332; x_wconf 85' lang='eng' dir='ltr'><em>peloridis</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 822 305 883 326; x_wconf 90' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 896 305 969 326; x_wconf 90' lang='eng'>11251</span> <span class='ocrx_word' id='word_1_46' title='bbox 984 305 1137 332; x_wconf 87' lang='eng' dir='ltr'><em>(AF550632)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 496 351 1152 380; baseline 0 -6"><span class='ocrx_word' id='word_1_47' title='bbox 496 352 694 380; x_wconf 88' lang='eng' dir='ltr'><em>Campy/obacter</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 700 352 810 380; x_wconf 86' lang='eng' dir='ltr'><em>peloridis</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 820 352 880 374; x_wconf 92' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 891 351 982 374; x_wconf 84' lang='eng' dir='ltr'><em>23910T</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 993 352 1152 380; x_wconf 86' lang='eng' dir='ltr'><em>(AM922331)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 483 402 1180 430; baseline -0.001 -6"><span class='ocrx_word' id='word_1_52' title='bbox 483 402 728 430; x_wconf 82' lang='eng' dir='ltr'><em>Campy/obacterlari</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 736 402 819 429; x_wconf 86' lang='eng' dir='ltr'><em>subsp.</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 831 402 871 424; x_wconf 82' lang='eng' dir='ltr'><em>Iari</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 879 402 963 424; x_wconf 91' lang='eng' dir='ltr'><em>CCUG</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 973 402 1053 424; x_wconf 87' lang='eng'>23947</span> <span class='ocrx_word' id='word_1_57' title='bbox 1064 402 1180 430; x_wconf 86' lang='eng' dir='ltr'><em>(LO4316)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 488 451 1218 479; baseline 0 -6"><span class='ocrx_word' id='word_1_58' title='bbox 488 451 686 479; x_wconf 83' lang='eng' dir='ltr'><em>Campy/obacter</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 693 452 867 479; x_wconf 87' lang='eng' dir='ltr'><em>insulaenigrae</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 878 451 956 473; x_wconf 88' lang='eng' dir='ltr'><em>NCTC</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 969 451 1058 473; x_wconf 82' lang='eng' dir='ltr'><em>12927T</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 1068 451 1218 479; x_wconf 88' lang='eng' dir='ltr'><em>(AJ620504)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 486 501 1284 529; baseline 0 -6"><span class='ocrx_word' id='word_1_63' title='bbox 486 501 730 529; x_wconf 86' lang='eng' dir='ltr'><em>Campy/obacter/ari</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 738 501 821 528; x_wconf 88' lang='eng' dir='ltr'><em>subsp.</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 834 501 959 523; x_wconf 85' lang='eng' dir='ltr'><em>concheus</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 969 501 1029 523; x_wconf 90' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 1042 501 1120 523; x_wconf 86' lang='eng'>11760</span> <span class='ocrx_word' id='word_1_68' title='bbox 1131 501 1284 529; x_wconf 88' lang='eng' dir='ltr'><em>(AF550633)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 485 531 1301 578; baseline 0 -5"><span class='ocrx_word' id='word_1_69' title='bbox 485 531 730 578; x_wconf 57' lang='eng' dir='ltr'><em>1((2)21mpylobacter/ari</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 738 551 821 578; x_wconf 85' lang='eng' dir='ltr'><em>subsp.</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 834 551 959 573; x_wconf 88' lang='eng' dir='ltr'><em>concheus</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 969 551 1029 573; x_wconf 93' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 1040 550 1131 573; x_wconf 90' lang='eng' dir='ltr'><em>21009T</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 1141 551 1301 578; x_wconf 86' lang='eng' dir='ltr'><em>(AM922330)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 441 600 1257 629; baseline 0 -6"><span class='ocrx_word' id='word_1_75' title='bbox 441 612 462 628; x_wconf 80' lang='eng'><em>55</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 483 601 757 629; x_wconf 85' lang='eng' dir='ltr'><em>Campy/obacterjejuni</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 765 601 848 628; x_wconf 86' lang='eng' dir='ltr'><em>subsp.</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 860 601 937 629; x_wconf 86' lang='eng' dir='ltr'><em>doylei</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 946 601 1029 623; x_wconf 91' lang='eng' dir='ltr'><strong>CCUG</strong></span> <span class='ocrx_word' id='word_1_80' title='bbox 1040 600 1132 623; x_wconf 77' lang='eng' dir='ltr'><em>24567T</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 1142 601 1257 629; x_wconf 85' lang='eng' dir='ltr'><em>(L14630)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 478 631 1248 678; baseline 0 -6"><span class='ocrx_word' id='word_1_82' title='bbox 478 631 755 678; x_wconf 53' lang='eng' dir='ltr'><em>1(goampylobacz‘erjejuni</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 762 651 846 678; x_wconf 89' lang='eng' dir='ltr'><em>subsp.</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 853 651 927 678; x_wconf 87' lang='eng' dir='ltr'><em>jejuni</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 934 650 1013 672; x_wconf 93' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 1023 650 1115 672; x_wconf 81' lang='eng' dir='ltr'><em>33560T</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 1125 650 1248 678; x_wconf 84' lang='eng' dir='ltr'><em>(M59298)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 507 699 1078 728; baseline 0 -6"><span class='ocrx_word' id='word_1_88' title='bbox 507 700 706 728; x_wconf 87' lang='eng' dir='ltr'><em>Campy/obacter</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 713 700 757 722; x_wconf 88' lang='eng' dir='ltr'><em>coli</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 764 700 843 722; x_wconf 93' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 853 699 945 722; x_wconf 83' lang='eng' dir='ltr'><em>33559T</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 955 700 1078 728; x_wconf 86' lang='eng' dir='ltr'><em>(M59073)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 14 749 689 777">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 14 749 689 777">
+     <span class='ocr_line' id='line_1_16' title="bbox 14 749 689 777; baseline 0.001 -6"><span class='ocrx_word' id='word_1_93' title='bbox 14 750 188 772; x_wconf 79' lang='eng' dir='ltr'><em>Caminibacler</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 194 750 400 777; x_wconf 88' lang='eng' dir='ltr'><em>hydrogeniphilus</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 408 750 464 771; x_wconf 93' lang='eng' dir='ltr'><em>AM1</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 472 750 480 771; x_wconf 96' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 488 749 528 772; x_wconf 83' lang='eng' dir='ltr'><em>16T</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 538 750 689 777; x_wconf 87' lang='eng' dir='ltr'><em>(AJ309655)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 129 34 337 54">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 129 34 337 54">
+     <span class='ocr_line' id='line_1_17' title="bbox 129 34 337 54; baseline 0.005 -1"><span class='ocrx_word' id='word_1_99' title='bbox 129 38 173 54; x_wconf 82' lang='eng'><em>10%</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 315 34 337 49; x_wconf 80' lang='eng'><em>58</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 2 10 516 352">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 2 10 516 352">
+     <span class='ocr_line' id='line_1_18' title="bbox 330 10 516 91; baseline 0 690"><span class='ocrx_word' id='word_1_101' title='bbox 330 10 516 91; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 2 91 495 247; baseline 0 -57"><span class='ocrx_word' id='word_1_102' title='bbox 2 91 495 247; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 330 247 444 352; baseline 0 429"><span class='ocrx_word' id='word_1_103' title='bbox 330 247 444 352; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 410 67 412 116">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 410 67 412 116">
+     <span class='ocr_line' id='line_1_21' title="bbox 410 67 412 116; baseline 0 665"><span class='ocrx_word' id='word_1_104' title='bbox 410 67 412 116; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 297 131 329 146">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 297 131 329 146">
+     <span class='ocr_line' id='line_1_22' title="bbox 297 131 329 146; baseline 0 0"><span class='ocrx_word' id='word_1_105' title='bbox 297 131 329 146; x_wconf 88' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 440 238 478 240">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 440 238 478 240">
+     <span class='ocr_line' id='line_1_23' title="bbox 440 238 478 240; baseline 0 541"><span class='ocrx_word' id='word_1_106' title='bbox 440 238 478 240; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 476 213 478 265">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 476 213 478 265">
+     <span class='ocr_line' id='line_1_24' title="bbox 476 213 478 265; baseline 0 516"><span class='ocrx_word' id='word_1_107' title='bbox 476 213 478 265; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 438 310 505 716">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 438 310 505 716">
+     <span class='ocr_line' id='line_1_25' title="bbox 448 310 494 345; baseline 0 436"><span class='ocrx_word' id='word_1_108' title='bbox 448 310 494 345; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 438 345 494 444; baseline 0.071 -55"><span class='ocrx_word' id='word_1_109' title='bbox 438 345 494 444; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 438 444 485 543; baseline 0 -50"><span class='ocrx_word' id='word_1_110' title='bbox 438 444 485 543; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 453 543 484 586; baseline 0 0"><span class='ocrx_word' id='word_1_111' title='bbox 453 543 484 586; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 462 643 505 716; baseline 0 0"><span class='ocrx_word' id='word_1_112' title='bbox 462 643 505 716; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 412 351 463 372">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 412 351 463 372">
+     <span class='ocr_line' id='line_1_30' title="bbox 412 351 463 372; baseline -0.02 -5"><span class='ocrx_word' id='word_1_113' title='bbox 412 351 434 367; x_wconf 82' lang='eng'>97</span> <span class='ocrx_word' id='word_1_114' title='bbox 440 357 463 372; x_wconf 74' lang='eng'>55</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 440 238 442 456">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 440 238 442 456">
+     <span class='ocr_line' id='line_1_31' title="bbox 440 238 442 456; baseline 0 325"><span class='ocrx_word' id='word_1_115' title='bbox 440 238 442 456; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 432 459 454 475">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 432 459 454 475">
+     <span class='ocr_line' id='line_1_32' title="bbox 432 459 454 475; baseline -0.045 0"><span class='ocrx_word' id='word_1_116' title='bbox 432 459 454 475; x_wconf 84' lang='eng'>97</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 436 543 455 558">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 436 543 455 558">
+     <span class='ocr_line' id='line_1_33' title="bbox 436 543 455 558; baseline 0 0"><span class='ocrx_word' id='word_1_117' title='bbox 436 543 455 558; x_wconf 86' lang='eng'>41</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 443 678 465 694">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 443 678 465 694">
+     <span class='ocr_line' id='line_1_34' title="bbox 443 678 465 694; baseline 0 0"><span class='ocrx_word' id='word_1_118' title='bbox 443 678 465 694; x_wconf 84' lang='eng'><em>64</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 0 153 2 762">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 0 153 2 762">
+     <span class='ocr_line' id='line_1_35' title="bbox 0 153 2 762; baseline 0 19"><span class='ocrx_word' id='word_1_119' title='bbox 0 153 2 762; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000901-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000901-0-000.pbm.png
new file mode 100644
index 00000000..580a06f1
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000901-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000901-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000901-0-000.pbm.png.hocr
new file mode 100644
index 00000000..fce2136e
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000901-0-000.pbm.png.hocr
@@ -0,0 +1,108 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000901-0-000.pbm.png"; bbox 0 0 1657 1258; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 10 2 707 49">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 10 2 707 49">
+     <span class='ocr_line' id='line_1_1' title="bbox 334 2 399 22; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 334 2 399 22; x_wconf 80' lang='eng'><em>0.05</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 10 30 707 49; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 10 30 707 49; x_wconf 93' lang='eng' dir='ltr'><em>I—l</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 17 88 1655 1256">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 17 88 1655 1256">
+     <span class='ocr_line' id='line_1_3' title="bbox 107 88 1287 123; baseline 0 -7"><span class='ocrx_word' id='word_1_3' title='bbox 107 105 132 122; x_wconf 66' lang='eng'><em>93</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 506 93 734 117; x_wconf 76' lang='eng' dir='ltr'><em>Antarctobacter</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 744 93 938 117; x_wconf 81' lang='eng' dir='ltr'><em>heliathermus</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 951 93 1023 117; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 1040 88 1287 123; x_wconf 65' lang='eng' dir='ltr'>11445T(Y11552)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 577 126 1217 161; baseline 0.002 -7"><span class='ocrx_word' id='word_1_8' title='bbox 577 130 712 161; x_wconf 77' lang='eng' dir='ltr'><em>Sagiltula</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 722 130 833 155; x_wconf 79' lang='eng' dir='ltr'><em>stellata</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 842 131 932 155; x_wconf 85' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_11' title='bbox 944 126 1064 155; x_wconf 89' lang='eng' dir='ltr'><em>700073T</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 1075 131 1217 161; x_wconf 72' lang='eng' dir='ltr'>(US$356)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 121 163 1080 199; baseline 0 -7"><span class='ocrx_word' id='word_1_13' title='bbox 121 181 145 197; x_wconf 60' lang='eng'>57</span> <span class='ocrx_word' id='word_1_14' title='bbox 419 168 595 199; x_wconf 81' lang='eng' dir='ltr'><em>Donghicola</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 606 168 741 192; x_wconf 79' lang='eng' dir='ltr'><em>eburneus</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 753 163 882 192; x_wconf 85' lang='eng' dir='ltr'><em>SW—277T</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 893 169 1080 199; x_wconf 88' lang='eng' dir='ltr'>(DQ667965)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 452 201 1107 237; baseline 0 -7"><span class='ocrx_word' id='word_1_18' title='bbox 452 207 632 237; x_wconf 77' lang='eng' dir='ltr'><strong><em>Donghicola</em></strong></span> <span class='ocrx_word' id='word_1_19' title='bbox 640 207 832 230; x_wconf 81' lang='eng' dir='ltr'><strong><em>xiamenensis</em></strong></span> <span class='ocrx_word' id='word_1_20' title='bbox 842 201 907 230; x_wconf 80' lang='eng' dir='ltr'><em>Y-2T</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 918 207 1107 236; x_wconf 88' lang='eng' dir='ltr'><em>(DQ120728)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 309 239 1371 274; baseline 0.001 -7"><span class='ocrx_word' id='word_1_22' title='bbox 309 256 334 272; x_wconf 74' lang='eng'>99</span> <span class='ocrx_word' id='word_1_23' title='bbox 686 245 849 268; x_wconf 76' lang='eng' dir='ltr'><em>Roseivivax</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 859 244 1027 268; x_wconf 77' lang='eng' dir='ltr'><em>halodurans</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 1038 244 1104 268; x_wconf 85' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 1120 239 1219 268; x_wconf 82' lang='eng' dir='ltr'><em>10272T</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 1230 244 1371 274; x_wconf 79' lang='eng' dir='ltr'>(D85829)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 632 277 1337 312; baseline 0 -6"><span class='ocrx_word' id='word_1_28' title='bbox 632 282 794 306; x_wconf 80' lang='eng' dir='ltr'><em>Roseivivax</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 804 281 993 306; x_wconf 78' lang='eng' dir='ltr'><em>halotolerans</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 1004 282 1071 306; x_wconf 89' lang='eng' dir='ltr'>JCM</span> <span class='ocrx_word' id='word_1_31' title='bbox 1086 282 1167 306; x_wconf 89' lang='eng'>10271</span> <span class='ocrx_word' id='word_1_32' title='bbox 1179 277 1185 288; x_wconf 45' lang='eng' dir='ltr'>F</span> <span class='ocrx_word' id='word_1_33' title='bbox 1195 282 1337 312; x_wconf 82' lang='eng' dir='ltr'>(D85831)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 164 315 1236 350; baseline 0 -7"><span class='ocrx_word' id='word_1_34' title='bbox 164 319 188 335; x_wconf 73' lang='eng'>79</span> <span class='ocrx_word' id='word_1_35' title='bbox 558 319 697 350; x_wconf 73' lang='eng' dir='ltr'><em>Salipiger</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 706 328 832 343; x_wconf 73' lang='eng' dir='ltr'><em>mucosus</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 842 320 918 343; x_wconf 87' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_38' title='bbox 930 315 1033 343; x_wconf 88' lang='eng' dir='ltr'><em>22090T</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 1052 319 1236 349; x_wconf 84' lang='eng' dir='ltr'>(AY527274)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 434 352 1308 388; baseline 0 -7"><span class='ocrx_word' id='word_1_40' title='bbox 434 358 595 388; x_wconf 79' lang='eng' dir='ltr'><em>Leisingera</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 606 357 915 388; x_wconf 77' lang='eng' dir='ltr'><em>methylohalidivorans</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 926 358 1001 381; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 1015 352 1114 381; x_wconf 81' lang='eng' dir='ltr'><em>14336T</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 1124 358 1308 388; x_wconf 88' lang='eng' dir='ltr'>(AY005463)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 410 390 1081 426; baseline 0 -7"><span class='ocrx_word' id='word_1_45' title='bbox 410 395 602 419; x_wconf 79' lang='eng' dir='ltr'><em>Phaeobacter</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 609 395 808 426; x_wconf 77' lang='eng' dir='ltr'><em>gallaeciensis</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 818 390 925 419; x_wconf 77' lang='eng' dir='ltr'><em>B81071</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 939 395 1081 425; x_wconf 86' lang='eng' dir='ltr'>(Y13244)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 280 428 944 463; baseline -0.003 -5"><span class='ocrx_word' id='word_1_49' title='bbox 280 441 317 458; x_wconf 81' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 363 433 555 457; x_wconf 77' lang='eng' dir='ltr'><em>Phaeobacter</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 565 433 689 457; x_wconf 74' lang='eng' dir='ltr'><em>inhibens</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 700 428 750 457; x_wconf 72' lang='eng' dir='ltr'><em>TST</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 761 433 944 463; x_wconf 89' lang='eng' dir='ltr'>(AY177712)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 389 466 1058 501; baseline 0 -7"><span class='ocrx_word' id='word_1_54' title='bbox 389 471 561 494; x_wconf 78' lang='eng' dir='ltr'><em>Marinovum</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 571 470 693 501; x_wconf 80' lang='eng' dir='ltr'><em>algicola</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 702 471 792 494; x_wconf 87' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_57' title='bbox 804 466 906 494; x_wconf 52' lang='eng'>51440&quot;</span> <span class='ocrx_word' id='word_1_58' title='bbox 916 470 1058 501; x_wconf 82' lang='eng' dir='ltr'>(X78315)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 640 503 1431 539; baseline 0 -7"><span class='ocrx_word' id='word_1_59' title='bbox 640 508 810 532; x_wconf 79' lang='eng' dir='ltr'><em>Jannaschia</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 821 508 1046 539; x_wconf 73' lang='eng' dir='ltr'><em>helgalandensis</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 1056 509 1131 532; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 1146 509 1212 532; x_wconf 84' lang='eng'>1485</span> <span class='ocrx_word' id='word_1_63' title='bbox 1219 503 1245 532; x_wconf 67' lang='eng' dir='ltr'><em>ST</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 1255 508 1361 539; x_wconf 87' lang='eng' dir='ltr'>(AJ438</span> <span class='ocrx_word' id='word_1_65' title='bbox 1369 509 1377 532; x_wconf 96' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 1385 508 1431 539; x_wconf 91' lang='eng'><em>57)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 692 541 1490 577; baseline -0.001 -7"><span class='ocrx_word' id='word_1_67' title='bbox 692 546 995 577; x_wconf 81' lang='eng' dir='ltr'><em>Ketogulonicigenium</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 1007 546 1118 577; x_wconf 77' lang='eng' dir='ltr'><em>vulgare</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 1130 546 1203 570; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 1214 541 1490 576; x_wconf 47' lang='eng' dir='ltr'>40251(AF136849)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 665 579 1404 615; baseline 0 -7"><span class='ocrx_word' id='word_1_71' title='bbox 665 584 835 608; x_wconf 79' lang='eng' dir='ltr'><em>Oceanicola</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 844 584 1011 615; x_wconf 72' lang='eng' dir='ltr'><em>gramzlosus</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 1021 584 1096 608; x_wconf 91' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_74' title='bbox 1111 579 1206 608; x_wconf 52' lang='eng'>15982&quot;</span> <span class='ocrx_word' id='word_1_75' title='bbox 1220 584 1404 614; x_wconf 81' lang='eng' dir='ltr'>(AY424896)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 388 617 1359 652; baseline -0.001 -5"><span class='ocrx_word' id='word_1_76' title='bbox 388 630 413 647; x_wconf 82' lang='eng'><em>97</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 690 622 880 646; x_wconf 79' lang='eng' dir='ltr'><em>Roseisalinus</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 890 624 1058 646; x_wconf 74' lang='eng' dir='ltr'><em>antarcticus</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 1070 617 1173 646; x_wconf 73' lang='eng' dir='ltr'><em>EL-SST</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 1183 622 1359 652; x_wconf 81' lang='eng' dir='ltr'>(AJ605747)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 17 655 1655 690; baseline 0 -7"><span class='ocrx_word' id='word_1_81' title='bbox 17 660 26 677; x_wconf 77' lang='eng'>0</span> <span class='ocrx_word' id='word_1_82' title='bbox 931 659 1125 683; x_wconf 75' lang='eng' dir='ltr'><em>Rhodobacter</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 1134 659 1294 690; x_wconf 76' lang='eng' dir='ltr'><em>capsulafus</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 1302 660 1392 683; x_wconf 89' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_85' title='bbox 1407 655 1504 683; x_wconf 91' lang='eng' dir='ltr'><em>11166T</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 1514 659 1655 690; x_wconf 86' lang='eng' dir='ltr'>(D16428)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 746 692 1576 728; baseline 0 -7"><span class='ocrx_word' id='word_1_87' title='bbox 746 697 1066 728; x_wconf 75' lang='eng' dir='ltr'><em>Marinasulfonomonas</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 1077 697 1293 728; x_wconf 77' lang='eng' dir='ltr'><em>methylotropha</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 1304 692 1424 721; x_wconf 83' lang='eng' dir='ltr'><em>PSCH4T</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 1434 697 1576 728; x_wconf 84' lang='eng' dir='ltr'>(U62894)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 743 730 1266 766; baseline -0.002 -7"><span class='ocrx_word' id='word_1_91' title='bbox 743 735 860 759; x_wconf 81' lang='eng' dir='ltr'><em>Nereida</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 872 737 970 766; x_wconf 83' lang='eng' dir='ltr'><em>ignava</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 981 730 1080 759; x_wconf 79' lang='eng' dir='ltr'><em>ZSM4T</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 1091 735 1266 765; x_wconf 80' lang='eng' dir='ltr'>(AJ748748)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 579 768 1310 803; baseline 0 -6"><span class='ocrx_word' id='word_1_95' title='bbox 579 773 784 797; x_wconf 74' lang='eng' dir='ltr'><em>Oceanihulbus</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 795 773 926 803; x_wconf 72' lang='eng' dir='ltr'><em>indoltfex</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 937 773 1010 797; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 1025 768 1310 803; x_wconf 43' lang='eng' dir='ltr'>148621(A1550939)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 579 805 1214 841; baseline 0 -7"><span class='ocrx_word' id='word_1_99' title='bbox 579 810 688 841; x_wconf 78' lang='eng' dir='ltr'><em>Staleya</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 697 810 863 841; x_wconf 74' lang='eng' dir='ltr'><em>guttiformis</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 874 805 1214 841; x_wconf 68' lang='eng' dir='ltr'>DSM11458T(Y16427)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 592 843 1237 879; baseline -0.002 -7"><span class='ocrx_word' id='word_1_102' title='bbox 592 848 789 879; x_wconf 80' lang='eng' dir='ltr'><em>Sulfitobacter</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 798 848 886 872; x_wconf 82' lang='eng' dir='ltr'><em>brevis</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 898 848 971 872; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 987 843 1237 878; x_wconf 60' lang='eng' dir='ltr'>11443T(Y16425)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 266 881 1239 917; baseline 0 -7"><span class='ocrx_word' id='word_1_106' title='bbox 266 900 290 917; x_wconf 70' lang='eng'>68</span> <span class='ocrx_word' id='word_1_107' title='bbox 376 894 400 911; x_wconf 72' lang='eng'><em>53</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 537 881 1239 917; x_wconf 65' lang='eng' dir='ltr'><em>SulfitobacterpontiacusDSM10014T(Y13155)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 190 919 1324 955; baseline 0 -7"><span class='ocrx_word' id='word_1_109' title='bbox 190 938 214 955; x_wconf 71' lang='eng'><em>97</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 598 924 785 948; x_wconf 80' lang='eng' dir='ltr'><em>Raseobacter</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 794 924 985 955; x_wconf 67' lang='eng' dir='ltr'><em>denitrificarzs</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 997 924 1070 948; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 1082 919 1166 948; x_wconf 85' lang='eng' dir='ltr'><em>7001T</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 1176 924 1324 954; x_wconf 87' lang='eng' dir='ltr'>(M59063)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 390 957 1239 992; baseline -0.001 -5"><span class='ocrx_word' id='word_1_115' title='bbox 390 970 428 987; x_wconf 84' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 557 962 746 985; x_wconf 79' lang='eng' dir='ltr'><em>Roseobacler</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 755 962 874 985; x_wconf 77' lang='eng' dir='ltr'><em>liloralis</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 883 962 973 986; x_wconf 86' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_119' title='bbox 984 957 1087 986; x_wconf 85' lang='eng' dir='ltr'><em>49566T</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 1097 962 1239 992; x_wconf 84' lang='eng' dir='ltr'>(X78312)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 728 995 1442 1029; baseline 0 -6"><span class='ocrx_word' id='word_1_121' title='bbox 728 999 966 1023; x_wconf 79' lang='eng' dir='ltr'><em>Octadecabacter</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 975 1001 1094 1023; x_wconf 79' lang='eng' dir='ltr'><em>arcticus</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 1105 1000 1158 1023; x_wconf 81' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_124' title='bbox 1173 995 1442 1029; x_wconf 58' lang='eng' dir='ltr'>1067321(U73725)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 296 1032 1267 1068; baseline 0 -7"><span class='ocrx_word' id='word_1_125' title='bbox 296 1046 321 1062; x_wconf 76' lang='eng'><em>90</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 511 1037 706 1061; x_wconf 77' lang='eng' dir='ltr'><em>Thalassobius</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 715 1032 1267 1068; x_wconf 73' lang='eng' dir='ltr'><em>gelatinovorusIAM12617T(D88523)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 170 1070 1254 1106; baseline -0.001 -7"><span class='ocrx_word' id='word_1_128' title='bbox 170 1087 191 1104; x_wconf 70' lang='eng'><em>61</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 484 1076 669 1099; x_wconf 72' lang='eng' dir='ltr'><em>Roseovarius</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 679 1079 867 1099; x_wconf 70' lang='eng' dir='ltr'><em>crassostreae</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 878 1070 1063 1099; x_wconf 81' lang='eng' dir='ltr'><em>CV919-312r</em></span> <span class='ocrx_word' id='word_1_132' title='bbox 1074 1075 1254 1106; x_wconf 83' lang='eng' dir='ltr'>(AF114484)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 442 1108 1211 1143; baseline 0 -7"><span class='ocrx_word' id='word_1_133' title='bbox 442 1113 627 1136; x_wconf 77' lang='eng' dir='ltr'><em>Roseovarius</em></span> <span class='ocrx_word' id='word_1_134' title='bbox 638 1112 819 1136; x_wconf 74' lang='eng' dir='ltr'><em>nubinhibens</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 830 1113 905 1136; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_136' title='bbox 920 1108 1015 1136; x_wconf 50' lang='eng'>15170&quot;</span> <span class='ocrx_word' id='word_1_137' title='bbox 1029 1113 1211 1143; x_wconf 84' lang='eng' dir='ltr'>(AF098495)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 474 1145 1138 1181; baseline -0.002 -7"><span class='ocrx_word' id='word_1_138' title='bbox 474 1151 657 1174; x_wconf 77' lang='eng' dir='ltr'><em>Roseovarius</em></span> <span class='ocrx_word' id='word_1_139' title='bbox 668 1150 790 1174; x_wconf 78' lang='eng' dir='ltr'><em>tolerans</em></span> <span class='ocrx_word' id='word_1_140' title='bbox 800 1150 875 1174; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_141' title='bbox 891 1145 1138 1181; x_wconf 63' lang='eng' dir='ltr'>11457T(Y11551)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 378 1183 1001 1219; baseline 0 -7"><span class='ocrx_word' id='word_1_142' title='bbox 378 1189 514 1219; x_wconf 81' lang='eng' dir='ltr'><em>Ruegeria</em></span> <span class='ocrx_word' id='word_1_143' title='bbox 524 1183 1001 1219; x_wconf 67' lang='eng' dir='ltr'>atlanticaIAM14463T(D88526)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 206 1221 1205 1256; baseline 0 -6"><span class='ocrx_word' id='word_1_144' title='bbox 206 1235 243 1251; x_wconf 85' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_145' title='bbox 418 1226 594 1250; x_wconf 77' lang='eng' dir='ltr'><em>Silicibacter</em></span> <span class='ocrx_word' id='word_1_146' title='bbox 604 1226 854 1250; x_wconf 76' lang='eng' dir='ltr'><em>lacuscaeru/ensis</em></span> <span class='ocrx_word' id='word_1_147' title='bbox 865 1221 1205 1256; x_wconf 69' lang='eng' dir='ltr'>DSM11314T(U77644)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 209 379 233 396">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 209 379 233 396">
+     <span class='ocr_line' id='line_1_34' title="bbox 209 379 233 396; baseline 0 0"><span class='ocrx_word' id='word_1_148' title='bbox 209 379 233 396; x_wconf 81' lang='eng'>97</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 294 567 319 584">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 294 567 319 584">
+     <span class='ocr_line' id='line_1_35' title="bbox 294 567 319 584; baseline 0 0"><span class='ocrx_word' id='word_1_149' title='bbox 294 567 319 584; x_wconf 82' lang='eng'>.98</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 238 796 339 815">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 238 796 339 815">
+     <span class='ocr_line' id='line_1_36' title="bbox 238 796 339 815; baseline 0.02 -2"><span class='ocrx_word' id='word_1_150' title='bbox 238 796 262 813; x_wconf 82' lang='eng'>60</span> <span class='ocrx_word' id='word_1_151' title='bbox 315 798 339 815; x_wconf 82' lang='eng'>82</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000935-0-005.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000935-0-005.pbm.png
new file mode 100644
index 00000000..3e93d074
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000935-0-005.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000935-0-005.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000935-0-005.pbm.png.hocr
new file mode 100644
index 00000000..1d947f3d
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000935-0-005.pbm.png.hocr
@@ -0,0 +1,478 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000935-0-005.pbm.png"; bbox 0 0 2012 1680; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 1 1381 132 1400">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 1 1381 132 1400">
+     <span class='ocr_line' id='line_1_1' title="bbox 1 1381 132 1400; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 1 1381 132 1400; x_wconf 87' lang='eng'>94/100/1.00</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 216 41 398 303">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 217 41 398 151">
+     <span class='ocr_line' id='line_1_2' title="bbox 217 41 398 60; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 217 46 235 60; x_wconf 89' lang='eng' dir='ltr'><em>a:</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 254 41 398 60; x_wconf 91' lang='eng'>100/100/1.00</span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 218 72 370 91; baseline 0.007 -1"><span class='ocrx_word' id='word_1_4' title='bbox 218 72 235 91; x_wconf 87' lang='eng' dir='ltr'><em>b:</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 253 72 370 91; x_wconf 72' lang='eng'><em>79/64/098</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 217 102 368 121; baseline 0.007 -1"><span class='ocrx_word' id='word_1_6' title='bbox 217 107 234 121; x_wconf 90' lang='eng' dir='ltr'><em>c:</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 251 102 368 121; x_wconf 75' lang='eng'>73/65/099</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 217 132 308 151; baseline 0 0"><span class='ocrx_word' id='word_1_8' title='bbox 217 132 235 151; x_wconf 90' lang='eng' dir='ltr'><em>d:</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 251 132 308 151; x_wconf 91' lang='eng'><strong>—/—/—</strong></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 216 162 370 211">
+     <span class='ocr_line' id='line_1_6' title="bbox 217 162 370 181; baseline 0 0"><span class='ocrx_word' id='word_1_10' title='bbox 217 167 235 181; x_wconf 89' lang='eng' dir='ltr'><em>e:</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 252 162 370 181; x_wconf 82' lang='eng'>87/85/100</span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 216 192 349 211; baseline 0 0"><span class='ocrx_word' id='word_1_12' title='bbox 216 193 228 211; x_wconf 88' lang='eng' dir='ltr'>f:</span> <span class='ocrx_word' id='word_1_13' title='bbox 244 192 349 211; x_wconf 86' lang='eng'><em>—/57/0.99</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 217 223 363 247">
+     <span class='ocr_line' id='line_1_8' title="bbox 217 223 363 247; baseline 0.007 -6"><span class='ocrx_word' id='word_1_14' title='bbox 217 228 235 247; x_wconf 87' lang='eng' dir='ltr'><em>g:</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 245 223 363 242; x_wconf 75' lang='eng'><em>76/82/096</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 218 253 391 303">
+     <span class='ocr_line' id='line_1_9' title="bbox 218 253 391 272; baseline 0 0"><span class='ocrx_word' id='word_1_16' title='bbox 218 253 235 272; x_wconf 90' lang='eng' dir='ltr'><em>h:</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 247 253 391 272; x_wconf 83' lang='eng'>100/100/100</span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 218 283 361 303; baseline 0.007 -1"><span class='ocrx_word' id='word_1_18' title='bbox 218 283 227 302; x_wconf 90' lang='eng' dir='ltr'><em>i:</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 244 283 361 303; x_wconf 69' lang='eng'>76/75/073</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 686 389 918 416">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 686 389 918 416">
+     <span class='ocr_line' id='line_1_11' title="bbox 686 389 918 416; baseline 0 0"><span class='ocrx_word' id='word_1_20' title='bbox 686 397 791 416; x_wconf 67' lang='eng'><em>—/54/0,56</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 906 389 918 403; x_wconf 68' lang='eng' dir='ltr'>e</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 639 469 756 488">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 639 469 756 488">
+     <span class='ocr_line' id='line_1_12' title="bbox 639 469 756 488; baseline 0 0"><span class='ocrx_word' id='word_1_22' title='bbox 639 469 756 488; x_wconf 72' lang='eng'><em>61/54/062</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 495 526 625 545">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 495 526 625 545">
+     <span class='ocr_line' id='line_1_13' title="bbox 495 526 625 545; baseline 0 0"><span class='ocrx_word' id='word_1_23' title='bbox 495 526 625 545; x_wconf 24' lang='eng'>100/97/1‘00</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 419 659 537 678">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 419 659 537 678">
+     <span class='ocr_line' id='line_1_14' title="bbox 419 659 537 678; baseline 0 0"><span class='ocrx_word' id='word_1_24' title='bbox 419 659 498 678; x_wconf 85' lang='eng'><em>90/93/1</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 505 659 537 678; x_wconf 90' lang='eng'><em>.00</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 651 696 803 758">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 651 696 803 758">
+     <span class='ocr_line' id='line_1_15' title="bbox 698 696 803 715; baseline 0 0"><span class='ocrx_word' id='word_1_26' title='bbox 698 696 803 715; x_wconf 84' lang='eng'><em>—/64/0.67</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 651 739 769 758; baseline 0 0"><span class='ocrx_word' id='word_1_27' title='bbox 651 739 769 758; x_wconf 17' lang='eng'><em>92/87/1000</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 560 796 691 815">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 560 796 691 815">
+     <span class='ocr_line' id='line_1_17' title="bbox 560 796 691 815; baseline 0 0"><span class='ocrx_word' id='word_1_28' title='bbox 560 796 691 815; x_wconf 82' lang='eng'>97/100/100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 339 874 456 893">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 339 874 456 893">
+     <span class='ocr_line' id='line_1_18' title="bbox 339 874 456 893; baseline 0 0"><span class='ocrx_word' id='word_1_29' title='bbox 339 874 417 893; x_wconf 86' lang='eng'>73/59/1</span> <span class='ocrx_word' id='word_1_30' title='bbox 424 874 456 893; x_wconf 93' lang='eng'>.00</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 271 1077 375 1096">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 271 1077 375 1096">
+     <span class='ocr_line' id='line_1_19' title="bbox 271 1077 375 1096; baseline 0 0"><span class='ocrx_word' id='word_1_31' title='bbox 271 1077 375 1096; x_wconf 87' lang='eng'><em>57/—/0.88</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 154 1255 254 1274">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 154 1255 254 1274">
+     <span class='ocr_line' id='line_1_20' title="bbox 154 1255 254 1274; baseline 0.01 -1"><span class='ocrx_word' id='word_1_32' title='bbox 154 1255 254 1274; x_wconf 83' lang='eng'><em>72/—/0.91</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 673 1007 817 1026">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 673 1007 817 1026">
+     <span class='ocr_line' id='line_1_21' title="bbox 673 1007 817 1026; baseline 0 0"><span class='ocrx_word' id='word_1_33' title='bbox 673 1007 817 1026; x_wconf 90' lang='eng'>100/100/1.00</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 818 15 1167 41">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 818 15 1167 41">
+     <span class='ocr_line' id='line_1_22' title="bbox 818 15 1167 41; baseline -0.006 -3"><span class='ocrx_word' id='word_1_34' title='bbox 818 21 936 40; x_wconf 67' lang='eng'>87/92/095</span> <span class='ocrx_word' id='word_1_35' title='bbox 959 15 1061 41; x_wconf 86' lang='eng' dir='ltr'><em>Colpoda</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 1071 15 1167 36; x_wconf 82' lang='eng' dir='ltr'><em>cucuI/us</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 799 49 929 106">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 799 49 929 106">
+     <span class='ocr_line' id='line_1_23' title="bbox 799 49 929 68; baseline 0 0"><span class='ocrx_word' id='word_1_37' title='bbox 799 49 890 68; x_wconf 85' lang='eng'><em>100/99/1</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 897 49 929 68; x_wconf 92' lang='eng'>.00</span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 803 87 893 106; baseline 0 0"><span class='ocrx_word' id='word_1_39' title='bbox 803 87 893 106; x_wconf 91' lang='eng'><em>—/—/0.54</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 973 50 1158 114">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 973 50 1158 114">
+     <span class='ocr_line' id='line_1_25' title="bbox 975 50 1158 77; baseline 0 -6"><span class='ocrx_word' id='word_1_40' title='bbox 975 50 1077 77; x_wconf 88' lang='eng' dir='ltr'><em>Colpoda</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 1086 51 1158 71; x_wconf 82' lang='eng' dir='ltr'><em>Iucida</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 973 88 1157 114; baseline 0 -5"><span class='ocrx_word' id='word_1_42' title='bbox 973 88 1075 114; x_wconf 89' lang='eng' dir='ltr'><em>Colpoda</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 1084 88 1157 109; x_wconf 87' lang='eng' dir='ltr'><em>inﬂata</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 918 123 1152 149">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 918 123 1152 149">
+     <span class='ocr_line' id='line_1_27' title="bbox 918 123 1152 149; baseline 0 -5"><span class='ocrx_word' id='word_1_44' title='bbox 918 135 930 149; x_wconf 71' lang='eng' dir='ltr'>a</span> <span class='ocrx_word' id='word_1_45' title='bbox 957 123 1058 149; x_wconf 89' lang='eng' dir='ltr'><em>Colpoda</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 1068 128 1152 149; x_wconf 89' lang='eng' dir='ltr'><em>magna</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 742 159 860 178">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 742 159 860 178">
+     <span class='ocr_line' id='line_1_28' title="bbox 742 159 860 178; baseline 0 0"><span class='ocrx_word' id='word_1_47' title='bbox 742 159 860 178; x_wconf 82' lang='eng'>87/92/100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 957 160 1157 186">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 957 160 1157 186">
+     <span class='ocr_line' id='line_1_29' title="bbox 957 160 1157 186; baseline 0 -5"><span class='ocrx_word' id='word_1_48' title='bbox 957 160 1058 186; x_wconf 84' lang='eng' dir='ltr'><em>Colpoda</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 1068 161 1157 181; x_wconf 90' lang='eng' dir='ltr'><em>minima</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 878 196 1240 260">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 878 196 1240 259">
+     <span class='ocr_line' id='line_1_30' title="bbox 912 196 1189 219; baseline 0 -3"><span class='ocrx_word' id='word_1_50' title='bbox 912 200 924 219; x_wconf 85' lang='eng' dir='ltr'>b</span> <span class='ocrx_word' id='word_1_51' title='bbox 988 196 1111 216; x_wconf 85' lang='eng' dir='ltr'><em>Bresslaua</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 1122 201 1189 216; x_wconf 89' lang='eng' dir='ltr'><em>vorax</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 878 232 1240 259; baseline -0.003 -5"><span class='ocrx_word' id='word_1_53' title='bbox 878 232 889 246; x_wconf 76' lang='eng' dir='ltr'>C</span> <span class='ocrx_word' id='word_1_54' title='bbox 999 233 1101 259; x_wconf 88' lang='eng' dir='ltr'><em>Colpoda</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 1110 233 1240 259; x_wconf 88' lang='eng' dir='ltr'><em>henneguyi</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 713 280 831 299">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 713 280 831 299">
+     <span class='ocr_line' id='line_1_32' title="bbox 713 280 831 299; baseline 0 0"><span class='ocrx_word' id='word_1_56' title='bbox 713 280 831 299; x_wconf 69' lang='eng'><em>80/63/039</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 944 267 1244 290">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 944 268 1244 289">
+     <span class='ocr_line' id='line_1_33' title="bbox 944 268 1244 289; baseline 0.003 -1"><span class='ocrx_word' id='word_1_57' title='bbox 944 268 1104 289; x_wconf 87' lang='eng' dir='ltr'><em>Bresslauides</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 1113 268 1244 289; x_wconf 89' lang='eng' dir='ltr'><em>discoideus</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 877 305 1312 368">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 877 306 1312 367">
+     <span class='ocr_line' id='line_1_34' title="bbox 928 306 1312 332; baseline 0 -5"><span class='ocrx_word' id='word_1_59' title='bbox 928 312 939 330; x_wconf 79' lang='eng' dir='ltr'>h</span> <span class='ocrx_word' id='word_1_60' title='bbox 1026 306 1199 332; x_wconf 85' lang='eng' dir='ltr'><em>Chain—forming</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 1210 306 1312 332; x_wconf 89' lang='eng' dir='ltr'><em>colpodid</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 877 341 1213 367; baseline -0.006 -4"><span class='ocrx_word' id='word_1_62' title='bbox 877 347 888 366; x_wconf 79' lang='eng' dir='ltr'>d</span> <span class='ocrx_word' id='word_1_63' title='bbox 1030 341 1131 367; x_wconf 88' lang='eng' dir='ltr'><em>Colpoda</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 1140 341 1213 362; x_wconf 88' lang='eng' dir='ltr'><em>steinii</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 810 433 866 452">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 810 433 866 452">
+     <span class='ocr_line' id='line_1_36' title="bbox 810 433 866 452; baseline 0 -6"><span class='ocrx_word' id='word_1_65' title='bbox 810 433 866 452; x_wconf 89' lang='eng'>_/_/_</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 886 377 1294 476">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 886 378 1294 475">
+     <span class='ocr_line' id='line_1_37' title="bbox 974 378 1294 405; baseline 0 -6"><span class='ocrx_word' id='word_1_66' title='bbox 974 378 1187 405; x_wconf 83' lang='eng' dir='ltr'><em>Mykophagophrys</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 1196 378 1294 399; x_wconf 85' lang='eng' dir='ltr'><em>terricola</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 958 413 1267 440; baseline 0 -6"><span class='ocrx_word' id='word_1_68' title='bbox 958 413 1197 440; x_wconf 83' lang='eng' dir='ltr'><em>Pseudop/atyoph/ya</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 1206 419 1267 434; x_wconf 90' lang='eng' dir='ltr'><em>nana</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 886 448 1164 475; baseline 0 -6"><span class='ocrx_word' id='word_1_70' title='bbox 886 455 894 473; x_wconf 90' lang='eng' dir='ltr'>f</span> <span class='ocrx_word' id='word_1_71' title='bbox 968 448 1070 475; x_wconf 88' lang='eng' dir='ltr'><em>Colpoda</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 1080 454 1164 475; x_wconf 86' lang='eng' dir='ltr'><em>aspera</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 1414 397 1727 435">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 1414 397 1727 435">
+     <span class='ocr_line' id='line_1_40' title="bbox 1414 397 1727 435; baseline -0.003 -8"><span class='ocrx_word' id='word_1_73' title='bbox 1414 397 1727 435; x_wconf 89' lang='eng' dir='ltr'><em>Grossglockneriida</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 998 485 1308 508">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 998 486 1308 507">
+     <span class='ocr_line' id='line_1_41' title="bbox 998 486 1308 507; baseline 0.003 -1"><span class='ocrx_word' id='word_1_74' title='bbox 998 486 1182 507; x_wconf 88' lang='eng' dir='ltr'><em>Hausmanniella</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 1191 486 1308 507; x_wconf 86' lang='eng' dir='ltr'><em>discoidea</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 928 521 1117 547">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 928 521 1117 547">
+     <span class='ocr_line' id='line_1_42' title="bbox 928 521 1117 547; baseline 0 -5"><span class='ocrx_word' id='word_1_76' title='bbox 928 521 1003 542; x_wconf 88' lang='eng' dir='ltr'><em>I/siella</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 1012 521 1117 547; x_wconf 85' lang='eng' dir='ltr'><em>palustris</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 876 558 1228 586">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 876 559 1228 585">
+     <span class='ocr_line' id='line_1_43' title="bbox 876 559 1228 585; baseline 0 -6"><span class='ocrx_word' id='word_1_78' title='bbox 876 559 1002 579; x_wconf 85' lang='eng' dir='ltr'><em>Notoxoma</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 1010 559 1228 585; x_wconf 86' lang='eng' dir='ltr'><em>parabryoph/yides</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 822 594 1051 620">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 822 594 1051 620">
+     <span class='ocr_line' id='line_1_44' title="bbox 822 594 1051 620; baseline 0 -5"><span class='ocrx_word' id='word_1_80' title='bbox 822 594 951 615; x_wconf 87' lang='eng' dir='ltr'><em>Barde/ie/Ia</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 959 594 1051 620; x_wconf 88' lang='eng' dir='ltr'><em>pu/chra</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 810 631 1166 657">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 810 631 1166 657">
+     <span class='ocr_line' id='line_1_45' title="bbox 810 631 1166 657; baseline -0.006 -3"><span class='ocrx_word' id='word_1_82' title='bbox 810 638 927 657; x_wconf 62' lang='eng'>89/75/099</span> <span class='ocrx_word' id='word_1_83' title='bbox 959 631 1166 652; x_wconf 84' lang='eng' dir='ltr'><em>HAVOmat-euk43</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 757 665 1059 687">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 757 665 1059 687">
+     <span class='ocr_line' id='line_1_46' title="bbox 757 665 1059 687; baseline 0.013 -3"><span class='ocrx_word' id='word_1_84' title='bbox 757 665 901 684; x_wconf 89' lang='eng'>100/100/1.00</span> <span class='ocrx_word' id='word_1_85' title='bbox 972 667 1059 687; x_wconf 83' lang='eng' dir='ltr'><em>LKM53</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 881 739 1065 760">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 881 739 1065 760">
+     <span class='ocr_line' id='line_1_47' title="bbox 881 739 1065 760; baseline 0 0"><span class='ocrx_word' id='word_1_86' title='bbox 881 739 1065 760; x_wconf 92' lang='eng' dir='ltr'>PAA1OAU2004</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 803 776 1324 947">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 905 776 1267 803">
+     <span class='ocr_line' id='line_1_48' title="bbox 905 776 1267 803; baseline 0 -6"><span class='ocrx_word' id='word_1_87' title='bbox 905 776 1073 803; x_wconf 85' lang='eng' dir='ltr'><em>Cyrtolophosis</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 1082 777 1191 797; x_wconf 88' lang='eng' dir='ltr'><em>mucicola</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 1200 777 1267 797; x_wconf 88' lang='eng' dir='ltr'><em>Brazil</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 912 811 1291 838">
+     <span class='ocr_line' id='line_1_49' title="bbox 912 811 1291 838; baseline 0 -6"><span class='ocrx_word' id='word_1_90' title='bbox 912 811 1080 838; x_wconf 80' lang='eng' dir='ltr'><em>Cyrtolophosis</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 1089 812 1198 832; x_wconf 86' lang='eng' dir='ltr'><em>mucicola</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 1205 812 1291 832; x_wconf 87' lang='eng' dir='ltr'><em>Austria</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 803 846 1324 873">
+     <span class='ocr_line' id='line_1_50' title="bbox 803 846 1324 873; baseline 0 -6"><span class='ocrx_word' id='word_1_93' title='bbox 803 855 814 873; x_wconf 76' lang='eng' dir='ltr'>h</span> <span class='ocrx_word' id='word_1_94' title='bbox 916 846 1107 867; x_wconf 86' lang='eng' dir='ltr'><em>Aristerostoma</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 1115 851 1153 872; x_wconf 87' lang='eng' dir='ltr'><em>sp.</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 1163 846 1237 867; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 1248 846 1324 867; x_wconf 84' lang='eng'><em>50986</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 947 885 1263 946">
+     <span class='ocr_line' id='line_1_51' title="bbox 947 885 1263 906; baseline 0 0"><span class='ocrx_word' id='word_1_98' title='bbox 947 885 1137 906; x_wconf 86' lang='eng' dir='ltr'><em>Aristerostoma</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 1146 885 1263 906; x_wconf 90' lang='eng' dir='ltr'><em>marinum</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_52' title="bbox 967 920 1163 946; baseline 0 -6"><span class='ocrx_word' id='word_1_100' title='bbox 967 920 1070 940; x_wconf 89' lang='eng' dir='ltr'><em>Bursaria</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 1078 925 1112 946; x_wconf 89' lang='eng' dir='ltr'><em>sp.</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 1123 920 1136 940; x_wconf 90' lang='eng'>2</span> <span class='ocrx_word' id='word_1_103' title='bbox 1144 920 1163 940; x_wconf 97' lang='eng' dir='ltr'>A</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 722 814 866 833">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 722 814 866 833">
+     <span class='ocr_line' id='line_1_53' title="bbox 722 814 866 833; baseline 0 -1"><span class='ocrx_word' id='word_1_104' title='bbox 722 814 866 833; x_wconf 89' lang='eng'>100/100/1.00</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 756 926 873 945">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 756 926 873 945">
+     <span class='ocr_line' id='line_1_54' title="bbox 756 926 873 945; baseline 0 0"><span class='ocrx_word' id='word_1_105' title='bbox 756 926 873 945; x_wconf 79' lang='eng'>80/91/100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 743 957 1097 983">
+    <p class='ocr_par' dir='ltr' id='par_1_42' title="bbox 743 957 1097 983">
+     <span class='ocr_line' id='line_1_55' title="bbox 743 957 1097 983; baseline -0.011 0"><span class='ocrx_word' id='word_1_106' title='bbox 743 964 861 983; x_wconf 78' lang='eng'>94/92/100</span> <span class='ocrx_word' id='word_1_107' title='bbox 902 957 1004 978; x_wconf 81' lang='eng' dir='ltr'><em>Bursaria</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 1012 962 1046 983; x_wconf 86' lang='eng' dir='ltr'><em>sp.</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 1057 957 1071 978; x_wconf 91' lang='eng'><em>2</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 1082 957 1097 978; x_wconf 92' lang='eng' dir='ltr'>B</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_37' title="bbox 916 992 1083 1018">
+    <p class='ocr_par' dir='ltr' id='par_1_43' title="bbox 916 992 1083 1018">
+     <span class='ocr_line' id='line_1_56' title="bbox 916 992 1083 1018; baseline 0 -5"><span class='ocrx_word' id='word_1_111' title='bbox 916 992 1019 1013; x_wconf 83' lang='eng' dir='ltr'><em>Bursaria</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 1028 997 1062 1018; x_wconf 90' lang='eng' dir='ltr'><em>sp.</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 1075 992 1083 1013; x_wconf 94' lang='eng'><em>1</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_38' title="bbox 979 703 1387 731">
+    <p class='ocr_par' dir='ltr' id='par_1_44' title="bbox 979 704 1387 730">
+     <span class='ocr_line' id='line_1_57' title="bbox 979 704 1387 730; baseline 0 -5"><span class='ocrx_word' id='word_1_114' title='bbox 979 704 1264 730; x_wconf 85' lang='eng' dir='ltr'><em>Pseudocyrtolophosis</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 1272 704 1387 730; x_wconf 87' lang='eng' dir='ltr'><em>alpestris</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_39' title="bbox 1396 556 1622 593">
+    <p class='ocr_par' dir='ltr' id='par_1_45' title="bbox 1396 556 1622 593">
+     <span class='ocr_line' id='line_1_58' title="bbox 1396 556 1622 593; baseline -0.013 -5"><span class='ocrx_word' id='word_1_116' title='bbox 1396 556 1404 588; x_wconf 99' lang='eng' dir='ltr'>I</span> <span class='ocrx_word' id='word_1_117' title='bbox 1415 556 1622 593; x_wconf 89' lang='eng' dir='ltr'><em>Bryophryida</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_40' title="bbox 1414 752 1726 789">
+    <p class='ocr_par' dir='ltr' id='par_1_46' title="bbox 1414 752 1726 789">
+     <span class='ocr_line' id='line_1_59' title="bbox 1414 752 1726 789; baseline 0 -8"><span class='ocrx_word' id='word_1_118' title='bbox 1414 752 1706 789; x_wconf 89' lang='eng' dir='ltr'><em>Cyrtolophosidida</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 1722 752 1726 781; x_wconf 99' lang='eng'><strong><em>|</em></strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_41' title="bbox 1415 967 1723 1004">
+    <p class='ocr_par' dir='ltr' id='par_1_47' title="bbox 1415 967 1723 1004">
+     <span class='ocr_line' id='line_1_60' title="bbox 1415 967 1723 1004; baseline 0 -8"><span class='ocrx_word' id='word_1_120' title='bbox 1415 967 1723 1004; x_wconf 89' lang='eng' dir='ltr'><em>Bursariomorphida</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_42' title="bbox 909 1030 1149 1050">
+    <p class='ocr_par' dir='ltr' id='par_1_48' title="bbox 909 1030 1149 1050">
+     <span class='ocr_line' id='line_1_61' title="bbox 909 1030 1149 1050; baseline 0 0"><span class='ocrx_word' id='word_1_121' title='bbox 909 1030 1012 1050; x_wconf 88' lang='eng' dir='ltr'><em>Bursaria</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 1022 1030 1149 1050; x_wconf 82' lang='eng' dir='ltr'><em>truncate/Ia</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_43' title="bbox 615 1050 719 1069">
+    <p class='ocr_par' dir='ltr' id='par_1_49' title="bbox 615 1050 719 1069">
+     <span class='ocr_line' id='line_1_62' title="bbox 615 1050 719 1069; baseline 0 0"><span class='ocrx_word' id='word_1_123' title='bbox 615 1050 719 1069; x_wconf 87' lang='eng'><em>—/62/0.92</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_44' title="bbox 518 1086 662 1105">
+    <p class='ocr_par' dir='ltr' id='par_1_50' title="bbox 518 1086 662 1105">
+     <span class='ocr_line' id='line_1_63' title="bbox 518 1086 662 1105; baseline 0 0"><span class='ocrx_word' id='word_1_124' title='bbox 518 1086 662 1105; x_wconf 93' lang='eng'>100/100/1.00</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_45' title="bbox 448 1180 704 1301">
+    <p class='ocr_par' dir='ltr' id='par_1_51' title="bbox 448 1180 704 1301">
+     <span class='ocr_line' id='line_1_64' title="bbox 558 1180 701 1199; baseline 0 0"><span class='ocrx_word' id='word_1_125' title='bbox 558 1180 701 1199; x_wconf 29' lang='eng'>100/100/1‘00</span> 
+     </span>
+     <span class='ocr_line' id='line_1_65' title="bbox 542 1216 659 1235; baseline 0 0"><span class='ocrx_word' id='word_1_126' title='bbox 542 1216 659 1235; x_wconf 72' lang='eng'><em>87/76/080</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_66' title="bbox 693 1251 704 1270; baseline 0 0"><span class='ocrx_word' id='word_1_127' title='bbox 693 1251 704 1270; x_wconf 95' lang='eng' dir='ltr'>h</span> 
+     </span>
+     <span class='ocr_line' id='line_1_67' title="bbox 448 1282 592 1301; baseline 0 0"><span class='ocrx_word' id='word_1_128' title='bbox 448 1282 592 1301; x_wconf 90' lang='eng'>100/100/1.00</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_46' title="bbox 892 1065 1404 1092">
+    <p class='ocr_par' dir='ltr' id='par_1_52' title="bbox 892 1065 1404 1091">
+     <span class='ocr_line' id='line_1_68' title="bbox 892 1065 1404 1091; baseline 0.004 -6"><span class='ocrx_word' id='word_1_129' title='bbox 892 1065 1057 1091; x_wconf 79' lang='eng' dir='ltr'><em>B/yometopus</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 1066 1065 1168 1091; x_wconf 85' lang='eng' dir='ltr'><em>atypicus</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 1396 1067 1404 1082; x_wconf 95' lang='eng' dir='ltr'><strong>I</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_47' title="bbox 838 1102 1207 1129">
+    <p class='ocr_par' dir='ltr' id='par_1_53' title="bbox 838 1102 1207 1128">
+     <span class='ocr_line' id='line_1_69' title="bbox 838 1102 1207 1128; baseline 0 -5"><span class='ocrx_word' id='word_1_132' title='bbox 838 1102 1003 1128; x_wconf 85' lang='eng' dir='ltr'><em>Bryometopus</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 1010 1102 1207 1128; x_wconf 83' lang='eng' dir='ltr'><em>pseudochilodon</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_48' title="bbox 712 1137 1052 1382">
+    <p class='ocr_par' dir='ltr' id='par_1_54' title="bbox 712 1137 1052 1382">
+     <span class='ocr_line' id='line_1_70' title="bbox 742 1137 1014 1164; baseline 0 -6"><span class='ocrx_word' id='word_1_134' title='bbox 742 1137 907 1164; x_wconf 83' lang='eng' dir='ltr'><em>Bryometopus</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 915 1137 1014 1163; x_wconf 87' lang='eng' dir='ltr'><em>sphagni</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_71' title="bbox 736 1174 1009 1201; baseline 0 -6"><span class='ocrx_word' id='word_1_136' title='bbox 736 1174 877 1201; x_wconf 81' lang='eng' dir='ltr'><em>Ottowph/ya</em></span> <span class='ocrx_word' id='word_1_137' title='bbox 887 1175 1009 1201; x_wconf 83' lang='eng' dir='ltr'><em>dragescoi</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_72' title="bbox 745 1210 1052 1236; baseline 0 -5"><span class='ocrx_word' id='word_1_138' title='bbox 745 1210 865 1236; x_wconf 86' lang='eng' dir='ltr'><em>Sorogena</em></span> <span class='ocrx_word' id='word_1_139' title='bbox 874 1210 1052 1231; x_wconf 87' lang='eng' dir='ltr'><em>stoianovitchae</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_73' title="bbox 749 1245 938 1272; baseline 0 -6"><span class='ocrx_word' id='word_1_140' title='bbox 749 1245 896 1272; x_wconf 85' lang='eng' dir='ltr'><em>Platyophrya</em></span> <span class='ocrx_word' id='word_1_141' title='bbox 903 1250 938 1271; x_wconf 83' lang='eng' dir='ltr'><em>sp.</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_74' title="bbox 785 1283 1009 1309; baseline 0 -6"><span class='ocrx_word' id='word_1_142' title='bbox 785 1283 931 1309; x_wconf 87' lang='eng' dir='ltr'><em>Platyophrya</em></span> <span class='ocrx_word' id='word_1_143' title='bbox 942 1288 1009 1303; x_wconf 83' lang='eng' dir='ltr'><em>vorax</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_75' title="bbox 715 1317 873 1344; baseline -0.006 -5"><span class='ocrx_word' id='word_1_144' title='bbox 715 1317 831 1344; x_wconf 85' lang='eng' dir='ltr'><em>Sagittaria</em></span> <span class='ocrx_word' id='word_1_145' title='bbox 839 1323 873 1344; x_wconf 91' lang='eng' dir='ltr'><em>sp.</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_76' title="bbox 712 1355 954 1382; baseline 0 -6"><span class='ocrx_word' id='word_1_146' title='bbox 712 1355 910 1382; x_wconf 83' lang='eng' dir='ltr'><em>PIatyophrya-Iike</em></span> <span class='ocrx_word' id='word_1_147' title='bbox 919 1360 954 1381; x_wconf 87' lang='eng' dir='ltr'><em>sp.</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_49' title="bbox 531 1382 897 1417">
+    <p class='ocr_par' dir='ltr' id='par_1_55' title="bbox 531 1382 897 1417">
+     <span class='ocr_line' id='line_1_77' title="bbox 531 1382 897 1417; baseline 0 -16"><span class='ocrx_word' id='word_1_148' title='bbox 531 1382 675 1401; x_wconf 77' lang='eng'>100/100/100</span> <span class='ocrx_word' id='word_1_149' title='bbox 702 1390 854 1417; x_wconf 65' lang='eng' dir='ltr'><em>Rostmphyra</em></span> <span class='ocrx_word' id='word_1_150' title='bbox 863 1395 897 1416; x_wconf 71' lang='eng' dir='ltr'><em>sp_</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_50' title="bbox 335 1431 452 1450">
+    <p class='ocr_par' dir='ltr' id='par_1_56' title="bbox 335 1431 452 1450">
+     <span class='ocr_line' id='line_1_78' title="bbox 335 1431 452 1450; baseline 0 0"><span class='ocrx_word' id='word_1_151' title='bbox 335 1431 452 1450; x_wconf 78' lang='eng'>96/82/100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_51' title="bbox 224 1506 342 1525">
+    <p class='ocr_par' dir='ltr' id='par_1_57' title="bbox 224 1506 342 1525">
+     <span class='ocr_line' id='line_1_79' title="bbox 224 1506 342 1525; baseline 0 0"><span class='ocrx_word' id='word_1_152' title='bbox 224 1506 303 1525; x_wconf 82' lang='eng'>99/75/1</span> <span class='ocrx_word' id='word_1_153' title='bbox 310 1506 342 1525; x_wconf 91' lang='eng'><em>.00</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_52' title="bbox 136 1650 358 1677">
+    <p class='ocr_par' dir='ltr' id='par_1_58' title="bbox 136 1650 358 1677">
+     <span class='ocr_line' id='line_1_80' title="bbox 136 1650 358 1677; baseline 0 -6"><span class='ocrx_word' id='word_1_154' title='bbox 136 1662 201 1666; x_wconf 97' lang='eng'>—</span> <span class='ocrx_word' id='word_1_155' title='bbox 217 1650 244 1671; x_wconf 94' lang='eng'>10</span> <span class='ocrx_word' id='word_1_156' title='bbox 254 1650 358 1677; x_wconf 86' lang='eng' dir='ltr'><em>changes</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_53' title="bbox 705 1428 997 1454">
+    <p class='ocr_par' dir='ltr' id='par_1_59' title="bbox 705 1428 997 1454">
+     <span class='ocr_line' id='line_1_81' title="bbox 705 1428 997 1454; baseline 0 -6"><span class='ocrx_word' id='word_1_157' title='bbox 705 1428 844 1454; x_wconf 84' lang='eng' dir='ltr'><em>Furgasonia</em></span> <span class='ocrx_word' id='word_1_158' title='bbox 853 1428 997 1448; x_wconf 86' lang='eng' dir='ltr'><em>blochmanni</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_54' title="bbox 689 1462 960 1489">
+    <p class='ocr_par' dir='ltr' id='par_1_60' title="bbox 689 1462 960 1489">
+     <span class='ocr_line' id='line_1_82' title="bbox 689 1462 960 1489; baseline -0.004 -5"><span class='ocrx_word' id='word_1_159' title='bbox 689 1462 827 1484; x_wconf 78' lang='eng' dir='ltr'><em>Obe/trumia</em></span> <span class='ocrx_word' id='word_1_160' title='bbox 836 1463 960 1489; x_wconf 82' lang='eng' dir='ltr'><em>georgiana</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_55' title="bbox 421 1573 697 1629">
+    <p class='ocr_par' dir='ltr' id='par_1_61' title="bbox 421 1573 697 1629">
+     <span class='ocr_line' id='line_1_83' title="bbox 535 1573 697 1599; baseline 0 -5"><span class='ocrx_word' id='word_1_161' title='bbox 535 1573 620 1599; x_wconf 89' lang='eng' dir='ltr'><em>Coleps</em></span> <span class='ocrx_word' id='word_1_162' title='bbox 629 1573 697 1594; x_wconf 85' lang='eng' dir='ltr'><em>hirtus</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_84' title="bbox 421 1608 606 1629; baseline 0 0"><span class='ocrx_word' id='word_1_163' title='bbox 421 1608 535 1629; x_wconf 87' lang='eng' dir='ltr'><em>Prorodon</em></span> <span class='ocrx_word' id='word_1_164' title='bbox 545 1609 606 1629; x_wconf 81' lang='eng' dir='ltr'><em>teres</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_56' title="bbox 714 1500 1105 1557">
+    <p class='ocr_par' dir='ltr' id='par_1_62' title="bbox 714 1500 1105 1557">
+     <span class='ocr_line' id='line_1_85' title="bbox 784 1500 1105 1527; baseline 0 -6"><span class='ocrx_word' id='word_1_165' title='bbox 784 1500 941 1521; x_wconf 69' lang='eng' dir='ltr'><em>OrthodoneI/a</em></span> <span class='ocrx_word' id='word_1_166' title='bbox 951 1501 1105 1527; x_wconf 86' lang='eng' dir='ltr'><em>apohamatus</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_86' title="bbox 714 1536 1046 1557; baseline 0 -1"><span class='ocrx_word' id='word_1_167' title='bbox 714 1536 956 1557; x_wconf 83' lang='eng' dir='ltr'><em>Pseudomicrothorax</em></span> <span class='ocrx_word' id='word_1_168' title='bbox 964 1536 1046 1557; x_wconf 82' lang='eng' dir='ltr'><em>dub/us</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_57' title="bbox 1396 1096 1655 1140">
+    <p class='ocr_par' dir='ltr' id='par_1_63' title="bbox 1396 1096 1655 1140">
+     <span class='ocr_line' id='line_1_87' title="bbox 1396 1096 1655 1140; baseline 0.004 -10"><span class='ocrx_word' id='word_1_169' title='bbox 1396 1096 1655 1140; x_wconf 79' lang='eng' dir='ltr'><em>:Bryometopida</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_58' title="bbox 1414 1191 1613 1229">
+    <p class='ocr_par' dir='ltr' id='par_1_64' title="bbox 1414 1191 1613 1229">
+     <span class='ocr_line' id='line_1_88' title="bbox 1414 1191 1613 1229; baseline 0 -8"><span class='ocrx_word' id='word_1_170' title='bbox 1414 1191 1613 1229; x_wconf 89' lang='eng' dir='ltr'><em>Sorogenida</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_59' title="bbox 1396 1300 1737 1372">
+    <p class='ocr_par' dir='ltr' id='par_1_65' title="bbox 1396 1300 1737 1372">
+     <span class='ocr_line' id='line_1_89' title="bbox 1396 1300 1737 1354; baseline 0.003 -10"><span class='ocrx_word' id='word_1_171' title='bbox 1396 1300 1706 1354; x_wconf 77' lang='eng' dir='ltr'><em>:Cyrtolophosidida</em></span> <span class='ocrx_word' id='word_1_172' title='bbox 1722 1317 1737 1345; x_wconf 98' lang='eng' dir='ltr'><strong><em>II</em></strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_90' title="bbox 1396 1357 1404 1372; baseline 0 0"><span class='ocrx_word' id='word_1_173' title='bbox 1396 1357 1404 1372; x_wconf 99' lang='eng' dir='ltr'><strong>I</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_60' title="bbox 1126 1428 1454 1559">
+    <p class='ocr_par' dir='ltr' id='par_1_66' title="bbox 1126 1428 1454 1558">
+     <span class='ocr_line' id='line_1_91' title="bbox 1126 1428 1133 1443; baseline 0 0"><span class='ocrx_word' id='word_1_174' title='bbox 1126 1428 1133 1443; x_wconf 98' lang='eng' dir='ltr'><strong>I</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_92' title="bbox 1126 1481 1454 1529; baseline -0.003 -18"><span class='ocrx_word' id='word_1_175' title='bbox 1126 1485 1133 1529; x_wconf 78' lang='eng'><strong>:</strong></span> <span class='ocrx_word' id='word_1_176' title='bbox 1150 1481 1454 1511; x_wconf 90' lang='eng' dir='ltr'><em>NASSOPHOREA</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_93' title="bbox 1126 1543 1133 1558; baseline 0 0"><span class='ocrx_word' id='word_1_177' title='bbox 1126 1543 1133 1558; x_wconf 98' lang='eng' dir='ltr'><strong>I</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_61' title="bbox 1150 1587 1448 1619">
+    <p class='ocr_par' dir='ltr' id='par_1_67' title="bbox 1150 1588 1448 1618">
+     <span class='ocr_line' id='line_1_94' title="bbox 1150 1588 1448 1618; baseline 0 0"><span class='ocrx_word' id='word_1_178' title='bbox 1150 1588 1448 1618; x_wconf 90' lang='eng' dir='ltr'><em>PROSTOMATEA</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_62' title="bbox 1761 270 1936 307">
+    <p class='ocr_par' dir='ltr' id='par_1_68' title="bbox 1761 270 1936 307">
+     <span class='ocr_line' id='line_1_95' title="bbox 1761 270 1936 307; baseline 0 -8"><span class='ocrx_word' id='word_1_179' title='bbox 1761 270 1936 307; x_wconf 89' lang='eng' dir='ltr'><em>Colpodida</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_63' title="bbox 1977 571 2007 790">
+    <p class='ocr_par' dir='ltr' id='par_1_69' title="bbox 1977 571 2007 790">
+     <span class='ocr_line' id='line_1_96' title="bbox 1977 571 2007 790; textangle 90"><span class='ocrx_word' id='word_1_180' title='bbox 1977 571 2007 790; x_wconf 59' lang='eng' dir='ltr'><em>VEIGOd‘IOO</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000943-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000943-0-000.pbm.png
new file mode 100644
index 00000000..b978a8ee
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000943-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000943-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000943-0-000.pbm.png.hocr
new file mode 100644
index 00000000..349b433e
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000943-0-000.pbm.png.hocr
@@ -0,0 +1,360 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000943-0-000.pbm.png"; bbox 0 0 1243 989; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 35 116 71 136">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 35 116 71 136">
+     <span class='ocr_line' id='line_1_1' title="bbox 35 116 71 136; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 35 116 71 136; x_wconf 88' lang='eng'><em>2%</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 320 69 363 90">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 320 69 363 90">
+     <span class='ocr_line' id='line_1_2' title="bbox 320 69 363 90; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 320 69 363 90; x_wconf 91' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 364 10 407 31">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 364 10 407 31">
+     <span class='ocr_line' id='line_1_3' title="bbox 364 10 407 31; baseline 0 0"><span class='ocrx_word' id='word_1_3' title='bbox 364 10 407 31; x_wconf 89' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 415 5 1222 32">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 415 5 1222 32">
+     <span class='ocr_line' id='line_1_4' title="bbox 415 5 1222 32; baseline 0.001 -6"><span class='ocrx_word' id='word_1_4' title='bbox 415 14 440 16; x_wconf 82' lang='eng'><em>—</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 448 5 612 27; x_wconf 86' lang='eng' dir='ltr'><em>Desulfovibrio</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 622 5 862 27; x_wconf 86' lang='eng' dir='ltr'><em>dechloracetivorans</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 870 5 947 27; x_wconf 93' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 957 5 1063 27; x_wconf 85' lang='eng' dir='ltr'><em>700912T</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 1073 5 1222 32; x_wconf 90' lang='eng' dir='ltr'><em>(AF230530)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 368 43 418 45">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 368 43 418 45">
+     <span class='ocr_line' id='line_1_5' title="bbox 368 43 418 45; baseline 0 944"><span class='ocrx_word' id='word_1_10' title='bbox 368 43 418 45; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 329 94 373 96">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 329 94 373 96">
+     <span class='ocr_line' id='line_1_6' title="bbox 329 94 373 96; baseline 0 893"><span class='ocrx_word' id='word_1_11' title='bbox 329 94 373 96; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 296 143 326 164">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 296 143 326 164">
+     <span class='ocr_line' id='line_1_7' title="bbox 296 143 326 164; baseline 0 0"><span class='ocrx_word' id='word_1_12' title='bbox 296 143 326 164; x_wconf 88' lang='eng'><strong>88</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 305 175 333 176">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 305 175 333 176">
+     <span class='ocr_line' id='line_1_8' title="bbox 305 175 333 176; baseline 0 813"><span class='ocrx_word' id='word_1_13' title='bbox 305 175 333 176; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 329 94 331 252">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 329 94 331 252">
+     <span class='ocr_line' id='line_1_9' title="bbox 329 94 331 252; baseline 0 737"><span class='ocrx_word' id='word_1_14' title='bbox 329 94 331 252; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 329 250 346 252">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 329 250 346 252">
+     <span class='ocr_line' id='line_1_10' title="bbox 329 250 346 252; baseline 0 737"><span class='ocrx_word' id='word_1_15' title='bbox 329 250 346 252; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 266 261 393 282">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 266 261 393 282">
+     <span class='ocr_line' id='line_1_11' title="bbox 266 261 393 282; baseline 0 0"><span class='ocrx_word' id='word_1_16' title='bbox 266 261 296 282; x_wconf 94' lang='eng'>50</span> <span class='ocrx_word' id='word_1_17' title='bbox 349 261 393 282; x_wconf 94' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 291 285 308 286">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 291 285 308 286">
+     <span class='ocr_line' id='line_1_12' title="bbox 291 285 308 286; baseline 0 703"><span class='ocrx_word' id='word_1_18' title='bbox 291 285 308 286; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 344 204 346 298">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 344 204 346 298">
+     <span class='ocr_line' id='line_1_13' title="bbox 344 204 346 298; baseline 0 691"><span class='ocrx_word' id='word_1_19' title='bbox 344 204 346 298; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 368 43 370 142">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 368 43 370 142">
+     <span class='ocr_line' id='line_1_14' title="bbox 368 43 370 142; baseline 0 847"><span class='ocrx_word' id='word_1_20' title='bbox 368 43 370 142; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 346 204 452 206">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 346 204 452 206">
+     <span class='ocr_line' id='line_1_15' title="bbox 346 204 452 206; baseline 0 783"><span class='ocrx_word' id='word_1_21' title='bbox 346 204 452 206; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 413 14 415 78">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 413 14 415 78">
+     <span class='ocr_line' id='line_1_16' title="bbox 413 14 415 78; baseline 0 911"><span class='ocrx_word' id='word_1_22' title='bbox 413 14 415 78; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 344 297 410 298">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 344 297 410 298">
+     <span class='ocr_line' id='line_1_17' title="bbox 344 297 410 298; baseline 0 691"><span class='ocrx_word' id='word_1_23' title='bbox 344 297 410 298; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 252 352 281 373">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 252 352 281 373">
+     <span class='ocr_line' id='line_1_18' title="bbox 252 352 281 373; baseline 0 0"><span class='ocrx_word' id='word_1_24' title='bbox 252 352 281 373; x_wconf 91' lang='eng'><em>77</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 267 387 294 388">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 267 387 294 388">
+     <span class='ocr_line' id='line_1_19' title="bbox 267 387 294 388; baseline 0 601"><span class='ocrx_word' id='word_1_25' title='bbox 267 387 294 388; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 305 174 307 396">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 305 174 307 396">
+     <span class='ocr_line' id='line_1_20' title="bbox 305 174 307 396; baseline 0 593"><span class='ocrx_word' id='word_1_26' title='bbox 305 174 307 396; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 291 284 293 489">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 291 284 293 489">
+     <span class='ocr_line' id='line_1_21' title="bbox 291 284 293 489; baseline 0 500"><span class='ocrx_word' id='word_1_27' title='bbox 291 284 293 489; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 404 268 406 332">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 404 268 406 332">
+     <span class='ocr_line' id='line_1_22' title="bbox 404 268 406 332; baseline 0 657"><span class='ocrx_word' id='word_1_28' title='bbox 404 268 406 332; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 364 456 407 477">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 364 456 407 477">
+     <span class='ocr_line' id='line_1_23' title="bbox 364 456 407 477; baseline 0 0"><span class='ocrx_word' id='word_1_29' title='bbox 364 456 407 477; x_wconf 90' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 415 65 1099 92">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 415 65 1099 92">
+     <span class='ocr_line' id='line_1_24' title="bbox 415 65 1099 92; baseline 0.001 -6"><span class='ocrx_word' id='word_1_30' title='bbox 415 77 446 78; x_wconf 36' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 456 65 625 87; x_wconf 81' lang='eng' dir='ltr'><em>Desulfovibrio</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 635 65 812 87; x_wconf 87' lang='eng' dir='ltr'><em>caledoniensis’</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 823 65 900 87; x_wconf 90' lang='eng' dir='ltr'>SEBR</span> <span class='ocrx_word' id='word_1_34' title='bbox 909 65 971 87; x_wconf 91' lang='eng'><em>7250</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 982 65 1099 92; x_wconf 87' lang='eng' dir='ltr'><em>(U53465)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 369 132 1066 159">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 369 132 1066 159">
+     <span class='ocr_line' id='line_1_25' title="bbox 369 132 1066 159; baseline 0.001 -6"><span class='ocrx_word' id='word_1_36' title='bbox 369 141 427 142; x_wconf 39' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 435 132 599 154; x_wconf 88' lang='eng' dir='ltr'><em>Desulfovibrio</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 609 132 769 159; x_wconf 87' lang='eng' dir='ltr'><em>aespoeensis</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 779 132 839 154; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 852 132 940 154; x_wconf 88' lang='eng' dir='ltr'><em>10631T</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 950 132 1066 159; x_wconf 83' lang='eng' dir='ltr'><em>(X95230)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 458 193 1049 220">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 458 193 1049 220">
+     <span class='ocr_line' id='line_1_26' title="bbox 458 193 1049 220; baseline 0 -6"><span class='ocrx_word' id='word_1_42' title='bbox 458 193 640 214; x_wconf 86' lang='eng' dir='ltr'><em>Desulfovibrio</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 650 193 798 214; x_wconf 86' lang='eng' dir='ltr'><em>tunisiensis</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 808 193 891 214; x_wconf 82' lang='eng' dir='ltr'><em>R322T</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 900 193 1049 220; x_wconf 88' lang='eng' dir='ltr'><em>(EF577029)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 405 256 1048 283">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 405 256 1048 283">
+     <span class='ocr_line' id='line_1_27' title="bbox 405 256 1048 283; baseline 0 -6"><span class='ocrx_word' id='word_1_46' title='bbox 405 256 630 277; x_wconf 84' lang='eng' dir='ltr'><em>—Desulfovibrio</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 639 256 768 283; x_wconf 86' lang='eng' dir='ltr'><em>halophilus</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 778 256 838 277; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 849 256 922 277; x_wconf 88' lang='eng' dir='ltr'><em>5663T</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 932 256 1048 283; x_wconf 85' lang='eng' dir='ltr'><em>(X99237)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 405 321 1103 348">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 405 321 1103 348">
+     <span class='ocr_line' id='line_1_28' title="bbox 405 321 1103 348; baseline 0 -6"><span class='ocrx_word' id='word_1_51' title='bbox 405 331 444 333; x_wconf 96' lang='eng'>—</span> <span class='ocrx_word' id='word_1_52' title='bbox 461 321 630 342; x_wconf 78' lang='eng' dir='ltr'><em>Desulfovibrio</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 639 321 785 342; x_wconf 78' lang='eng' dir='ltr'><em>brasiliensis‘</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 797 321 858 342; x_wconf 92' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 870 321 946 342; x_wconf 88' lang='eng'>15816</span> <span class='ocrx_word' id='word_1_56' title='bbox 956 321 1103 348; x_wconf 87' lang='eng' dir='ltr'><em>(AJ544687)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 424 385 1168 473">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 424 385 1168 473">
+     <span class='ocr_line' id='line_1_29' title="bbox 477 385 1168 412; baseline 0 -6"><span class='ocrx_word' id='word_1_57' title='bbox 477 385 642 406; x_wconf 87' lang='eng' dir='ltr'><em>Desulfovibrio</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 651 385 838 412; x_wconf 82' lang='eng' dir='ltr'><em>hydrothermalis</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 849 385 908 406; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 921 385 1009 406; x_wconf 91' lang='eng' dir='ltr'><em>14728T</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 1018 385 1168 412; x_wconf 87' lang='eng' dir='ltr'>(AF458778)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 424 445 1019 473; baseline 0 -6"><span class='ocrx_word' id='word_1_62' title='bbox 424 459 442 461; x_wconf 41' lang='eng'>~</span> <span class='ocrx_word' id='word_1_63' title='bbox 459 445 624 467; x_wconf 82' lang='eng' dir='ltr'><em>Desulfovibrio</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 633 446 722 473; x_wconf 86' lang='eng' dir='ltr'><em>gracilis</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 732 445 792 467; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 804 445 893 467; x_wconf 81' lang='eng' dir='ltr'><em>16080T</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 902 445 1019 473; x_wconf 86' lang='eng' dir='ltr'><em>(U53464)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 291 488 426 489">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 291 488 426 489">
+     <span class='ocr_line' id='line_1_31' title="bbox 291 488 426 489; baseline 0 500"><span class='ocrx_word' id='word_1_68' title='bbox 291 488 426 489; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 201 515 245 536">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 201 515 245 536">
+     <span class='ocr_line' id='line_1_32' title="bbox 201 515 245 536; baseline 0 0"><span class='ocrx_word' id='word_1_69' title='bbox 201 515 245 536; x_wconf 93' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 4 552 271 553">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 4 552 271 553">
+     <span class='ocr_line' id='line_1_33' title="bbox 4 552 271 553; baseline 0 436"><span class='ocrx_word' id='word_1_70' title='bbox 4 552 271 553; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 4 552 5 968">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 4 552 5 968">
+     <span class='ocr_line' id='line_1_34' title="bbox 4 552 5 968; baseline 0 21"><span class='ocrx_word' id='word_1_71' title='bbox 4 552 5 968; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 289 589 330 609">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 289 589 330 609">
+     <span class='ocr_line' id='line_1_35' title="bbox 289 589 330 609; baseline 0.024 -1"><span class='ocrx_word' id='word_1_72' title='bbox 289 589 330 609; x_wconf 91' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 279 616 357 617">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 279 616 357 617">
+     <span class='ocr_line' id='line_1_36' title="bbox 279 616 357 617; baseline 0 372"><span class='ocrx_word' id='word_1_73' title='bbox 279 616 357 617; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 350 585 352 651">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 350 585 352 651">
+     <span class='ocr_line' id='line_1_37' title="bbox 350 585 352 651; baseline 0 338"><span class='ocrx_word' id='word_1_74' title='bbox 350 585 352 651; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_37' title="bbox 267 387 269 713">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 267 387 269 713">
+     <span class='ocr_line' id='line_1_38' title="bbox 267 387 269 713; baseline 0 276"><span class='ocrx_word' id='word_1_75' title='bbox 267 387 269 713; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_38' title="bbox 352 585 458 587">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 352 585 458 587">
+     <span class='ocr_line' id='line_1_39' title="bbox 352 585 458 587; baseline 0 402"><span class='ocrx_word' id='word_1_76' title='bbox 352 585 458 587; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_39' title="bbox 422 458 424 523">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 422 458 424 523">
+     <span class='ocr_line' id='line_1_40' title="bbox 422 458 424 523; baseline 0 466"><span class='ocrx_word' id='word_1_77' title='bbox 422 458 424 523; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_40' title="bbox 424 511 1092 538">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 424 511 1092 538">
+     <span class='ocr_line' id='line_1_41' title="bbox 424 511 1092 538; baseline 0 -6"><span class='ocrx_word' id='word_1_78' title='bbox 424 521 455 523; x_wconf 96' lang='eng'>—</span> <span class='ocrx_word' id='word_1_79' title='bbox 468 511 637 533; x_wconf 79' lang='eng' dir='ltr'><em>Desulfovibrio</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 647 511 770 538; x_wconf 81' lang='eng' dir='ltr'><em>capillatus’</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 781 511 842 533; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 854 511 930 533; x_wconf 87' lang='eng'><em>14982</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 941 511 1092 538; x_wconf 87' lang='eng' dir='ltr'><em>(AY176773)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_41' title="bbox 465 574 1139 602">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 465 574 1139 602">
+     <span class='ocr_line' id='line_1_42' title="bbox 465 574 1139 602; baseline 0 -6"><span class='ocrx_word' id='word_1_84' title='bbox 465 574 630 596; x_wconf 87' lang='eng' dir='ltr'><em>Desulfovibrio</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 639 575 812 596; x_wconf 87' lang='eng' dir='ltr'><em>indonesiensis</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 822 574 883 596; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 895 574 983 596; x_wconf 88' lang='eng' dir='ltr'><em>15121T</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 993 574 1139 602; x_wconf 86' lang='eng' dir='ltr'><em>(AJ621884)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_42' title="bbox 352 636 1072 663">
+    <p class='ocr_par' dir='ltr' id='par_1_42' title="bbox 352 636 1072 663">
+     <span class='ocr_line' id='line_1_43' title="bbox 352 636 1072 663; baseline 0 -6"><span class='ocrx_word' id='word_1_89' title='bbox 352 649 465 651; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_90' title='bbox 472 636 637 657; x_wconf 75' lang='eng' dir='ltr'><em>Desulfovibrio</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 646 636 770 663; x_wconf 79' lang='eng' dir='ltr'><em>giganteus</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 779 636 839 657; x_wconf 93' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 849 636 912 657; x_wconf 90' lang='eng'>4370</span> <span class='ocrx_word' id='word_1_94' title='bbox 922 636 1072 663; x_wconf 92' lang='eng' dir='ltr'><em>(AF418170)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_43' title="bbox 267 711 487 714">
+    <p class='ocr_par' dir='ltr' id='par_1_43' title="bbox 267 711 487 714">
+     <span class='ocr_line' id='line_1_44' title="bbox 267 711 487 714; baseline 0 275"><span class='ocrx_word' id='word_1_95' title='bbox 267 711 487 714; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_44' title="bbox 236 707 318 743">
+    <p class='ocr_par' dir='ltr' id='par_1_44' title="bbox 236 707 318 743">
+     <span class='ocr_line' id='line_1_45' title="bbox 236 707 318 743; baseline 0 -14"><span class='ocrx_word' id='word_1_96' title='bbox 236 722 266 743; x_wconf 80' lang='eng' dir='ltr'><em>7O</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 288 707 318 729; x_wconf 88' lang='eng'>95</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_45' title="bbox 296 742 324 744">
+    <p class='ocr_par' dir='ltr' id='par_1_45' title="bbox 296 742 324 744">
+     <span class='ocr_line' id='line_1_46' title="bbox 296 742 324 744; baseline 0 245"><span class='ocrx_word' id='word_1_98' title='bbox 296 742 324 744; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_46' title="bbox 320 712 322 777">
+    <p class='ocr_par' dir='ltr' id='par_1_46' title="bbox 320 712 322 777">
+     <span class='ocr_line' id='line_1_47' title="bbox 320 712 322 777; baseline 0 212"><span class='ocrx_word' id='word_1_99' title='bbox 320 712 322 777; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_47' title="bbox 279 615 281 807">
+    <p class='ocr_par' dir='ltr' id='par_1_47' title="bbox 279 615 281 807">
+     <span class='ocr_line' id='line_1_48' title="bbox 279 615 281 807; baseline 0 182"><span class='ocrx_word' id='word_1_100' title='bbox 279 615 281 807; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_48' title="bbox 279 805 300 807">
+    <p class='ocr_par' dir='ltr' id='par_1_48' title="bbox 279 805 300 807">
+     <span class='ocr_line' id='line_1_49' title="bbox 279 805 300 807; baseline 0 182"><span class='ocrx_word' id='word_1_101' title='bbox 279 805 300 807; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_49' title="bbox 257 823 286 844">
+    <p class='ocr_par' dir='ltr' id='par_1_49' title="bbox 257 823 286 844">
+     <span class='ocr_line' id='line_1_50' title="bbox 257 823 286 844; baseline 0 0"><span class='ocrx_word' id='word_1_102' title='bbox 257 823 286 844; x_wconf 90' lang='eng'><em>82</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_50' title="bbox 296 742 298 870">
+    <p class='ocr_par' dir='ltr' id='par_1_50' title="bbox 296 742 298 870">
+     <span class='ocr_line' id='line_1_51' title="bbox 296 742 298 870; baseline 0 119"><span class='ocrx_word' id='word_1_103' title='bbox 296 742 298 870; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_51' title="bbox 296 868 330 870">
+    <p class='ocr_par' dir='ltr' id='par_1_51' title="bbox 296 868 330 870">
+     <span class='ocr_line' id='line_1_52' title="bbox 296 868 330 870; baseline 0 119"><span class='ocrx_word' id='word_1_104' title='bbox 296 868 330 870; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_52' title="bbox 326 839 328 904">
+    <p class='ocr_par' dir='ltr' id='par_1_52' title="bbox 326 839 328 904">
+     <span class='ocr_line' id='line_1_53' title="bbox 326 839 328 904; baseline 0 85"><span class='ocrx_word' id='word_1_105' title='bbox 326 839 328 904; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_53' title="bbox 287 882 316 904">
+    <p class='ocr_par' dir='ltr' id='par_1_53' title="bbox 287 882 316 904">
+     <span class='ocr_line' id='line_1_54' title="bbox 287 882 316 904; baseline -0.034 0"><span class='ocrx_word' id='word_1_106' title='bbox 287 882 316 904; x_wconf 85' lang='eng'><em>92</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_54' title="bbox 469 703 1241 919">
+    <p class='ocr_par' dir='ltr' id='par_1_54' title="bbox 496 703 1141 731">
+     <span class='ocr_line' id='line_1_55' title="bbox 496 703 1141 731; baseline 0 -6"><span class='ocrx_word' id='word_1_107' title='bbox 496 703 665 725; x_wconf 81' lang='eng' dir='ltr'><em>Desulfovibrio</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 674 703 838 725; x_wconf 80' lang='eng' dir='ltr'><em>fairﬁeldensis’</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 848 703 925 725; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 935 704 1013 725; x_wconf 91' lang='eng'>70045</span> <span class='ocrx_word' id='word_1_111' title='bbox 1023 703 1141 731; x_wconf 88' lang='eng' dir='ltr'><em>(U42221)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_55' title="bbox 469 765 1241 857">
+     <span class='ocr_line' id='line_1_56' title="bbox 469 765 1241 792; baseline 0 -5"><span class='ocrx_word' id='word_1_112' title='bbox 469 765 634 787; x_wconf 87' lang='eng' dir='ltr'><em>Desulfovibrio</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 644 765 741 792; x_wconf 85' lang='eng' dir='ltr'><em>vulgaris</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 750 765 831 792; x_wconf 87' lang='eng' dir='ltr'><em>subsp.</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 844 765 940 792; x_wconf 89' lang='eng' dir='ltr'><em>vulgaris</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 950 765 1010 787; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 1021 765 1079 787; x_wconf 89' lang='eng' dir='ltr'><em>644T</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 1086 765 1241 792; x_wconf 88' lang='eng' dir='ltr'><em>(DQ826728)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_57' title="bbox 483 830 1194 857; baseline 0 -6"><span class='ocrx_word' id='word_1_119' title='bbox 483 830 648 851; x_wconf 88' lang='eng' dir='ltr'><em>Desulfovibrio</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 656 830 859 857; x_wconf 82' lang='eng' dir='ltr'><em>psychrotolerans</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 869 830 929 851; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 941 830 1029 851; x_wconf 81' lang='eng' dir='ltr'><em>19430T</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 1039 830 1194 857; x_wconf 85' lang='eng' dir='ltr'><em>(AM418397)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_56' title="bbox 505 891 1175 919">
+     <span class='ocr_line' id='line_1_58' title="bbox 505 891 1175 919; baseline -0.001 -5"><span class='ocrx_word' id='word_1_124' title='bbox 505 892 670 914; x_wconf 87' lang='eng' dir='ltr'><em>Desulfovibrio</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 679 892 812 914; x_wconf 88' lang='eng' dir='ltr'><em>alaskensis</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 830 892 919 914; x_wconf 90' lang='eng' dir='ltr'><em>NCIMB</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 931 891 1019 914; x_wconf 87' lang='eng' dir='ltr'><em>13491T</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 1029 892 1175 919; x_wconf 90' lang='eng' dir='ltr'><em>(AJ404226)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_55' title="bbox 294 957 975 984">
+    <p class='ocr_par' dir='ltr' id='par_1_57' title="bbox 294 957 975 984">
+     <span class='ocr_line' id='line_1_59' title="bbox 294 957 975 984; baseline 0 -6"><span class='ocrx_word' id='word_1_129' title='bbox 294 957 530 978; x_wconf 83' lang='eng' dir='ltr'><em>Desulfotomaculum</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 539 957 678 984; x_wconf 89' lang='eng' dir='ltr'><em>halophilum</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 688 957 748 978; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_132' title='bbox 761 957 849 978; x_wconf 80' lang='eng' dir='ltr'><em>11559T</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 858 957 975 984; x_wconf 87' lang='eng' dir='ltr'>(U88891)</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000968-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000968-0-000.pbm.png
new file mode 100644
index 00000000..1c962671
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000968-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000968-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000968-0-000.pbm.png.hocr
new file mode 100644
index 00000000..ac47ebf2
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000968-0-000.pbm.png.hocr
@@ -0,0 +1,218 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000968-0-000.pbm.png"; bbox 0 0 994 1292; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 5 818 7 1272">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 5 818 7 1272">
+     <span class='ocr_line' id='line_1_1' title="bbox 5 818 7 1272; baseline 0 20"><span class='ocrx_word' id='word_1_1' title='bbox 5 818 7 1272; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 18 6 64 25">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 18 6 64 25">
+     <span class='ocr_line' id='line_1_2' title="bbox 18 6 64 25; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 18 6 64 25; x_wconf 79' lang='eng'><em>0.01</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 31 790 58 809">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 31 790 58 809">
+     <span class='ocr_line' id='line_1_3' title="bbox 31 790 58 809; baseline 0 0"><span class='ocrx_word' id='word_1_3' title='bbox 31 790 58 809; x_wconf 88' lang='eng'><em>86</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 69 995 96 1014">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 69 995 96 1014">
+     <span class='ocr_line' id='line_1_4' title="bbox 69 995 96 1014; baseline 0 0"><span class='ocrx_word' id='word_1_4' title='bbox 69 995 96 1014; x_wconf 87' lang='eng'><em>52</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 101 927 104 1044">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 101 927 104 1044">
+     <span class='ocr_line' id='line_1_5' title="bbox 101 927 104 1044; baseline 0 248"><span class='ocrx_word' id='word_1_5' title='bbox 101 927 104 1044; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 173 620 213 640">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 173 620 213 640">
+     <span class='ocr_line' id='line_1_6' title="bbox 173 620 213 640; baseline 0 0"><span class='ocrx_word' id='word_1_6' title='bbox 173 620 213 640; x_wconf 83' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 347 8 798 35">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 347 8 798 35">
+     <span class='ocr_line' id='line_1_7' title="bbox 347 8 798 35; baseline 0 -5"><span class='ocrx_word' id='word_1_7' title='bbox 347 17 377 19; x_wconf 89' lang='eng'>—</span> <span class='ocrx_word' id='word_1_8' title='bbox 385 10 457 35; x_wconf 84' lang='eng' dir='ltr'><em>Dye/la</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 467 10 581 30; x_wconf 83' lang='eng' dir='ltr'><em>koreensis</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 590 8 650 30; x_wconf 79' lang='eng' dir='ltr'><em>B84T</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 658 10 798 35; x_wconf 85' lang='eng' dir='ltr'><em>(AY884571)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 345 17 347 133">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 345 17 347 133">
+     <span class='ocr_line' id='line_1_8' title="bbox 345 17 347 133; baseline 0 1159"><span class='ocrx_word' id='word_1_12' title='bbox 345 17 347 133; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 347 124 732 151">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 347 124 732 151">
+     <span class='ocr_line' id='line_1_9' title="bbox 347 124 732 151; baseline 0 -6"><span class='ocrx_word' id='word_1_13' title='bbox 347 131 380 133; x_wconf 84' lang='eng'>—</span> <span class='ocrx_word' id='word_1_14' title='bbox 389 126 461 146; x_wconf 90' lang='eng' dir='ltr'><em>Strain</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 472 124 577 146; x_wconf 58' lang='eng' dir='ltr'><em>CSS-BZ&#39;r</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 585 126 732 151; x_wconf 82' lang='eng' dir='ltr'><em>(AM939778)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 302 186 323 188">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 302 186 323 188">
+     <span class='ocr_line' id='line_1_10' title="bbox 302 186 323 188; baseline 0 1104"><span class='ocrx_word' id='word_1_17' title='bbox 302 186 323 188; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 332 236 928 264">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 332 236 928 264">
+     <span class='ocr_line' id='line_1_11' title="bbox 332 236 928 264; baseline 0 -6"><span class='ocrx_word' id='word_1_18' title='bbox 332 244 404 246; x_wconf 90' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_19' title='bbox 414 239 486 264; x_wconf 88' lang='eng' dir='ltr'><em>Dye/Ia</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 495 239 636 264; x_wconf 85' lang='eng' dir='ltr'><em>ginsengisoli</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 643 238 701 258; x_wconf 86' lang='eng' dir='ltr'><em>Gsoil</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 711 236 781 258; x_wconf 79' lang='eng' dir='ltr'><em>3046T</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 789 239 928 264; x_wconf 81' lang='eng' dir='ltr'><em>(ABZ45367)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 321 73 323 303">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 321 73 323 303">
+     <span class='ocr_line' id='line_1_12' title="bbox 321 73 323 303; baseline 0 989"><span class='ocrx_word' id='word_1_24' title='bbox 321 73 323 303; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 271 302 332 322">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 271 302 332 322">
+     <span class='ocr_line' id='line_1_13' title="bbox 271 302 332 322; baseline -0.016 0"><span class='ocrx_word' id='word_1_25' title='bbox 271 302 332 322; x_wconf 60' lang='eng'><em>86*</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 271 329 304 331">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 271 329 304 331">
+     <span class='ocr_line' id='line_1_14' title="bbox 271 329 304 331; baseline 0 961"><span class='ocrx_word' id='word_1_26' title='bbox 271 329 304 331; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 330 244 332 360">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 330 244 332 360">
+     <span class='ocr_line' id='line_1_15' title="bbox 330 244 332 360; baseline 0 932"><span class='ocrx_word' id='word_1_27' title='bbox 330 244 332 360; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 495 345 993 372">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 495 345 993 372">
+     <span class='ocr_line' id='line_1_16' title="bbox 495 345 993 372; baseline 0 -5"><span class='ocrx_word' id='word_1_28' title='bbox 495 347 600 367; x_wconf 77' lang='eng' dir='ltr'><em>Frateun&#39;a</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 610 347 704 367; x_wconf 75' lang='eng' dir='ltr'><em>aurantia</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 715 347 771 367; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 781 345 851 367; x_wconf 87' lang='eng' dir='ltr'><em>6220T</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 858 347 993 372; x_wconf 87' lang='eng' dir='ltr'><em>(AJO10481)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 302 186 304 474">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 302 186 304 474">
+     <span class='ocr_line' id='line_1_17' title="bbox 302 186 304 474; baseline 0 818"><span class='ocrx_word' id='word_1_33' title='bbox 302 186 304 474; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 304 472 388 474">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 304 472 388 474">
+     <span class='ocr_line' id='line_1_18' title="bbox 304 472 388 474; baseline 0 818"><span class='ocrx_word' id='word_1_34' title='bbox 304 472 388 474; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 261 463 809 490">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 261 463 809 490">
+     <span class='ocr_line' id='line_1_19' title="bbox 261 463 809 490; baseline 0 -5"><span class='ocrx_word' id='word_1_35' title='bbox 261 475 273 488; x_wconf 45' lang='eng'><em>*1</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 395 465 467 490; x_wconf 75' lang='eng' dir='ltr'><em>Dye/la</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 473 465 575 490; x_wconf 77' lang='eng' dir='ltr'><em>japan/ca</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 583 463 661 485; x_wconf 82' lang='eng' dir='ltr'><em>XD53T</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 669 465 809 490; x_wconf 83' lang='eng' dir='ltr'><em>(AB110498)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 291 585 391 587">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 291 585 391 587">
+     <span class='ocr_line' id='line_1_20' title="bbox 291 585 391 587; baseline 0 705"><span class='ocrx_word' id='word_1_40' title='bbox 291 585 391 587; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 298 578 896 655">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 298 578 896 655">
+     <span class='ocr_line' id='line_1_21' title="bbox 397 578 896 606; baseline 0 -6"><span class='ocrx_word' id='word_1_41' title='bbox 397 580 470 606; x_wconf 84' lang='eng' dir='ltr'><em>Dye/la</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 477 580 604 606; x_wconf 85' lang='eng' dir='ltr'><em>yeojuensis</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 614 578 744 600; x_wconf 83' lang='eng' dir='ltr'><em>R2A16-10T</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 752 580 896 605; x_wconf 86' lang='eng' dir='ltr'><em>(DQ181549)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 298 635 325 655; baseline 0 0"><span class='ocrx_word' id='word_1_45' title='bbox 298 635 325 655; x_wconf 90' lang='eng'><em>55</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 273 643 289 665">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 273 643 289 665">
+     <span class='ocr_line' id='line_1_23' title="bbox 273 643 289 665; textangle 90"><span class='ocrx_word' id='word_1_46' title='bbox 276 656 286 665; x_wconf 59' lang='eng' dir='ltr'><strong>X&#39;</strong></span> <span class='ocrx_word' id='word_1_47' title='bbox 273 643 289 646; x_wconf 84' lang='eng'>|</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 289 585 291 700">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 289 585 291 700">
+     <span class='ocr_line' id='line_1_24' title="bbox 289 585 291 700; baseline 0 592"><span class='ocrx_word' id='word_1_48' title='bbox 289 585 291 700; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 482 684 974 743">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 482 684 974 743">
+     <span class='ocr_line' id='line_1_25' title="bbox 490 684 974 706; baseline 0 0"><span class='ocrx_word' id='word_1_49' title='bbox 490 686 674 706; x_wconf 75' lang='eng' dir='ltr'><em>Rhodanobacter</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 680 686 859 706; x_wconf 80' lang='eng' dir='ltr'><em>Iindaniclasticus</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 869 684 974 706; x_wconf 88' lang='eng' dir='ltr'><em>RP5557T</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 482 718 621 743; baseline 0 -5"><span class='ocrx_word' id='word_1_52' title='bbox 482 718 621 743; x_wconf 82' lang='eng' dir='ltr'><em>(AF039167)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 268 329 274 815">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 268 329 274 815">
+     <span class='ocr_line' id='line_1_27' title="bbox 268 329 274 815; baseline 0 477"><span class='ocrx_word' id='word_1_53' title='bbox 268 329 274 815; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 269 329 275 815">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 269 329 275 815">
+     <span class='ocr_line' id='line_1_28' title="bbox 269 329 275 815; baseline 0 477"><span class='ocrx_word' id='word_1_54' title='bbox 269 329 275 815; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 269 329 276 815">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 269 329 276 815">
+     <span class='ocr_line' id='line_1_29' title="bbox 269 329 276 815; baseline 0 477"><span class='ocrx_word' id='word_1_55' title='bbox 269 329 276 815; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 270 813 357 815">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 270 813 357 815">
+     <span class='ocr_line' id='line_1_30' title="bbox 270 813 357 815; baseline 0 477"><span class='ocrx_word' id='word_1_56' title='bbox 270 813 357 815; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 365 806 851 833">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 365 806 851 833">
+     <span class='ocr_line' id='line_1_31' title="bbox 365 806 851 833; baseline 0 -6"><span class='ocrx_word' id='word_1_57' title='bbox 365 808 501 827; x_wconf 84' lang='eng' dir='ltr'><em>Fulvimonas</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 510 808 550 827; x_wconf 86' lang='eng' dir='ltr'><em>so/i</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 558 807 612 827; x_wconf 90' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 624 806 706 827; x_wconf 75' lang='eng' dir='ltr'><em>19981T</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 715 808 851 833; x_wconf 86' lang='eng' dir='ltr'><em>(AJ311653)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 266 918 764 945">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 266 918 764 945">
+     <span class='ocr_line' id='line_1_32' title="bbox 266 918 764 945; baseline 0 -5"><span class='ocrx_word' id='word_1_62' title='bbox 266 921 400 945; x_wconf 81' lang='eng' dir='ltr'><em>Aquimonas</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 410 921 473 940; x_wconf 85' lang='eng' dir='ltr'><em>voraii</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 480 920 569 940; x_wconf 87' lang='eng' dir='ltr'><em>GPTSA</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 578 918 618 940; x_wconf 90' lang='eng' dir='ltr'><em>20T</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 627 921 764 945; x_wconf 88' lang='eng' dir='ltr'><em>(AY544768)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 336 1035 847 1062">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 336 1035 847 1062">
+     <span class='ocr_line' id='line_1_33' title="bbox 336 1035 847 1062; baseline 0 -5"><span class='ocrx_word' id='word_1_67' title='bbox 336 1037 468 1057; x_wconf 85' lang='eng' dir='ltr'><em>Dokdone/la</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 477 1037 591 1057; x_wconf 83' lang='eng' dir='ltr'><em>koreensis</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 601 1035 701 1057; x_wconf 84' lang='eng' dir='ltr'><em>DS—123T</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 709 1037 847 1062; x_wconf 85' lang='eng' dir='ltr'><em>(AY987368)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 282 1147 708 1174">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 282 1147 708 1174">
+     <span class='ocr_line' id='line_1_34' title="bbox 282 1147 708 1174; baseline 0 -5"><span class='ocrx_word' id='word_1_71' title='bbox 282 1149 426 1169; x_wconf 84' lang='eng' dir='ltr'><em>Silanimonas</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 434 1150 490 1169; x_wconf 75' lang='eng' dir='ltr'><em>lenta</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 498 1147 563 1169; x_wconf 90' lang='eng' dir='ltr'><em>25-4T</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 571 1150 708 1174; x_wconf 85' lang='eng' dir='ltr'><em>(AY557615)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 304 1263 850 1290">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 304 1263 850 1290">
+     <span class='ocr_line' id='line_1_35' title="bbox 304 1263 850 1290; baseline 0 -5"><span class='ocrx_word' id='word_1_75' title='bbox 304 1265 469 1285; x_wconf 81' lang='eng' dir='ltr'><em>Xanthomonas</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 477 1265 606 1290; x_wconf 77' lang='eng' dir='ltr'><em>campestris</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 615 1265 670 1285; x_wconf 92' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 680 1263 735 1285; x_wconf 80' lang='eng' dir='ltr'><em>568T</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 743 1265 850 1290; x_wconf 80' lang='eng' dir='ltr'><em>(X95917)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000984-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000984-0-000.pbm.png
new file mode 100644
index 00000000..194592c9
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000984-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000984-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000984-0-000.pbm.png.hocr
new file mode 100644
index 00000000..a37c25b8
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000984-0-000.pbm.png.hocr
@@ -0,0 +1,102 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000984-0-000.pbm.png"; bbox 0 0 1172 533; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 130 139 171 157">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 130 139 171 157">
+     <span class='ocr_line' id='line_1_1' title="bbox 130 139 171 157; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 130 139 171 157; x_wconf 87' lang='eng'>0.01</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 427 0 1083 241">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 479 0 1083 70">
+     <span class='ocr_line' id='line_1_2' title="bbox 489 0 1083 29; baseline 0.002 -7"><span class='ocrx_word' id='word_1_2' title='bbox 489 11 514 29; x_wconf 75' lang='eng'><em>84</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 558 3 581 22; x_wconf 95' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 593 3 798 23; x_wconf 84' lang='eng' dir='ltr'><em>histidinolovorans</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 808 2 865 23; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 875 0 963 23; x_wconf 80' lang='eng' dir='ltr'><em>20115T</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 972 3 1083 28; x_wconf 91' lang='eng' dir='ltr'><em>(X83406)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 479 43 1003 70; baseline 0 -5"><span class='ocrx_word' id='word_1_8' title='bbox 479 43 503 61; x_wconf 79' lang='eng'>96</span> <span class='ocrx_word' id='word_1_9' title='bbox 536 45 558 65; x_wconf 92' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 571 45 748 65; x_wconf 82' lang='eng' dir='ltr'><em>nicotinovorans</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 758 45 815 65; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 825 43 882 65; x_wconf 89' lang='eng' dir='ltr'><em>420T</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 892 45 1003 70; x_wconf 88' lang='eng' dir='ltr'>(X80743)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 571 85 1056 156">
+     <span class='ocr_line' id='line_1_4' title="bbox 594 85 1056 113; baseline -0.002 -5"><span class='ocrx_word' id='word_1_14' title='bbox 594 88 617 107; x_wconf 97' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 629 87 770 108; x_wconf 87' lang='eng' dir='ltr'><em>ureafaciens</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 781 87 838 108; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 848 85 935 108; x_wconf 78' lang='eng' dir='ltr'><em>20128T</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 945 88 1056 113; x_wconf 89' lang='eng' dir='ltr'><em>(X80744)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 571 128 1018 156; baseline 0 -5"><span class='ocrx_word' id='word_1_19' title='bbox 571 130 594 151; x_wconf 90' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 606 136 732 151; x_wconf 79' lang='eng' dir='ltr'><em>aurescens</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 742 130 800 151; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 810 128 898 151; x_wconf 76' lang='eng' dir='ltr'><em>20116T</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 907 130 1018 156; x_wconf 89' lang='eng' dir='ltr'><em>(X83405)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 427 171 1066 241">
+     <span class='ocr_line' id='line_1_6' title="bbox 665 171 1066 199; baseline 0 -6"><span class='ocrx_word' id='word_1_24' title='bbox 665 173 688 193; x_wconf 93' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 700 173 780 193; x_wconf 77' lang='eng' dir='ltr'><em>citreus</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 791 173 847 193; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 858 171 945 193; x_wconf 86' lang='eng' dir='ltr'><em>20133T</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 955 173 1066 199; x_wconf 86' lang='eng' dir='ltr'>(X80737)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 427 214 966 241; baseline 0 -5"><span class='ocrx_word' id='word_1_29' title='bbox 427 225 502 228; x_wconf 96' lang='eng'>—</span> <span class='ocrx_word' id='word_1_30' title='bbox 510 216 532 236; x_wconf 92' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 545 216 751 241; x_wconf 85' lang='eng' dir='ltr'><em>chlorophenolicus</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 758 214 813 236; x_wconf 74' lang='eng' dir='ltr'><em>A—6T</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 822 216 966 241; x_wconf 85' lang='eng' dir='ltr'>(AF102267)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 353 8 662 309">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 353 8 662 309">
+     <span class='ocr_line' id='line_1_8' title="bbox 514 8 555 30; baseline 0 503"><span class='ocrx_word' id='word_1_34' title='bbox 514 8 555 30; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 381 42 590 127; baseline 0 0"><span class='ocrx_word' id='word_1_35' title='bbox 381 42 590 127; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 353 127 662 224; baseline 0 -23"><span class='ocrx_word' id='word_1_36' title='bbox 353 127 662 224; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 353 224 392 254; baseline 0 279"><span class='ocrx_word' id='word_1_37' title='bbox 353 224 392 254; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 353 254 395 309; baseline 0 224"><span class='ocrx_word' id='word_1_38' title='bbox 353 254 395 309; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 427 228 429 302">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 427 228 429 302">
+     <span class='ocr_line' id='line_1_13' title="bbox 427 228 429 302; baseline 0 231"><span class='ocrx_word' id='word_1_39' title='bbox 427 228 429 302; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 0 310 516 313">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 0 310 516 313">
+     <span class='ocr_line' id='line_1_14' title="bbox 0 310 516 313; baseline 0 220"><span class='ocrx_word' id='word_1_40' title='bbox 0 310 516 313; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 395 256 1061 455">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 395 256 1061 455">
+     <span class='ocr_line' id='line_1_15' title="bbox 395 256 857 289; baseline -0.002 -10"><span class='ocrx_word' id='word_1_41' title='bbox 395 271 419 289; x_wconf 72' lang='eng'>92</span> <span class='ocrx_word' id='word_1_42' title='bbox 518 258 593 279; x_wconf 91' lang='eng' dir='ltr'><em>Strain</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 604 256 697 284; x_wconf 82' lang='eng' dir='ltr'><em>Sphe3&#39;r</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 706 258 857 284; x_wconf 85' lang='eng' dir='ltr'>(AM176541)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 425 268 1061 356; baseline 0 -34"><span class='ocrx_word' id='word_1_45' title='bbox 425 268 509 356; x_wconf 42' lang='eng' dir='ltr'><em>EH</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 523 302 546 322; x_wconf 69' lang='eng' dir='ltr'><em>A,</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 557 302 775 327; x_wconf 86' lang='eng' dir='ltr'><em>polychromogenes</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 785 301 842 322; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 853 299 940 322; x_wconf 85' lang='eng' dir='ltr'><em>20136T</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 950 302 1061 327; x_wconf 91' lang='eng' dir='ltr'>(X80741)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 450 341 936 370; baseline 0 -6"><span class='ocrx_word' id='word_1_51' title='bbox 450 341 475 358; x_wconf 85' lang='eng'><em>93</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 514 344 537 364; x_wconf 92' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 549 344 651 370; x_wconf 89' lang='eng' dir='ltr'><em>oxydans</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 661 344 718 364; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 728 342 815 364; x_wconf 82' lang='eng' dir='ltr'><em>20119T</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 825 344 936 370; x_wconf 83' lang='eng' dir='ltr'>(X83408)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 481 385 939 413; baseline 0 -6"><span class='ocrx_word' id='word_1_57' title='bbox 481 387 504 407; x_wconf 72' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 516 387 648 413; x_wconf 85' lang='eng' dir='ltr'><em>globiformis</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 658 387 715 407; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 726 385 813 407; x_wconf 91' lang='eng' dir='ltr'><em>20124T</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 823 387 939 412; x_wconf 87' lang='eng' dir='ltr'>(M23411)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 405 426 892 455; baseline 0 -5"><span class='ocrx_word' id='word_1_62' title='bbox 405 426 442 444; x_wconf 69' lang='eng'>100</span> <span class='ocrx_word' id='word_1_63' title='bbox 470 430 492 449; x_wconf 92' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 503 435 606 455; x_wconf 84' lang='eng' dir='ltr'><em>pascens</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 616 429 673 450; x_wconf 86' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 684 427 771 450; x_wconf 89' lang='eng' dir='ltr'><em>20545T</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 781 430 892 455; x_wconf 93' lang='eng' dir='ltr'>(X80740)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 667 471 1172 499">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 667 471 1172 499">
+     <span class='ocr_line' id='line_1_20' title="bbox 667 471 1172 499; baseline 0 -5"><span class='ocrx_word' id='word_1_68' title='bbox 667 474 851 499; x_wconf 82' lang='eng' dir='ltr'><em>Mycobacterium</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 861 474 993 499; x_wconf 78' lang='eng' dir='ltr'><em>smegmatis</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 1001 474 1075 494; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 1087 471 1172 494; x_wconf 90' lang='eng' dir='ltr'><em>19420T</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 3 500 657 502">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 3 500 657 502">
+     <span class='ocr_line' id='line_1_21' title="bbox 3 500 657 502; baseline 0 31"><span class='ocrx_word' id='word_1_72' title='bbox 3 500 657 502; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 666 507 811 533">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 666 507 811 533">
+     <span class='ocr_line' id='line_1_22' title="bbox 666 507 811 533; baseline 0 -6"><span class='ocrx_word' id='word_1_73' title='bbox 666 507 811 533; x_wconf 89' lang='eng' dir='ltr'>(AY457078)</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000984-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000984-0-001.pbm.png
new file mode 100644
index 00000000..296b46d6
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000984-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000984-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000984-0-001.pbm.png.hocr
new file mode 100644
index 00000000..a1310343
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.000984-0-001.pbm.png.hocr
@@ -0,0 +1,148 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.000984-0-001.pbm.png"; bbox 0 0 1148 469; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 0 378 6 438">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 0 378 6 438">
+     <span class='ocr_line' id='line_1_1' title="bbox 0 378 6 438; baseline 0 31"><span class='ocrx_word' id='word_1_1' title='bbox 0 378 6 438; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 57 43 102 61">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 57 43 102 61">
+     <span class='ocr_line' id='line_1_2' title="bbox 57 43 102 61; baseline -0.022 0"><span class='ocrx_word' id='word_1_2' title='bbox 57 43 102 61; x_wconf 86' lang='eng'><em>0.02</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 140 154 165 172">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 140 154 165 172">
+     <span class='ocr_line' id='line_1_3' title="bbox 140 154 165 172; baseline 0 0"><span class='ocrx_word' id='word_1_3' title='bbox 140 154 165 172; x_wconf 84' lang='eng'><em>84</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 475 0 1148 175">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 475 0 1148 175">
+     <span class='ocr_line' id='line_1_4' title="bbox 504 0 971 28; baseline 0 -6"><span class='ocrx_word' id='word_1_4' title='bbox 504 3 527 22; x_wconf 96' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 540 3 641 28; x_wconf 85' lang='eng' dir='ltr'><em>oxydans</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 648 2 722 22; x_wconf 88' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 734 0 819 22; x_wconf 83' lang='eng' dir='ltr'><em>14358T</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 828 3 971 28; x_wconf 83' lang='eng' dir='ltr'><em>(AF214789)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 475 37 1056 64; baseline 0 -5"><span class='ocrx_word' id='word_1_9' title='bbox 475 39 498 59; x_wconf 94' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 509 39 726 64; x_wconf 86' lang='eng' dir='ltr'><em>polychromogenes</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 734 39 807 59; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 819 37 904 59; x_wconf 82' lang='eng' dir='ltr'><em>15216T</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 914 39 1056 64; x_wconf 91' lang='eng' dir='ltr'><em>(AF214785)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 521 74 859 101; baseline 0 -5"><span class='ocrx_word' id='word_1_14' title='bbox 521 76 596 96; x_wconf 84' lang='eng' dir='ltr'><em>Strain</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 607 74 699 101; x_wconf 79' lang='eng' dir='ltr'><em>Sphe3T</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 709 76 859 101; x_wconf 87' lang='eng' dir='ltr'><em>(AM931439)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 603 110 1093 138; baseline -0.002 -5"><span class='ocrx_word' id='word_1_17' title='bbox 603 113 625 132; x_wconf 90' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 638 118 763 133; x_wconf 84' lang='eng' dir='ltr'><em>aurescens</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 771 113 844 133; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 856 110 941 133; x_wconf 83' lang='eng' dir='ltr'><em>13344T</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 951 113 1093 138; x_wconf 85' lang='eng' dir='ltr'><em>(AF214793)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 580 147 1148 175; baseline 0 -6"><span class='ocrx_word' id='word_1_22' title='bbox 580 149 603 169; x_wconf 91' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 615 149 818 169; x_wconf 81' lang='eng' dir='ltr'><em>histidinolovorans</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 826 149 899 169; x_wconf 88' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 911 147 996 169; x_wconf 79' lang='eng' dir='ltr'><em>11442T</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 1005 149 1148 175; x_wconf 84' lang='eng' dir='ltr'><em>(AF214788)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 347 7 372 24">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 347 7 372 24">
+     <span class='ocr_line' id='line_1_9' title="bbox 347 7 372 24; baseline 0 0"><span class='ocrx_word' id='word_1_27' title='bbox 347 7 372 24; x_wconf 88' lang='eng'>98</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 376 11 378 47">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 376 11 378 47">
+     <span class='ocr_line' id='line_1_10' title="bbox 376 11 378 47; baseline 0 422"><span class='ocrx_word' id='word_1_28' title='bbox 376 11 378 47; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 376 47 468 50">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 376 47 468 50">
+     <span class='ocr_line' id='line_1_11' title="bbox 376 47 468 50; baseline 0 419"><span class='ocrx_word' id='word_1_29' title='bbox 376 47 468 50; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 172 25 512 176">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 172 25 512 176">
+     <span class='ocr_line' id='line_1_12' title="bbox 172 25 512 176; baseline 0 0"><span class='ocrx_word' id='word_1_30' title='bbox 172 25 512 176; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 259 121 261 178">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 259 121 261 178">
+     <span class='ocr_line' id='line_1_13' title="bbox 259 121 261 178; baseline 0 291"><span class='ocrx_word' id='word_1_31' title='bbox 259 121 261 178; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 281 158 283 194">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 281 158 283 194">
+     <span class='ocr_line' id='line_1_14' title="bbox 281 158 283 194; baseline 0 275"><span class='ocrx_word' id='word_1_32' title='bbox 281 158 283 194; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 102 176 283 178">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 102 176 283 178">
+     <span class='ocr_line' id='line_1_15' title="bbox 102 176 283 178; baseline 0 291"><span class='ocrx_word' id='word_1_33' title='bbox 102 176 283 178; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 74 227 95 245">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 74 227 95 245">
+     <span class='ocr_line' id='line_1_16' title="bbox 74 227 95 245; baseline -0.048 0"><span class='ocrx_word' id='word_1_34' title='bbox 74 227 95 245; x_wconf 87' lang='eng'><em>51</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 102 176 104 325">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 102 176 104 325">
+     <span class='ocr_line' id='line_1_17' title="bbox 102 176 104 325; baseline 0 144"><span class='ocrx_word' id='word_1_35' title='bbox 102 176 104 325; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 102 323 170 325">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 102 323 170 325">
+     <span class='ocr_line' id='line_1_18' title="bbox 102 323 170 325; baseline 0 144"><span class='ocrx_word' id='word_1_36' title='bbox 102 323 170 325; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 135 331 159 348">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 135 331 159 348">
+     <span class='ocr_line' id='line_1_19' title="bbox 135 331 159 348; baseline 0 0"><span class='ocrx_word' id='word_1_37' title='bbox 135 331 159 348; x_wconf 89' lang='eng'>72</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 168 307 170 343">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 168 307 170 343">
+     <span class='ocr_line' id='line_1_20' title="bbox 168 307 170 343; baseline 0 126"><span class='ocrx_word' id='word_1_38' title='bbox 168 307 170 343; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 168 158 1078 307">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 205 184 1078 285">
+     <span class='ocr_line' id='line_1_21' title="bbox 248 184 1078 212; baseline 0 -6"><span class='ocrx_word' id='word_1_39' title='bbox 248 184 273 201; x_wconf 86' lang='eng'><em>59</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 281 194 581 197; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_41' title='bbox 588 187 611 206; x_wconf 98' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 623 187 764 207; x_wconf 85' lang='eng' dir='ltr'><em>ureafaciens</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 772 187 845 207; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 855 184 926 207; x_wconf 86' lang='eng' dir='ltr'><em>7562T</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 936 187 1078 212; x_wconf 87' lang='eng' dir='ltr'><em>(AF214782)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 415 221 897 249; baseline 0 -6"><span class='ocrx_word' id='word_1_46' title='bbox 415 224 438 243; x_wconf 91' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 450 223 582 249; x_wconf 87' lang='eng' dir='ltr'><em>globiformis</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 590 223 663 243; x_wconf 88' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 674 221 745 243; x_wconf 76' lang='eng' dir='ltr'>8010T</span> <span class='ocrx_word' id='word_1_50' title='bbox 754 224 897 248; x_wconf 79' lang='eng' dir='ltr'><em>(AF214780)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 205 257 994 285; baseline 0 -5"><span class='ocrx_word' id='word_1_51' title='bbox 205 257 230 275; x_wconf 75' lang='eng'><em>68</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 528 260 551 280; x_wconf 61' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 562 265 664 285; x_wconf 86' lang='eng' dir='ltr'><em>pascens</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 672 260 745 280; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 757 258 842 280; x_wconf 75' lang='eng' dir='ltr'><em>13346T</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 852 260 994 285; x_wconf 86' lang='eng' dir='ltr'><em>(AF214786)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 532 294 1109 396">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 532 294 1109 396">
+     <span class='ocr_line' id='line_1_24' title="bbox 620 294 1109 322; baseline 0 -5"><span class='ocrx_word' id='word_1_57' title='bbox 620 297 643 317; x_wconf 69' lang='eng' dir='ltr'><em>A,</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 655 297 778 317; x_wconf 82' lang='eng' dir='ltr'><em>nicotianae</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 786 297 860 317; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 872 294 956 317; x_wconf 86' lang='eng' dir='ltr'><em>15236T</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 966 297 1109 322; x_wconf 87' lang='eng' dir='ltr'><em>(AF214792)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 532 332 1007 359; baseline -0.002 -5"><span class='ocrx_word' id='word_1_62' title='bbox 532 334 555 353; x_wconf 93' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 567 334 677 354; x_wconf 87' lang='eng' dir='ltr'><em>sulfureus</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 685 334 758 354; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 770 332 855 354; x_wconf 75' lang='eng' dir='ltr'><em>19098T</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 864 334 1007 359; x_wconf 86' lang='eng' dir='ltr'><em>(AF214787)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 545 369 990 396; baseline -0.002 -5"><span class='ocrx_word' id='word_1_67' title='bbox 545 371 568 390; x_wconf 94' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 581 371 660 391; x_wconf 76' lang='eng' dir='ltr'><em>citreus</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 668 371 741 391; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 753 369 838 391; x_wconf 79' lang='eng' dir='ltr'><em>11624T</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 848 371 990 396; x_wconf 89' lang='eng' dir='ltr'><em>(AF214781)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 620 408 1134 469">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 620 408 1134 469">
+     <span class='ocr_line' id='line_1_27' title="bbox 620 408 1134 436; baseline 0 -6"><span class='ocrx_word' id='word_1_72' title='bbox 620 410 804 436; x_wconf 80' lang='eng' dir='ltr'><em>Mycobacterium</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 814 410 969 430; x_wconf 73' lang='eng' dir='ltr'><em>mon‘okaense</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 979 410 1022 430; x_wconf 89' lang='eng' dir='ltr'><em>CIP</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 1034 408 1134 430; x_wconf 79' lang='eng' dir='ltr'><em>105393T</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 620 443 764 469; baseline 0 -6"><span class='ocrx_word' id='word_1_76' title='bbox 620 443 764 469; x_wconf 86' lang='eng' dir='ltr'><em>(AY859691)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001123-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001123-0-000.pbm.png
new file mode 100644
index 00000000..925c6ac6
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001123-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001123-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001123-0-000.pbm.png.hocr
new file mode 100644
index 00000000..b4c323bb
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001123-0-000.pbm.png.hocr
@@ -0,0 +1,377 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001123-0-000.pbm.png"; bbox 0 0 1243 1430; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 115 34 149 50">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 115 34 149 50">
+     <span class='ocr_line' id='line_1_1' title="bbox 115 34 149 50; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 115 34 149 50; x_wconf 88' lang='eng'>1%</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 107 63 157 65">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 107 63 157 65">
+     <span class='ocr_line' id='line_1_2' title="bbox 107 63 157 65; baseline 0 1365"><span class='ocrx_word' id='word_1_2' title='bbox 107 63 157 65; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 349 99 383 116">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 349 99 383 116">
+     <span class='ocr_line' id='line_1_3' title="bbox 349 99 383 116; baseline 0.029 -1"><span class='ocrx_word' id='word_1_3' title='bbox 349 99 383 116; x_wconf 90' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 397 13 496 15">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 397 13 496 15">
+     <span class='ocr_line' id='line_1_4' title="bbox 397 13 496 15; baseline 0 1415"><span class='ocrx_word' id='word_1_4' title='bbox 397 13 496 15; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 503 3 1080 66">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 503 3 1080 66">
+     <span class='ocr_line' id='line_1_5' title="bbox 503 3 965 29; baseline 0 -5"><span class='ocrx_word' id='word_1_5' title='bbox 503 4 523 24; x_wconf 78' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_6' title='bbox 536 4 657 24; x_wconf 82' lang='eng' dir='ltr'>ubonensis</span> <span class='ocrx_word' id='word_1_7' title='bbox 667 4 722 24; x_wconf 91' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_8' title='bbox 732 3 815 24; x_wconf 88' lang='eng' dir='ltr'>20358T</span> <span class='ocrx_word' id='word_1_9' title='bbox 824 4 965 29; x_wconf 87' lang='eng' dir='ltr'>(AY780511)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 579 40 1080 66; baseline 0 -6"><span class='ocrx_word' id='word_1_10' title='bbox 579 41 600 60; x_wconf 91' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_11' title='bbox 613 41 774 61; x_wconf 77' lang='eng' dir='ltr'>vietnamiensis</span> <span class='ocrx_word' id='word_1_12' title='bbox 783 41 839 61; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_13' title='bbox 851 40 932 61; x_wconf 73' lang='eng' dir='ltr'>10929T</span> <span class='ocrx_word' id='word_1_14' title='bbox 941 41 1080 66; x_wconf 87' lang='eng' dir='ltr'>(AF143774)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 417 68 437 70">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 417 68 437 70">
+     <span class='ocr_line' id='line_1_7' title="bbox 417 68 437 70; baseline 0 1360"><span class='ocrx_word' id='word_1_15' title='bbox 417 68 437 70; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 6 119 397 121">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 6 119 397 121">
+     <span class='ocr_line' id='line_1_8' title="bbox 6 119 397 121; baseline 0 1309"><span class='ocrx_word' id='word_1_16' title='bbox 6 119 397 121; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 6 119 8 1411">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 6 119 8 1411">
+     <span class='ocr_line' id='line_1_9' title="bbox 6 119 8 1411; baseline 0 19"><span class='ocrx_word' id='word_1_17' title='bbox 6 119 8 1411; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 428 123 528 125">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 428 123 528 125">
+     <span class='ocr_line' id='line_1_10' title="bbox 428 123 528 125; baseline 0 1305"><span class='ocrx_word' id='word_1_18' title='bbox 428 123 528 125; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 426 123 428 161">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 426 123 428 161">
+     <span class='ocr_line' id='line_1_11' title="bbox 426 123 428 161; baseline 0 1269"><span class='ocrx_word' id='word_1_19' title='bbox 426 123 428 161; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 428 160 516 161">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 428 160 516 161">
+     <span class='ocr_line' id='line_1_12' title="bbox 428 160 516 161; baseline 0 1269"><span class='ocrx_word' id='word_1_20' title='bbox 428 160 516 161; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 395 13 397 228">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 395 13 397 228">
+     <span class='ocr_line' id='line_1_13' title="bbox 395 13 397 228; baseline 0 1202"><span class='ocrx_word' id='word_1_21' title='bbox 395 13 397 228; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 395 226 417 228">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 395 226 417 228">
+     <span class='ocr_line' id='line_1_14' title="bbox 395 226 417 228; baseline 0 1202"><span class='ocrx_word' id='word_1_22' title='bbox 395 226 417 228; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 415 68 419 349">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 415 68 419 349">
+     <span class='ocr_line' id='line_1_15' title="bbox 415 68 419 349; baseline 0 1081"><span class='ocrx_word' id='word_1_23' title='bbox 415 68 419 349; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 435 50 437 88">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 435 50 437 88">
+     <span class='ocr_line' id='line_1_16' title="bbox 435 50 437 88; baseline 0 1342"><span class='ocrx_word' id='word_1_24' title='bbox 435 50 437 88; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 437 86 519 88">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 437 86 519 88">
+     <span class='ocr_line' id='line_1_17' title="bbox 437 86 519 88; baseline 0 1342"><span class='ocrx_word' id='word_1_25' title='bbox 437 86 519 88; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 433 77 1193 896">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 433 77 1000 250">
+     <span class='ocr_line' id='line_1_18' title="bbox 525 77 951 102; baseline 0 -5"><span class='ocrx_word' id='word_1_26' title='bbox 525 78 546 97; x_wconf 92' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_27' title='bbox 558 78 644 97; x_wconf 83' lang='eng' dir='ltr'>anthina</span> <span class='ocrx_word' id='word_1_28' title='bbox 655 77 710 97; x_wconf 91' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_29' title='bbox 720 77 803 97; x_wconf 79' lang='eng' dir='ltr'>20980T</span> <span class='ocrx_word' id='word_1_30' title='bbox 812 78 951 102; x_wconf 87' lang='eng' dir='ltr'>(AF456059)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 534 114 1000 139; baseline 0 -5"><span class='ocrx_word' id='word_1_31' title='bbox 534 114 555 134; x_wconf 90' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_32' title='bbox 566 114 703 134; x_wconf 80' lang='eng' dir='ltr'><em>multivorans</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 713 114 767 134; x_wconf 91' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_34' title='bbox 779 114 851 134; x_wconf 92' lang='eng'>16660</span> <span class='ocrx_word' id='word_1_35' title='bbox 861 114 1000 139; x_wconf 89' lang='eng' dir='ltr'>(AF143774)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 523 151 940 176; baseline 0 -5"><span class='ocrx_word' id='word_1_36' title='bbox 523 151 543 171; x_wconf 90' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_37' title='bbox 556 151 633 171; x_wconf 86' lang='eng' dir='ltr'><em>do/osa</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 643 151 698 171; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_39' title='bbox 710 151 791 171; x_wconf 86' lang='eng' dir='ltr'>18943T</span> <span class='ocrx_word' id='word_1_40' title='bbox 801 151 940 176; x_wconf 87' lang='eng' dir='ltr'>(AF323971)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 433 187 960 213; baseline -0.004 -3"><span class='ocrx_word' id='word_1_41' title='bbox 433 194 535 210; x_wconf 90' lang='eng'>66—</span> <span class='ocrx_word' id='word_1_42' title='bbox 543 188 564 208; x_wconf 90' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 577 188 668 213; x_wconf 82' lang='eng' dir='ltr'>cepac/a</span> <span class='ocrx_word' id='word_1_44' title='bbox 678 188 733 208; x_wconf 90' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_45' title='bbox 745 187 811 208; x_wconf 78' lang='eng' dir='ltr'>1222T</span> <span class='ocrx_word' id='word_1_46' title='bbox 820 188 960 213; x_wconf 87' lang='eng' dir='ltr'>(AF143786)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 462 224 994 250; baseline 0 -6"><span class='ocrx_word' id='word_1_47' title='bbox 462 225 560 244; x_wconf 91' lang='eng' dir='ltr'><em>—B.</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 571 225 687 250; x_wconf 83' lang='eng' dir='ltr'>pyrrocinia</span> <span class='ocrx_word' id='word_1_49' title='bbox 698 225 752 245; x_wconf 90' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_50' title='bbox 764 224 846 245; x_wconf 75' lang='eng' dir='ltr'>14191T</span> <span class='ocrx_word' id='word_1_51' title='bbox 856 225 994 250; x_wconf 86' lang='eng' dir='ltr'>(AF143794)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 444 261 1165 471">
+     <span class='ocr_line' id='line_1_23' title="bbox 583 261 1111 286; baseline 0 -5"><span class='ocrx_word' id='word_1_52' title='bbox 583 262 604 281; x_wconf 90' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_53' title='bbox 616 262 766 286; x_wconf 78' lang='eng' dir='ltr'>Genocepacia</span> <span class='ocrx_word' id='word_1_54' title='bbox 776 262 813 281; x_wconf 95' lang='eng' dir='ltr'><strong>IIIB</strong></span> <span class='ocrx_word' id='word_1_55' title='bbox 824 261 879 281; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_56' title='bbox 891 262 962 281; x_wconf 93' lang='eng'>16659</span> <span class='ocrx_word' id='word_1_57' title='bbox 972 262 1111 286; x_wconf 88' lang='eng' dir='ltr'>(AF143783)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 553 297 974 323; baseline 0 -5"><span class='ocrx_word' id='word_1_58' title='bbox 553 298 574 318; x_wconf 91' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 586 298 668 318; x_wconf 74' lang='eng' dir='ltr'>stabi/is</span> <span class='ocrx_word' id='word_1_60' title='bbox 677 298 732 318; x_wconf 91' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_61' title='bbox 744 297 825 318; x_wconf 76' lang='eng' dir='ltr'>14294T</span> <span class='ocrx_word' id='word_1_62' title='bbox 835 298 974 323; x_wconf 87' lang='eng' dir='ltr'>(AF456031)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 455 335 984 360; baseline 0 -5"><span class='ocrx_word' id='word_1_63' title='bbox 455 335 549 355; x_wconf 41' lang='eng'><em>78.</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 561 335 672 355; x_wconf 82' lang='eng' dir='ltr'>semina/is</span> <span class='ocrx_word' id='word_1_65' title='bbox 682 335 737 355; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_66' title='bbox 747 335 830 355; x_wconf 89' lang='eng' dir='ltr'>24067T</span> <span class='ocrx_word' id='word_1_67' title='bbox 839 335 984 360; x_wconf 87' lang='eng' dir='ltr'>(AM748102)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 444 372 1054 397; baseline 0 -5"><span class='ocrx_word' id='word_1_68' title='bbox 444 372 540 392; x_wconf 92' lang='eng' dir='ltr'><em>—B.</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 552 372 701 397; x_wconf 83' lang='eng' dir='ltr'>cenocepacia</span> <span class='ocrx_word' id='word_1_70' title='bbox 712 372 750 392; x_wconf 93' lang='eng' dir='ltr'><strong>IIIC</strong></span> <span class='ocrx_word' id='word_1_71' title='bbox 761 372 815 392; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_72' title='bbox 828 372 899 392; x_wconf 84' lang='eng'>19239</span> <span class='ocrx_word' id='word_1_73' title='bbox 909 372 1054 397; x_wconf 85' lang='eng' dir='ltr'>(AM748105)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 579 408 1165 434; baseline 0 -5"><span class='ocrx_word' id='word_1_74' title='bbox 579 409 600 429; x_wconf 93' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_75' title='bbox 612 409 761 434; x_wconf 83' lang='eng' dir='ltr'>cenocepacia</span> <span class='ocrx_word' id='word_1_76' title='bbox 772 409 810 429; x_wconf 91' lang='eng' dir='ltr'><strong>IIIA</strong></span> <span class='ocrx_word' id='word_1_77' title='bbox 819 409 875 429; x_wconf 90' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_78' title='bbox 886 408 965 429; x_wconf 79' lang='eng' dir='ltr'>16656T</span> <span class='ocrx_word' id='word_1_79' title='bbox 975 409 1051 434; x_wconf 88' lang='eng' dir='ltr'>(whole</span> <span class='ocrx_word' id='word_1_80' title='bbox 1061 409 1165 434; x_wconf 86' lang='eng' dir='ltr'>genome)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 482 446 1121 471; baseline -0.002 -5"><span class='ocrx_word' id='word_1_81' title='bbox 482 446 612 465; x_wconf 90' lang='eng' dir='ltr'><em>—B.</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 625 446 774 471; x_wconf 80' lang='eng' dir='ltr'>cenocepacia</span> <span class='ocrx_word' id='word_1_83' title='bbox 784 446 823 465; x_wconf 95' lang='eng' dir='ltr'><strong>IIID</strong></span> <span class='ocrx_word' id='word_1_84' title='bbox 834 446 889 466; x_wconf 89' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_85' title='bbox 898 446 967 466; x_wconf 87' lang='eng'>21461</span> <span class='ocrx_word' id='word_1_86' title='bbox 982 446 1121 471; x_wconf 91' lang='eng' dir='ltr'>(AF456021)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 595 482 1018 507">
+     <span class='ocr_line' id='line_1_29' title="bbox 595 482 1018 507; baseline 0 -5"><span class='ocrx_word' id='word_1_87' title='bbox 595 483 615 502; x_wconf 87' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_88' title='bbox 628 482 705 502; x_wconf 86' lang='eng' dir='ltr'><em>diffusa</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 715 482 770 502; x_wconf 91' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_90' title='bbox 780 482 863 502; x_wconf 87' lang='eng' dir='ltr'>24065T</span> <span class='ocrx_word' id='word_1_91' title='bbox 873 483 1018 507; x_wconf 87' lang='eng' dir='ltr'>(AM748103)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 471 491 1193 896">
+     <span class='ocr_line' id='line_1_30' title="bbox 471 491 959 544; baseline 0 -5"><span class='ocrx_word' id='word_1_92' title='bbox 471 491 649 539; x_wconf 42' lang='eng' dir='ltr'>53—719.].3tens</span> <span class='ocrx_word' id='word_1_93' title='bbox 659 519 713 539; x_wconf 91' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_94' title='bbox 723 519 804 539; x_wconf 78' lang='eng' dir='ltr'>24064T</span> <span class='ocrx_word' id='word_1_95' title='bbox 813 519 959 544; x_wconf 83' lang='eng' dir='ltr'>(AM922300)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 478 555 1046 581; baseline 0.002 -6"><span class='ocrx_word' id='word_1_96' title='bbox 478 556 618 575; x_wconf 91' lang='eng' dir='ltr'><em>—B.</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 631 556 739 576; x_wconf 82' lang='eng' dir='ltr'><em>ambifaria</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 749 556 804 576; x_wconf 91' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_99' title='bbox 816 555 898 576; x_wconf 87' lang='eng' dir='ltr'>19182T</span> <span class='ocrx_word' id='word_1_100' title='bbox 907 556 1046 581; x_wconf 83' lang='eng' dir='ltr'>(AF323985)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 480 592 1023 618; baseline 0 -5"><span class='ocrx_word' id='word_1_101' title='bbox 480 601 588 603; x_wconf 91' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_102' title='bbox 597 593 617 613; x_wconf 90' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_103' title='bbox 630 593 711 613; x_wconf 82' lang='eng' dir='ltr'>arbor/s</span> <span class='ocrx_word' id='word_1_104' title='bbox 720 592 775 613; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_105' title='bbox 785 592 868 613; x_wconf 70' lang='eng' dir='ltr'>24066T</span> <span class='ocrx_word' id='word_1_106' title='bbox 878 593 1023 618; x_wconf 83' lang='eng' dir='ltr'>(AM748095)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 614 618 1193 668; baseline 0 -18"><span class='ocrx_word' id='word_1_107' title='bbox 614 630 635 650; x_wconf 78' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_108' title='bbox 647 630 751 650; x_wconf 74' lang='eng' dir='ltr'>meta/lice</span> <span class='ocrx_word' id='word_1_109' title='bbox 762 630 817 650; x_wconf 91' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_110' title='bbox 827 629 910 650; x_wconf 79' lang='eng' dir='ltr'>24068T</span> <span class='ocrx_word' id='word_1_111' title='bbox 920 630 1059 655; x_wconf 84' lang='eng' dir='ltr'>(AF456103)</span> <span class='ocrx_word' id='word_1_112' title='bbox 1115 622 1126 646; x_wconf 47' lang='eng'><strong>\</strong></span> <span class='ocrx_word' id='word_1_113' title='bbox 1181 618 1193 668; x_wconf 59' lang='eng'>\</span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 565 666 1053 692; baseline -0.002 -5"><span class='ocrx_word' id='word_1_114' title='bbox 565 667 586 686; x_wconf 88' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_115' title='bbox 598 667 749 687; x_wconf 83' lang='eng' dir='ltr'>contaminans</span> <span class='ocrx_word' id='word_1_116' title='bbox 759 667 813 687; x_wconf 90' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_117' title='bbox 824 666 905 687; x_wconf 81' lang='eng' dir='ltr'>23361T</span> <span class='ocrx_word' id='word_1_118' title='bbox 914 667 1053 692; x_wconf 87' lang='eng' dir='ltr'>(AF456121)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 569 704 1034 728; baseline 0 -5"><span class='ocrx_word' id='word_1_119' title='bbox 569 711 575 713; x_wconf 85' lang='eng'><em>-</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 584 704 605 723; x_wconf 91' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_121' title='bbox 617 704 769 723; x_wconf 69' lang='eng' dir='ltr'>Bantam/Hans</span> <span class='ocrx_word' id='word_1_122' title='bbox 778 704 879 723; x_wconf 87' lang='eng' dir='ltr'>R—20938</span> <span class='ocrx_word' id='word_1_123' title='bbox 889 704 1034 728; x_wconf 86' lang='eng' dir='ltr'>(AM905035)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 574 740 1034 765; baseline 0 -5"><span class='ocrx_word' id='word_1_124' title='bbox 574 740 611 760; x_wconf 42' lang='eng' dir='ltr'>*B,</span> <span class='ocrx_word' id='word_1_125' title='bbox 624 740 775 760; x_wconf 82' lang='eng' dir='ltr'>contaminans</span> <span class='ocrx_word' id='word_1_126' title='bbox 784 740 885 760; x_wconf 84' lang='eng' dir='ltr'>R-13528</span> <span class='ocrx_word' id='word_1_127' title='bbox 895 740 1034 765; x_wconf 82' lang='eng' dir='ltr'>(AF456073)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 585 777 1139 829; baseline 0.002 -33"><span class='ocrx_word' id='word_1_128' title='bbox 585 777 605 796; x_wconf 92' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_129' title='bbox 617 777 769 797; x_wconf 82' lang='eng' dir='ltr'>contaminans</span> <span class='ocrx_word' id='word_1_130' title='bbox 779 777 879 797; x_wconf 88' lang='eng' dir='ltr'>R-18442</span> <span class='ocrx_word' id='word_1_131' title='bbox 889 777 1034 802; x_wconf 85' lang='eng' dir='ltr'>(AM905034)</span> <span class='ocrx_word' id='word_1_132' title='bbox 1128 786 1139 829; x_wconf 62' lang='eng'>&gt;</span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 573 814 1081 896; baseline 0 -63"><span class='ocrx_word' id='word_1_133' title='bbox 573 819 619 896; x_wconf 42' lang='eng' dir='ltr'>E)“</span> <span class='ocrx_word' id='word_1_134' title='bbox 631 814 652 833; x_wconf 94' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_135' title='bbox 664 814 815 833; x_wconf 79' lang='eng' dir='ltr'>contaminans</span> <span class='ocrx_word' id='word_1_136' title='bbox 825 814 925 833; x_wconf 85' lang='eng' dir='ltr'>R-18428</span> <span class='ocrx_word' id='word_1_137' title='bbox 936 814 1081 838; x_wconf 86' lang='eng' dir='ltr'>(AM905037)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 438 215 462 217">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 438 215 462 217">
+     <span class='ocr_line' id='line_1_39' title="bbox 438 215 462 217; baseline 0 1213"><span class='ocrx_word' id='word_1_138' title='bbox 438 215 462 217; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 461 196 462 235">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 461 196 462 235">
+     <span class='ocr_line' id='line_1_40' title="bbox 461 196 462 235; baseline 0 1195"><span class='ocrx_word' id='word_1_139' title='bbox 461 196 462 235; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 436 50 441 299">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 436 50 441 299">
+     <span class='ocr_line' id='line_1_41' title="bbox 436 50 441 299; baseline 0 1131"><span class='ocrx_word' id='word_1_140' title='bbox 436 50 441 299; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 455 307 540 309">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 455 307 540 309">
+     <span class='ocr_line' id='line_1_42' title="bbox 455 307 540 309; baseline 0 1121"><span class='ocrx_word' id='word_1_141' title='bbox 455 307 540 309; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 451 270 456 345">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 451 270 456 345">
+     <span class='ocr_line' id='line_1_43' title="bbox 451 270 456 345; baseline 0 1085"><span class='ocrx_word' id='word_1_142' title='bbox 451 270 456 345; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 444 413 577 673">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 444 413 577 673">
+     <span class='ocr_line' id='line_1_44' title="bbox 444 413 577 552; baseline 0 -44"><span class='ocrx_word' id='word_1_143' title='bbox 444 413 577 552; x_wconf 95' lang='eng' dir='ltr'>    </span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 458 552 480 673; baseline 0 757"><span class='ocrx_word' id='word_1_144' title='bbox 458 552 480 673; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 442 380 444 497">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 442 380 444 497">
+     <span class='ocr_line' id='line_1_46' title="bbox 442 380 444 497; baseline 0 933"><span class='ocrx_word' id='word_1_145' title='bbox 442 380 444 497; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 476 634 607 1356">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 476 653 592 1356">
+     <span class='ocr_line' id='line_1_47' title="bbox 528 653 568 777; baseline 0 -37"><span class='ocrx_word' id='word_1_146' title='bbox 528 653 568 777; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_48' title="bbox 476 777 573 934; baseline 0 -120"><span class='ocrx_word' id='word_1_147' title='bbox 476 777 573 934; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_49' title="bbox 476 934 575 961; baseline 0 469"><span class='ocrx_word' id='word_1_148' title='bbox 476 934 575 961; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_50' title="bbox 476 961 575 1048; baseline 0 -50"><span class='ocrx_word' id='word_1_149' title='bbox 476 961 575 1048; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_51' title="bbox 528 1048 592 1125; baseline 0 -13"><span class='ocrx_word' id='word_1_150' title='bbox 528 1048 592 1125; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_52' title="bbox 528 1125 575 1224; baseline 0 0"><span class='ocrx_word' id='word_1_151' title='bbox 528 1125 560 1224; x_wconf 95' lang='eng' dir='ltr'>   </span> <span class='ocrx_word' id='word_1_152' title='bbox 570 1192 575 1224; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_53' title="bbox 542 1224 560 1274; baseline 0 156"><span class='ocrx_word' id='word_1_153' title='bbox 542 1224 560 1274; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_54' title="bbox 555 1331 563 1356; baseline 0 74"><span class='ocrx_word' id='word_1_154' title='bbox 555 1331 563 1356; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 1149 779 1168 834">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 1149 779 1168 834">
+     <span class='ocr_line' id='line_1_55' title="bbox 1149 779 1168 834; textangle 90"><span class='ocrx_word' id='word_1_155' title='bbox 1149 779 1168 834; x_wconf 65' lang='eng' dir='ltr'>Hm!</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 540 846 1139 1300">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 540 846 1139 1300">
+     <span class='ocr_line' id='line_1_56' title="bbox 581 846 1063 875; baseline 0 -5"><span class='ocrx_word' id='word_1_156' title='bbox 581 846 604 862; x_wconf 78' lang='eng'>76</span> <span class='ocrx_word' id='word_1_157' title='bbox 628 851 649 870; x_wconf 95' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_158' title='bbox 661 851 812 870; x_wconf 75' lang='eng' dir='ltr'><em>contaminans</em></span> <span class='ocrx_word' id='word_1_159' title='bbox 822 851 907 870; x_wconf 84' lang='eng' dir='ltr'>R-9896</span> <span class='ocrx_word' id='word_1_160' title='bbox 918 851 1063 875; x_wconf 87' lang='eng' dir='ltr'>(AM905036)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_57' title="bbox 619 887 1107 913; baseline 0 -6"><span class='ocrx_word' id='word_1_161' title='bbox 619 887 641 907; x_wconf 91' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_162' title='bbox 653 887 804 908; x_wconf 71' lang='eng' dir='ltr'>contaminans</span> <span class='ocrx_word' id='word_1_163' title='bbox 813 887 869 908; x_wconf 88' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_164' title='bbox 881 887 951 908; x_wconf 90' lang='eng'>16227</span> <span class='ocrx_word' id='word_1_165' title='bbox 962 887 1107 913; x_wconf 85' lang='eng' dir='ltr'>(AM922301)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_58' title="bbox 586 924 1073 949; baseline 0 -5"><span class='ocrx_word' id='word_1_166' title='bbox 586 925 606 944; x_wconf 90' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_167' title='bbox 619 925 770 944; x_wconf 74' lang='eng' dir='ltr'><em>contaminans</em></span> <span class='ocrx_word' id='word_1_168' title='bbox 780 924 835 944; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_169' title='bbox 845 925 918 944; x_wconf 89' lang='eng'>23253</span> <span class='ocrx_word' id='word_1_170' title='bbox 928 925 1073 949; x_wconf 81' lang='eng' dir='ltr'>(AM922303)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_59' title="bbox 581 961 1068 986; baseline 0 -5"><span class='ocrx_word' id='word_1_171' title='bbox 581 961 602 981; x_wconf 88' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_172' title='bbox 614 961 765 981; x_wconf 83' lang='eng' dir='ltr'><em>contaminans</em></span> <span class='ocrx_word' id='word_1_173' title='bbox 775 961 830 981; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_174' title='bbox 840 961 913 981; x_wconf 85' lang='eng'>23255</span> <span class='ocrx_word' id='word_1_175' title='bbox 923 961 1068 986; x_wconf 82' lang='eng' dir='ltr'>(AM922302)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_60' title="bbox 577 998 967 1023; baseline 0.003 -6"><span class='ocrx_word' id='word_1_176' title='bbox 577 1005 599 1007; x_wconf 93' lang='eng'>—</span> <span class='ocrx_word' id='word_1_177' title='bbox 610 998 631 1017; x_wconf 94' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_178' title='bbox 643 998 684 1018; x_wconf 85' lang='eng' dir='ltr'>Iata</span> <span class='ocrx_word' id='word_1_179' title='bbox 695 998 749 1018; x_wconf 87' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_180' title='bbox 759 998 817 1018; x_wconf 87' lang='eng'>6860</span> <span class='ocrx_word' id='word_1_181' title='bbox 828 998 967 1023; x_wconf 86' lang='eng' dir='ltr'>(AF456069)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_61' title="bbox 584 1034 960 1059; baseline 0 -5"><span class='ocrx_word' id='word_1_182' title='bbox 584 1042 595 1044; x_wconf 90' lang='eng'><em>-</em></span> <span class='ocrx_word' id='word_1_183' title='bbox 603 1035 624 1054; x_wconf 93' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_184' title='bbox 636 1035 678 1054; x_wconf 83' lang='eng' dir='ltr'>lata</span> <span class='ocrx_word' id='word_1_185' title='bbox 688 1034 743 1054; x_wconf 90' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_186' title='bbox 753 1035 810 1054; x_wconf 89' lang='eng'>6992</span> <span class='ocrx_word' id='word_1_187' title='bbox 821 1035 960 1059; x_wconf 90' lang='eng' dir='ltr'>(AF456008)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_62' title="bbox 540 1064 1139 1098; baseline 0 -7"><span class='ocrx_word' id='word_1_188' title='bbox 540 1064 551 1080; x_wconf 76' lang='eng'><strong>3</strong></span> <span class='ocrx_word' id='word_1_189' title='bbox 569 1064 580 1080; x_wconf 82' lang='eng'>5</span> <span class='ocrx_word' id='word_1_190' title='bbox 598 1072 619 1091; x_wconf 93' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_191' title='bbox 631 1072 673 1091; x_wconf 78' lang='eng' dir='ltr'><em>lata</em></span> <span class='ocrx_word' id='word_1_192' title='bbox 683 1071 738 1091; x_wconf 93' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_193' title='bbox 748 1072 806 1091; x_wconf 89' lang='eng'>6863</span> <span class='ocrx_word' id='word_1_194' title='bbox 816 1072 955 1096; x_wconf 88' lang='eng' dir='ltr'>(AF456019)</span> <span class='ocrx_word' id='word_1_195' title='bbox 1128 1078 1139 1098; x_wconf 58' lang='eng'><strong><em>&gt;</em></strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_63' title="bbox 594 1108 1026 1133; baseline 0 -5"><span class='ocrx_word' id='word_1_196' title='bbox 594 1108 615 1128; x_wconf 92' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_197' title='bbox 627 1108 669 1128; x_wconf 83' lang='eng' dir='ltr'><em>lata</em></span> <span class='ocrx_word' id='word_1_198' title='bbox 679 1108 734 1128; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_199' title='bbox 744 1108 827 1128; x_wconf 79' lang='eng' dir='ltr'>22485T</span> <span class='ocrx_word' id='word_1_200' title='bbox 837 1108 913 1133; x_wconf 90' lang='eng' dir='ltr'>(whole</span> <span class='ocrx_word' id='word_1_201' title='bbox 923 1108 1026 1133; x_wconf 91' lang='eng' dir='ltr'>genome)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_64' title="bbox 549 1140 935 1170; baseline -0.003 -5"><span class='ocrx_word' id='word_1_202' title='bbox 549 1140 559 1156; x_wconf 82' lang='eng'>5</span> <span class='ocrx_word' id='word_1_203' title='bbox 578 1145 599 1164; x_wconf 92' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_204' title='bbox 610 1145 653 1165; x_wconf 78' lang='eng' dir='ltr'><em>lata</em></span> <span class='ocrx_word' id='word_1_205' title='bbox 663 1145 718 1165; x_wconf 90' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_206' title='bbox 728 1145 786 1165; x_wconf 86' lang='eng'>6993</span> <span class='ocrx_word' id='word_1_207' title='bbox 796 1145 935 1170; x_wconf 85' lang='eng' dir='ltr'>(AF456124)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_65' title="bbox 577 1182 945 1207; baseline 0 -5"><span class='ocrx_word' id='word_1_208' title='bbox 577 1182 631 1202; x_wconf 41' lang='eng'><em>*8.</em></span> <span class='ocrx_word' id='word_1_209' title='bbox 643 1182 685 1202; x_wconf 82' lang='eng' dir='ltr'><em>lata</em></span> <span class='ocrx_word' id='word_1_210' title='bbox 695 1182 795 1202; x_wconf 88' lang='eng' dir='ltr'>R—18628</span> <span class='ocrx_word' id='word_1_211' title='bbox 806 1182 945 1207; x_wconf 86' lang='eng' dir='ltr'>(AF456087)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_66' title="bbox 577 1219 928 1300; baseline 0 -62"><span class='ocrx_word' id='word_1_212' title='bbox 577 1219 630 1300; x_wconf 35' lang='eng'>{(8.</span> <span class='ocrx_word' id='word_1_213' title='bbox 641 1219 683 1239; x_wconf 80' lang='eng' dir='ltr'><em>lata</em></span> <span class='ocrx_word' id='word_1_214' title='bbox 694 1219 779 1239; x_wconf 84' lang='eng' dir='ltr'>R-9940</span> <span class='ocrx_word' id='word_1_215' title='bbox 789 1219 928 1244; x_wconf 90' lang='eng' dir='ltr'>(AF456011)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 479 454 482 943">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 479 454 482 943">
+     <span class='ocr_line' id='line_1_67' title="bbox 479 454 482 943; baseline 0 487"><span class='ocrx_word' id='word_1_216' title='bbox 479 454 482 943; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 476 564 482 943">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 476 564 482 943">
+     <span class='ocr_line' id='line_1_68' title="bbox 476 564 482 943; baseline 0 487"><span class='ocrx_word' id='word_1_217' title='bbox 476 564 482 943; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 478 564 484 943">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 478 564 484 943">
+     <span class='ocr_line' id='line_1_69' title="bbox 478 564 484 943; baseline 0 487"><span class='ocrx_word' id='word_1_218' title='bbox 478 564 484 943; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 569 711 574 970">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 569 711 574 970">
+     <span class='ocr_line' id='line_1_70' title="bbox 569 711 574 970; baseline 0 460"><span class='ocrx_word' id='word_1_219' title='bbox 569 711 574 970; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 571 748 574 970">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 571 748 574 970">
+     <span class='ocr_line' id='line_1_71' title="bbox 571 748 574 970; baseline 0 460"><span class='ocrx_word' id='word_1_220' title='bbox 571 748 574 970; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 1115 970 1237 1054">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 1115 970 1237 1054">
+     <span class='ocr_line' id='line_1_72' title="bbox 1115 970 1126 1010; textangle 90"><span class='ocrx_word' id='word_1_221' title='bbox 1115 970 1126 1010; x_wconf 61' lang='eng' dir='ltr'>J\</span> 
+     </span>
+     <span class='ocr_line' id='line_1_73' title="bbox 1195 982 1205 1046; textangle 90"><span class='ocrx_word' id='word_1_222' title='bbox 1195 982 1205 1046; x_wconf 63' lang='eng' dir='ltr'><strong>V</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_74' title="bbox 1217 974 1237 1054; textangle 90"><span class='ocrx_word' id='word_1_223' title='bbox 1217 974 1237 1054; x_wconf 61' lang='eng' dir='ltr'>MUOXQL</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 575 1005 577 1062">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 575 1005 577 1062">
+     <span class='ocr_line' id='line_1_75' title="bbox 575 1005 577 1062; baseline 0 368"><span class='ocrx_word' id='word_1_224' title='bbox 575 1005 577 1062; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 1149 1061 1168 1121">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 1149 1061 1168 1121">
+     <span class='ocr_line' id='line_1_76' title="bbox 1149 1061 1168 1121; textangle 90"><span class='ocrx_word' id='word_1_225' title='bbox 1149 1061 1168 1121; x_wconf 50' lang='eng'>&quot;#391</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 1115 1166 1126 1202">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 1115 1166 1126 1202">
+     <span class='ocr_line' id='line_1_77' title="bbox 1115 1166 1126 1202; textangle 90"><span class='ocrx_word' id='word_1_226' title='bbox 1115 1166 1126 1202; x_wconf 64' lang='eng' dir='ltr'>JK</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_37' title="bbox 560 1200 570 1216">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 560 1200 570 1216">
+     <span class='ocr_line' id='line_1_78' title="bbox 560 1200 570 1216; baseline 0 0"><span class='ocrx_word' id='word_1_227' title='bbox 560 1200 570 1216; x_wconf 85' lang='eng'>3</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_38' title="bbox 575 1189 577 1255">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 575 1189 577 1255">
+     <span class='ocr_line' id='line_1_79' title="bbox 575 1189 577 1255; baseline 0 -39"><span class='ocrx_word' id='word_1_228' title='bbox 575 1189 577 1255; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_39' title="bbox 528 1256 1193 1410">
+    <p class='ocr_par' dir='ltr' id='par_1_42' title="bbox 528 1256 1193 1410">
+     <span class='ocr_line' id='line_1_80' title="bbox 624 1256 943 1280; baseline 0 -5"><span class='ocrx_word' id='word_1_229' title='bbox 624 1256 644 1275; x_wconf 95' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_230' title='bbox 656 1256 698 1275; x_wconf 82' lang='eng' dir='ltr'><em>lata</em></span> <span class='ocrx_word' id='word_1_231' title='bbox 708 1256 789 1275; x_wconf 85' lang='eng' dir='ltr'>R-3211</span> <span class='ocrx_word' id='word_1_232' title='bbox 803 1256 943 1280; x_wconf 88' lang='eng' dir='ltr'>(AF456078)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_81' title="bbox 528 1283 1139 1317; baseline 0 -5"><span class='ocrx_word' id='word_1_233' title='bbox 528 1295 550 1312; x_wconf 85' lang='eng'>53</span> <span class='ocrx_word' id='word_1_234' title='bbox 577 1288 600 1304; x_wconf 81' lang='eng'>50</span> <span class='ocrx_word' id='word_1_235' title='bbox 615 1293 636 1312; x_wconf 92' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_236' title='bbox 648 1293 690 1312; x_wconf 84' lang='eng' dir='ltr'><em>lata</em></span> <span class='ocrx_word' id='word_1_237' title='bbox 700 1293 800 1312; x_wconf 81' lang='eng' dir='ltr'>R-23139</span> <span class='ocrx_word' id='word_1_238' title='bbox 811 1293 956 1317; x_wconf 85' lang='eng' dir='ltr'>(AM905032)</span> <span class='ocrx_word' id='word_1_239' title='bbox 1128 1283 1139 1308; x_wconf 69' lang='eng'>&gt;</span> 
+     </span>
+     <span class='ocr_line' id='line_1_82' title="bbox 565 1329 985 1354; baseline 0 -5"><span class='ocrx_word' id='word_1_240' title='bbox 565 1336 600 1338; x_wconf 98' lang='eng'>—</span> <span class='ocrx_word' id='word_1_241' title='bbox 614 1329 635 1349; x_wconf 74' lang='eng'>8.</span> <span class='ocrx_word' id='word_1_242' title='bbox 646 1329 688 1349; x_wconf 79' lang='eng' dir='ltr'>lata</span> <span class='ocrx_word' id='word_1_243' title='bbox 699 1329 753 1349; x_wconf 89' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_244' title='bbox 765 1329 837 1349; x_wconf 83' lang='eng'>14095</span> <span class='ocrx_word' id='word_1_245' title='bbox 847 1329 985 1354; x_wconf 89' lang='eng' dir='ltr'>(AF456016)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_83' title="bbox 565 1360 1193 1410; baseline 0.003 -25"><span class='ocrx_word' id='word_1_246' title='bbox 565 1372 600 1374; x_wconf 98' lang='eng'>—</span> <span class='ocrx_word' id='word_1_247' title='bbox 608 1366 629 1385; x_wconf 93' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_248' title='bbox 641 1366 683 1386; x_wconf 84' lang='eng' dir='ltr'><em>lata</em></span> <span class='ocrx_word' id='word_1_249' title='bbox 693 1366 793 1386; x_wconf 89' lang='eng' dir='ltr'>R-15816</span> <span class='ocrx_word' id='word_1_250' title='bbox 803 1366 948 1391; x_wconf 82' lang='eng' dir='ltr'>(AM905033)</span> <span class='ocrx_word' id='word_1_251' title='bbox 1181 1360 1193 1410; x_wconf 61' lang='eng'><em>/</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_40' title="bbox 1149 1265 1168 1329">
+    <p class='ocr_par' dir='ltr' id='par_1_43' title="bbox 1149 1265 1168 1329">
+     <span class='ocr_line' id='line_1_84' title="bbox 1149 1265 1168 1329; textangle 90"><span class='ocrx_word' id='word_1_252' title='bbox 1149 1265 1168 1329; x_wconf 66' lang='eng' dir='ltr'>||H7091</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_41' title="bbox 1192 656 1195 1372">
+    <p class='ocr_par' dir='ltr' id='par_1_44' title="bbox 1192 656 1195 1372">
+     <span class='ocr_line' id='line_1_85' title="bbox 1192 656 1195 1372; baseline 0 58"><span class='ocrx_word' id='word_1_253' title='bbox 1192 656 1195 1372; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_42' title="bbox 563 1336 565 1374">
+    <p class='ocr_par' dir='ltr' id='par_1_45' title="bbox 563 1336 565 1374">
+     <span class='ocr_line' id='line_1_86' title="bbox 563 1336 565 1374; baseline 0 56"><span class='ocrx_word' id='word_1_254' title='bbox 563 1336 565 1374; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_43' title="bbox 1126 640 1128 1392">
+    <p class='ocr_par' dir='ltr' id='par_1_46' title="bbox 1126 640 1128 1392">
+     <span class='ocr_line' id='line_1_87' title="bbox 1126 640 1128 1392; baseline 0 38"><span class='ocrx_word' id='word_1_255' title='bbox 1126 640 1128 1392; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_44' title="bbox 136 1402 610 1427">
+    <p class='ocr_par' dir='ltr' id='par_1_47' title="bbox 136 1402 610 1427">
+     <span class='ocr_line' id='line_1_88' title="bbox 136 1402 610 1427; baseline 0 -5"><span class='ocrx_word' id='word_1_256' title='bbox 136 1403 157 1422; x_wconf 93' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_257' title='bbox 168 1408 307 1422; x_wconf 76' lang='eng' dir='ltr'>xenovorans</span> <span class='ocrx_word' id='word_1_258' title='bbox 316 1403 371 1422; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_259' title='bbox 381 1402 464 1422; x_wconf 83' lang='eng' dir='ltr'>21463T</span> <span class='ocrx_word' id='word_1_260' title='bbox 474 1403 610 1427; x_wconf 86' lang='eng' dir='ltr'>(AJ544489)</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001123-0-003.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001123-0-003.pbm.png
new file mode 100644
index 00000000..f814edc6
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001123-0-003.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001123-0-003.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001123-0-003.pbm.png.hocr
new file mode 100644
index 00000000..86ec50a0
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001123-0-003.pbm.png.hocr
@@ -0,0 +1,270 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001123-0-003.pbm.png"; bbox 0 0 758 623; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 26 97 54 111">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 26 97 54 111">
+     <span class='ocr_line' id='line_1_1' title="bbox 26 97 54 111; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 26 97 54 111; x_wconf 85' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 152 63 181 78">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 152 63 181 78">
+     <span class='ocr_line' id='line_1_2' title="bbox 152 63 181 78; baseline 0.034 -1"><span class='ocrx_word' id='word_1_2' title='bbox 152 63 181 78; x_wconf 87' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 331 3 757 70">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 331 3 757 70">
+     <span class='ocr_line' id='line_1_3' title="bbox 331 3 757 31; baseline 0 -6"><span class='ocrx_word' id='word_1_3' title='bbox 331 4 483 31; x_wconf 84' lang='eng' dir='ltr'><em>Cupriavidus</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 492 4 665 25; x_wconf 87' lang='eng' dir='ltr'><em>metallidurans</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 674 3 757 25; x_wconf 80' lang='eng' dir='ltr'><em>CH34T</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 339 48 680 70; baseline 0 0"><span class='ocrx_word' id='word_1_6' title='bbox 339 60 384 62; x_wconf 98' lang='eng'>—</span> <span class='ocrx_word' id='word_1_7' title='bbox 395 49 418 70; x_wconf 93' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 429 54 579 70; x_wconf 88' lang='eng' dir='ltr'><em>xenovorans</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 589 48 680 70; x_wconf 87' lang='eng' dir='ltr'><em>LB400T</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 153 82 339 84">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 153 82 339 84">
+     <span class='ocr_line' id='line_1_5' title="bbox 153 82 339 84; baseline 0 539"><span class='ocrx_word' id='word_1_10' title='bbox 153 82 339 84; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 20 117 155 119">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 20 117 155 119">
+     <span class='ocr_line' id='line_1_6' title="bbox 20 117 155 119; baseline 0 504"><span class='ocrx_word' id='word_1_11' title='bbox 20 117 155 119; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 4 15 6 215">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 4 15 6 215">
+     <span class='ocr_line' id='line_1_7' title="bbox 4 15 6 215; baseline 0 408"><span class='ocrx_word' id='word_1_12' title='bbox 4 15 6 215; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 4 213 22 215">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 4 213 22 215">
+     <span class='ocr_line' id='line_1_8' title="bbox 4 213 22 215; baseline 0 408"><span class='ocrx_word' id='word_1_13' title='bbox 4 213 22 215; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 20 117 22 312">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 20 117 22 312">
+     <span class='ocr_line' id='line_1_9' title="bbox 20 117 22 312; baseline 0 311"><span class='ocrx_word' id='word_1_14' title='bbox 20 117 22 312; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 159 214 187 228">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 159 214 187 228">
+     <span class='ocr_line' id='line_1_10' title="bbox 159 214 187 228; baseline 0 0"><span class='ocrx_word' id='word_1_15' title='bbox 159 214 187 228; x_wconf 88' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 337 60 339 107">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 337 60 339 107">
+     <span class='ocr_line' id='line_1_11' title="bbox 337 60 339 107; baseline 0 516"><span class='ocrx_word' id='word_1_16' title='bbox 337 60 339 107; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 339 91 674 119">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 339 91 674 119">
+     <span class='ocr_line' id='line_1_12' title="bbox 339 91 674 119; baseline 0 -6"><span class='ocrx_word' id='word_1_17' title='bbox 339 92 410 113; x_wconf 93' lang='eng' dir='ltr'><em>—B.</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 421 92 587 119; x_wconf 86' lang='eng' dir='ltr'><em>phytofirmans</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 597 91 674 113; x_wconf 88' lang='eng' dir='ltr'><em>PsJNT</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 155 139 542 167">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 155 139 542 167">
+     <span class='ocr_line' id='line_1_13' title="bbox 155 139 542 167; baseline 0 -6"><span class='ocrx_word' id='word_1_20' title='bbox 155 151 239 153; x_wconf 95' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_21' title='bbox 246 140 269 161; x_wconf 93' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 280 140 414 167; x_wconf 83' lang='eng' dir='ltr'><em>phymatum</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 424 139 542 161; x_wconf 88' lang='eng' dir='ltr'><em>STM815T</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 289 187 609 209">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 289 187 609 209">
+     <span class='ocr_line' id='line_1_14' title="bbox 289 187 609 209; baseline 0 0"><span class='ocrx_word' id='word_1_24' title='bbox 289 188 344 209; x_wconf 94' lang='eng' dir='ltr'><em>—B.</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 357 188 524 209; x_wconf 84' lang='eng' dir='ltr'><em>thai/andensis</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 534 187 609 209; x_wconf 74' lang='eng' dir='ltr'><em>E264T</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 153 232 289 234">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 153 232 289 234">
+     <span class='ocr_line' id='line_1_15' title="bbox 153 232 289 234; baseline 0 389"><span class='ocrx_word' id='word_1_27' title='bbox 153 232 289 234; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 20 311 154 313">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 20 311 154 313">
+     <span class='ocr_line' id='line_1_16' title="bbox 20 311 154 313; baseline 0 310"><span class='ocrx_word' id='word_1_28' title='bbox 20 311 154 313; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 24 318 53 333">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 24 318 53 333">
+     <span class='ocr_line' id='line_1_17' title="bbox 24 318 53 333; baseline 0.034 -1"><span class='ocrx_word' id='word_1_29' title='bbox 24 318 53 333; x_wconf 87' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 88 443 111 457">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 88 443 111 457">
+     <span class='ocr_line' id='line_1_18' title="bbox 88 443 111 457; baseline 0 0"><span class='ocrx_word' id='word_1_30' title='bbox 88 443 111 457; x_wconf 88' lang='eng'><em>0.1</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 152 82 155 390">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 152 82 155 390">
+     <span class='ocr_line' id='line_1_19' title="bbox 152 82 155 390; baseline 0 233"><span class='ocrx_word' id='word_1_31' title='bbox 152 82 155 390; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 152 388 230 390">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 152 388 230 390">
+     <span class='ocr_line' id='line_1_20' title="bbox 152 388 230 390; baseline 0 233"><span class='ocrx_word' id='word_1_32' title='bbox 152 388 230 390; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 151 398 179 412">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 151 398 179 412">
+     <span class='ocr_line' id='line_1_21' title="bbox 151 398 179 412; baseline 0 0"><span class='ocrx_word' id='word_1_33' title='bbox 151 398 179 412; x_wconf 85' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 228 336 230 444">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 228 336 230 444">
+     <span class='ocr_line' id='line_1_22' title="bbox 228 336 230 444; baseline 0 179"><span class='ocrx_word' id='word_1_34' title='bbox 228 336 230 444; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 255 432 286 452">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 255 432 286 452">
+     <span class='ocr_line' id='line_1_23' title="bbox 255 432 286 452; baseline 0 -6"><span class='ocrx_word' id='word_1_35' title='bbox 255 432 286 452; x_wconf 70' lang='eng'><em>109</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 228 442 249 444">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 228 442 249 444">
+     <span class='ocr_line' id='line_1_24' title="bbox 228 442 249 444; baseline 0 179"><span class='ocrx_word' id='word_1_36' title='bbox 228 442 249 444; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 214 450 242 464">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 214 450 242 464">
+     <span class='ocr_line' id='line_1_25' title="bbox 214 450 242 464; baseline 0 0"><span class='ocrx_word' id='word_1_37' title='bbox 214 450 242 464; x_wconf 87' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 287 198 289 268">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 287 198 289 268">
+     <span class='ocr_line' id='line_1_26' title="bbox 287 198 289 268; baseline 0 355"><span class='ocrx_word' id='word_1_38' title='bbox 287 198 289 268; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 287 231 632 299">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 287 231 632 299">
+     <span class='ocr_line' id='line_1_27' title="bbox 289 231 632 291; baseline 0 -39"><span class='ocrx_word' id='word_1_39' title='bbox 289 243 333 291; x_wconf 36' lang='eng'><em>4[</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 341 231 364 252; x_wconf 90' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 375 231 546 257; x_wconf 87' lang='eng' dir='ltr'><em>pseudomal/ei</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 556 231 632 253; x_wconf 87' lang='eng' dir='ltr'>1710b</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 287 274 624 299; baseline 0 -1"><span class='ocrx_word' id='word_1_43' title='bbox 287 274 316 289; x_wconf 65' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 339 277 362 298; x_wconf 94' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 374 277 450 299; x_wconf 86' lang='eng' dir='ltr'><em>mal/ei</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 459 277 535 299; x_wconf 93' lang='eng' dir='ltr'><em>NCTC</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 548 277 624 299; x_wconf 87' lang='eng'><em>10247</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 289 325 652 347">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 289 325 652 347">
+     <span class='ocr_line' id='line_1_29' title="bbox 289 325 652 347; baseline 0 0"><span class='ocrx_word' id='word_1_48' title='bbox 289 326 312 347; x_wconf 63' lang='eng' dir='ltr'><em>B,</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 324 326 471 347; x_wconf 83' lang='eng' dir='ltr'><em>multivorans</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 478 325 552 347; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 565 325 652 347; x_wconf 79' lang='eng' dir='ltr'><em>17616T</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 249 369 555 392">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 249 369 555 392">
+     <span class='ocr_line' id='line_1_30' title="bbox 249 369 555 392; baseline 0.003 -1"><span class='ocrx_word' id='word_1_52' title='bbox 249 381 307 383; x_wconf 98' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_53' title='bbox 313 370 336 391; x_wconf 92' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 349 370 432 392; x_wconf 85' lang='eng' dir='ltr'><em>dolosa</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 440 369 555 392; x_wconf 88' lang='eng' dir='ltr'><em>AU0158T</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 288 418 595 440">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 288 418 595 440">
+     <span class='ocr_line' id='line_1_31' title="bbox 288 418 595 440; baseline 0 0"><span class='ocrx_word' id='word_1_56' title='bbox 288 427 331 429; x_wconf 94' lang='eng'>—</span> <span class='ocrx_word' id='word_1_57' title='bbox 338 419 361 440; x_wconf 93' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 373 418 489 440; x_wconf 84' lang='eng' dir='ltr'><em>ambifan&#39;a</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 496 418 595 440; x_wconf 74' lang='eng' dir='ltr'><em>AMMDT</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 286 427 288 475">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 286 427 288 475">
+     <span class='ocr_line' id='line_1_32' title="bbox 286 427 288 475; baseline 0 148"><span class='ocrx_word' id='word_1_60' title='bbox 286 427 288 475; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 247 381 249 504">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 247 381 249 504">
+     <span class='ocr_line' id='line_1_33' title="bbox 247 381 249 504; baseline 0 119"><span class='ocrx_word' id='word_1_61' title='bbox 247 381 249 504; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 247 502 274 504">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 247 502 274 504">
+     <span class='ocr_line' id='line_1_34' title="bbox 247 502 274 504; baseline 0 119"><span class='ocrx_word' id='word_1_62' title='bbox 247 502 274 504; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 239 510 268 524">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 239 510 268 524">
+     <span class='ocr_line' id='line_1_35' title="bbox 239 510 268 524; baseline 0 0"><span class='ocrx_word' id='word_1_63' title='bbox 239 510 268 524; x_wconf 85' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 272 451 274 556">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 272 451 274 556">
+     <span class='ocr_line' id='line_1_36' title="bbox 272 451 274 556; baseline 0 67"><span class='ocrx_word' id='word_1_64' title='bbox 272 451 274 556; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 288 463 632 535">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 288 463 632 535">
+     <span class='ocr_line' id='line_1_37' title="bbox 288 463 611 484; baseline 0 0"><span class='ocrx_word' id='word_1_65' title='bbox 288 473 350 475; x_wconf 97' lang='eng'>—</span> <span class='ocrx_word' id='word_1_66' title='bbox 357 464 380 484; x_wconf 71' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 393 464 566 484; x_wconf 80' lang='eng' dir='ltr'><em>vietnamiensis</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 575 463 611 484; x_wconf 90' lang='eng' dir='ltr'><em>G4</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 296 507 632 535; baseline 0.003 -6"><span class='ocrx_word' id='word_1_69' title='bbox 296 519 331 521; x_wconf 98' lang='eng'>—</span> <span class='ocrx_word' id='word_1_70' title='bbox 339 508 362 529; x_wconf 94' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 374 508 534 535; x_wconf 85' lang='eng' dir='ltr'><em>cenocepacia</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 544 507 632 530; x_wconf 81' lang='eng' dir='ltr'><em>J2315T</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 272 554 296 556">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 272 554 296 556">
+     <span class='ocr_line' id='line_1_39' title="bbox 272 554 296 556; baseline 0 67"><span class='ocrx_word' id='word_1_73' title='bbox 272 554 296 556; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_37' title="bbox 262 560 290 574">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 262 560 290 574">
+     <span class='ocr_line' id='line_1_40' title="bbox 262 560 290 574; baseline 0 0"><span class='ocrx_word' id='word_1_74' title='bbox 262 560 290 574; x_wconf 88' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_38' title="bbox 295 520 296 589">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 295 520 296 589">
+     <span class='ocr_line' id='line_1_41' title="bbox 295 520 296 589; baseline 0 34"><span class='ocrx_word' id='word_1_75' title='bbox 295 520 296 589; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_39' title="bbox 288 552 657 619">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 288 552 657 619">
+     <span class='ocr_line' id='line_1_42' title="bbox 324 552 501 574; baseline 0 0"><span class='ocrx_word' id='word_1_76' title='bbox 324 565 344 567; x_wconf 98' lang='eng'>—</span> <span class='ocrx_word' id='word_1_77' title='bbox 350 553 376 574; x_wconf 95' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 387 553 435 574; x_wconf 75' lang='eng' dir='ltr'><em>[are</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 445 552 501 574; x_wconf 78' lang='eng' dir='ltr'><em>383T</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 288 593 657 619; baseline 0 0"><span class='ocrx_word' id='word_1_80' title='bbox 288 593 317 608; x_wconf 63' lang='eng'><em>10°</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 324 611 346 613; x_wconf 98' lang='eng'>—</span> <span class='ocrx_word' id='word_1_82' title='bbox 354 597 379 619; x_wconf 92' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 391 597 567 619; x_wconf 85' lang='eng' dir='ltr'><em>contaminans</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 577 597 657 619; x_wconf 91' lang='eng' dir='ltr'><em>SAR-1</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_40' title="bbox 295 588 324 590">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 295 588 324 590">
+     <span class='ocr_line' id='line_1_44' title="bbox 295 588 324 590; baseline 0 33"><span class='ocrx_word' id='word_1_85' title='bbox 295 588 324 590; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_41' title="bbox 322 565 324 613">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 322 565 324 613">
+     <span class='ocr_line' id='line_1_45' title="bbox 322 565 324 613; baseline 0 10"><span class='ocrx_word' id='word_1_86' title='bbox 322 565 324 613; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001149-0-003.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001149-0-003.pbm.png
new file mode 100644
index 00000000..298d11f5
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001149-0-003.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001149-0-003.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001149-0-003.pbm.png.hocr
new file mode 100644
index 00000000..3d81d54c
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001149-0-003.pbm.png.hocr
@@ -0,0 +1,268 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001149-0-003.pbm.png"; bbox 0 0 2012 2610; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 1172 36 1404 68">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 1172 36 1404 68">
+     <span class='ocr_line' id='line_1_1' title="bbox 1172 36 1404 68; baseline 0.004 -6"><span class='ocrx_word' id='word_1_1' title='bbox 1172 42 1191 62; x_wconf 94' lang='eng' dir='ltr'><strong><em>L.</em></strong></span> <span class='ocrx_word' id='word_1_2' title='bbox 1202 42 1338 68; x_wconf 79' lang='eng' dir='ltr'><strong><em>pyrrhocoris</em></strong></span> <span class='ocrx_word' id='word_1_3' title='bbox 1372 36 1404 68; x_wconf 78' lang='eng' dir='ltr'><strong>n</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 1096 148 1344 181">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 1096 148 1344 181">
+     <span class='ocr_line' id='line_1_2' title="bbox 1096 148 1344 181; baseline 0 -7"><span class='ocrx_word' id='word_1_4' title='bbox 1096 154 1115 174; x_wconf 92' lang='eng' dir='ltr'><strong><em>L.</em></strong></span> <span class='ocrx_word' id='word_1_5' title='bbox 1125 154 1249 179; x_wconf 75' lang='eng' dir='ltr'><em>pod/ipaevi</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 1259 159 1273 169; x_wconf 99' lang='eng'><strong>=</strong></span> <span class='ocrx_word' id='word_1_7' title='bbox 1296 148 1344 181; x_wconf 69' lang='eng' dir='ltr'><strong>m</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 1075 190 1746 202">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 1075 116 1746 223">
+     <span class='ocr_line' id='line_1_3' title="bbox 1075 116 1577 202; baseline 0.002 -70"><span class='ocrx_word' id='word_1_8' title='bbox 1075 116 1577 202; x_wconf 67' lang='eng' dir='ltr'><strong><em>:la...o..oou...o.anuaxenic59L]</em></strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 1221 190 1746 223; baseline 0.006 -8"><span class='ocrx_word' id='word_1_9' title='bbox 1221 190 1460 223; x_wconf 64' lang='eng' dir='ltr'><strong><em>jun-uuua</em></strong></span> <span class='ocrx_word' id='word_1_10' title='bbox 1478 197 1629 223; x_wconf 87' lang='eng' dir='ltr'><strong><em>=L.jaderae</em></strong></span> <span class='ocrx_word' id='word_1_11' title='bbox 1645 202 1746 222; x_wconf 87' lang='eng' dir='ltr'><strong><em>sp.nov.</em></strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 1186 286 1374 312">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 1186 286 1374 312">
+     <span class='ocr_line' id='line_1_5' title="bbox 1186 286 1374 312; baseline 0 -5"><span class='ocrx_word' id='word_1_12' title='bbox 1186 286 1316 307; x_wconf 87' lang='eng' dir='ltr'><strong><em>Wallaceina</em></strong></span> <span class='ocrx_word' id='word_1_13' title='bbox 1325 291 1374 312; x_wconf 87' lang='eng' dir='ltr'><strong><em>spp.</em></strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 1053 371 1518 397">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 1053 371 1518 397">
+     <span class='ocr_line' id='line_1_6' title="bbox 1053 371 1518 397; baseline 0 -5"><span class='ocrx_word' id='word_1_14' title='bbox 1053 372 1431 397; x_wconf 79' lang='eng' dir='ltr'><strong><em>...................Leptomonas</em></strong></span> <span class='ocrx_word' id='word_1_15' title='bbox 1441 376 1474 397; x_wconf 85' lang='eng' dir='ltr'><strong><em>Sp.</em></strong></span> <span class='ocrx_word' id='word_1_16' title='bbox 1485 371 1518 392; x_wconf 95' lang='eng' dir='ltr'><strong><em>C4</em></strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 1321 460 1524 529">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 1321 460 1524 529">
+     <span class='ocr_line' id='line_1_7' title="bbox 1325 460 1454 495; baseline 0 0"><span class='ocrx_word' id='word_1_17' title='bbox 1325 460 1454 495; x_wconf 95' lang='eng' dir='ltr'><strong><em>      </em></strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 1321 495 1524 529; baseline 0 0"><span class='ocrx_word' id='word_1_18' title='bbox 1321 495 1350 529; x_wconf 95' lang='eng' dir='ltr'><strong><em>  </em></strong></span> <span class='ocrx_word' id='word_1_19' title='bbox 1448 495 1454 496; x_wconf 95' lang='eng' dir='ltr'><strong><em> </em></strong></span> <span class='ocrx_word' id='word_1_20' title='bbox 1469 496 1524 529; x_wconf 95' lang='eng' dir='ltr'><strong><em> </em></strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 1036 427 1763 492">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 1371 427 1763 460">
+     <span class='ocr_line' id='line_1_9' title="bbox 1371 427 1763 460; baseline -0.003 -6"><span class='ocrx_word' id='word_1_21' title='bbox 1371 427 1419 460; x_wconf 62' lang='eng' dir='ltr'><strong>m</strong></span> <span class='ocrx_word' id='word_1_22' title='bbox 1429 439 1443 448; x_wconf 98' lang='eng'>=</span> <span class='ocrx_word' id='word_1_23' title='bbox 1452 433 1474 453; x_wconf 97' lang='eng' dir='ltr'><strong><em>L.</em></strong></span> <span class='ocrx_word' id='word_1_24' title='bbox 1485 438 1645 459; x_wconf 87' lang='eng' dir='ltr'><strong><em>neopamerae</em></strong></span> <span class='ocrx_word' id='word_1_25' title='bbox 1662 439 1699 459; x_wconf 89' lang='eng' dir='ltr'><strong><em>sp.</em></strong></span> <span class='ocrx_word' id='word_1_26' title='bbox 1710 438 1763 454; x_wconf 91' lang='eng' dir='ltr'><strong><em>nov.</em></strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 1176 465 1946 559">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 1176 465 1946 559">
+     <span class='ocr_line' id='line_1_10' title="bbox 1454 465 1747 486; baseline 0.02 -5"><span class='ocrx_word' id='word_1_27' title='bbox 1454 475 1573 481; x_wconf 0' lang='eng'><strong><em></em></strong></span> <span class='ocrx_word' id='word_1_28' title='bbox 1582 465 1607 485; x_wconf 75' lang='eng' dir='ltr'><strong><em>‘B.</em></strong></span> <span class='ocrx_word' id='word_1_29' title='bbox 1619 465 1747 486; x_wconf 89' lang='eng' dir='ltr'><em>miridarum’</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 1176 499 1908 534; baseline 0.007 -5"><span class='ocrx_word' id='word_1_30' title='bbox 1176 510 1194 530; x_wconf 94' lang='eng' dir='ltr'><strong><em>L.</em></strong></span> <span class='ocrx_word' id='word_1_31' title='bbox 1206 509 1310 530; x_wconf 85' lang='eng' dir='ltr'><em>bifurcata</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 1746 531 1749 534; x_wconf 73' lang='eng'><strong><em>.</em></strong></span> <span class='ocrx_word' id='word_1_33' title='bbox 1906 531 1908 534; x_wconf 92' lang='eng'><strong><em>.</em></strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 1257 531 1946 559; baseline 0.007 -12"><span class='ocrx_word' id='word_1_34' title='bbox 1257 533 1273 559; x_wconf 70' lang='eng' dir='ltr'><strong>j</strong></span> <span class='ocrx_word' id='word_1_35' title='bbox 1298 539 1549 545; x_wconf 0' lang='eng'><strong></strong></span> <span class='ocrx_word' id='word_1_36' title='bbox 1571 531 1593 552; x_wconf 71' lang='eng' dir='ltr'><strong><em>C.</em></strong></span> <span class='ocrx_word' id='word_1_37' title='bbox 1604 531 1615 551; x_wconf 85' lang='eng' dir='ltr'><strong><em>l.</em></strong></span> <span class='ocrx_word' id='word_1_38' title='bbox 1627 531 1774 557; x_wconf 78' lang='eng' dir='ltr'><strong><em>thermophI/a,</em></strong></span> <span class='ocrx_word' id='word_1_39' title='bbox 1786 531 1815 552; x_wconf 70' lang='eng' dir='ltr'><strong><em>‘C,</em></strong></span> <span class='ocrx_word' id='word_1_40' title='bbox 1827 531 1946 557; x_wconf 68' lang='eng' dir='ltr'><strong><em>deaneI’U)</em></strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 1283 562 1361 606">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 1283 562 1361 606">
+     <span class='ocr_line' id='line_1_13' title="bbox 1283 562 1361 606; baseline 0 -6"><span class='ocrx_word' id='word_1_41' title='bbox 1283 562 1361 606; x_wconf 66' lang='eng' dir='ltr'>Jill</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 1278 604 1834 975">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 1278 604 1834 975">
+     <span class='ocr_line' id='line_1_14' title="bbox 1395 604 1621 679; baseline 0 -34"><span class='ocrx_word' id='word_1_42' title='bbox 1395 604 1411 679; x_wconf 69' lang='eng'>]</span> <span class='ocrx_word' id='word_1_43' title='bbox 1436 625 1621 645; x_wconf 84' lang='eng' dir='ltr'><strong><em>Paraleishmania</em></strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 1658 661 1834 737; baseline 0 -28"><span class='ocrx_word' id='word_1_44' title='bbox 1658 661 1675 737; x_wconf 70' lang='eng'>]</span> <span class='ocrx_word' id='word_1_45' title='bbox 1696 689 1715 709; x_wconf 90' lang='eng' dir='ltr'><strong><em>L.</em></strong></span> <span class='ocrx_word' id='word_1_46' title='bbox 1727 689 1834 715; x_wconf 85' lang='eng' dir='ltr'><em>(Viannia)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 1394 765 1582 791; baseline 0.005 -6"><span class='ocrx_word' id='word_1_47' title='bbox 1394 765 1413 785; x_wconf 94' lang='eng' dir='ltr'><strong><em>L.</em></strong></span> <span class='ocrx_word' id='word_1_48' title='bbox 1426 765 1582 791; x_wconf 84' lang='eng' dir='ltr'><strong><em>(Leishmania)</em></strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 1278 827 1513 885; baseline 0 -20"><span class='ocrx_word' id='word_1_49' title='bbox 1278 827 1294 885; x_wconf 64' lang='eng' dir='ltr'>J</span> <span class='ocrx_word' id='word_1_50' title='bbox 1311 845 1330 865; x_wconf 93' lang='eng' dir='ltr'><strong><em>L.</em></strong></span> <span class='ocrx_word' id='word_1_51' title='bbox 1342 845 1437 865; x_wconf 74' lang='eng' dir='ltr'><strong><em>farce/es</em></strong></span> <span class='ocrx_word' id='word_1_52' title='bbox 1447 851 1460 859; x_wconf 96' lang='eng'><em>=</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 1480 838 1513 871; x_wconf 73' lang='eng' dir='ltr'><strong>n</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 1405 880 1474 975; baseline 0 -30"><span class='ocrx_word' id='word_1_54' title='bbox 1405 880 1474 975; x_wconf 68' lang='eng' dir='ltr'><strong><em>]m</em></strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 1158 970 2009 1065">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 1158 970 2009 1065">
+     <span class='ocr_line' id='line_1_19' title="bbox 1233 978 1344 998; baseline 0 0"><span class='ocrx_word' id='word_1_55' title='bbox 1233 978 1251 998; x_wconf 72' lang='eng' dir='ltr'><strong><em>L.</em></strong></span> <span class='ocrx_word' id='word_1_56' title='bbox 1264 983 1320 998; x_wconf 86' lang='eng' dir='ltr'><strong><em>acus</em></strong></span> <span class='ocrx_word' id='word_1_57' title='bbox 1331 984 1344 992; x_wconf 96' lang='eng'><em>=</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 1202 970 2009 1032; baseline 0 -13"><span class='ocrx_word' id='word_1_58' title='bbox 1202 970 1218 1008; x_wconf 73' lang='eng' dir='ltr'>:l</span> <span class='ocrx_word' id='word_1_59' title='bbox 1335 1024 1344 1032; x_wconf 60' lang='eng'><em>.</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 1352 971 1399 1032; x_wconf 53' lang='eng' dir='ltr'><strong><em>Eu.</em></strong></span> <span class='ocrx_word' id='word_1_61' title='bbox 1493 980 1596 1032; x_wconf 37' lang='eng' dir='ltr'><strong><em>Iggy.</em></strong></span> <span class='ocrx_word' id='word_1_62' title='bbox 1608 999 1687 1019; x_wconf 91' lang='eng' dir='ltr'><strong>127AL</strong></span> <span class='ocrx_word' id='word_1_63' title='bbox 1696 1004 1710 1014; x_wconf 99' lang='eng'><strong>=</strong></span> <span class='ocrx_word' id='word_1_64' title='bbox 1722 999 1745 1019; x_wconf 91' lang='eng' dir='ltr'><strong><em>C.</em></strong></span> <span class='ocrx_word' id='word_1_65' title='bbox 1756 999 1899 1019; x_wconf 86' lang='eng' dir='ltr'><strong><em>abscondita</em></strong></span> <span class='ocrx_word' id='word_1_66' title='bbox 1908 1004 1946 1024; x_wconf 92' lang='eng' dir='ltr'><strong><em>sp.</em></strong></span> <span class='ocrx_word' id='word_1_67' title='bbox 1957 1004 2009 1019; x_wconf 92' lang='eng' dir='ltr'><strong><em>nov.</em></strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 1158 1029 1988 1065; baseline 0.001 -16"><span class='ocrx_word' id='word_1_68' title='bbox 1158 1056 1167 1065; x_wconf 58' lang='eng'><em>.</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 1176 1056 1185 1065; x_wconf 54' lang='eng'>.</span> <span class='ocrx_word' id='word_1_70' title='bbox 1193 1056 1202 1065; x_wconf 58' lang='eng'>.</span> <span class='ocrx_word' id='word_1_71' title='bbox 1211 1056 1220 1065; x_wconf 59' lang='eng'><em>.</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 1227 1033 1326 1065; x_wconf 52' lang='eng'><strong><em>331::</em></strong></span> <span class='ocrx_word' id='word_1_73' title='bbox 1547 1034 1598 1050; x_wconf 76' lang='eng' dir='ltr'><strong><em>.ax.</em></strong></span> <span class='ocrx_word' id='word_1_74' title='bbox 1610 1029 1688 1050; x_wconf 86' lang='eng' dir='ltr'>119YS</span> <span class='ocrx_word' id='word_1_75' title='bbox 1698 1035 1712 1044; x_wconf 99' lang='eng'>=</span> <span class='ocrx_word' id='word_1_76' title='bbox 1724 1029 1747 1050; x_wconf 89' lang='eng' dir='ltr'><strong><em>C.</em></strong></span> <span class='ocrx_word' id='word_1_77' title='bbox 1757 1029 1879 1055; x_wconf 86' lang='eng' dir='ltr'><strong><em>insperata</em></strong></span> <span class='ocrx_word' id='word_1_78' title='bbox 1887 1034 1925 1055; x_wconf 88' lang='eng' dir='ltr'><strong><em>sp.</em></strong></span> <span class='ocrx_word' id='word_1_79' title='bbox 1936 1034 1988 1050; x_wconf 90' lang='eng' dir='ltr'><strong><em>nov.</em></strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 1335 1051 1547 1065">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 1335 1051 1547 1065">
+     <span class='ocr_line' id='line_1_22' title="bbox 1335 1051 1547 1065; baseline 0 1545"><span class='ocrx_word' id='word_1_80' title='bbox 1335 1051 1547 1065; x_wconf 95' lang='eng' dir='ltr'><strong><em> </em></strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 1356 1056 1972 1220">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 1356 1056 1972 1220">
+     <span class='ocr_line' id='line_1_23' title="bbox 1529 1056 1972 1086; baseline -0.002 -5"><span class='ocrx_word' id='word_1_81' title='bbox 1529 1056 1538 1065; x_wconf 67' lang='eng'><strong>&#39;</strong></span> <span class='ocrx_word' id='word_1_82' title='bbox 1547 1056 1557 1065; x_wconf 66' lang='eng'><strong><em>&#39;</em></strong></span> <span class='ocrx_word' id='word_1_83' title='bbox 1564 1066 1599 1081; x_wconf 87' lang='eng' dir='ltr'><strong><em>ax.</em></strong></span> <span class='ocrx_word' id='word_1_84' title='bbox 1611 1060 1679 1081; x_wconf 86' lang='eng'><strong>128$|</strong></span> <span class='ocrx_word' id='word_1_85' title='bbox 1689 1066 1703 1075; x_wconf 99' lang='eng'><strong>=</strong></span> <span class='ocrx_word' id='word_1_86' title='bbox 1715 1060 1738 1081; x_wconf 91' lang='eng' dir='ltr'><strong><em>C.</em></strong></span> <span class='ocrx_word' id='word_1_87' title='bbox 1748 1061 1862 1086; x_wconf 84' lang='eng' dir='ltr'><strong><em>permixta</em></strong></span> <span class='ocrx_word' id='word_1_88' title='bbox 1871 1066 1908 1086; x_wconf 84' lang='eng' dir='ltr'><strong><em>sp.</em></strong></span> <span class='ocrx_word' id='word_1_89' title='bbox 1920 1066 1972 1081; x_wconf 89' lang='eng' dir='ltr'><strong><em>nov.</em></strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 1356 1069 1485 1138; baseline 0 -23"><span class='ocrx_word' id='word_1_90' title='bbox 1356 1069 1372 1138; x_wconf 76' lang='eng'>]</span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 1437 1129 1655 1155; baseline 0 -6"><span class='ocrx_word' id='word_1_91' title='bbox 1437 1129 1459 1149; x_wconf 93' lang='eng' dir='ltr'><strong><em>C.</em></strong></span> <span class='ocrx_word' id='word_1_92' title='bbox 1470 1129 1655 1155; x_wconf 80' lang='eng' dir='ltr'><strong><em>acanthocepha/i</em></strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 1438 1165 1669 1190; baseline 0 -5"><span class='ocrx_word' id='word_1_93' title='bbox 1438 1165 1641 1190; x_wconf 78' lang='eng' dir='ltr'><strong><em>‘Leptomonas’sp.</em></strong></span> <span class='ocrx_word' id='word_1_94' title='bbox 1654 1165 1669 1185; x_wconf 91' lang='eng' dir='ltr'>P</span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 1440 1199 1602 1220; baseline 0 0"><span class='ocrx_word' id='word_1_95' title='bbox 1440 1199 1462 1220; x_wconf 91' lang='eng' dir='ltr'><strong><em>C.</em></strong></span> <span class='ocrx_word' id='word_1_96' title='bbox 1474 1199 1602 1220; x_wconf 83' lang='eng' dir='ltr'><strong><em>fascicu/ata</em></strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 1443 1231 1492 1308">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 1444 1276 1492 1308">
+     <span class='ocr_line' id='line_1_28' title="bbox 1444 1276 1492 1308; baseline 0 0"><span class='ocrx_word' id='word_1_97' title='bbox 1444 1276 1492 1308; x_wconf 70' lang='eng' dir='ltr'><strong><em>E</em></strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 1371 1458 1718 1517">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 1371 1458 1718 1517">
+     <span class='ocr_line' id='line_1_29' title="bbox 1371 1458 1718 1483; baseline 0 -5"><span class='ocrx_word' id='word_1_98' title='bbox 1371 1458 1392 1478; x_wconf 92' lang='eng' dir='ltr'><strong><em>B.</em></strong></span> <span class='ocrx_word' id='word_1_99' title='bbox 1405 1458 1519 1478; x_wconf 76' lang='eng' dir='ltr'><strong><em>triatomae</em></strong></span> <span class='ocrx_word' id='word_1_100' title='bbox 1530 1470 1538 1472; x_wconf 99' lang='eng'>-</span> <span class='ocrx_word' id='word_1_101' title='bbox 1547 1458 1568 1478; x_wconf 94' lang='eng' dir='ltr'><strong><em>B.</em></strong></span> <span class='ocrx_word' id='word_1_102' title='bbox 1580 1458 1718 1483; x_wconf 82' lang='eng' dir='ltr'><strong><em>leptocoridis</em></strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 1371 1491 1696 1517; baseline 0 -6"><span class='ocrx_word' id='word_1_103' title='bbox 1371 1491 1434 1511; x_wconf 84' lang='eng' dir='ltr'><strong><em>clade</em></strong></span> <span class='ocrx_word' id='word_1_104' title='bbox 1444 1491 1549 1517; x_wconf 90' lang='eng' dir='ltr'><strong><em>including</em></strong></span> <span class='ocrx_word' id='word_1_105' title='bbox 1559 1491 1629 1517; x_wconf 79' lang='eng' dir='ltr'><strong><em>typing</em></strong></span> <span class='ocrx_word' id='word_1_106' title='bbox 1641 1491 1696 1511; x_wconf 80' lang='eng' dir='ltr'><strong><em>units</em></strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 948 1533 1657 1563">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 948 1533 1657 1563">
+     <span class='ocr_line' id='line_1_31' title="bbox 948 1533 1657 1563; baseline 0.001 -1"><span class='ocrx_word' id='word_1_107' title='bbox 948 1556 1076 1562; x_wconf 0' lang='eng'><strong><em></em></strong></span> <span class='ocrx_word' id='word_1_108' title='bbox 1089 1543 1111 1563; x_wconf 82' lang='eng' dir='ltr'><strong><em>B.</em></strong></span> <span class='ocrx_word' id='word_1_109' title='bbox 1123 1543 1236 1563; x_wconf 74' lang='eng' dir='ltr'><strong><em>triatomae</em></strong></span> <span class='ocrx_word' id='word_1_110' title='bbox 1379 1533 1439 1557; x_wconf 63' lang='eng'><strong><em>9&#39;17&#39;</em></strong></span> <span class='ocrx_word' id='word_1_111' title='bbox 1451 1533 1526 1557; x_wconf 44' lang='eng'><strong>1943&#39;</strong></span> <span class='ocrx_word' id='word_1_112' title='bbox 1536 1533 1572 1557; x_wconf 60' lang='eng'><strong><em>25&#39;</em></strong></span> <span class='ocrx_word' id='word_1_113' title='bbox 1582 1533 1657 1557; x_wconf 57' lang='eng'><strong><em>28&#39;30’</em></strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 1366 1522 1679 1596">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 1366 1522 1679 1596">
+     <span class='ocr_line' id='line_1_32' title="bbox 1366 1522 1679 1596; baseline 0 1014"><span class='ocrx_word' id='word_1_114' title='bbox 1366 1522 1679 1596; x_wconf 95' lang='eng' dir='ltr'><strong><em> </em></strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 1380 1566 1639 1590">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 1380 1566 1639 1590">
+     <span class='ocr_line' id='line_1_33' title="bbox 1380 1566 1639 1590; baseline -0.004 -4"><span class='ocrx_word' id='word_1_115' title='bbox 1380 1566 1415 1589; x_wconf 85' lang='eng'><strong><em>33,</em></strong></span> <span class='ocrx_word' id='word_1_116' title='bbox 1426 1566 1461 1589; x_wconf 86' lang='eng'><strong><em>34,</em></strong></span> <span class='ocrx_word' id='word_1_117' title='bbox 1472 1566 1507 1589; x_wconf 83' lang='eng'><strong><em>37,</em></strong></span> <span class='ocrx_word' id='word_1_118' title='bbox 1518 1566 1553 1590; x_wconf 83' lang='eng'><strong><em>39,</em></strong></span> <span class='ocrx_word' id='word_1_119' title='bbox 1564 1566 1600 1590; x_wconf 74' lang='eng'><strong>44,</strong></span> <span class='ocrx_word' id='word_1_120' title='bbox 1610 1566 1639 1586; x_wconf 93' lang='eng'><strong><em>45</em></strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 937 1597 1277 1621">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 937 1597 1277 1621">
+     <span class='ocr_line' id='line_1_34' title="bbox 937 1597 1277 1621; baseline -0.009 -1"><span class='ocrx_word' id='word_1_121' title='bbox 937 1612 1087 1621; x_wconf 84' lang='eng'><strong><em>.........</em></strong></span> <span class='ocrx_word' id='word_1_122' title='bbox 1105 1597 1277 1618; x_wconf 84' lang='eng' dir='ltr'><strong><em>env.127AL-A</em></strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 990 1635 1236 1655">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 990 1635 1236 1655">
+     <span class='ocr_line' id='line_1_35' title="bbox 990 1635 1236 1655; baseline 0 0"><span class='ocrx_word' id='word_1_123' title='bbox 990 1635 1236 1655; x_wconf 78' lang='eng' dir='ltr'><strong><em>-------env.59Ll</em></strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 981 1759 1273 1827">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 981 1759 1273 1827">
+     <span class='ocr_line' id='line_1_36' title="bbox 981 1759 1199 1779; baseline 0 0"><span class='ocrx_word' id='word_1_124' title='bbox 981 1767 990 1776; x_wconf 78' lang='eng'><strong>-</strong></span> <span class='ocrx_word' id='word_1_125' title='bbox 999 1767 1008 1776; x_wconf 71' lang='eng' dir='ltr'><strong>o</strong></span> <span class='ocrx_word' id='word_1_126' title='bbox 1017 1767 1026 1776; x_wconf 68' lang='eng' dir='ltr'><strong><em>o</em></strong></span> <span class='ocrx_word' id='word_1_127' title='bbox 1035 1767 1044 1776; x_wconf 74' lang='eng'><strong>-</strong></span> <span class='ocrx_word' id='word_1_128' title='bbox 1052 1759 1199 1779; x_wconf 70' lang='eng' dir='ltr'><strong><em>aenv.1288l</em></strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 1101 1806 1273 1827; baseline 0 -1"><span class='ocrx_word' id='word_1_129' title='bbox 1101 1812 1153 1827; x_wconf 85' lang='eng' dir='ltr'><strong><em>env.</em></strong></span> <span class='ocrx_word' id='word_1_130' title='bbox 1165 1806 1273 1826; x_wconf 91' lang='eng' dir='ltr'><strong><em>127AL-B</em></strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 1008 1824 1590 1897">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 1121 1846 1590 1897">
+     <span class='ocr_line' id='line_1_38' title="bbox 1126 1846 1515 1877; baseline 0 -11"><span class='ocrx_word' id='word_1_131' title='bbox 1126 1846 1155 1866; x_wconf 89' lang='eng' dir='ltr'><strong><em>.B.</em></strong></span> <span class='ocrx_word' id='word_1_132' title='bbox 1166 1846 1304 1872; x_wconf 80' lang='eng' dir='ltr'><strong><em>Ieptocoridis</em></strong></span> <span class='ocrx_word' id='word_1_133' title='bbox 1364 1861 1418 1877; x_wconf 49' lang='eng' dir='ltr'><strong><em>em,</em></strong></span> <span class='ocrx_word' id='word_1_134' title='bbox 1436 1855 1515 1876; x_wconf 78' lang='eng' dir='ltr'><strong><em>119YS</em></strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 1121 1864 1590 1897; baseline 0 -20"><span class='ocrx_word' id='word_1_135' title='bbox 1121 1868 1325 1877; x_wconf 63' lang='eng'><strong>00-00-000...</strong></span> <span class='ocrx_word' id='word_1_136' title='bbox 1351 1868 1360 1877; x_wconf 66' lang='eng'><strong><em>0</em></strong></span> <span class='ocrx_word' id='word_1_137' title='bbox 1420 1872 1424 1876; x_wconf 88' lang='eng'><strong><em>.</em></strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 1033 1860 1123 1877">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 1033 1860 1123 1877">
+     <span class='ocr_line' id='line_1_40' title="bbox 1033 1860 1123 1877; baseline 0 733"><span class='ocrx_word' id='word_1_138' title='bbox 1033 1860 1123 1877; x_wconf 95' lang='eng' dir='ltr'><strong><em> </em></strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 1057 1903 1457 1910">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 1057 1903 1457 1910">
+     <span class='ocr_line' id='line_1_41' title="bbox 1057 1903 1457 1910; baseline 0 0"><span class='ocrx_word' id='word_1_139' title='bbox 1057 1903 1080 1910; x_wconf 95' lang='eng' dir='ltr'><strong><em> </em></strong></span> <span class='ocrx_word' id='word_1_140' title='bbox 1433 1903 1457 1910; x_wconf 95' lang='eng' dir='ltr'><strong><em> </em></strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 962 1886 1891 1912">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 962 1886 1891 1912">
+     <span class='ocr_line' id='line_1_42' title="bbox 962 1886 1891 1912; baseline -0.001 -2"><span class='ocrx_word' id='word_1_141' title='bbox 962 1903 1051 1910; x_wconf 0' lang='eng'><strong><em></em></strong></span> <span class='ocrx_word' id='word_1_142' title='bbox 1080 1891 1428 1910; x_wconf 87' lang='eng'><strong><em>................:::::.::::::::</em></strong></span> <span class='ocrx_word' id='word_1_143' title='bbox 1457 1891 1597 1910; x_wconf 85' lang='eng'><strong><em>:::::::&#39;.....</em></strong></span> <span class='ocrx_word' id='word_1_144' title='bbox 1606 1886 1785 1912; x_wconf 78' lang='eng' dir='ltr'><strong><em>Herpetomonas</em></strong></span> <span class='ocrx_word' id='word_1_145' title='bbox 1794 1891 1827 1912; x_wconf 88' lang='eng' dir='ltr'><strong><em>sp.</em></strong></span> <span class='ocrx_word' id='word_1_146' title='bbox 1838 1886 1891 1906; x_wconf 93' lang='eng' dir='ltr'><strong><em>Tom</em></strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 1160 1924 1897 2008">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 1262 1924 1897 2008">
+     <span class='ocr_line' id='line_1_43' title="bbox 1262 1924 1897 2008; baseline 0 -46"><span class='ocrx_word' id='word_1_147' title='bbox 1262 1935 1280 2008; x_wconf 59' lang='eng'>1</span> <span class='ocrx_word' id='word_1_148' title='bbox 1754 1942 1773 1962; x_wconf 97' lang='eng' dir='ltr'><strong><em>L.</em></strong></span> <span class='ocrx_word' id='word_1_149' title='bbox 1785 1942 1897 1967; x_wconf 83' lang='eng' dir='ltr'><strong><em>seymouri</em></strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 1278 1963 1640 2020">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 1278 1963 1640 2020">
+     <span class='ocr_line' id='line_1_44' title="bbox 1287 1963 1640 1989; baseline 0 -6"><span class='ocrx_word' id='word_1_150' title='bbox 1287 1963 1310 1983; x_wconf 96' lang='eng' dir='ltr'><strong><em>H.</em></strong></span> <span class='ocrx_word' id='word_1_151' title='bbox 1322 1968 1455 1987; x_wconf 78' lang='eng' dir='ltr'><strong><em>muscarum,</em></strong></span> <span class='ocrx_word' id='word_1_152' title='bbox 1466 1963 1490 1983; x_wconf 97' lang='eng' dir='ltr'><strong><em>H.</em></strong></span> <span class='ocrx_word' id='word_1_153' title='bbox 1502 1963 1640 1989; x_wconf 83' lang='eng' dir='ltr'><strong><em>megaseliae</em></strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 1278 1995 1462 2020; baseline 0 -5"><span class='ocrx_word' id='word_1_154' title='bbox 1278 2002 1319 2008; x_wconf 0' lang='eng'><strong><em></em></strong></span> <span class='ocrx_word' id='word_1_155' title='bbox 1333 1995 1356 2015; x_wconf 95' lang='eng' dir='ltr'><strong><em>H.</em></strong></span> <span class='ocrx_word' id='word_1_156' title='bbox 1367 1995 1462 2020; x_wconf 88' lang='eng' dir='ltr'><em>pessoai</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 1117 2013 1134 2039">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 1117 2013 1134 2039">
+     <span class='ocr_line' id='line_1_46' title="bbox 1117 2013 1134 2039; baseline 0 0"><span class='ocrx_word' id='word_1_157' title='bbox 1117 2013 1134 2039; x_wconf 76' lang='eng'>3</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 1091 2039 1658 2118">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 1091 2039 1658 2118">
+     <span class='ocr_line' id='line_1_47' title="bbox 1091 2039 1658 2085; baseline 0 -6"><span class='ocrx_word' id='word_1_158' title='bbox 1091 2039 1135 2072; x_wconf 57' lang='eng' dir='ltr'><strong><em>P—</em></strong></span> <span class='ocrx_word' id='word_1_159' title='bbox 1172 2059 1195 2079; x_wconf 71' lang='eng' dir='ltr'><strong><em>H.</em></strong></span> <span class='ocrx_word' id='word_1_160' title='bbox 1207 2059 1309 2083; x_wconf 79' lang='eng' dir='ltr'><em>roitmani,</em></span> <span class='ocrx_word' id='word_1_161' title='bbox 1320 2059 1499 2085; x_wconf 82' lang='eng' dir='ltr'><strong><em>Herpetomonas</em></strong></span> <span class='ocrx_word' id='word_1_162' title='bbox 1508 2064 1541 2085; x_wconf 87' lang='eng' dir='ltr'><strong><em>sp.</em></strong></span> <span class='ocrx_word' id='word_1_163' title='bbox 1552 2059 1658 2083; x_wconf 76' lang='eng' dir='ltr'><strong><em>TCCZ63,</em></strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_48' title="bbox 1172 2091 1543 2118; baseline 0 -6"><span class='ocrx_word' id='word_1_164' title='bbox 1172 2091 1201 2113; x_wconf 88' lang='eng' dir='ltr'><strong><em>‘C.</em></strong></span> <span class='ocrx_word' id='word_1_165' title='bbox 1213 2092 1374 2118; x_wconf 71' lang='eng' dir='ltr'><strong><em>oncopelti’al),</em></strong></span> <span class='ocrx_word' id='word_1_166' title='bbox 1387 2091 1409 2113; x_wconf 92' lang='eng' dir='ltr'><strong><em>C.</em></strong></span> <span class='ocrx_word' id='word_1_167' title='bbox 1421 2092 1503 2112; x_wconf 85' lang='eng' dir='ltr'><strong><em>deanei</em></strong></span> <span class='ocrx_word' id='word_1_168' title='bbox 1512 2092 1543 2118; x_wconf 90' lang='eng' dir='ltr'><strong><em>(II)</em></strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 1097 2135 1450 2213">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 1345 2135 1423 2169">
+     <span class='ocr_line' id='line_1_49' title="bbox 1345 2135 1423 2169; baseline 0.026 -2"><span class='ocrx_word' id='word_1_169' title='bbox 1345 2135 1423 2169; x_wconf 76' lang='eng' dir='ltr'>J</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 1137 2208 1749 2254">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 1137 2208 1749 2254">
+     <span class='ocr_line' id='line_1_50' title="bbox 1242 2208 1749 2228; baseline 0 -6"><span class='ocrx_word' id='word_1_170' title='bbox 1242 2208 1580 2228; x_wconf 0' lang='eng'></span> <span class='ocrx_word' id='word_1_171' title='bbox 1592 2208 1749 2228; x_wconf 63' lang='eng' dir='ltr'><strong><em>costaricensis</em></strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_51' title="bbox 1137 2234 1290 2254; baseline 0 0"><span class='ocrx_word' id='word_1_172' title='bbox 1137 2234 1156 2254; x_wconf 97' lang='eng' dir='ltr'><strong><em>L.</em></strong></span> <span class='ocrx_word' id='word_1_173' title='bbox 1168 2234 1290 2254; x_wconf 87' lang='eng' dir='ltr'><em>col/osoma</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 1010 2279 1218 2304">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 1010 2279 1218 2304">
+     <span class='ocr_line' id='line_1_52' title="bbox 1010 2279 1218 2304; baseline 0 -5"><span class='ocrx_word' id='word_1_174' title='bbox 1010 2279 1161 2304; x_wconf 82' lang='eng' dir='ltr'><strong><em>Phytomonas</em></strong></span> <span class='ocrx_word' id='word_1_175' title='bbox 1170 2284 1218 2304; x_wconf 90' lang='eng' dir='ltr'>spp.</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 1067 2341 1520 2381">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 1067 2341 1520 2381">
+     <span class='ocr_line' id='line_1_53' title="bbox 1067 2341 1520 2381; baseline 0 -20"><span class='ocrx_word' id='word_1_176' title='bbox 1067 2341 1088 2361; x_wconf 94' lang='eng' dir='ltr'><strong><em>B.</em></strong></span> <span class='ocrx_word' id='word_1_177' title='bbox 1101 2341 1173 2361; x_wconf 84' lang='eng' dir='ltr'><strong><em>culicis</em></strong></span> <span class='ocrx_word' id='word_1_178' title='bbox 1473 2348 1520 2381; x_wconf 67' lang='eng' dir='ltr'><em>m</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 898 2387 1543 2417">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 898 2387 1543 2417">
+     <span class='ocr_line' id='line_1_54' title="bbox 898 2387 1543 2417; baseline -0.005 -4"><span class='ocrx_word' id='word_1_179' title='bbox 898 2387 1442 2417; x_wconf 66' lang='eng' dir='ltr'><strong><em>.........Q.¢n.qopelti.(|)........-Leptomonas</em></strong></span> <span class='ocrx_word' id='word_1_180' title='bbox 1451 2396 1484 2417; x_wconf 84' lang='eng' dir='ltr'><strong><em>sp.</em></strong></span> <span class='ocrx_word' id='word_1_181' title='bbox 1496 2391 1543 2411; x_wconf 77' lang='eng' dir='ltr'>me</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 1274 2464 1629 2517">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 1274 2464 1629 2517">
+     <span class='ocr_line' id='line_1_55' title="bbox 1274 2464 1362 2484; baseline 0 0"><span class='ocrx_word' id='word_1_182' title='bbox 1274 2464 1292 2484; x_wconf 92' lang='eng' dir='ltr'><strong><em>T.</em></strong></span> <span class='ocrx_word' id='word_1_183' title='bbox 1305 2464 1362 2484; x_wconf 87' lang='eng' dir='ltr'><em>cruzi</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_56' title="bbox 1408 2491 1629 2517; baseline 0 -6"><span class='ocrx_word' id='word_1_184' title='bbox 1408 2491 1571 2517; x_wconf 88' lang='eng' dir='ltr'><strong><em>Trypanosoma</em></strong></span> <span class='ocrx_word' id='word_1_185' title='bbox 1581 2496 1629 2517; x_wconf 87' lang='eng' dir='ltr'><strong><em>spp.</em></strong></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001149-0-004.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001149-0-004.pbm.png
new file mode 100644
index 00000000..e5d3ee4a
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001149-0-004.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001149-0-004.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001149-0-004.pbm.png.hocr
new file mode 100644
index 00000000..8f92c34e
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001149-0-004.pbm.png.hocr
@@ -0,0 +1,172 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001149-0-004.pbm.png"; bbox 0 0 1302 1528; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 248 0 1302 12">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 248 0 1302 12">
+     <span class='ocr_line' id='line_1_1' title="bbox 248 0 1302 12; baseline 0 1516"><span class='ocrx_word' id='word_1_1' title='bbox 248 0 1302 12; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 671 21 944 83">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 671 21 944 83">
+     <span class='ocr_line' id='line_1_2' title="bbox 682 21 944 45; baseline 0 -5"><span class='ocrx_word' id='word_1_2' title='bbox 682 21 820 45; x_wconf 82' lang='eng' dir='ltr'><em>Leptomonas</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 827 21 944 45; x_wconf 84' lang='eng' dir='ltr'><em>pod/ipaevi</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 671 59 940 83; baseline 0 -5"><span class='ocrx_word' id='word_1_4' title='bbox 671 59 719 78; x_wconf 85' lang='eng' dir='ltr'><em>59L|</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 728 64 741 73; x_wconf 99' lang='eng'><strong><em>=</em></strong></span> <span class='ocrx_word' id='word_1_6' title='bbox 750 59 769 78; x_wconf 95' lang='eng' dir='ltr'><em>L.</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 779 59 806 78; x_wconf 92' lang='eng' dir='ltr'><em>cf.</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 814 59 940 83; x_wconf 86' lang='eng' dir='ltr'><em>podlipaevi</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 401 75 1181 226">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 401 75 1181 226">
+     <span class='ocr_line' id='line_1_4' title="bbox 502 75 1181 132; baseline 0 -16"><span class='ocrx_word' id='word_1_9' title='bbox 502 75 615 97; x_wconf 70' lang='eng'><em>95/80/87</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 696 97 757 116; x_wconf 87' lang='eng' dir='ltr'><em>34EC</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 767 102 779 111; x_wconf 99' lang='eng'>=</span> <span class='ocrx_word' id='word_1_12' title='bbox 788 97 808 116; x_wconf 95' lang='eng' dir='ltr'><em>L.</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 813 97 905 121; x_wconf 88' lang='eng' dir='ltr'><em>jaderae</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 913 102 947 121; x_wconf 88' lang='eng' dir='ltr'><em>sp.</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 958 102 1006 116; x_wconf 88' lang='eng' dir='ltr'><em>nov.</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 1140 101 1181 132; x_wconf 0' lang='eng'><em></em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 452 133 1117 185; baseline 0 0"><span class='ocrx_word' id='word_1_17' title='bbox 452 147 564 169; x_wconf 74' lang='eng'><em>96/98/98</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 653 167 680 185; x_wconf 86' lang='eng' dir='ltr'><em>Le</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 696 133 829 185; x_wconf 59' lang='eng' dir='ltr'><em>tomo7nsaZRs:</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 839 133 1016 185; x_wconf 50' lang='eng' dir='ltr'><em>:Lerfpame’ae</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 1024 138 1058 156; x_wconf 47' lang='eng' dir='ltr'><em>sp-</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 1068 138 1117 151; x_wconf 39' lang='eng' dir='ltr'><em>nov.</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 401 171 908 205; baseline 0.004 -2"><span class='ocrx_word' id='word_1_23' title='bbox 401 181 514 203; x_wconf 84' lang='eng'><em>66/56/62</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 680 171 694 190; x_wconf 73' lang='eng' dir='ltr'><em>p</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 826 172 840 190; x_wconf 67' lang='eng' dir='ltr'><em>y</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 906 202 908 205; x_wconf 71' lang='eng'>,</span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 648 202 920 226; baseline 0 -5"><span class='ocrx_word' id='word_1_27' title='bbox 648 202 787 226; x_wconf 78' lang='eng' dir='ltr'><em>Leptomonas</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 794 202 920 226; x_wconf 84' lang='eng' dir='ltr'><em>pyrrhocor/s</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 586 234 1050 291">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 586 234 1050 291">
+     <span class='ocr_line' id='line_1_8' title="bbox 586 234 1032 257; baseline 0 -5"><span class='ocrx_word' id='word_1_29' title='bbox 586 234 660 252; x_wconf 88' lang='eng' dir='ltr'><em>127AL</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 669 239 682 248; x_wconf 99' lang='eng'><strong>=</strong></span> <span class='ocrx_word' id='word_1_31' title='bbox 692 234 792 252; x_wconf 79' lang='eng' dir='ltr'><em>Crithidia</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 800 234 932 252; x_wconf 82' lang='eng' dir='ltr'><em>abscondita</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 940 239 974 257; x_wconf 93' lang='eng' dir='ltr'><em>sp.</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 984 239 1032 252; x_wconf 89' lang='eng' dir='ltr'><em>nov.</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 848 268 1050 291; baseline 0 -5"><span class='ocrx_word' id='word_1_35' title='bbox 848 268 977 286; x_wconf 81' lang='eng' dir='ltr'><em>Leishmania</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 986 268 1050 291; x_wconf 82' lang='eng' dir='ltr'><em>major</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 275 306 1187 599">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 275 306 1187 599">
+     <span class='ocr_line' id='line_1_10' title="bbox 579 306 1073 341; baseline 0.002 -18"><span class='ocrx_word' id='word_1_37' title='bbox 579 319 692 341; x_wconf 69' lang='eng'><em>92/66/88</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 840 306 968 325; x_wconf 81' lang='eng' dir='ltr'><em>Leishmania</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 977 306 1073 325; x_wconf 80' lang='eng' dir='ltr'><em>infantum</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 496 342 1131 376; baseline -0.002 -15"><span class='ocrx_word' id='word_1_40' title='bbox 496 354 656 376; x_wconf 72' lang='eng'><em>100/100/100</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 882 342 1010 360; x_wconf 86' lang='eng' dir='ltr'><em>Leishmania</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 1020 342 1131 360; x_wconf 80' lang='eng' dir='ltr'><em>tarentolae</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 924 376 1187 395; baseline 0 -1"><span class='ocrx_word' id='word_1_43' title='bbox 924 376 1052 395; x_wconf 84' lang='eng' dir='ltr'><em>Leishmania</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 1062 376 1187 395; x_wconf 85' lang='eng' dir='ltr'><em>braziliensis</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 806 407 1099 430; baseline 0 -4"><span class='ocrx_word' id='word_1_45' title='bbox 806 407 945 430; x_wconf 77' lang='eng' dir='ltr'><em>Leptomonas</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 953 407 1099 426; x_wconf 81' lang='eng' dir='ltr'><em>costaricensis</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 359 441 981 466; baseline 0.002 -8"><span class='ocrx_word' id='word_1_47' title='bbox 359 444 447 466; x_wconf 55' lang='eng' dir='ltr'><em>Egg/V51</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 692 441 852 459; x_wconf 82' lang='eng' dir='ltr'><em>‘Blastocrithidia</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 861 441 981 459; x_wconf 84' lang='eng' dir='ltr'><em>miridarum’</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 568 472 782 496; baseline 0 -5"><span class='ocrx_word' id='word_1_50' title='bbox 568 472 717 496; x_wconf 76' lang='eng' dir='ltr'><em>‘Leptomonas’</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 726 477 757 496; x_wconf 81' lang='eng' dir='ltr'><em>sp.</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 768 472 782 491; x_wconf 92' lang='eng' dir='ltr'>P</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 567 510 743 529; baseline 0.006 -1"><span class='ocrx_word' id='word_1_53' title='bbox 567 510 657 529; x_wconf 85' lang='eng' dir='ltr'><em>Crithidia</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 666 510 743 529; x_wconf 84' lang='eng' dir='ltr'><em>luciliae</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 562 532 891 564; baseline 0 -4"><span class='ocrx_word' id='word_1_55' title='bbox 562 542 653 560; x_wconf 80' lang='eng' dir='ltr'><em>Crithidia</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 662 542 780 560; x_wconf 78' lang='eng' dir='ltr'><em>fasciculata</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 864 532 891 564; x_wconf 90' lang='eng' dir='ltr'><strong>C</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 275 569 773 599; baseline 0.01 -9"><span class='ocrx_word' id='word_1_58' title='bbox 275 569 387 591; x_wconf 85' lang='eng'><em>71/98/79</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 574 575 713 599; x_wconf 82' lang='eng' dir='ltr'><em>Leptomonas</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 721 580 773 594; x_wconf 78' lang='eng' dir='ltr'><em>acus</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 233 594 925 700">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 233 603 925 694">
+     <span class='ocr_line' id='line_1_19' title="bbox 233 603 800 641; baseline -0.004 -10"><span class='ocrx_word' id='word_1_61' title='bbox 233 603 238 641; x_wconf 0' lang='eng'><em></em></span> <span class='ocrx_word' id='word_1_62' title='bbox 566 611 704 634; x_wconf 81' lang='eng' dir='ltr'><em>Leptomonas</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 713 611 800 629; x_wconf 80' lang='eng' dir='ltr'><em>tarcoles</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 233 629 925 694; baseline -0.003 -26"><span class='ocrx_word' id='word_1_64' title='bbox 233 645 238 674; x_wconf 0' lang='eng'><em></em></span> <span class='ocrx_word' id='word_1_65' title='bbox 255 629 402 654; x_wconf 77' lang='eng' dir='ltr'><em>100l99/99</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 485 631 505 694; x_wconf 65' lang='eng'><strong>|</strong></span> <span class='ocrx_word' id='word_1_67' title='bbox 585 647 682 666; x_wconf 77' lang='eng' dir='ltr'><em>‘Crithidia</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 691 647 847 666; x_wconf 83' lang='eng' dir='ltr'><em>deanei’ATCC</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 857 648 925 666; x_wconf 84' lang='eng'><em>30255</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 283 681 1300 874">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 283 681 1300 874">
+     <span class='ocr_line' id='line_1_21' title="bbox 582 681 824 705; baseline 0 -5"><span class='ocrx_word' id='word_1_70' title='bbox 582 681 721 705; x_wconf 78' lang='eng' dir='ltr'><em>Leptomonas</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 729 681 824 700; x_wconf 75' lang='eng' dir='ltr'><em>blfurcata</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 579 715 1004 738; baseline 0 -5"><span class='ocrx_word' id='word_1_72' title='bbox 579 715 652 733; x_wconf 83' lang='eng' dir='ltr'>119YS</span> <span class='ocrx_word' id='word_1_73' title='bbox 662 720 674 729; x_wconf 98' lang='eng'><strong>=</strong></span> <span class='ocrx_word' id='word_1_74' title='bbox 685 715 784 733; x_wconf 84' lang='eng' dir='ltr'><em>Crithidia</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 792 715 904 738; x_wconf 85' lang='eng' dir='ltr'><em>insperata</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 912 720 946 738; x_wconf 84' lang='eng' dir='ltr'><em>sp.</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 956 720 1004 733; x_wconf 88' lang='eng' dir='ltr'><em>nov.</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 504 742 854 764; baseline 0 0"><span class='ocrx_word' id='word_1_78' title='bbox 504 742 549 764; x_wconf 91' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 624 745 745 764; x_wconf 83' lang='eng' dir='ltr'><em>Wallaceina</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 754 745 854 764; x_wconf 86' lang='eng' dir='ltr'><em>brevicu/a</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 588 779 839 798; baseline 0.004 -1"><span class='ocrx_word' id='word_1_81' title='bbox 588 779 709 798; x_wconf 85' lang='eng' dir='ltr'><em>Wallaceina</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 718 779 839 798; x_wconf 84' lang='eng' dir='ltr'><em>inconstans</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 512 813 753 836; baseline 0 -5"><span class='ocrx_word' id='word_1_83' title='bbox 512 813 662 836; x_wconf 79' lang='eng' dir='ltr'><em>‘Leptomonas’</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 668 817 699 836; x_wconf 84' lang='eng' dir='ltr'><em>sp.</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 709 813 753 831; x_wconf 90' lang='eng' dir='ltr'><em>Cfm</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 283 844 1300 874; baseline 0 0"><span class='ocrx_word' id='word_1_86' title='bbox 283 844 323 866; x_wconf 82' lang='eng'><em>64/</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 326 844 334 865; x_wconf 79' lang='eng'>1</span> <span class='ocrx_word' id='word_1_88' title='bbox 341 844 412 866; x_wconf 80' lang='eng'><em>00/90</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 487 846 550 865; x_wconf 75' lang='eng'><em>1285&#39;</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 560 851 573 860; x_wconf 95' lang='eng'><strong><em>=</em></strong></span> <span class='ocrx_word' id='word_1_91' title='bbox 583 846 899 874; x_wconf 51' lang='eng' dir='ltr'><em>Cairhiéieeemixtaﬁnzmax:</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 903 870 1287 874; x_wconf 91' lang='eng'><em>..............................................</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 1291 867 1300 874; x_wconf 95' lang='eng'><strong><em>..</em></strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 133 883 1063 1142">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 133 883 1063 1142">
+     <span class='ocr_line' id='line_1_27' title="bbox 525 883 890 907; baseline 0 -5"><span class='ocrx_word' id='word_1_94' title='bbox 525 883 621 902; x_wconf 75' lang='eng' dir='ltr'><em>‘Crithidia</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 631 883 736 907; x_wconf 80' lang='eng' dir='ltr'><em>oncope/ti’</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 745 883 812 902; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 822 883 890 902; x_wconf 83' lang='eng'><em>30264</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 432 918 833 945; baseline 0 -8"><span class='ocrx_word' id='word_1_98' title='bbox 432 923 477 945; x_wconf 81' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 526 919 692 942; x_wconf 76' lang='eng' dir='ltr'><em>Herpetomonas</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 700 923 731 942; x_wconf 87' lang='eng' dir='ltr'><em>sp.</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 740 918 833 937; x_wconf 88' lang='eng' dir='ltr'><em>TCC263</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 532 955 860 974; baseline 0 0"><span class='ocrx_word' id='word_1_102' title='bbox 532 955 622 974; x_wconf 86' lang='eng' dir='ltr'><em>Crithidia</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 631 955 708 974; x_wconf 80' lang='eng' dir='ltr'><em>deanel</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 714 955 782 974; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 791 955 860 974; x_wconf 78' lang='eng'><em>30969</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 133 986 788 1011; baseline -0.003 -3"><span class='ocrx_word' id='word_1_106' title='bbox 133 986 225 1008; x_wconf 80' lang='eng'><em>55/*/86</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 523 988 689 1011; x_wconf 81' lang='eng' dir='ltr'><em>Herpetomonas</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 697 988 788 1007; x_wconf 81' lang='eng' dir='ltr'><em>roitmani</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 654 1020 957 1043; baseline 0 -5"><span class='ocrx_word' id='word_1_109' title='bbox 654 1020 793 1043; x_wconf 82' lang='eng' dir='ltr'><em>Leptomonas</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 801 1020 957 1038; x_wconf 82' lang='eng' dir='ltr'><em>Iactosovorans</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 289 1053 1063 1095; baseline 0 -23"><span class='ocrx_word' id='word_1_111' title='bbox 289 1068 416 1090; x_wconf 75' lang='eng'><em>100/88/98</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 641 1053 703 1072; x_wconf 85' lang='eng' dir='ltr'><em>37EC</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 712 1058 725 1067; x_wconf 99' lang='eng'>=</span> <span class='ocrx_word' id='word_1_114' title='bbox 734 1053 753 1072; x_wconf 97' lang='eng' dir='ltr'><em>L.</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 763 1053 790 1072; x_wconf 86' lang='eng' dir='ltr'><em>cf.</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 799 1053 970 1090; x_wconf 40' lang='eng' dir='ltr'><em>Iactosovo&#39;rans</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 1039 1065 1063 1095; x_wconf 89' lang='eng' dir='ltr'><strong>H</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 656 1087 917 1110; baseline 0 -5"><span class='ocrx_word' id='word_1_118' title='bbox 656 1087 822 1110; x_wconf 83' lang='eng' dir='ltr'><em>Herpetomonas</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 829 1092 917 1110; x_wconf 81' lang='eng' dir='ltr'><em>pessoal</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 555 1118 846 1142; baseline 0 -5"><span class='ocrx_word' id='word_1_120' title='bbox 555 1118 720 1142; x_wconf 85' lang='eng' dir='ltr'><em>Herpetomonas</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 729 1123 846 1137; x_wconf 78' lang='eng' dir='ltr'><em>muscarum</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 703 1152 938 1176">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 703 1152 938 1176">
+     <span class='ocr_line' id='line_1_35' title="bbox 703 1152 938 1176; baseline 0 -5"><span class='ocrx_word' id='word_1_122' title='bbox 703 1152 842 1176; x_wconf 75' lang='eng' dir='ltr'><em>Phytomonas</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 850 1157 881 1176; x_wconf 86' lang='eng' dir='ltr'><em>sp.</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 892 1152 938 1171; x_wconf 94' lang='eng' dir='ltr'><em>EM1</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 374 362 444 384">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 374 362 444 384">
+     <span class='ocr_line' id='line_1_36' title="bbox 374 362 444 384; baseline 0 0"><span class='ocrx_word' id='word_1_125' title='bbox 374 362 444 384; x_wconf 81' lang='eng'><em>56/*/*</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 1300 850 1302 863">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 1300 850 1302 863">
+     <span class='ocr_line' id='line_1_37' title="bbox 1300 850 1302 863; baseline 0 665"><span class='ocrx_word' id='word_1_126' title='bbox 1300 850 1302 863; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 573 870 583 874">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 573 870 583 874">
+     <span class='ocr_line' id='line_1_38' title="bbox 573 870 583 874; baseline 0 654"><span class='ocrx_word' id='word_1_127' title='bbox 573 870 583 874; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 319 1175 1110 1284">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 319 1175 1110 1284">
+     <span class='ocr_line' id='line_1_39' title="bbox 577 1175 1110 1214; baseline 0 -7"><span class='ocrx_word' id='word_1_128' title='bbox 577 1175 622 1197; x_wconf 75' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 747 1188 887 1212; x_wconf 73' lang='eng' dir='ltr'><em>Phytomonas</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 895 1193 926 1212; x_wconf 85' lang='eng' dir='ltr'><em>sp.</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 1087 1183 1110 1214; x_wconf 88' lang='eng' dir='ltr'>P</span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 806 1222 1044 1246; baseline 0 -5"><span class='ocrx_word' id='word_1_132' title='bbox 806 1222 946 1246; x_wconf 77' lang='eng' dir='ltr'><em>Phytomonas</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 954 1227 1044 1246; x_wconf 77' lang='eng' dir='ltr'><em>serpens</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 319 1246 812 1284; baseline -0.002 -5"><span class='ocrx_word' id='word_1_134' title='bbox 319 1246 349 1268; x_wconf 79' lang='eng'><em>98</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 459 1260 549 1279; x_wconf 83' lang='eng' dir='ltr'><em>Crithidia</em></span> <span class='ocrx_word' id='word_1_136' title='bbox 559 1260 661 1284; x_wconf 85' lang='eng' dir='ltr'><em>oncopelti</em></span> <span class='ocrx_word' id='word_1_137' title='bbox 667 1260 734 1279; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_138' title='bbox 745 1260 812 1279; x_wconf 86' lang='eng'><em>12982</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 359 1292 1072 1484">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 359 1292 1072 1484">
+     <span class='ocr_line' id='line_1_42' title="bbox 530 1292 763 1310; baseline 0 0"><span class='ocrx_word' id='word_1_139' title='bbox 530 1292 686 1310; x_wconf 83' lang='eng' dir='ltr'><em>Blastocrimidia</em></span> <span class='ocrx_word' id='word_1_140' title='bbox 696 1292 763 1310; x_wconf 85' lang='eng' dir='ltr'><em>culicis</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 493 1325 753 1349; baseline 0 -5"><span class='ocrx_word' id='word_1_141' title='bbox 493 1325 631 1349; x_wconf 80' lang='eng' dir='ltr'><em>Leptomonas</em></span> <span class='ocrx_word' id='word_1_142' title='bbox 640 1325 753 1344; x_wconf 78' lang='eng' dir='ltr'><em>collosoma</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 536 1358 745 1381; baseline 0 -5"><span class='ocrx_word' id='word_1_143' title='bbox 536 1358 621 1381; x_wconf 81' lang='eng' dir='ltr'><em>Sergeia</em></span> <span class='ocrx_word' id='word_1_144' title='bbox 629 1358 745 1381; x_wconf 83' lang='eng' dir='ltr'><em>pod/ipaevi</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 359 1385 1072 1417; baseline 0 -5"><span class='ocrx_word' id='word_1_145' title='bbox 359 1385 404 1407; x_wconf 77' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_146' title='bbox 843 1394 994 1417; x_wconf 84' lang='eng' dir='ltr'><em>Trypanosoma</em></span> <span class='ocrx_word' id='word_1_147' title='bbox 1003 1394 1072 1412; x_wconf 84' lang='eng' dir='ltr'><em>brucei</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 690 1432 904 1455; baseline 0 -5"><span class='ocrx_word' id='word_1_148' title='bbox 690 1432 841 1455; x_wconf 83' lang='eng' dir='ltr'><em>Trypanosoma</em></span> <span class='ocrx_word' id='word_1_149' title='bbox 850 1432 904 1450; x_wconf 88' lang='eng' dir='ltr'><em>cruzi</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 462 1465 608 1484; baseline 0 0"><span class='ocrx_word' id='word_1_150' title='bbox 462 1465 520 1484; x_wconf 85' lang='eng' dir='ltr'><em>Bodo</em></span> <span class='ocrx_word' id='word_1_151' title='bbox 528 1465 608 1484; x_wconf 84' lang='eng' dir='ltr'><em>saltans</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 129 1506 176 1524">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 129 1506 176 1524">
+     <span class='ocr_line' id='line_1_48' title="bbox 129 1506 176 1524; baseline 0 0"><span class='ocrx_word' id='word_1_152' title='bbox 129 1506 176 1524; x_wconf 85' lang='eng'><em>0.05</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001149-0-005.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001149-0-005.pbm.png
new file mode 100644
index 00000000..08a738f8
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001149-0-005.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001149-0-005.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001149-0-005.pbm.png.hocr
new file mode 100644
index 00000000..910067c9
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001149-0-005.pbm.png.hocr
@@ -0,0 +1,300 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001149-0-005.pbm.png"; bbox 0 0 1243 1595; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 98 495 295 538">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 102 504 293 530">
+     <span class='ocr_line' id='line_1_1' title="bbox 102 504 293 530; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 102 504 181 530; x_wconf 91' lang='eng'><em>100/1</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 209 504 293 530; x_wconf 90' lang='eng'><em>0/100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 404 1 1007 14">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 404 1 1007 14">
+     <span class='ocr_line' id='line_1_2' title="bbox 404 1 1007 14; baseline 0 1581"><span class='ocrx_word' id='word_1_3' title='bbox 404 1 1007 14; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 462 29 758 86">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 462 29 758 86">
+     <span class='ocr_line' id='line_1_3' title="bbox 462 29 758 48; baseline 0 0"><span class='ocrx_word' id='word_1_4' title='bbox 462 29 594 48; x_wconf 87' lang='eng' dir='ltr'><em>Leishmania</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 604 29 758 48; x_wconf 83' lang='eng' dir='ltr'><em>amazonensis</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 462 61 671 86; baseline 0.005 -6"><span class='ocrx_word' id='word_1_6' title='bbox 462 61 594 81; x_wconf 85' lang='eng' dir='ltr'><em>Leishmania</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 604 61 671 86; x_wconf 84' lang='eng' dir='ltr'><em>major</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 283 30 504 683">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 301 30 504 587">
+     <span class='ocr_line' id='line_1_5' title="bbox 428 30 459 160; baseline 0 -103"><span class='ocrx_word' id='word_1_8' title='bbox 428 30 459 160; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 406 160 471 192; baseline 0 0"><span class='ocrx_word' id='word_1_9' title='bbox 406 160 471 192; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 392 192 504 263; baseline 0 0"><span class='ocrx_word' id='word_1_10' title='bbox 392 192 504 263; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 406 263 485 333; baseline 0 -13"><span class='ocrx_word' id='word_1_11' title='bbox 406 263 485 333; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 392 333 441 405; baseline 0 0"><span class='ocrx_word' id='word_1_12' title='bbox 392 333 441 405; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 362 405 461 487; baseline 0 0"><span class='ocrx_word' id='word_1_13' title='bbox 362 405 461 487; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 301 487 463 514; baseline 0 1081"><span class='ocrx_word' id='word_1_14' title='bbox 301 487 463 514; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 301 514 456 587; baseline 0 -28"><span class='ocrx_word' id='word_1_15' title='bbox 301 514 456 587; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 973 411 1004 539">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 973 411 1004 539">
+     <span class='ocr_line' id='line_1_13' title="bbox 973 411 1004 539; baseline 0 0"><span class='ocrx_word' id='word_1_16' title='bbox 973 411 1004 539; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 204 57 1060 501">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 204 84 1060 498">
+     <span class='ocr_line' id='line_1_14' title="bbox 311 84 948 123; baseline 0 -12"><span class='ocrx_word' id='word_1_17' title='bbox 311 84 428 123; x_wconf 50' lang='eng'><em>68/82/52</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 466 92 599 111; x_wconf 87' lang='eng' dir='ltr'><em>Leishmania</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 608 92 741 116; x_wconf 85' lang='eng' dir='ltr'><em>guyanensis</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 900 91 948 122; x_wconf 0' lang='eng'><em></em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 387 127 723 146; baseline 0.003 -1"><span class='ocrx_word' id='word_1_21' title='bbox 387 127 392 140; x_wconf 65' lang='eng' dir='ltr'><strong><em>I</em></strong></span> <span class='ocrx_word' id='word_1_22' title='bbox 466 127 599 146; x_wconf 83' lang='eng' dir='ltr'><em>Leishmania</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 608 127 723 146; x_wconf 79' lang='eng' dir='ltr'><em>tarentolae</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 204 150 720 183; baseline 0 0"><span class='ocrx_word' id='word_1_24' title='bbox 204 150 321 173; x_wconf 71' lang='eng'><em>66/56/62</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 471 164 603 183; x_wconf 84' lang='eng' dir='ltr'><em>Leishmania</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 612 164 720 183; x_wconf 79' lang='eng' dir='ltr'><em>donovani</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 387 198 830 227; baseline -0.002 -9"><span class='ocrx_word' id='word_1_27' title='bbox 387 214 392 227; x_wconf 55' lang='eng'><strong><em>:</em></strong></span> <span class='ocrx_word' id='word_1_28' title='bbox 514 198 684 223; x_wconf 79' lang='eng' dir='ltr'><em>Endotrypanum</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 692 198 830 223; x_wconf 84' lang='eng' dir='ltr'><em>monterogeii</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 257 231 696 271; baseline 0 -12"><span class='ocrx_word' id='word_1_30' title='bbox 257 246 373 268; x_wconf 76' lang='eng'><em>85/61/79</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 387 231 392 271; x_wconf 0' lang='eng'><em></em></span> <span class='ocrx_word' id='word_1_32' title='bbox 490 240 633 264; x_wconf 83' lang='eng' dir='ltr'><em>Leptomonas</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 642 244 696 259; x_wconf 85' lang='eng' dir='ltr'><em>acus</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 387 272 732 297; baseline 0 -6"><span class='ocrx_word' id='word_1_34' title='bbox 387 275 392 297; x_wconf 71' lang='eng' dir='ltr'><strong>g</strong></span> <span class='ocrx_word' id='word_1_35' title='bbox 490 272 633 296; x_wconf 83' lang='eng' dir='ltr'><em>Leptomonas</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 642 272 732 291; x_wconf 79' lang='eng' dir='ltr'><em>tarooles</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 283 302 690 341; baseline 0 -17"><span class='ocrx_word' id='word_1_37' title='bbox 283 316 298 338; x_wconf 81' lang='eng'><strong>5</strong></span> <span class='ocrx_word' id='word_1_38' title='bbox 299 316 314 338; x_wconf 82' lang='eng'>4</span> <span class='ocrx_word' id='word_1_39' title='bbox 316 316 336 338; x_wconf 61' lang='eng'><em>/*</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 337 316 378 338; x_wconf 63' lang='eng'><em>[58</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 387 302 392 341; x_wconf 0' lang='eng'><em></em></span> <span class='ocrx_word' id='word_1_42' title='bbox 465 305 558 324; x_wconf 79' lang='eng' dir='ltr'><em>Cr/thidia</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 568 305 690 324; x_wconf 82' lang='eng' dir='ltr'><em>fascicu/ata</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 387 342 711 367; baseline 0 -6"><span class='ocrx_word' id='word_1_44' title='bbox 387 345 392 367; x_wconf 69' lang='eng'><strong>3</strong></span> <span class='ocrx_word' id='word_1_45' title='bbox 453 342 577 361; x_wconf 81' lang='eng' dir='ltr'><em>Wallaceina</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 586 342 711 361; x_wconf 83' lang='eng' dir='ltr'><em>inconstans</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 248 371 693 402; baseline -0.002 -5"><span class='ocrx_word' id='word_1_47' title='bbox 248 374 289 397; x_wconf 84' lang='eng'><em>83/</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 293 375 301 397; x_wconf 86' lang='eng'>1</span> <span class='ocrx_word' id='word_1_49' title='bbox 308 371 392 402; x_wconf 52' lang='eng'><strong>00/893</strong></span> <span class='ocrx_word' id='word_1_50' title='bbox 455 377 580 396; x_wconf 75' lang='eng' dir='ltr'><em>Wallace/n3</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 589 377 693 396; x_wconf 83' lang='eng' dir='ltr'><em>brevicu/a</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 220 415 993 448; baseline -0.006 -7"><span class='ocrx_word' id='word_1_52' title='bbox 220 418 370 441; x_wconf 85' lang='eng'><strong>99/100/100</strong></span> <span class='ocrx_word' id='word_1_53' title='bbox 387 415 392 445; x_wconf 0' lang='eng'><strong></strong></span> <span class='ocrx_word' id='word_1_54' title='bbox 477 419 620 443; x_wconf 87' lang='eng' dir='ltr'><em>Leptomonas</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 628 419 748 443; x_wconf 85' lang='eng' dir='ltr'><em>pod/ipaevi</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 989 426 993 448; x_wconf 55' lang='eng'><strong>5</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 244 448 1060 498; baseline -0.001 -30"><span class='ocrx_word' id='word_1_57' title='bbox 244 453 360 476; x_wconf 77' lang='eng'><em>63/86/67</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 387 449 392 454; x_wconf 83' lang='eng'><strong>&#39;</strong></span> <span class='ocrx_word' id='word_1_59' title='bbox 479 448 529 468; x_wconf 88' lang='eng' dir='ltr'><em>59L|</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 539 454 552 463; x_wconf 99' lang='eng'><strong>=</strong></span> <span class='ocrx_word' id='word_1_61' title='bbox 561 448 581 467; x_wconf 97' lang='eng' dir='ltr'><em>L.</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 591 448 619 468; x_wconf 87' lang='eng' dir='ltr'><em>cf.</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 627 448 757 472; x_wconf 86' lang='eng' dir='ltr'><em>podlipaevi</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 989 453 993 475; x_wconf 73' lang='eng' dir='ltr'>g</span> <span class='ocrx_word' id='word_1_65' title='bbox 1016 467 1037 498; x_wconf 86' lang='eng' dir='ltr'>L</span> <span class='ocrx_word' id='word_1_66' title='bbox 1039 467 1060 498; x_wconf 79' lang='eng'>2</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 445 478 993 788">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 445 478 993 788">
+     <span class='ocr_line' id='line_1_25' title="bbox 477 478 929 502; baseline 0 -5"><span class='ocrx_word' id='word_1_67' title='bbox 477 478 540 497; x_wconf 87' lang='eng' dir='ltr'><em>34EC</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 550 483 563 492; x_wconf 98' lang='eng'>=</span> <span class='ocrx_word' id='word_1_69' title='bbox 572 478 825 502; x_wconf 85' lang='eng' dir='ltr'><em>Leptomonasjaderae</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 834 483 869 502; x_wconf 84' lang='eng' dir='ltr'><em>sp.</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 879 483 929 497; x_wconf 91' lang='eng' dir='ltr'><em>nov.</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 466 505 993 536; baseline 0 -5"><span class='ocrx_word' id='word_1_72' title='bbox 466 512 532 531; x_wconf 88' lang='eng' dir='ltr'><em>73BR</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 540 517 554 526; x_wconf 99' lang='eng'><strong><em>=</em></strong></span> <span class='ocrx_word' id='word_1_74' title='bbox 563 512 717 536; x_wconf 84' lang='eng' dir='ltr'><em>Leptomonas</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 726 517 879 536; x_wconf 85' lang='eng' dir='ltr'><em>neopamerae</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 887 517 923 536; x_wconf 90' lang='eng' dir='ltr'><em>sp.</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 933 505 993 531; x_wconf 66' lang='eng' dir='ltr'><em>nov.5</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 462 540 993 575; baseline 0 -5"><span class='ocrx_word' id='word_1_78' title='bbox 462 551 605 575; x_wconf 77' lang='eng' dir='ltr'><em>Leptomonas</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 613 551 712 570; x_wconf 78' lang='eng' dir='ltr'><em>bifurcata</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 989 540 993 553; x_wconf 50' lang='eng'><strong>2</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 449 584 800 603; baseline 0 0"><span class='ocrx_word' id='word_1_81' title='bbox 449 584 549 603; x_wconf 83' lang='eng' dir='ltr'><em>‘Crithidia</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 559 584 720 603; x_wconf 79' lang='eng' dir='ltr'><em>deanei‘ATCC</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 730 584 800 603; x_wconf 78' lang='eng'><em>30255</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 447 623 747 643; baseline -0.003 0"><span class='ocrx_word' id='word_1_84' title='bbox 447 623 614 643; x_wconf 80' lang='eng' dir='ltr'><em>‘Blastocrithidia</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 624 624 747 643; x_wconf 83' lang='eng' dir='ltr'><em>miridarum’</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 475 656 777 680; baseline 0 -5"><span class='ocrx_word' id='word_1_86' title='bbox 475 656 618 680; x_wconf 74' lang='eng' dir='ltr'><em>Leptomonas</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 627 656 777 675; x_wconf 80' lang='eng' dir='ltr'><em>costaricensis</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 459 691 717 715; baseline 0 -5"><span class='ocrx_word' id='word_1_88' title='bbox 459 691 645 715; x_wconf 79' lang='eng' dir='ltr'><em>Trypanosomatid</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 656 691 717 710; x_wconf 89' lang='eng' dir='ltr'>G755</span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 445 727 696 751; baseline 0 -5"><span class='ocrx_word' id='word_1_90' title='bbox 445 727 598 751; x_wconf 75' lang='eng' dir='ltr'><em>‘Leptomonas&#39;</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 608 732 640 751; x_wconf 84' lang='eng' dir='ltr'><em>sp.</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 651 727 696 746; x_wconf 89' lang='eng' dir='ltr'><em>Cfm</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 486 763 744 788; baseline 0 -6"><span class='ocrx_word' id='word_1_93' title='bbox 486 763 629 787; x_wconf 85' lang='eng' dir='ltr'><em>Leptomonas</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 638 763 744 788; x_wconf 87' lang='eng' dir='ltr'><em>seymouri</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 456 803 921 893">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 456 803 921 893">
+     <span class='ocr_line' id='line_1_34' title="bbox 456 803 878 828; baseline 0 -6"><span class='ocrx_word' id='word_1_95' title='bbox 456 803 521 823; x_wconf 88' lang='eng' dir='ltr'><em>128$l</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 531 809 544 818; x_wconf 99' lang='eng'><strong>=</strong></span> <span class='ocrx_word' id='word_1_97' title='bbox 555 803 658 823; x_wconf 85' lang='eng' dir='ltr'><em>Crithidia</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 665 804 774 827; x_wconf 91' lang='eng' dir='ltr'><em>permixta</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 783 808 818 828; x_wconf 88' lang='eng' dir='ltr'><em>sp.</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 828 808 878 823; x_wconf 94' lang='eng' dir='ltr'><em>nov.</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 460 836 921 861; baseline 0 -5"><span class='ocrx_word' id='word_1_101' title='bbox 460 837 536 856; x_wconf 90' lang='eng' dir='ltr'><em>127AL</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 545 842 559 851; x_wconf 98' lang='eng'><strong>=</strong></span> <span class='ocrx_word' id='word_1_103' title='bbox 569 836 673 856; x_wconf 86' lang='eng' dir='ltr'><em>Crithidia</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 681 837 817 856; x_wconf 86' lang='eng' dir='ltr'><em>abscondita</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 826 841 861 861; x_wconf 92' lang='eng' dir='ltr'><em>sp.</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 871 841 921 856; x_wconf 88' lang='eng' dir='ltr'><em>nov.</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 465 869 904 893; baseline 0 -5"><span class='ocrx_word' id='word_1_107' title='bbox 465 869 540 888; x_wconf 84' lang='eng' dir='ltr'><strong>119YS</strong></span> <span class='ocrx_word' id='word_1_108' title='bbox 550 874 563 883; x_wconf 99' lang='eng'>=</span> <span class='ocrx_word' id='word_1_109' title='bbox 573 869 677 888; x_wconf 86' lang='eng' dir='ltr'><em>Crithidia</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 685 869 800 893; x_wconf 84' lang='eng' dir='ltr'><em>insperata</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 809 874 844 893; x_wconf 87' lang='eng' dir='ltr'><em>sp.</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 854 874 904 888; x_wconf 91' lang='eng' dir='ltr'><em>nov.</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 536 906 929 969">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 536 906 929 969">
+     <span class='ocr_line' id='line_1_37' title="bbox 536 906 822 931; baseline 0.003 -6"><span class='ocrx_word' id='word_1_113' title='bbox 536 907 680 931; x_wconf 83' lang='eng' dir='ltr'><em>Phytomonas</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 689 911 781 931; x_wconf 83' lang='eng' dir='ltr'><em>serpens</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 791 906 822 926; x_wconf 83' lang='eng' dir='ltr'><em>1G</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 540 938 929 969; baseline 0 -9"><span class='ocrx_word' id='word_1_116' title='bbox 540 941 685 966; x_wconf 78' lang='eng' dir='ltr'><em>Phytomonas</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 693 946 725 966; x_wconf 89' lang='eng' dir='ltr'><em>sp.</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 736 941 783 960; x_wconf 84' lang='eng' dir='ltr'><em>EM1</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 905 938 929 969; x_wconf 91' lang='eng' dir='ltr'>P</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 260 559 565 994">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 260 559 565 994">
+     <span class='ocr_line' id='line_1_39' title="bbox 404 559 456 575; baseline 0 1020"><span class='ocrx_word' id='word_1_120' title='bbox 404 559 456 575; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 404 575 449 653; baseline 0 -41"><span class='ocrx_word' id='word_1_121' title='bbox 404 575 449 653; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 301 653 469 692; baseline 0 0"><span class='ocrx_word' id='word_1_122' title='bbox 301 653 469 692; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 286 692 450 728; baseline 0 -13"><span class='ocrx_word' id='word_1_123' title='bbox 286 692 450 728; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 260 728 476 840; baseline 0 -77"><span class='ocrx_word' id='word_1_124' title='bbox 260 728 476 840; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 301 840 465 905; baseline 0 0"><span class='ocrx_word' id='word_1_125' title='bbox 301 840 465 905; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 301 905 533 943; baseline 0 652"><span class='ocrx_word' id='word_1_126' title='bbox 301 905 533 943; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 301 943 540 978; baseline 0 0"><span class='ocrx_word' id='word_1_127' title='bbox 301 943 540 978; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 448 978 565 994; baseline 0 601"><span class='ocrx_word' id='word_1_128' title='bbox 448 978 565 994; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 150 563 404 661">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 150 580 404 661">
+     <span class='ocr_line' id='line_1_48' title="bbox 314 580 404 629; baseline -0.011 -9"><span class='ocrx_word' id='word_1_129' title='bbox 314 580 404 629; x_wconf 43' lang='eng'><em>54/75}</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_49' title="bbox 150 633 392 661; baseline 0 0"><span class='ocrx_word' id='word_1_130' title='bbox 150 638 266 661; x_wconf 86' lang='eng'><em>63/81/65</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 387 633 392 655; x_wconf 72' lang='eng' dir='ltr'>S</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 192 695 286 717">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 192 695 286 717">
+     <span class='ocr_line' id='line_1_50' title="bbox 192 695 286 717; baseline 0 0"><span class='ocrx_word' id='word_1_132' title='bbox 192 695 286 717; x_wconf 86' lang='eng'><em>51/*/55</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 262 1019 933 1206">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 262 1019 875 1197">
+     <span class='ocr_line' id='line_1_51' title="bbox 551 1019 799 1070; baseline 0 0"><span class='ocrx_word' id='word_1_133' title='bbox 551 1054 609 1070; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> <span class='ocrx_word' id='word_1_134' title='bbox 775 1019 799 1070; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_52' title="bbox 551 1070 793 1092; baseline 0 503"><span class='ocrx_word' id='word_1_135' title='bbox 551 1070 793 1092; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_53' title="bbox 262 1092 795 1141; baseline 0 -18"><span class='ocrx_word' id='word_1_136' title='bbox 262 1092 795 1141; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_54' title="bbox 262 1141 645 1160; baseline 0 435"><span class='ocrx_word' id='word_1_137' title='bbox 262 1141 645 1160; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_55' title="bbox 551 1160 875 1197; baseline 0 -11"><span class='ocrx_word' id='word_1_138' title='bbox 551 1160 645 1186; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> <span class='ocrx_word' id='word_1_139' title='bbox 810 1160 875 1197; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 144 1071 266 1073">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 144 1071 266 1073">
+     <span class='ocr_line' id='line_1_56' title="bbox 144 1071 266 1073; baseline 0 522"><span class='ocrx_word' id='word_1_140' title='bbox 144 1071 266 1073; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 113 978 1149 1112">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 113 978 1149 1112">
+     <span class='ocr_line' id='line_1_57' title="bbox 279 978 848 1003; baseline -0.009 -1"><span class='ocrx_word' id='word_1_141' title='bbox 279 980 444 1003; x_wconf 89' lang='eng'><strong>100/100/100</strong></span> <span class='ocrx_word' id='word_1_142' title='bbox 573 978 717 1003; x_wconf 84' lang='eng' dir='ltr'><em>Phytomonas</em></span> <span class='ocrx_word' id='word_1_143' title='bbox 726 983 757 1003; x_wconf 87' lang='eng' dir='ltr'><em>sp.</em></span> <span class='ocrx_word' id='word_1_144' title='bbox 769 978 848 997; x_wconf 86' lang='eng' dir='ltr'>HART1</span> 
+     </span>
+     <span class='ocr_line' id='line_1_58' title="bbox 113 1017 1123 1075; baseline -0.003 -35"><span class='ocrx_word' id='word_1_145' title='bbox 113 1030 230 1053; x_wconf 75' lang='eng'><em>88/77/76</em></span> <span class='ocrx_word' id='word_1_146' title='bbox 609 1036 775 1059; x_wconf 70' lang='eng'><strong>100/100/100</strong></span> <span class='ocrx_word' id='word_1_147' title='bbox 806 1018 977 1075; x_wconf 60' lang='eng' dir='ltr'><em>Zerpetomonas</em></span> <span class='ocrx_word' id='word_1_148' title='bbox 986 1022 1017 1058; x_wconf 46' lang='eng' dir='ltr'><em>sp:</em></span> <span class='ocrx_word' id='word_1_149' title='bbox 1027 1017 1123 1058; x_wconf 40' lang='eng' dir='ltr'><em>TOG-263</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_59' title="bbox 827 1057 1081 1080; baseline 0 -5"><span class='ocrx_word' id='word_1_150' title='bbox 827 1057 979 1080; x_wconf 83' lang='eng' dir='ltr'><em>erpetomonas</em></span> <span class='ocrx_word' id='word_1_151' title='bbox 988 1057 1081 1075; x_wconf 76' lang='eng' dir='ltr'><em>rortmam</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_60' title="bbox 378 1089 1149 1112; baseline -0.004 -1"><span class='ocrx_word' id='word_1_152' title='bbox 378 1089 527 1112; x_wconf 85' lang='eng'><strong>100/99/100</strong></span> <span class='ocrx_word' id='word_1_153' title='bbox 809 1089 903 1108; x_wconf 77' lang='eng' dir='ltr'><em>Crilhidia</em></span> <span class='ocrx_word' id='word_1_154' title='bbox 912 1089 991 1108; x_wconf 83' lang='eng' dir='ltr'><em>deanei</em></span> <span class='ocrx_word' id='word_1_155' title='bbox 998 1089 1068 1108; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_156' title='bbox 1078 1089 1149 1108; x_wconf 86' lang='eng'><em>30969</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 645 1152 810 1175">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 645 1152 810 1175">
+     <span class='ocr_line' id='line_1_61' title="bbox 645 1152 810 1175; baseline 0 0"><span class='ocrx_word' id='word_1_157' title='bbox 645 1152 810 1175; x_wconf 91' lang='eng'><strong>100/100/100</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 446 1235 448 1272">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 446 1235 448 1272">
+     <span class='ocr_line' id='line_1_62' title="bbox 446 1235 448 1272; baseline 0 323"><span class='ocrx_word' id='word_1_158' title='bbox 446 1235 448 1272; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 4 1268 146 1270">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 4 1268 146 1270">
+     <span class='ocr_line' id='line_1_63' title="bbox 4 1268 146 1270; baseline 0 325"><span class='ocrx_word' id='word_1_159' title='bbox 4 1268 146 1270; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 4 1268 6 1521">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 4 1268 6 1521">
+     <span class='ocr_line' id='line_1_64' title="bbox 4 1268 6 1521; baseline 0 74"><span class='ocrx_word' id='word_1_160' title='bbox 4 1268 6 1521; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 415 1305 417 1344">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 415 1305 417 1344">
+     <span class='ocr_line' id='line_1_65' title="bbox 415 1305 417 1344; baseline 0 251"><span class='ocrx_word' id='word_1_161' title='bbox 415 1305 417 1344; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 264 1198 916 1390">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 277 1198 916 1390">
+     <span class='ocr_line' id='line_1_66' title="bbox 294 1198 459 1221; baseline 0 0"><span class='ocrx_word' id='word_1_162' title='bbox 294 1198 302 1220; x_wconf 91' lang='eng'>1</span> <span class='ocrx_word' id='word_1_163' title='bbox 309 1198 361 1221; x_wconf 81' lang='eng'><strong>00/1</strong></span> <span class='ocrx_word' id='word_1_164' title='bbox 368 1198 421 1221; x_wconf 90' lang='eng'><strong>00/1</strong></span> <span class='ocrx_word' id='word_1_165' title='bbox 428 1198 459 1221; x_wconf 92' lang='eng'><em>00</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_67' title="bbox 564 1209 916 1281; baseline 0 -36"><span class='ocrx_word' id='word_1_166' title='bbox 564 1226 735 1250; x_wconf 80' lang='eng' dir='ltr'><em>Herpetomonas</em></span> <span class='ocrx_word' id='word_1_167' title='bbox 744 1231 865 1245; x_wconf 88' lang='eng' dir='ltr'><em>muscarum</em></span> <span class='ocrx_word' id='word_1_168' title='bbox 893 1209 916 1281; x_wconf 81' lang='eng' dir='ltr'>:l</span> 
+     </span>
+     <span class='ocr_line' id='line_1_68' title="bbox 614 1262 872 1286; baseline 0 -5"><span class='ocrx_word' id='word_1_169' title='bbox 614 1262 785 1286; x_wconf 84' lang='eng' dir='ltr'><em>Herpetamonas</em></span> <span class='ocrx_word' id='word_1_170' title='bbox 794 1262 872 1286; x_wconf 75' lang='eng' dir='ltr'><em>ztiplika</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_69' title="bbox 277 1278 849 1315; baseline 0 0"><span class='ocrx_word' id='word_1_171' title='bbox 277 1278 393 1301; x_wconf 76' lang='eng'><em>97/86/80</em></span> <span class='ocrx_word' id='word_1_172' title='bbox 570 1296 732 1315; x_wconf 72' lang='eng' dir='ltr'><em>Blastecrithidia</em></span> <span class='ocrx_word' id='word_1_173' title='bbox 741 1296 849 1315; x_wconf 79' lang='eng' dir='ltr'><em>triatomae</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_70' title="bbox 641 1333 882 1358; baseline 0 -5"><span class='ocrx_word' id='word_1_174' title='bbox 641 1333 882 1358; x_wconf 79' lang='eng' dir='ltr'><em>Leptomonasjaculum</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_71' title="bbox 450 1366 666 1390; baseline 0 -5"><span class='ocrx_word' id='word_1_175' title='bbox 450 1366 537 1390; x_wconf 82' lang='eng' dir='ltr'><em>Serge/a</em></span> <span class='ocrx_word' id='word_1_176' title='bbox 545 1366 666 1390; x_wconf 82' lang='eng' dir='ltr'><em>pad/ipaevi</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 264 733 266 1414">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 264 733 266 1414">
+     <span class='ocr_line' id='line_1_72' title="bbox 264 733 266 1414; baseline 0 181"><span class='ocrx_word' id='word_1_177' title='bbox 264 733 266 1414; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 737 1399 1005 1423">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 737 1399 1005 1423">
+     <span class='ocr_line' id='line_1_73' title="bbox 737 1399 1005 1423; baseline 0 -5"><span class='ocrx_word' id='word_1_178' title='bbox 737 1399 880 1423; x_wconf 81' lang='eng' dir='ltr'><em>Leptomonas</em></span> <span class='ocrx_word' id='word_1_179' title='bbox 889 1399 1005 1418; x_wconf 83' lang='eng' dir='ltr'><em>col/osoma</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 139 1412 835 1497">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 139 1438 835 1497">
+     <span class='ocr_line' id='line_1_74' title="bbox 146 1438 835 1484; baseline -0.01 -20"><span class='ocrx_word' id='word_1_180' title='bbox 146 1446 540 1484; x_wconf 64' lang='eng'><strong>—{——</strong></span> <span class='ocrx_word' id='word_1_181' title='bbox 564 1438 720 1462; x_wconf 85' lang='eng' dir='ltr'><em>Trypanosoma</em></span> <span class='ocrx_word' id='word_1_182' title='bbox 729 1438 835 1462; x_wconf 85' lang='eng' dir='ltr'><em>sce/opori</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_75' title="bbox 139 1471 635 1497; baseline -0.01 -3"><span class='ocrx_word' id='word_1_183' title='bbox 139 1474 273 1497; x_wconf 87' lang='eng'><strong>99/100/97</strong></span> <span class='ocrx_word' id='word_1_184' title='bbox 400 1471 557 1495; x_wconf 78' lang='eng' dir='ltr'><em>lepanosoma</em></span> <span class='ocrx_word' id='word_1_185' title='bbox 566 1471 635 1490; x_wconf 88' lang='eng' dir='ltr'><em>avium</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 144 1071 146 1466">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 144 1071 146 1466">
+     <span class='ocr_line' id='line_1_76' title="bbox 144 1071 146 1466; baseline 0 129"><span class='ocrx_word' id='word_1_186' title='bbox 144 1071 146 1466; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 4 1519 561 1521">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 4 1519 561 1521">
+     <span class='ocr_line' id='line_1_77' title="bbox 4 1519 561 1521; baseline 0 74"><span class='ocrx_word' id='word_1_187' title='bbox 4 1519 561 1521; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 1 1558 59 1592">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 1 1573 46 1592">
+     <span class='ocr_line' id='line_1_78' title="bbox 1 1573 46 1592; baseline 0 0"><span class='ocrx_word' id='word_1_188' title='bbox 1 1573 46 1592; x_wconf 67' lang='eng'><strong>0,01</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 588 1510 739 1529">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 588 1510 739 1529">
+     <span class='ocr_line' id='line_1_79' title="bbox 588 1510 739 1529; baseline 0 0"><span class='ocrx_word' id='word_1_189' title='bbox 588 1510 648 1529; x_wconf 85' lang='eng' dir='ltr'><em>Bode</em></span> <span class='ocrx_word' id='word_1_190' title='bbox 657 1510 739 1529; x_wconf 82' lang='eng' dir='ltr'><em>sa/tans</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 810 1124 1189 1148">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 810 1124 1189 1148">
+     <span class='ocr_line' id='line_1_80' title="bbox 810 1124 1189 1148; baseline 0 -5"><span class='ocrx_word' id='word_1_191' title='bbox 810 1124 911 1143; x_wconf 82' lang='eng' dir='ltr'><em>‘Crithidia</em></span> <span class='ocrx_word' id='word_1_192' title='bbox 921 1124 1108 1148; x_wconf 76' lang='eng' dir='ltr'><em>oncope/ti’ATCC</em></span> <span class='ocrx_word' id='word_1_193' title='bbox 1118 1124 1189 1143; x_wconf 85' lang='eng'><em>30264</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 875 1161 1239 1210">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 875 1161 1239 1210">
+     <span class='ocr_line' id='line_1_81' title="bbox 875 1161 1239 1185; baseline 0 -5"><span class='ocrx_word' id='word_1_194' title='bbox 875 1161 968 1180; x_wconf 80' lang='eng' dir='ltr'><em>Crithidia</em></span> <span class='ocrx_word' id='word_1_195' title='bbox 978 1161 1083 1185; x_wconf 82' lang='eng' dir='ltr'><em>oncope/ti</em></span> <span class='ocrx_word' id='word_1_196' title='bbox 1090 1161 1159 1180; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_197' title='bbox 1171 1161 1239 1180; x_wconf 85' lang='eng'><em>12982</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_82' title="bbox 941 1191 1183 1210; baseline 0 0"><span class='ocrx_word' id='word_1_198' title='bbox 941 1191 1103 1210; x_wconf 71' lang='eng' dir='ltr'><em>BIastocrithid/a</em></span> <span class='ocrx_word' id='word_1_199' title='bbox 1113 1191 1183 1210; x_wconf 80' lang='eng' dir='ltr'><em>oulicis</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001172-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001172-0-000.pbm.png
new file mode 100644
index 00000000..b79a8189
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001172-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001172-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001172-0-000.pbm.png.hocr
new file mode 100644
index 00000000..73ebc98a
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001172-0-000.pbm.png.hocr
@@ -0,0 +1,138 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001172-0-000.pbm.png"; bbox 0 0 994 873; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 74 33 918 864">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 74 33 918 864">
+     <span class='ocr_line' id='line_1_1' title="bbox 74 33 918 58; baseline 0.002 -6"><span class='ocrx_word' id='word_1_1' title='bbox 74 38 83 52; x_wconf 88' lang='eng'>2</span> <span class='ocrx_word' id='word_1_2' title='bbox 89 38 105 52; x_wconf 81' lang='eng'><strong>%</strong></span> <span class='ocrx_word' id='word_1_3' title='bbox 378 35 397 54; x_wconf 96' lang='eng' dir='ltr'><strong><em>L.</em></strong></span> <span class='ocrx_word' id='word_1_4' title='bbox 405 33 596 55; x_wconf 83' lang='eng' dir='ltr'>fabifermentans</span> <span class='ocrx_word' id='word_1_5' title='bbox 605 34 660 54; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_6' title='bbox 668 33 756 55; x_wconf 83' lang='eng' dir='ltr'>24284T</span> <span class='ocrx_word' id='word_1_7' title='bbox 764 34 918 58; x_wconf 87' lang='eng' dir='ltr'>(AM905388)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 376 78 767 105; baseline 0 -6"><span class='ocrx_word' id='word_1_8' title='bbox 376 79 392 99; x_wconf 92' lang='eng' dir='ltr'>L.</span> <span class='ocrx_word' id='word_1_9' title='bbox 399 78 522 105; x_wconf 80' lang='eng' dir='ltr'>plantarum</span> <span class='ocrx_word' id='word_1_10' title='bbox 529 79 578 99; x_wconf 87' lang='eng' dir='ltr'>JCM</span> <span class='ocrx_word' id='word_1_11' title='bbox 589 78 767 102; x_wconf 67' lang='eng' dir='ltr'>1149T(D79210)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 364 106 748 149; baseline 0 -5"><span class='ocrx_word' id='word_1_12' title='bbox 364 106 503 149; x_wconf 44' lang='eng' dir='ltr'>g(L.pem‘osus</span> <span class='ocrx_word' id='word_1_13' title='bbox 510 124 558 144; x_wconf 92' lang='eng' dir='ltr'>JCM</span> <span class='ocrx_word' id='word_1_14' title='bbox 569 123 748 147; x_wconf 60' lang='eng' dir='ltr'>1558T(D79211)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 359 167 849 194; baseline 0.002 -6"><span class='ocrx_word' id='word_1_15' title='bbox 359 169 374 189; x_wconf 93' lang='eng' dir='ltr'>L.</span> <span class='ocrx_word' id='word_1_16' title='bbox 381 168 559 194; x_wconf 82' lang='eng' dir='ltr'>paraplantarum</span> <span class='ocrx_word' id='word_1_17' title='bbox 568 169 621 189; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_18' title='bbox 632 167 711 189; x_wconf 83' lang='eng' dir='ltr'>10667T</span> <span class='ocrx_word' id='word_1_19' title='bbox 719 168 849 192; x_wconf 88' lang='eng' dir='ltr'>(AJ306297)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 341 212 736 239; baseline 0.003 -6"><span class='ocrx_word' id='word_1_20' title='bbox 341 214 357 234; x_wconf 90' lang='eng' dir='ltr'>L.</span> <span class='ocrx_word' id='word_1_21' title='bbox 365 213 448 239; x_wconf 85' lang='eng' dir='ltr'>algidus</span> <span class='ocrx_word' id='word_1_22' title='bbox 455 213 504 234; x_wconf 89' lang='eng' dir='ltr'>JCM</span> <span class='ocrx_word' id='word_1_23' title='bbox 515 212 593 234; x_wconf 71' lang='eng' dir='ltr'>10491T</span> <span class='ocrx_word' id='word_1_24' title='bbox 602 213 736 237; x_wconf 88' lang='eng' dir='ltr'>(ABO33209)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 410 257 813 281; baseline 0 -3"><span class='ocrx_word' id='word_1_25' title='bbox 410 258 426 278; x_wconf 92' lang='eng' dir='ltr'>L.</span> <span class='ocrx_word' id='word_1_26' title='bbox 434 258 556 278; x_wconf 85' lang='eng' dir='ltr'>saerimneri</span> <span class='ocrx_word' id='word_1_27' title='bbox 563 257 670 278; x_wconf 73' lang='eng' dir='ltr'>GDA154T</span> <span class='ocrx_word' id='word_1_28' title='bbox 678 258 813 281; x_wconf 86' lang='eng' dir='ltr'>(AY255802)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 410 302 790 329; baseline 0.003 -6"><span class='ocrx_word' id='word_1_29' title='bbox 410 304 426 323; x_wconf 92' lang='eng' dir='ltr'>L.</span> <span class='ocrx_word' id='word_1_30' title='bbox 434 303 550 329; x_wconf 85' lang='eng' dir='ltr'>acidipiscis</span> <span class='ocrx_word' id='word_1_31' title='bbox 559 302 647 324; x_wconf 81' lang='eng' dir='ltr'>F560-1T</span> <span class='ocrx_word' id='word_1_32' title='bbox 655 303 790 327; x_wconf 80' lang='eng' dir='ltr'>(ABOZ3836)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 376 347 759 371; baseline 0 -3"><span class='ocrx_word' id='word_1_33' title='bbox 376 348 392 368; x_wconf 92' lang='eng' dir='ltr'>L.</span> <span class='ocrx_word' id='word_1_34' title='bbox 400 348 489 368; x_wconf 88' lang='eng' dir='ltr'>aviarius</span> <span class='ocrx_word' id='word_1_35' title='bbox 499 348 552 368; x_wconf 91' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_36' title='bbox 560 347 641 368; x_wconf 87' lang='eng' dir='ltr'>20655T</span> <span class='ocrx_word' id='word_1_37' title='bbox 649 348 759 371; x_wconf 88' lang='eng' dir='ltr'>(M58808)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 358 392 792 416; baseline 0 -3"><span class='ocrx_word' id='word_1_38' title='bbox 358 393 374 413; x_wconf 92' lang='eng' dir='ltr'><em>L.</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 382 392 490 413; x_wconf 85' lang='eng' dir='ltr'>salivarius</span> <span class='ocrx_word' id='word_1_40' title='bbox 498 393 561 413; x_wconf 90' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_41' title='bbox 571 394 577 413; x_wconf 96' lang='eng'>1</span> <span class='ocrx_word' id='word_1_42' title='bbox 586 394 636 413; x_wconf 95' lang='eng'>1741</span> <span class='ocrx_word' id='word_1_43' title='bbox 642 392 650 403; x_wconf 68' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_44' title='bbox 658 393 792 416; x_wconf 86' lang='eng' dir='ltr'>(AF089108)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 285 436 667 461; baseline 0 -3"><span class='ocrx_word' id='word_1_45' title='bbox 285 445 309 447; x_wconf 88' lang='eng'>—</span> <span class='ocrx_word' id='word_1_46' title='bbox 324 438 340 458; x_wconf 95' lang='eng' dir='ltr'>L.</span> <span class='ocrx_word' id='word_1_47' title='bbox 348 437 399 458; x_wconf 87' lang='eng' dir='ltr'><em>mali</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 407 438 459 458; x_wconf 90' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_49' title='bbox 468 436 549 458; x_wconf 72' lang='eng' dir='ltr'>20444T</span> <span class='ocrx_word' id='word_1_50' title='bbox 558 437 667 461; x_wconf 90' lang='eng' dir='ltr'>(M58824)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 285 481 799 506; baseline 0.002 -4"><span class='ocrx_word' id='word_1_51' title='bbox 285 491 308 493; x_wconf 97' lang='eng'>—</span> <span class='ocrx_word' id='word_1_52' title='bbox 323 483 342 503; x_wconf 87' lang='eng' dir='ltr'>L.</span> <span class='ocrx_word' id='word_1_53' title='bbox 350 488 477 503; x_wconf 83' lang='eng' dir='ltr'>cacaonum</span> <span class='ocrx_word' id='word_1_54' title='bbox 485 483 541 502; x_wconf 89' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_55' title='bbox 550 481 637 503; x_wconf 76' lang='eng' dir='ltr'>24285T</span> <span class='ocrx_word' id='word_1_56' title='bbox 645 482 799 506; x_wconf 86' lang='eng' dir='ltr'>(AM905389)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 393 526 672 557; baseline 0.004 -10"><span class='ocrx_word' id='word_1_57' title='bbox 393 528 408 547; x_wconf 96' lang='eng' dir='ltr'>L.</span> <span class='ocrx_word' id='word_1_58' title='bbox 416 526 492 553; x_wconf 84' lang='eng' dir='ltr'><em>nagelii</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 500 526 672 557; x_wconf 59' lang='eng' dir='ltr'>LuEwT(Y17500)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 324 571 768 595; baseline 0 -3"><span class='ocrx_word' id='word_1_60' title='bbox 324 572 340 592; x_wconf 96' lang='eng' dir='ltr'>L.</span> <span class='ocrx_word' id='word_1_61' title='bbox 347 572 487 592; x_wconf 81' lang='eng' dir='ltr'>satsumensis</span> <span class='ocrx_word' id='word_1_62' title='bbox 496 572 551 592; x_wconf 92' lang='eng' dir='ltr'>NRIC</span> <span class='ocrx_word' id='word_1_63' title='bbox 559 571 625 592; x_wconf 85' lang='eng' dir='ltr'>0604T</span> <span class='ocrx_word' id='word_1_64' title='bbox 633 572 768 595; x_wconf 89' lang='eng' dir='ltr'>(AB154519)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 358 616 746 641; baseline 0 -4"><span class='ocrx_word' id='word_1_65' title='bbox 358 618 374 637; x_wconf 98' lang='eng' dir='ltr'>L.</span> <span class='ocrx_word' id='word_1_66' title='bbox 382 617 476 637; x_wconf 90' lang='eng' dir='ltr'>murinus</span> <span class='ocrx_word' id='word_1_67' title='bbox 485 617 538 637; x_wconf 93' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_68' title='bbox 547 616 628 637; x_wconf 88' lang='eng' dir='ltr'>20452T</span> <span class='ocrx_word' id='word_1_69' title='bbox 636 617 746 641; x_wconf 87' lang='eng' dir='ltr'>(M58826)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 359 661 750 685; baseline 0 -3"><span class='ocrx_word' id='word_1_70' title='bbox 359 662 374 682; x_wconf 95' lang='eng' dir='ltr'>L.</span> <span class='ocrx_word' id='word_1_71' title='bbox 382 661 480 682; x_wconf 83' lang='eng' dir='ltr'>animalis</span> <span class='ocrx_word' id='word_1_72' title='bbox 489 662 542 682; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_73' title='bbox 551 661 631 682; x_wconf 81' lang='eng' dir='ltr'>20602T</span> <span class='ocrx_word' id='word_1_74' title='bbox 640 662 750 685; x_wconf 87' lang='eng' dir='ltr'>(M58807)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 376 705 708 732; baseline 0 -5"><span class='ocrx_word' id='word_1_75' title='bbox 376 707 392 727; x_wconf 95' lang='eng' dir='ltr'>L.</span> <span class='ocrx_word' id='word_1_76' title='bbox 400 707 449 732; x_wconf 87' lang='eng' dir='ltr'><em>equi</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 456 707 492 727; x_wconf 95' lang='eng' dir='ltr'>YIT</span> <span class='ocrx_word' id='word_1_78' title='bbox 499 705 565 727; x_wconf 90' lang='eng' dir='ltr'>0455T</span> <span class='ocrx_word' id='word_1_79' title='bbox 573 706 708 730; x_wconf 85' lang='eng' dir='ltr'>(ABO48833)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 273 750 711 777; baseline 0.002 -6"><span class='ocrx_word' id='word_1_80' title='bbox 273 758 349 760; x_wconf 91' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_81' title='bbox 359 752 374 772; x_wconf 93' lang='eng' dir='ltr'>L.</span> <span class='ocrx_word' id='word_1_82' title='bbox 382 751 441 777; x_wconf 82' lang='eng' dir='ltr'><em>agilis</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 450 751 504 772; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_84' title='bbox 513 750 593 772; x_wconf 88' lang='eng' dir='ltr'>20509T</span> <span class='ocrx_word' id='word_1_85' title='bbox 601 751 711 775; x_wconf 87' lang='eng' dir='ltr'>(M58803)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 376 795 755 820; baseline 0 -4"><span class='ocrx_word' id='word_1_86' title='bbox 376 797 392 816; x_wconf 92' lang='eng' dir='ltr'>L.</span> <span class='ocrx_word' id='word_1_87' title='bbox 400 796 485 816; x_wconf 88' lang='eng' dir='ltr'><em>ruminis</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 494 796 547 816; x_wconf 85' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_89' title='bbox 556 795 637 816; x_wconf 73' lang='eng' dir='ltr'>20403T</span> <span class='ocrx_word' id='word_1_90' title='bbox 645 796 755 820; x_wconf 88' lang='eng' dir='ltr'>(M58828)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 185 840 603 864; baseline 0 -3"><span class='ocrx_word' id='word_1_91' title='bbox 185 841 201 861; x_wconf 93' lang='eng' dir='ltr'>L.</span> <span class='ocrx_word' id='word_1_92' title='bbox 209 840 335 861; x_wconf 81' lang='eng' dir='ltr'>delbrueckii</span> <span class='ocrx_word' id='word_1_93' title='bbox 343 841 396 861; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_94' title='bbox 404 840 485 861; x_wconf 87' lang='eng' dir='ltr'>20074T</span> <span class='ocrx_word' id='word_1_95' title='bbox 493 841 603 864; x_wconf 86' lang='eng' dir='ltr'>(M58814)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 0 39 409 854">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 0 39 409 854">
+     <span class='ocr_line' id='line_1_20' title="bbox 180 39 375 85; baseline 0 -15"><span class='ocrx_word' id='word_1_96' title='bbox 180 39 375 85; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 180 85 360 118; baseline 0 755"><span class='ocrx_word' id='word_1_97' title='bbox 180 85 360 118; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 176 118 358 207; baseline 0 -8"><span class='ocrx_word' id='word_1_98' title='bbox 176 118 358 207; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 0 207 409 335; baseline 0 0"><span class='ocrx_word' id='word_1_99' title='bbox 0 207 409 335; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 0 335 376 383; baseline 0.008 -3"><span class='ocrx_word' id='word_1_100' title='bbox 0 335 376 383; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 0 383 255 428; baseline 0 445"><span class='ocrx_word' id='word_1_101' title='bbox 0 383 255 428; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 0 428 282 473; baseline 0 400"><span class='ocrx_word' id='word_1_102' title='bbox 0 428 282 473; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 0 473 285 518; baseline 0 355"><span class='ocrx_word' id='word_1_103' title='bbox 0 473 285 518; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 0 518 387 559; baseline 0 314"><span class='ocrx_word' id='word_1_104' title='bbox 0 518 387 559; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 0 559 324 607; baseline 0 266"><span class='ocrx_word' id='word_1_105' title='bbox 0 559 324 607; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 0 607 347 697; baseline 0 0"><span class='ocrx_word' id='word_1_106' title='bbox 0 607 347 697; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 0 697 347 737; baseline 0 136"><span class='ocrx_word' id='word_1_107' title='bbox 0 697 347 737; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 0 737 273 790; baseline 0 83"><span class='ocrx_word' id='word_1_108' title='bbox 0 737 273 790; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 0 790 366 854; baseline 0 0"><span class='ocrx_word' id='word_1_109' title='bbox 0 790 366 854; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 49 65 130 68">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 49 65 130 68">
+     <span class='ocr_line' id='line_1_34' title="bbox 49 65 130 68; baseline 0 805"><span class='ocrx_word' id='word_1_110' title='bbox 49 65 130 68; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 142 199 173 214">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 142 199 173 214">
+     <span class='ocr_line' id='line_1_35' title="bbox 142 199 173 214; baseline -0.032 0"><span class='ocrx_word' id='word_1_111' title='bbox 142 199 173 214; x_wconf 81' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 249 357 251 403">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 249 357 251 403">
+     <span class='ocr_line' id='line_1_36' title="bbox 249 357 251 403; baseline 0 470"><span class='ocrx_word' id='word_1_112' title='bbox 249 357 251 403; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 251 401 349 403">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 251 401 349 403">
+     <span class='ocr_line' id='line_1_37' title="bbox 251 401 349 403; baseline 0 470"><span class='ocrx_word' id='word_1_113' title='bbox 251 401 349 403; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 283 445 285 493">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 283 445 285 493">
+     <span class='ocr_line' id='line_1_38' title="bbox 283 445 285 493; baseline 0 380"><span class='ocrx_word' id='word_1_114' title='bbox 283 445 285 493; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 271 714 273 760">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 271 714 273 760">
+     <span class='ocr_line' id='line_1_39' title="bbox 271 714 273 760; baseline 0 113"><span class='ocrx_word' id='word_1_115' title='bbox 271 714 273 760; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 967 0 994 226">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 967 0 994 226">
+     <span class='ocr_line' id='line_1_40' title="bbox 967 0 994 226; textangle 90"><span class='ocrx_word' id='word_1_116' title='bbox 967 154 987 226; x_wconf 71' lang='eng' dir='ltr'>dn016</span> <span class='ocrx_word' id='word_1_117' title='bbox 967 23 994 146; x_wconf 66' lang='eng' dir='ltr'>Lummun/d</span> <span class='ocrx_word' id='word_1_118' title='bbox 973 0 993 16; x_wconf 72' lang='eng'>&#39;7</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 967 446 994 657">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 967 446 994 657">
+     <span class='ocr_line' id='line_1_41' title="bbox 967 446 994 657; textangle 90"><span class='ocrx_word' id='word_1_119' title='bbox 967 585 987 657; x_wconf 78' lang='eng' dir='ltr'>dnmﬁ</span> <span class='ocrx_word' id='word_1_120' title='bbox 973 470 994 577; x_wconf 68' lang='eng' dir='ltr'>snymyns</span> <span class='ocrx_word' id='word_1_121' title='bbox 973 446 993 462; x_wconf 79' lang='eng'>&#39;7</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001172-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001172-0-001.pbm.png
new file mode 100644
index 00000000..45cf927d
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001172-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001172-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001172-0-001.pbm.png.hocr
new file mode 100644
index 00000000..647736e3
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001172-0-001.pbm.png.hocr
@@ -0,0 +1,167 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001172-0-001.pbm.png"; bbox 0 0 888 1005; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 100 40 140 53">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 100 40 140 53">
+     <span class='ocr_line' id='line_1_1' title="bbox 100 40 140 53; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 100 40 140 53; x_wconf 83' lang='eng'><em>10%</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 269 45 362 47">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 269 45 362 47">
+     <span class='ocr_line' id='line_1_2' title="bbox 269 45 362 47; baseline 0 958"><span class='ocrx_word' id='word_1_2' title='bbox 269 45 362 47; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 368 37 888 61">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 368 37 888 61">
+     <span class='ocr_line' id='line_1_3' title="bbox 368 37 888 61; baseline 0 -3"><span class='ocrx_word' id='word_1_3' title='bbox 368 39 386 58; x_wconf 90' lang='eng' dir='ltr'><em>L.</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 394 38 578 58; x_wconf 81' lang='eng' dir='ltr'><em>fabifermentans</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 586 39 639 58; x_wconf 91' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 647 37 732 58; x_wconf 79' lang='eng' dir='ltr'><em>24284T</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 740 38 888 61; x_wconf 86' lang='eng' dir='ltr'><em>(AM922294)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 2 80 862 232">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 2 80 862 232">
+     <span class='ocr_line' id='line_1_4' title="bbox 395 80 812 106; baseline -0.002 -5"><span class='ocrx_word' id='word_1_8' title='bbox 395 82 410 101; x_wconf 92' lang='eng' dir='ltr'><em>L.</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 417 81 535 106; x_wconf 77' lang='eng' dir='ltr'><em>plantarum</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 545 81 594 101; x_wconf 89' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 603 80 667 101; x_wconf 73' lang='eng' dir='ltr'><em>6907T</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 675 81 812 104; x_wconf 86' lang='eng' dir='ltr'><em>(AM087714)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 329 88 862 177; baseline 0 -34"><span class='ocrx_word' id='word_1_13' title='bbox 329 88 370 177; x_wconf 70' lang='eng' dir='ltr'>E</span> <span class='ocrx_word' id='word_1_14' title='bbox 378 124 394 143; x_wconf 94' lang='eng' dir='ltr'><em>L.</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 400 123 571 149; x_wconf 79' lang='eng' dir='ltr'><em>paraplantarum</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 580 124 630 143; x_wconf 88' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 640 123 717 143; x_wconf 88' lang='eng' dir='ltr'><em>16673T</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 725 124 862 146; x_wconf 88' lang='eng' dir='ltr'><em>(AM087727)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 378 165 790 191; baseline 0 -5"><span class='ocrx_word' id='word_1_19' title='bbox 378 167 394 186; x_wconf 94' lang='eng' dir='ltr'><em>L.</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 400 169 500 191; x_wconf 81' lang='eng' dir='ltr'><em>pentosus</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 509 167 559 186; x_wconf 89' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 569 165 645 186; x_wconf 75' lang='eng' dir='ltr'><em>10755T</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 653 166 790 189; x_wconf 86' lang='eng' dir='ltr'><em>(AM087713)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 2 208 493 232; baseline 0.002 -4"><span class='ocrx_word' id='word_1_24' title='bbox 2 217 65 219; x_wconf 95' lang='eng'>—</span> <span class='ocrx_word' id='word_1_25' title='bbox 74 210 89 229; x_wconf 92' lang='eng' dir='ltr'><em>L.</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 97 209 218 229; x_wconf 84' lang='eng' dir='ltr'><em>delbrueckii</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 225 210 275 229; x_wconf 88' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 283 208 348 229; x_wconf 74' lang='eng' dir='ltr'><em>6412T</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 355 209 493 232; x_wconf 85' lang='eng' dir='ltr'><em>(AM087689)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 72 61 167 64">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 72 61 167 64">
+     <span class='ocr_line' id='line_1_8' title="bbox 72 61 167 64; baseline 0 941"><span class='ocrx_word' id='word_1_30' title='bbox 72 61 167 64; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 0 94 269 96">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 0 94 269 96">
+     <span class='ocr_line' id='line_1_9' title="bbox 0 94 269 96; baseline 0 909"><span class='ocrx_word' id='word_1_31' title='bbox 0 94 269 96; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 267 45 269 141">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 267 45 269 141">
+     <span class='ocr_line' id='line_1_10' title="bbox 267 45 269 141; baseline 0 864"><span class='ocrx_word' id='word_1_32' title='bbox 267 45 269 141; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 9 334 30 357">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 9 334 30 357">
+     <span class='ocr_line' id='line_1_11' title="bbox 9 334 30 357; baseline 0.143 -3"><span class='ocrx_word' id='word_1_33' title='bbox 9 334 30 357; x_wconf 86' lang='eng' dir='ltr'>b)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 0 380 817 1005">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 277 380 707 403">
+     <span class='ocr_line' id='line_1_12' title="bbox 277 380 707 403; baseline 0 -3"><span class='ocrx_word' id='word_1_34' title='bbox 277 381 293 400; x_wconf 93' lang='eng' dir='ltr'><em>L.</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 300 381 418 400; x_wconf 82' lang='eng' dir='ltr'><em>saerimneri</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 425 381 475 400; x_wconf 89' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 484 380 561 400; x_wconf 75' lang='eng' dir='ltr'><em>22087T</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 569 381 707 403; x_wconf 89' lang='eng' dir='ltr'><em>(AM087717)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 377 422 773 446">
+     <span class='ocr_line' id='line_1_13' title="bbox 377 422 773 446; baseline 0 -3"><span class='ocrx_word' id='word_1_39' title='bbox 377 424 393 443; x_wconf 71' lang='eng' dir='ltr'><em>L.</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 401 424 483 443; x_wconf 76' lang='eng' dir='ltr'><em>ruminis</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 491 424 541 443; x_wconf 92' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 551 422 628 443; x_wconf 82' lang='eng' dir='ltr'><em>10756T</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 635 424 773 446; x_wconf 90' lang='eng' dir='ltr'><em>(AM087756)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 377 465 737 491">
+     <span class='ocr_line' id='line_1_14' title="bbox 377 465 737 491; baseline 0 -5"><span class='ocrx_word' id='word_1_44' title='bbox 377 467 393 486; x_wconf 89' lang='eng' dir='ltr'><em>L.</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 400 467 448 491; x_wconf 88' lang='eng' dir='ltr'><em>equi</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 456 467 506 486; x_wconf 89' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 514 465 592 486; x_wconf 81' lang='eng' dir='ltr'><em>21748T</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 600 466 737 489; x_wconf 89' lang='eng' dir='ltr'><em>(AM087740)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 327 508 727 532">
+     <span class='ocr_line' id='line_1_15' title="bbox 327 508 727 532; baseline 0 -3"><span class='ocrx_word' id='word_1_49' title='bbox 327 510 343 529; x_wconf 87' lang='eng' dir='ltr'><em>L.</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 350 510 437 529; x_wconf 83' lang='eng' dir='ltr'><em>aviarius</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 446 510 496 529; x_wconf 90' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 506 508 582 529; x_wconf 87' lang='eng' dir='ltr'><em>10753T</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 590 509 727 532; x_wconf 86' lang='eng' dir='ltr'><em>(AMO87737)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 327 551 683 577">
+     <span class='ocr_line' id='line_1_16' title="bbox 327 551 683 577; baseline 0 -5"><span class='ocrx_word' id='word_1_54' title='bbox 327 553 343 572; x_wconf 90' lang='eng' dir='ltr'><em>L.</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 350 552 407 577; x_wconf 83' lang='eng' dir='ltr'><em>agilis</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 416 553 466 572; x_wconf 89' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 474 551 538 572; x_wconf 80' lang='eng' dir='ltr'><em>9186T</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 546 552 683 575; x_wconf 85' lang='eng' dir='ltr'><em>(AM087734)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 327 594 720 618">
+     <span class='ocr_line' id='line_1_17' title="bbox 327 594 720 618; baseline 0 -3"><span class='ocrx_word' id='word_1_59' title='bbox 327 596 343 615; x_wconf 92' lang='eng' dir='ltr'><em>L.</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 350 595 445 615; x_wconf 84' lang='eng' dir='ltr'><em>anima/is</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 453 596 503 615; x_wconf 88' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 512 594 575 615; x_wconf 73' lang='eng' dir='ltr'><em>9843T</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 583 595 720 618; x_wconf 89' lang='eng' dir='ltr'><em>(AM087679)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 328 637 731 661">
+     <span class='ocr_line' id='line_1_18' title="bbox 328 637 731 661; baseline 0 -3"><span class='ocrx_word' id='word_1_64' title='bbox 328 639 343 658; x_wconf 90' lang='eng' dir='ltr'><em>L.</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 351 639 441 658; x_wconf 81' lang='eng' dir='ltr'><em>murinus</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 450 639 499 658; x_wconf 91' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 510 637 586 658; x_wconf 81' lang='eng' dir='ltr'><em>14189T</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 594 638 731 661; x_wconf 91' lang='eng' dir='ltr'><em>(AMO87760)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 260 680 802 833">
+     <span class='ocr_line' id='line_1_19' title="bbox 377 680 802 706; baseline 0 -5"><span class='ocrx_word' id='word_1_69' title='bbox 377 682 393 701; x_wconf 92' lang='eng' dir='ltr'><em>L.</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 400 681 512 706; x_wconf 80' lang='eng' dir='ltr'><em>acidipiscis</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 521 682 571 701; x_wconf 88' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 581 680 657 701; x_wconf 88' lang='eng' dir='ltr'><em>19820T</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 665 681 802 704; x_wconf 85' lang='eng' dir='ltr'><em>(AM087762)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 394 723 787 749; baseline 0 -5"><span class='ocrx_word' id='word_1_74' title='bbox 394 725 409 744; x_wconf 96' lang='eng' dir='ltr'><em>L.</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 417 724 497 749; x_wconf 71' lang='eng' dir='ltr'><em>a/gidus</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 505 725 555 744; x_wconf 93' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 566 723 642 744; x_wconf 83' lang='eng' dir='ltr'><em>19872T</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 650 724 787 747; x_wconf 84' lang='eng' dir='ltr'><em>(AM263504)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 394 766 796 790; baseline 0 -4"><span class='ocrx_word' id='word_1_79' title='bbox 394 768 409 787; x_wconf 96' lang='eng' dir='ltr'><em>L.</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 417 767 520 787; x_wconf 82' lang='eng' dir='ltr'><em>salivarius</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 529 767 579 787; x_wconf 88' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 587 766 651 787; x_wconf 88' lang='eng' dir='ltr'><em>9477T</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 659 767 796 790; x_wconf 89' lang='eng' dir='ltr'><em>(AM087721)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 260 809 715 833; baseline 0.002 -4"><span class='ocrx_word' id='word_1_84' title='bbox 260 819 359 821; x_wconf 91' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_85' title='bbox 368 811 383 830; x_wconf 96' lang='eng' dir='ltr'><em>L.</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 391 810 440 830; x_wconf 86' lang='eng' dir='ltr'><em>mali</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 448 810 497 830; x_wconf 89' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 506 809 570 830; x_wconf 56' lang='eng' dir='ltr'>6899T</span> <span class='ocrx_word' id='word_1_89' title='bbox 577 810 715 833; x_wconf 87' lang='eng' dir='ltr'><em>(AM087746)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 363 852 750 878">
+     <span class='ocr_line' id='line_1_23' title="bbox 363 852 750 878; baseline 0 -6"><span class='ocrx_word' id='word_1_90' title='bbox 363 853 378 872; x_wconf 93' lang='eng' dir='ltr'><em>L.</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 386 852 461 878; x_wconf 85' lang='eng' dir='ltr'><em>nage/ii</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 469 853 519 872; x_wconf 89' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 527 852 605 872; x_wconf 84' lang='eng' dir='ltr'><em>21593T</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 613 853 750 876; x_wconf 90' lang='eng' dir='ltr'><em>(AMO87708)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 0 895 817 1005">
+     <span class='ocr_line' id='line_1_24' title="bbox 347 895 807 919; baseline 0 -3"><span class='ocrx_word' id='word_1_95' title='bbox 347 896 366 916; x_wconf 89' lang='eng' dir='ltr'><em>L.</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 373 902 496 916; x_wconf 84' lang='eng' dir='ltr'><em>cacaonum</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 505 896 558 916; x_wconf 91' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 566 895 650 916; x_wconf 86' lang='eng' dir='ltr'><em>24285T</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 658 896 807 919; x_wconf 87' lang='eng' dir='ltr'><strong>(AM922295)</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 370 938 817 962; baseline -0.002 -3"><span class='ocrx_word' id='word_1_100' title='bbox 370 940 386 959; x_wconf 91' lang='eng' dir='ltr'><em>L.</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 393 939 527 959; x_wconf 78' lang='eng' dir='ltr'><em>sarsumensis</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 536 939 586 959; x_wconf 88' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 594 938 672 959; x_wconf 74' lang='eng' dir='ltr'><em>22973T</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 681 939 817 962; x_wconf 85' lang='eng' dir='ltr'><em>(AM087769)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 0 981 529 1005; baseline -0.002 -3"><span class='ocrx_word' id='word_1_105' title='bbox 0 991 105 994; x_wconf 93' lang='eng'>—</span> <span class='ocrx_word' id='word_1_106' title='bbox 111 982 126 1002; x_wconf 95' lang='eng' dir='ltr'><em>L.</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 134 981 255 1002; x_wconf 85' lang='eng' dir='ltr'><em>de/brueckii</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 262 982 312 1002; x_wconf 88' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 320 981 384 1002; x_wconf 75' lang='eng' dir='ltr'><em>6412T</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 392 982 529 1005; x_wconf 87' lang='eng' dir='ltr'><em>(AM087689)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 0 384 389 953">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 0 384 389 953">
+     <span class='ocr_line' id='line_1_27' title="bbox 0 384 277 414; baseline 0 591"><span class='ocrx_word' id='word_1_111' title='bbox 0 384 277 414; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 0 414 368 544; baseline 0 -86"><span class='ocrx_word' id='word_1_112' title='bbox 0 414 368 544; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 167 544 324 630; baseline 0 0"><span class='ocrx_word' id='word_1_113' title='bbox 167 544 324 630; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 167 630 328 673; baseline 0 332"><span class='ocrx_word' id='word_1_114' title='bbox 167 630 328 673; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 186 673 389 797; baseline 0 0"><span class='ocrx_word' id='word_1_115' title='bbox 186 673 389 797; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 196 797 368 891; baseline 0.035 -52"><span class='ocrx_word' id='word_1_116' title='bbox 196 797 368 891; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 231 891 366 953; baseline 0 0"><span class='ocrx_word' id='word_1_117' title='bbox 231 891 366 953; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 258 861 356 864">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 258 861 356 864">
+     <span class='ocr_line' id='line_1_34' title="bbox 258 861 356 864; baseline 0 141"><span class='ocrx_word' id='word_1_118' title='bbox 258 861 356 864; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 258 775 260 904">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 258 775 260 904">
+     <span class='ocr_line' id='line_1_35' title="bbox 258 775 260 904; baseline 0 101"><span class='ocrx_word' id='word_1_119' title='bbox 258 775 260 904; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 0 3 6 991">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 0 3 6 991">
+     <span class='ocr_line' id='line_1_36' title="bbox 0 3 6 991; baseline 0 14"><span class='ocrx_word' id='word_1_120' title='bbox 0 3 6 991; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001180-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001180-0-000.pbm.png
new file mode 100644
index 00000000..72bba0c1
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001180-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001180-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001180-0-000.pbm.png.hocr
new file mode 100644
index 00000000..4b0fe5c4
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001180-0-000.pbm.png.hocr
@@ -0,0 +1,320 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001180-0-000.pbm.png"; bbox 0 0 1656 2059; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 54 20 572 21">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 54 20 572 21">
+     <span class='ocr_line' id='line_1_1' title="bbox 54 20 572 21; baseline 0 2038"><span class='ocrx_word' id='word_1_1' title='bbox 54 20 572 21; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 0 80 56 81">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 0 80 56 81">
+     <span class='ocr_line' id='line_1_2' title="bbox 0 80 56 81; baseline 0 1978"><span class='ocrx_word' id='word_1_2' title='bbox 0 80 56 81; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 0 80 2 1348">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 0 80 2 1348">
+     <span class='ocr_line' id='line_1_3' title="bbox 0 80 2 1348; baseline 0 711"><span class='ocrx_word' id='word_1_3' title='bbox 0 80 2 1348; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 4 92 50 112">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 4 92 50 112">
+     <span class='ocr_line' id='line_1_4' title="bbox 4 92 50 112; baseline 0 0"><span class='ocrx_word' id='word_1_4' title='bbox 4 92 50 112; x_wconf 86' lang='eng'>82.5</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 21 664 53 684">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 21 664 53 684">
+     <span class='ocr_line' id='line_1_5' title="bbox 21 664 53 684; baseline 0 0"><span class='ocrx_word' id='word_1_5' title='bbox 21 664 53 684; x_wconf 87' lang='eng'><em>73.</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 54 20 56 138">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 54 20 56 138">
+     <span class='ocr_line' id='line_1_6' title="bbox 54 20 56 138; baseline 0 1921"><span class='ocrx_word' id='word_1_6' title='bbox 54 20 56 138; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 581 0 1389 38">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 581 0 1389 38">
+     <span class='ocr_line' id='line_1_7' title="bbox 581 0 1389 38; baseline 0 -7"><span class='ocrx_word' id='word_1_7' title='bbox 581 6 851 31; x_wconf 82' lang='eng' dir='ltr'><em>Pseudoalteromonas</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 861 6 1029 38; x_wconf 77' lang='eng' dir='ltr'><em>haloplanklis</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 1047 8 1136 31; x_wconf 90' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_10' title='bbox 1150 0 1248 31; x_wconf 84' lang='eng' dir='ltr'><em>14393T</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 1259 7 1389 38; x_wconf 85' lang='eng' dir='ltr'>(X67024)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 54 136 663 138">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 54 136 663 138">
+     <span class='ocr_line' id='line_1_8' title="bbox 54 136 663 138; baseline 0 1921"><span class='ocrx_word' id='word_1_12' title='bbox 54 136 663 138; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 60 664 65 683">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 60 664 65 683">
+     <span class='ocr_line' id='line_1_9' title="bbox 60 664 65 683; baseline 0 0"><span class='ocrx_word' id='word_1_13' title='bbox 60 664 65 683; x_wconf 96' lang='eng' dir='ltr'>l</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 28 696 73 697">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 28 696 73 697">
+     <span class='ocr_line' id='line_1_10' title="bbox 28 696 73 697; baseline 0 -14"><span class='ocrx_word' id='word_1_14' title='bbox 28 696 73 697; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 0 1346 30 1348">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 0 1346 30 1348">
+     <span class='ocr_line' id='line_1_11' title="bbox 0 1346 30 1348; baseline 0 711"><span class='ocrx_word' id='word_1_15' title='bbox 0 1346 30 1348; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 28 696 30 1999">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 28 696 30 1999">
+     <span class='ocr_line' id='line_1_12' title="bbox 28 696 30 1999; baseline 0 60"><span class='ocrx_word' id='word_1_16' title='bbox 28 696 30 1999; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 71 311 73 1082">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 71 311 73 1082">
+     <span class='ocr_line' id='line_1_13' title="bbox 71 311 73 1082; baseline 0 977"><span class='ocrx_word' id='word_1_17' title='bbox 71 311 73 1082; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 261 324 299 344">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 261 324 299 344">
+     <span class='ocr_line' id='line_1_14' title="bbox 261 324 299 344; baseline 0 0"><span class='ocrx_word' id='word_1_18' title='bbox 261 324 299 344; x_wconf 91' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 311 253 313 372">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 311 253 313 372">
+     <span class='ocr_line' id='line_1_15' title="bbox 311 253 313 372; baseline 0 1687"><span class='ocrx_word' id='word_1_19' title='bbox 311 253 313 372; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 325 616 435 618">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 325 616 435 618">
+     <span class='ocr_line' id='line_1_16' title="bbox 325 616 435 618; baseline 0 1441"><span class='ocrx_word' id='word_1_20' title='bbox 325 616 435 618; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 380 624 428 644">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 380 624 428 644">
+     <span class='ocr_line' id='line_1_17' title="bbox 380 624 428 644; baseline 0 0"><span class='ocrx_word' id='word_1_21' title='bbox 380 624 428 644; x_wconf 85' lang='eng'>95.4</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 434 487 435 749">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 434 487 435 749">
+     <span class='ocr_line' id='line_1_18' title="bbox 434 487 435 749; baseline 0 1310"><span class='ocrx_word' id='word_1_22' title='bbox 434 487 435 749; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 439 602 441 894">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 439 602 441 894">
+     <span class='ocr_line' id='line_1_19' title="bbox 439 602 441 894; baseline 0 1165"><span class='ocrx_word' id='word_1_23' title='bbox 439 602 441 894; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 439 892 500 894">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 439 892 500 894">
+     <span class='ocr_line' id='line_1_20' title="bbox 439 892 500 894; baseline 0 1165"><span class='ocrx_word' id='word_1_24' title='bbox 439 892 500 894; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 447 898 495 918">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 447 898 495 918">
+     <span class='ocr_line' id='line_1_21' title="bbox 447 898 495 918; baseline 0 0"><span class='ocrx_word' id='word_1_25' title='bbox 447 898 495 918; x_wconf 87' lang='eng'>86.4</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 499 776 501 1011">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 499 776 501 1011">
+     <span class='ocr_line' id='line_1_22' title="bbox 499 776 501 1011; baseline 0 1048"><span class='ocrx_word' id='word_1_26' title='bbox 499 776 501 1011; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 71 1081 327 1082">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 71 1081 327 1082">
+     <span class='ocr_line' id='line_1_23' title="bbox 71 1081 327 1082; baseline 0 977"><span class='ocrx_word' id='word_1_27' title='bbox 71 1081 327 1082; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 270 1088 308 1108">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 270 1088 308 1108">
+     <span class='ocr_line' id='line_1_24' title="bbox 270 1088 308 1108; baseline 0 0"><span class='ocrx_word' id='word_1_28' title='bbox 270 1088 308 1108; x_wconf 93' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 416 1418 418 1534">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 416 1418 418 1534">
+     <span class='ocr_line' id='line_1_25' title="bbox 416 1418 418 1534; baseline 0 525"><span class='ocrx_word' id='word_1_29' title='bbox 416 1418 418 1534; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 325 616 327 1550">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 325 616 327 1550">
+     <span class='ocr_line' id='line_1_26' title="bbox 325 616 327 1550; baseline 0 509"><span class='ocrx_word' id='word_1_30' title='bbox 325 616 327 1550; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 444 1753 483 1773">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 444 1753 483 1773">
+     <span class='ocr_line' id='line_1_27' title="bbox 444 1753 483 1773; baseline 0 0"><span class='ocrx_word' id='word_1_31' title='bbox 444 1753 483 1773; x_wconf 87' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 496 1649 498 1825">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 496 1649 498 1825">
+     <span class='ocr_line' id='line_1_28' title="bbox 496 1649 498 1825; baseline 0 234"><span class='ocrx_word' id='word_1_32' title='bbox 496 1649 498 1825; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 323 1179 584 1743">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 323 1179 584 1743">
+     <span class='ocr_line' id='line_1_29' title="bbox 323 1179 584 1614; baseline 0 0"><span class='ocrx_word' id='word_1_33' title='bbox 323 1179 584 1614; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 323 1614 500 1743; baseline 0 0"><span class='ocrx_word' id='word_1_34' title='bbox 323 1614 500 1743; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 682 113 1375 151">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 682 113 1375 151">
+     <span class='ocr_line' id='line_1_31' title="bbox 682 113 1375 151; baseline 0 -7"><span class='ocrx_word' id='word_1_35' title='bbox 682 119 881 151; x_wconf 80' lang='eng' dir='ltr'><em>Psychromonas</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 891 121 1031 144; x_wconf 78' lang='eng' dir='ltr'><em>antarctica</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 1050 121 1121 144; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 1135 113 1233 144; x_wconf 87' lang='eng' dir='ltr'><em>10704T</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 1244 120 1375 150; x_wconf 85' lang='eng' dir='ltr'>(Y14697)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 594 238 1354 276">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 594 238 1354 276">
+     <span class='ocr_line' id='line_1_32' title="bbox 594 238 1354 276; baseline 0 -7"><span class='ocrx_word' id='word_1_40' title='bbox 594 244 726 269; x_wconf 83' lang='eng' dir='ltr'><em>Colwellia</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 731 244 959 276; x_wconf 80' lang='eng' dir='ltr'><em>psychrerythraea</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 977 245 1066 269; x_wconf 87' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 1076 238 1178 269; x_wconf 81' lang='eng' dir='ltr'><em>27364T</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 1187 245 1354 275; x_wconf 85' lang='eng' dir='ltr'>(AF001375)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 608 351 1311 388">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 608 351 1311 388">
+     <span class='ocr_line' id='line_1_33' title="bbox 608 351 1311 388; baseline -0.001 -6"><span class='ocrx_word' id='word_1_45' title='bbox 608 357 818 382; x_wconf 80' lang='eng' dir='ltr'><em>Thalassamonas</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 827 357 938 382; x_wconf 81' lang='eng' dir='ltr'><em>viridans</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 957 358 1029 382; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 1044 351 1141 382; x_wconf 88' lang='eng' dir='ltr'><em>13754T</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 1150 358 1311 388; x_wconf 87' lang='eng' dir='ltr'>(AJ294748)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 599 474 1620 512">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 599 474 1620 512">
+     <span class='ocr_line' id='line_1_34' title="bbox 599 474 1620 512; baseline 0 -7"><span class='ocrx_word' id='word_1_50' title='bbox 599 481 835 505; x_wconf 82' lang='eng' dir='ltr'><em>Pseudidiomarina</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 844 481 981 505; x_wconf 83' lang='eng' dir='ltr'><em>salinarum</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 994 481 1156 511; x_wconf 82' lang='eng' dir='ltr'><em>[Idiomarina</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 1165 481 1313 511; x_wconf 82' lang='eng' dir='ltr'><em>salinarum]</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 1334 474 1446 505; x_wconf 87' lang='eng' dir='ltr'><em>ISL-52T</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 1457 481 1620 512; x_wconf 87' lang='eng' dir='ltr'>(EF486355)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 632 585 1656 623">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 632 585 1656 623">
+     <span class='ocr_line' id='line_1_35' title="bbox 632 585 1656 623; baseline 0 -7"><span class='ocrx_word' id='word_1_56' title='bbox 632 592 868 616; x_wconf 81' lang='eng' dir='ltr'><em>Pseudidiomarina</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 878 592 1013 616; x_wconf 81' lang='eng' dir='ltr'><em>homiensis</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 1025 592 1188 623; x_wconf 78' lang='eng' dir='ltr'><em>[Idiomarina</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 1197 592 1342 623; x_wconf 85' lang='eng' dir='ltr'><em>homiensis]</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 1355 585 1473 616; x_wconf 82' lang='eng' dir='ltr'><em>PO-M2T</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 1484 592 1656 623; x_wconf 88' lang='eng' dir='ltr'>(DQ342238)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 780 707 1445 743">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 780 707 1445 743">
+     <span class='ocr_line' id='line_1_36' title="bbox 780 707 1445 743; baseline -0.002 -5"><span class='ocrx_word' id='word_1_62' title='bbox 780 713 1015 738; x_wconf 81' lang='eng' dir='ltr'><em>Pseudidiomarina</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 1024 714 1171 738; x_wconf 81' lang='eng' dir='ltr'><em>sediminum</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 1190 707 1273 738; x_wconf 73' lang='eng' dir='ltr'><em>(3121T</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 1282 714 1445 743; x_wconf 84' lang='eng' dir='ltr'>(EF212001)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 511 789 557 809">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 511 789 557 809">
+     <span class='ocr_line' id='line_1_37' title="bbox 511 789 557 809; baseline 0 0"><span class='ocrx_word' id='word_1_66' title='bbox 511 789 557 809; x_wconf 86' lang='eng'>89.5</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_37' title="bbox 698 820 1405 971">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 698 820 1405 971">
+     <span class='ocr_line' id='line_1_38' title="bbox 714 820 1405 856; baseline -0.001 -5"><span class='ocrx_word' id='word_1_67' title='bbox 714 826 950 851; x_wconf 80' lang='eng' dir='ltr'><em>Pseudidiamarina</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 960 828 1120 851; x_wconf 79' lang='eng' dir='ltr'><em>taiwanensis</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 1138 828 1188 850; x_wconf 89' lang='eng' dir='ltr'><em>PIT</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 1193 827 1202 850; x_wconf 94' lang='eng'><strong>1</strong></span> <span class='ocrx_word' id='word_1_71' title='bbox 1207 820 1223 839; x_wconf 79' lang='eng' dir='ltr'><strong>T</strong></span> <span class='ocrx_word' id='word_1_72' title='bbox 1233 827 1306 856; x_wconf 91' lang='eng' dir='ltr'>(DQl</span> <span class='ocrx_word' id='word_1_73' title='bbox 1314 827 1405 856; x_wconf 85' lang='eng'>18948)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 698 935 1404 971; baseline 0 -5"><span class='ocrx_word' id='word_1_74' title='bbox 698 942 939 966; x_wconf 84' lang='eng' dir='ltr'><strong><em>Pseudidiomarina</em></strong></span> <span class='ocrx_word' id='word_1_75' title='bbox 948 942 1110 966; x_wconf 82' lang='eng' dir='ltr'><em>tainanensis</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 1128 935 1222 966; x_wconf 87' lang='eng' dir='ltr'><em>PINlT</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 1233 942 1404 971; x_wconf 87' lang='eng' dir='ltr'>(EU423907)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_38' title="bbox 555 1018 1359 1085">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 555 1018 1359 1085">
+     <span class='ocr_line' id='line_1_40' title="bbox 555 1018 594 1038; baseline 0 0"><span class='ocrx_word' id='word_1_78' title='bbox 555 1018 594 1038; x_wconf 91' lang='eng'><em>100</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 705 1049 1359 1085; baseline 0 -5"><span class='ocrx_word' id='word_1_79' title='bbox 705 1056 946 1080; x_wconf 82' lang='eng' dir='ltr'><em>Pseudidiomarina</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 956 1056 1057 1080; x_wconf 85' lang='eng' dir='ltr'><em>marina</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 1076 1049 1178 1080; x_wconf 88' lang='eng' dir='ltr'><em>PIMlT</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 1189 1056 1359 1085; x_wconf 86' lang='eng' dir='ltr'>(EU423908)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_39' title="bbox 570 1171 1307 1436">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 570 1171 1307 1436">
+     <span class='ocr_line' id='line_1_42' title="bbox 570 1171 1307 1209; baseline 0 -7"><span class='ocrx_word' id='word_1_83' title='bbox 570 1178 919 1209; x_wconf 74' lang='eng' dir='ltr'><em>Idiomarinaﬁmtislapidosi</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 938 1179 1012 1202; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_85' title='bbox 1022 1171 1123 1202; x_wconf 86' lang='eng' dir='ltr'><em>22169T</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 1134 1178 1307 1209; x_wconf 88' lang='eng' dir='ltr'>(AY526861)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 591 1284 1149 1322; baseline 0 -7"><span class='ocrx_word' id='word_1_87' title='bbox 591 1291 745 1315; x_wconf 80' lang='eng' dir='ltr'><em>ldiomarina</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 755 1291 848 1315; x_wconf 82' lang='eng' dir='ltr'><em>baltica</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 867 1284 978 1315; x_wconf 83' lang='eng' dir='ltr'><em>OSl45T</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 988 1291 1149 1322; x_wconf 88' lang='eng' dir='ltr'>(AJ440214)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 587 1399 1208 1436; baseline -0.002 -6"><span class='ocrx_word' id='word_1_91' title='bbox 587 1405 741 1430; x_wconf 80' lang='eng' dir='ltr'><em>Idiomarina</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 749 1405 851 1430; x_wconf 83' lang='eng' dir='ltr'><em>zobellii</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 869 1406 953 1429; x_wconf 94' lang='eng' dir='ltr'>KMM</span> <span class='ocrx_word' id='word_1_94' title='bbox 963 1399 1030 1430; x_wconf 86' lang='eng' dir='ltr'><em>231T</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 1041 1405 1208 1436; x_wconf 87' lang='eng' dir='ltr'>(AF052741)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_40' title="bbox 596 1512 1257 1549">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 596 1512 1257 1549">
+     <span class='ocr_line' id='line_1_45' title="bbox 596 1512 1257 1549; baseline 0 -6"><span class='ocrx_word' id='word_1_96' title='bbox 596 1518 750 1543; x_wconf 80' lang='eng' dir='ltr'><em>Idiomarina</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 759 1520 912 1543; x_wconf 79' lang='eng' dir='ltr'><em>seasinensis</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 931 1512 1074 1543; x_wconf 82' lang='eng' dir='ltr'><em>CL-SP19T</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 1084 1519 1257 1549; x_wconf 86' lang='eng' dir='ltr'>(AY635468)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_41' title="bbox 498 1632 1203 1669">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 498 1632 1203 1669">
+     <span class='ocr_line' id='line_1_46' title="bbox 498 1632 1203 1669; baseline -0.001 -6"><span class='ocrx_word' id='word_1_100' title='bbox 498 1649 546 1651; x_wconf 93' lang='eng'>—</span> <span class='ocrx_word' id='word_1_101' title='bbox 558 1638 712 1663; x_wconf 80' lang='eng' dir='ltr'><em>Idiomarina</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 722 1638 846 1669; x_wconf 80' lang='eng' dir='ltr'><em>abyssalis</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 865 1639 948 1662; x_wconf 89' lang='eng' dir='ltr'>KMM</span> <span class='ocrx_word' id='word_1_104' title='bbox 959 1632 1026 1663; x_wconf 87' lang='eng' dir='ltr'><em>227T</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 1037 1638 1203 1669; x_wconf 89' lang='eng' dir='ltr'>(AF052740)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_42' title="bbox 536 1749 1303 1786">
+    <p class='ocr_par' dir='ltr' id='par_1_42' title="bbox 536 1749 1303 1786">
+     <span class='ocr_line' id='line_1_47' title="bbox 536 1749 1303 1786; baseline 0 -7"><span class='ocrx_word' id='word_1_106' title='bbox 536 1765 592 1767; x_wconf 90' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_107' title='bbox 603 1755 757 1779; x_wconf 79' lang='eng' dir='ltr'><em>Idiomarina</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 766 1755 915 1779; x_wconf 78' lang='eng' dir='ltr'><em>ramblicola</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 934 1756 1007 1779; x_wconf 89' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_110' title='bbox 1018 1749 1120 1779; x_wconf 90' lang='eng' dir='ltr'><em>22170T</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 1130 1755 1303 1786; x_wconf 85' lang='eng' dir='ltr'>(AY526862)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_43' title="bbox 534 1765 536 1884">
+    <p class='ocr_par' dir='ltr' id='par_1_43' title="bbox 534 1765 536 1884">
+     <span class='ocr_line' id='line_1_48' title="bbox 534 1765 536 1884; baseline 0 175"><span class='ocrx_word' id='word_1_112' title='bbox 534 1765 536 1884; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_44' title="bbox 472 1823 533 1860">
+    <p class='ocr_par' dir='ltr' id='par_1_44' title="bbox 472 1840 520 1860">
+     <span class='ocr_line' id='line_1_49' title="bbox 472 1840 520 1860; baseline 0 0"><span class='ocrx_word' id='word_1_113' title='bbox 472 1840 520 1860; x_wconf 88' lang='eng'>99.4</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_45' title="bbox 536 1861 1177 1898">
+    <p class='ocr_par' dir='ltr' id='par_1_45' title="bbox 536 1861 1177 1898">
+     <span class='ocr_line' id='line_1_50' title="bbox 536 1861 1177 1898; baseline 0 -6"><span class='ocrx_word' id='word_1_114' title='bbox 536 1883 569 1884; x_wconf 37' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 579 1867 733 1892; x_wconf 81' lang='eng' dir='ltr'><em>Idiomarina</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 743 1867 872 1892; x_wconf 81' lang='eng' dir='ltr'><em>loihiensz&#39;s</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 891 1861 1000 1892; x_wconf 79' lang='eng' dir='ltr'><em>LZ-TRT</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 1010 1868 1063 1898; x_wconf 88' lang='eng' dir='ltr'><em>(AF</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 1065 1868 1177 1898; x_wconf 87' lang='eng'>288370)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_46' title="bbox 28 1997 646 1999">
+    <p class='ocr_par' dir='ltr' id='par_1_46' title="bbox 28 1997 646 1999">
+     <span class='ocr_line' id='line_1_51' title="bbox 28 1997 646 1999; baseline 0 60"><span class='ocrx_word' id='word_1_120' title='bbox 28 1997 646 1999; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_47' title="bbox 28 2057 131 2059">
+    <p class='ocr_par' dir='ltr' id='par_1_47' title="bbox 28 2057 131 2059">
+     <span class='ocr_line' id='line_1_52' title="bbox 28 2057 131 2059; baseline 0 0"><span class='ocrx_word' id='word_1_121' title='bbox 28 2057 131 2059; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_48' title="bbox 54 2026 100 2046">
+    <p class='ocr_par' dir='ltr' id='par_1_48' title="bbox 54 2026 100 2046">
+     <span class='ocr_line' id='line_1_53' title="bbox 54 2026 100 2046; baseline -0.022 0"><span class='ocrx_word' id='word_1_122' title='bbox 54 2026 100 2046; x_wconf 90' lang='eng'><em>0.01</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_49' title="bbox 660 1976 1409 2014">
+    <p class='ocr_par' dir='ltr' id='par_1_49' title="bbox 660 1976 1409 2014">
+     <span class='ocr_line' id='line_1_54' title="bbox 660 1976 1409 2014; baseline -0.001 -6"><span class='ocrx_word' id='word_1_123' title='bbox 660 1984 845 2008; x_wconf 83' lang='eng' dir='ltr'><em>Oceanimonas</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 855 1983 1008 2014; x_wconf 72' lang='eng' dir='ltr'><em>doudoroﬂii</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 1026 1984 1116 2008; x_wconf 91' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_126' title='bbox 1126 1976 1228 2008; x_wconf 81' lang='eng' dir='ltr'><em>27123T</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 1239 1983 1409 2014; x_wconf 89' lang='eng' dir='ltr'>(AB019390)</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001230-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001230-0-000.pbm.png
new file mode 100644
index 00000000..4f6eb45e
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001230-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001230-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001230-0-000.pbm.png.hocr
new file mode 100644
index 00000000..c68ae690
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001230-0-000.pbm.png.hocr
@@ -0,0 +1,196 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001230-0-000.pbm.png"; bbox 0 0 1894 1744; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 412 780 438 801">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 412 780 438 801">
+     <span class='ocr_line' id='line_1_1' title="bbox 412 780 438 801; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 412 780 438 801; x_wconf 88' lang='eng'>91</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 556 198 601 219">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 556 198 601 219">
+     <span class='ocr_line' id='line_1_2' title="bbox 556 198 601 219; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 556 198 601 219; x_wconf 92' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 543 791 569 812">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 543 791 569 812">
+     <span class='ocr_line' id='line_1_3' title="bbox 543 791 569 812; baseline 0 0"><span class='ocrx_word' id='word_1_3' title='bbox 543 791 569 812; x_wconf 87' lang='eng'>81</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 980 8 1538 38">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 980 8 1538 38">
+     <span class='ocr_line' id='line_1_4' title="bbox 980 8 1538 38; baseline 0 -6"><span class='ocrx_word' id='word_1_4' title='bbox 980 11 1004 32; x_wconf 70' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_5' title='bbox 1017 11 1199 32; x_wconf 81' lang='eng' dir='ltr'>radioresistens</span> <span class='ocrx_word' id='word_1_6' title='bbox 1217 11 1281 32; x_wconf 91' lang='eng' dir='ltr'>CCM</span> <span class='ocrx_word' id='word_1_7' title='bbox 1293 8 1368 32; x_wconf 81' lang='eng' dir='ltr'>3588T</span> <span class='ocrx_word' id='word_1_8' title='bbox 1382 11 1538 38; x_wconf 90' lang='eng' dir='ltr'>(EU477112)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 766 43 1143 70">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 766 43 1143 70">
+     <span class='ocr_line' id='line_1_5' title="bbox 766 43 1143 70; baseline 0 -6"><span class='ocrx_word' id='word_1_9' title='bbox 766 43 791 64; x_wconf 93' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_10' title='bbox 802 43 878 70; x_wconf 84' lang='eng' dir='ltr'><em>baylyi</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 892 43 964 64; x_wconf 90' lang='eng' dir='ltr'>ADP1</span> <span class='ocrx_word' id='word_1_12' title='bbox 987 43 1143 70; x_wconf 90' lang='eng' dir='ltr'>(EU477155)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 703 524 748 545">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 703 524 748 545">
+     <span class='ocr_line' id='line_1_6' title="bbox 703 524 748 545; baseline 0 0"><span class='ocrx_word' id='word_1_13' title='bbox 703 524 748 545; x_wconf 93' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 754 714 798 735">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 754 714 798 735">
+     <span class='ocr_line' id='line_1_7' title="bbox 754 714 798 735; baseline 0 0"><span class='ocrx_word' id='word_1_14' title='bbox 754 714 798 735; x_wconf 92' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 796 890 841 912">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 796 890 841 912">
+     <span class='ocr_line' id='line_1_8' title="bbox 796 890 841 912; baseline 0 0"><span class='ocrx_word' id='word_1_15' title='bbox 796 890 841 912; x_wconf 92' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 775 1344 820 1365">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 775 1344 820 1365">
+     <span class='ocr_line' id='line_1_9' title="bbox 775 1344 820 1365; baseline 0 0"><span class='ocrx_word' id='word_1_16' title='bbox 775 1344 820 1365; x_wconf 91' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 657 1652 705 1674">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 657 1652 705 1674">
+     <span class='ocr_line' id='line_1_10' title="bbox 657 1652 705 1674; baseline 0.021 -1"><span class='ocrx_word' id='word_1_17' title='bbox 657 1652 705 1674; x_wconf 88' lang='eng'>2%</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 832 74 1888 1740">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 832 74 1888 1740">
+     <span class='ocr_line' id='line_1_11' title="bbox 850 74 1305 104; baseline 0 -6"><span class='ocrx_word' id='word_1_18' title='bbox 850 77 875 98; x_wconf 93' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_19' title='bbox 888 77 981 104; x_wconf 86' lang='eng' dir='ltr'>ursingii</span> <span class='ocrx_word' id='word_1_20' title='bbox 998 77 1064 98; x_wconf 89' lang='eng' dir='ltr'>NIPH</span> <span class='ocrx_word' id='word_1_21' title='bbox 1078 74 1135 98; x_wconf 89' lang='eng' dir='ltr'>137T</span> <span class='ocrx_word' id='word_1_22' title='bbox 1149 77 1305 104; x_wconf 91' lang='eng' dir='ltr'>(EU477105)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 1019 105 1489 135; baseline 0 -6"><span class='ocrx_word' id='word_1_23' title='bbox 1019 108 1044 129; x_wconf 93' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_24' title='bbox 1057 108 1151 129; x_wconf 85' lang='eng' dir='ltr'>towneri</span> <span class='ocrx_word' id='word_1_25' title='bbox 1168 108 1232 129; x_wconf 87' lang='eng' dir='ltr'>CCM</span> <span class='ocrx_word' id='word_1_26' title='bbox 1243 105 1319 129; x_wconf 91' lang='eng' dir='ltr'>7201T</span> <span class='ocrx_word' id='word_1_27' title='bbox 1332 108 1489 135; x_wconf 86' lang='eng' dir='ltr'>(EU477154)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 880 138 1342 167; baseline 0 -6"><span class='ocrx_word' id='word_1_28' title='bbox 880 140 904 161; x_wconf 95' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 917 140 1004 161; x_wconf 81' lang='eng' dir='ltr'>tandoii</span> <span class='ocrx_word' id='word_1_30' title='bbox 1020 140 1084 161; x_wconf 91' lang='eng' dir='ltr'>CCM</span> <span class='ocrx_word' id='word_1_31' title='bbox 1095 138 1171 161; x_wconf 79' lang='eng' dir='ltr'>7199T</span> <span class='ocrx_word' id='word_1_32' title='bbox 1185 140 1342 167; x_wconf 89' lang='eng' dir='ltr'>(EU477152)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 1058 169 1525 199; baseline 0 -6"><span class='ocrx_word' id='word_1_33' title='bbox 1058 172 1083 193; x_wconf 95' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 1095 172 1188 199; x_wconf 88' lang='eng' dir='ltr'>gerneri</span> <span class='ocrx_word' id='word_1_35' title='bbox 1204 172 1267 193; x_wconf 88' lang='eng' dir='ltr'>CCM</span> <span class='ocrx_word' id='word_1_36' title='bbox 1278 169 1354 193; x_wconf 90' lang='eng' dir='ltr'>7197T</span> <span class='ocrx_word' id='word_1_37' title='bbox 1368 172 1525 199; x_wconf 92' lang='eng' dir='ltr'>(EU477151)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 1004 203 1760 230; baseline 0 -6"><span class='ocrx_word' id='word_1_38' title='bbox 1004 203 1120 224; x_wconf 84' lang='eng' dir='ltr'>Genomic</span> <span class='ocrx_word' id='word_1_39' title='bbox 1130 209 1165 230; x_wconf 71' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_40' title='bbox 1179 203 1208 224; x_wconf 93' lang='eng'>10</span> <span class='ocrx_word' id='word_1_41' title='bbox 1227 203 1287 224; x_wconf 93' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_42' title='bbox 1300 203 1361 224; x_wconf 87' lang='eng'>1003</span> <span class='ocrx_word' id='word_1_43' title='bbox 1373 203 1397 230; x_wconf 89' lang='eng'>(=</span> <span class='ocrx_word' id='word_1_44' title='bbox 1406 203 1484 224; x_wconf 87' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_45' title='bbox 1497 203 1584 230; x_wconf 87' lang='eng'>17924)</span> <span class='ocrx_word' id='word_1_46' title='bbox 1604 203 1760 230; x_wconf 91' lang='eng' dir='ltr'>(EU477116)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 948 235 1688 262; baseline 0 -6"><span class='ocrx_word' id='word_1_47' title='bbox 948 235 1064 256; x_wconf 85' lang='eng' dir='ltr'>Genomic</span> <span class='ocrx_word' id='word_1_48' title='bbox 1074 241 1110 262; x_wconf 86' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_49' title='bbox 1124 235 1148 256; x_wconf 97' lang='eng'>11</span> <span class='ocrx_word' id='word_1_50' title='bbox 1172 235 1231 256; x_wconf 91' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_51' title='bbox 1243 235 1290 256; x_wconf 86' lang='eng'>988</span> <span class='ocrx_word' id='word_1_52' title='bbox 1301 236 1325 262; x_wconf 93' lang='eng'>(=</span> <span class='ocrx_word' id='word_1_53' title='bbox 1334 235 1413 256; x_wconf 92' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_54' title='bbox 1426 235 1513 262; x_wconf 87' lang='eng'>11171)</span> <span class='ocrx_word' id='word_1_55' title='bbox 1533 235 1688 262; x_wconf 91' lang='eng' dir='ltr'>(EU477117)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 909 268 1477 295; baseline 0 -6"><span class='ocrx_word' id='word_1_56' title='bbox 909 268 1025 289; x_wconf 83' lang='eng' dir='ltr'>Genomic</span> <span class='ocrx_word' id='word_1_57' title='bbox 1035 274 1071 295; x_wconf 81' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_58' title='bbox 1085 268 1151 289; x_wconf 90' lang='eng' dir='ltr'>15TU</span> <span class='ocrx_word' id='word_1_59' title='bbox 1172 268 1226 289; x_wconf 96' lang='eng' dir='ltr'>LUH</span> <span class='ocrx_word' id='word_1_60' title='bbox 1240 268 1301 289; x_wconf 88' lang='eng'>1090</span> <span class='ocrx_word' id='word_1_61' title='bbox 1321 268 1477 295; x_wconf 84' lang='eng' dir='ltr'>(EU477119)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 1039 297 1488 327; baseline 0 -6"><span class='ocrx_word' id='word_1_62' title='bbox 1039 300 1064 321; x_wconf 89' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_63' title='bbox 1076 300 1150 322; x_wconf 82' lang='eng' dir='ltr'>lwoffii</span> <span class='ocrx_word' id='word_1_64' title='bbox 1166 300 1230 321; x_wconf 91' lang='eng' dir='ltr'>CCM</span> <span class='ocrx_word' id='word_1_65' title='bbox 1241 297 1317 321; x_wconf 91' lang='eng' dir='ltr'>5581T</span> <span class='ocrx_word' id='word_1_66' title='bbox 1331 300 1488 327; x_wconf 87' lang='eng' dir='ltr'>(EU477111)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 1004 332 1481 361; baseline 0 -5"><span class='ocrx_word' id='word_1_67' title='bbox 1004 335 1029 356; x_wconf 93' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_68' title='bbox 1042 335 1143 356; x_wconf 86' lang='eng' dir='ltr'>bouvetii</span> <span class='ocrx_word' id='word_1_69' title='bbox 1159 335 1224 356; x_wconf 90' lang='eng' dir='ltr'>CCM</span> <span class='ocrx_word' id='word_1_70' title='bbox 1235 332 1311 356; x_wconf 81' lang='eng' dir='ltr'>7196T</span> <span class='ocrx_word' id='word_1_71' title='bbox 1325 335 1481 361; x_wconf 89' lang='eng' dir='ltr'>(EU477150)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 950 361 1453 391; baseline 0 -6"><span class='ocrx_word' id='word_1_72' title='bbox 950 364 975 385; x_wconf 95' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_73' title='bbox 988 364 1113 385; x_wconf 82' lang='eng' dir='ltr'>schind/eri</span> <span class='ocrx_word' id='word_1_74' title='bbox 1130 364 1195 385; x_wconf 91' lang='eng' dir='ltr'>NIPH</span> <span class='ocrx_word' id='word_1_75' title='bbox 1209 361 1283 385; x_wconf 90' lang='eng' dir='ltr'>1034T</span> <span class='ocrx_word' id='word_1_76' title='bbox 1296 364 1453 391; x_wconf 89' lang='eng' dir='ltr'>(EU477128)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 980 395 1407 425; baseline 0 -7"><span class='ocrx_word' id='word_1_77' title='bbox 980 397 1004 418; x_wconf 94' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_78' title='bbox 1012 397 1070 425; x_wconf 88' lang='eng' dir='ltr'>junii</span> <span class='ocrx_word' id='word_1_79' title='bbox 1086 397 1150 418; x_wconf 91' lang='eng' dir='ltr'>CCM</span> <span class='ocrx_word' id='word_1_80' title='bbox 1161 395 1237 418; x_wconf 80' lang='eng' dir='ltr'>2376T</span> <span class='ocrx_word' id='word_1_81' title='bbox 1251 397 1407 424; x_wconf 91' lang='eng' dir='ltr'>(EU477110)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 1044 431 1784 458; baseline 0 -6"><span class='ocrx_word' id='word_1_82' title='bbox 1044 431 1160 452; x_wconf 89' lang='eng' dir='ltr'>Genomic</span> <span class='ocrx_word' id='word_1_83' title='bbox 1171 437 1207 458; x_wconf 69' lang='eng' dir='ltr'>sp,</span> <span class='ocrx_word' id='word_1_84' title='bbox 1218 431 1232 452; x_wconf 90' lang='eng'>6</span> <span class='ocrx_word' id='word_1_85' title='bbox 1252 431 1311 452; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_86' title='bbox 1324 431 1385 452; x_wconf 90' lang='eng'>1026</span> <span class='ocrx_word' id='word_1_87' title='bbox 1397 431 1421 458; x_wconf 95' lang='eng'>(=</span> <span class='ocrx_word' id='word_1_88' title='bbox 1431 431 1509 452; x_wconf 93' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_89' title='bbox 1522 431 1609 458; x_wconf 84' lang='eng'>17979)</span> <span class='ocrx_word' id='word_1_90' title='bbox 1628 431 1784 458; x_wconf 89' lang='eng' dir='ltr'>(EU477115)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 941 459 1488 489; baseline 0 -6"><span class='ocrx_word' id='word_1_91' title='bbox 941 462 965 483; x_wconf 95' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_92' title='bbox 978 462 1148 489; x_wconf 80' lang='eng' dir='ltr'>haemolyticus</span> <span class='ocrx_word' id='word_1_93' title='bbox 1166 462 1231 483; x_wconf 90' lang='eng' dir='ltr'>CCM</span> <span class='ocrx_word' id='word_1_94' title='bbox 1242 459 1318 483; x_wconf 83' lang='eng' dir='ltr'>2358T</span> <span class='ocrx_word' id='word_1_95' title='bbox 1331 462 1488 489; x_wconf 86' lang='eng' dir='ltr'>(EU477109)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 936 491 1738 521; baseline 0 -6"><span class='ocrx_word' id='word_1_96' title='bbox 936 491 981 512; x_wconf 89' lang='eng'>100</span> <span class='ocrx_word' id='word_1_97' title='bbox 1156 494 1181 515; x_wconf 95' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_98' title='bbox 1194 494 1369 515; x_wconf 84' lang='eng' dir='ltr'>ca/coaceticus</span> <span class='ocrx_word' id='word_1_99' title='bbox 1386 494 1464 515; x_wconf 88' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_100' title='bbox 1475 491 1567 515; x_wconf 83' lang='eng' dir='ltr'>23055T</span> <span class='ocrx_word' id='word_1_101' title='bbox 1581 494 1738 521; x_wconf 88' lang='eng' dir='ltr'>(EU477149)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 1108 526 1839 553; baseline 0 -6"><span class='ocrx_word' id='word_1_102' title='bbox 1108 526 1225 547; x_wconf 84' lang='eng' dir='ltr'>Genomic</span> <span class='ocrx_word' id='word_1_103' title='bbox 1235 532 1270 553; x_wconf 87' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_104' title='bbox 1283 526 1400 547; x_wconf 79' lang='eng' dir='ltr'>‘Between</span> <span class='ocrx_word' id='word_1_105' title='bbox 1413 526 1421 547; x_wconf 96' lang='eng'>1</span> <span class='ocrx_word' id='word_1_106' title='bbox 1436 526 1482 547; x_wconf 87' lang='eng' dir='ltr'>and</span> <span class='ocrx_word' id='word_1_107' title='bbox 1494 526 1514 547; x_wconf 89' lang='eng'>3’</span> <span class='ocrx_word' id='word_1_108' title='bbox 1534 526 1588 547; x_wconf 94' lang='eng' dir='ltr'>LUH</span> <span class='ocrx_word' id='word_1_109' title='bbox 1602 526 1664 547; x_wconf 86' lang='eng'>1469</span> <span class='ocrx_word' id='word_1_110' title='bbox 1683 526 1839 553; x_wconf 92' lang='eng' dir='ltr'>(EU477122)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 1143 557 1883 584; baseline 0 -6"><span class='ocrx_word' id='word_1_111' title='bbox 1143 557 1259 578; x_wconf 89' lang='eng' dir='ltr'>Genomic</span> <span class='ocrx_word' id='word_1_112' title='bbox 1269 563 1305 584; x_wconf 73' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_113' title='bbox 1317 557 1331 578; x_wconf 86' lang='eng'>3</span> <span class='ocrx_word' id='word_1_114' title='bbox 1350 557 1410 578; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_115' title='bbox 1423 557 1485 578; x_wconf 86' lang='eng'>1035</span> <span class='ocrx_word' id='word_1_116' title='bbox 1496 557 1520 584; x_wconf 91' lang='eng'>(=</span> <span class='ocrx_word' id='word_1_117' title='bbox 1529 557 1608 578; x_wconf 91' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_118' title='bbox 1620 557 1708 584; x_wconf 89' lang='eng'>19004)</span> <span class='ocrx_word' id='word_1_119' title='bbox 1727 557 1883 584; x_wconf 89' lang='eng' dir='ltr'>(EU477114)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 832 587 1656 617; baseline 0 -6"><span class='ocrx_word' id='word_1_120' title='bbox 832 594 862 615; x_wconf 84' lang='eng'>97</span> <span class='ocrx_word' id='word_1_121' title='bbox 1115 590 1140 611; x_wconf 94' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_122' title='bbox 1152 590 1289 612; x_wconf 87' lang='eng' dir='ltr'>baumannii</span> <span class='ocrx_word' id='word_1_123' title='bbox 1304 590 1382 611; x_wconf 89' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_124' title='bbox 1395 587 1486 611; x_wconf 81' lang='eng' dir='ltr'>19606T</span> <span class='ocrx_word' id='word_1_125' title='bbox 1500 590 1656 617; x_wconf 88' lang='eng' dir='ltr'>(EU477108)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 1124 622 1822 649; baseline 0 -6"><span class='ocrx_word' id='word_1_126' title='bbox 1124 622 1241 643; x_wconf 85' lang='eng' dir='ltr'>Genomic</span> <span class='ocrx_word' id='word_1_127' title='bbox 1251 628 1286 649; x_wconf 88' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_128' title='bbox 1299 622 1378 643; x_wconf 79' lang='eng' dir='ltr'>‘Close</span> <span class='ocrx_word' id='word_1_129' title='bbox 1387 623 1411 643; x_wconf 90' lang='eng' dir='ltr'>to</span> <span class='ocrx_word' id='word_1_130' title='bbox 1423 622 1497 643; x_wconf 78' lang='eng' dir='ltr'>13TU’</span> <span class='ocrx_word' id='word_1_131' title='bbox 1518 622 1572 643; x_wconf 96' lang='eng' dir='ltr'>LUH</span> <span class='ocrx_word' id='word_1_132' title='bbox 1586 622 1646 643; x_wconf 90' lang='eng'>1472</span> <span class='ocrx_word' id='word_1_133' title='bbox 1666 622 1822 649; x_wconf 88' lang='eng' dir='ltr'>(EU477126)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 870 654 1888 681; baseline 0 -6"><span class='ocrx_word' id='word_1_134' title='bbox 870 654 901 675; x_wconf 87' lang='eng'>80</span> <span class='ocrx_word' id='word_1_135' title='bbox 1116 654 1233 675; x_wconf 85' lang='eng' dir='ltr'>Genomic</span> <span class='ocrx_word' id='word_1_136' title='bbox 1243 660 1278 681; x_wconf 84' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_137' title='bbox 1292 654 1358 675; x_wconf 89' lang='eng' dir='ltr'>13TU</span> <span class='ocrx_word' id='word_1_138' title='bbox 1371 654 1431 675; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_139' title='bbox 1443 654 1489 675; x_wconf 87' lang='eng'>993</span> <span class='ocrx_word' id='word_1_140' title='bbox 1501 654 1525 681; x_wconf 93' lang='eng'>(=</span> <span class='ocrx_word' id='word_1_141' title='bbox 1534 654 1612 675; x_wconf 91' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_142' title='bbox 1625 654 1712 681; x_wconf 86' lang='eng'>17903)</span> <span class='ocrx_word' id='word_1_143' title='bbox 1733 654 1888 681; x_wconf 90' lang='eng' dir='ltr'>(EU477118)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 843 683 1374 713; baseline 0 -6"><span class='ocrx_word' id='word_1_144' title='bbox 843 686 868 707; x_wconf 95' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_145' title='bbox 881 686 1034 713; x_wconf 85' lang='eng' dir='ltr'>tjernbergiae</span> <span class='ocrx_word' id='word_1_146' title='bbox 1053 686 1117 707; x_wconf 90' lang='eng' dir='ltr'>CCM</span> <span class='ocrx_word' id='word_1_147' title='bbox 1128 683 1204 707; x_wconf 90' lang='eng' dir='ltr'>7200T</span> <span class='ocrx_word' id='word_1_148' title='bbox 1218 686 1374 713; x_wconf 90' lang='eng' dir='ltr'>(EU477153)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 891 718 1457 745; baseline 0 -6"><span class='ocrx_word' id='word_1_149' title='bbox 891 718 1007 739; x_wconf 90' lang='eng' dir='ltr'>Genomic</span> <span class='ocrx_word' id='word_1_150' title='bbox 1017 724 1053 745; x_wconf 86' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_151' title='bbox 1067 718 1095 739; x_wconf 87' lang='eng'>16</span> <span class='ocrx_word' id='word_1_152' title='bbox 1113 718 1192 739; x_wconf 89' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_153' title='bbox 1204 718 1282 739; x_wconf 87' lang='eng'>17988</span> <span class='ocrx_word' id='word_1_154' title='bbox 1301 718 1457 745; x_wconf 88' lang='eng' dir='ltr'>(EU477135)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 891 750 1454 777; baseline 0 -6"><span class='ocrx_word' id='word_1_155' title='bbox 891 750 1007 771; x_wconf 90' lang='eng' dir='ltr'>Genomic</span> <span class='ocrx_word' id='word_1_156' title='bbox 1017 756 1053 777; x_wconf 85' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_157' title='bbox 1067 750 1129 771; x_wconf 80' lang='eng' dir='ltr'>1SBJ</span> <span class='ocrx_word' id='word_1_158' title='bbox 1149 750 1203 771; x_wconf 95' lang='eng' dir='ltr'>LUH</span> <span class='ocrx_word' id='word_1_159' title='bbox 1217 750 1279 771; x_wconf 85' lang='eng'>1729</span> <span class='ocrx_word' id='word_1_160' title='bbox 1298 750 1454 777; x_wconf 86' lang='eng' dir='ltr'>(EU477133)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 955 782 1506 809; baseline 0 -6"><span class='ocrx_word' id='word_1_161' title='bbox 955 782 984 803; x_wconf 69' lang='eng' dir='ltr'>‘A,</span> <span class='ocrx_word' id='word_1_162' title='bbox 998 782 1143 803; x_wconf 82' lang='eng' dir='ltr'>venetianus‘</span> <span class='ocrx_word' id='word_1_163' title='bbox 1161 782 1239 803; x_wconf 87' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_164' title='bbox 1251 782 1330 803; x_wconf 89' lang='eng'>31012</span> <span class='ocrx_word' id='word_1_165' title='bbox 1350 782 1506 809; x_wconf 88' lang='eng' dir='ltr'>(EU477136)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 870 814 1398 841; baseline 0 -6"><span class='ocrx_word' id='word_1_166' title='bbox 870 814 986 835; x_wconf 90' lang='eng' dir='ltr'>Genomic</span> <span class='ocrx_word' id='word_1_167' title='bbox 996 820 1032 841; x_wconf 86' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_168' title='bbox 1046 814 1074 835; x_wconf 95' lang='eng'>17</span> <span class='ocrx_word' id='word_1_169' title='bbox 1094 814 1148 835; x_wconf 96' lang='eng' dir='ltr'>LUH</span> <span class='ocrx_word' id='word_1_170' title='bbox 1162 814 1223 835; x_wconf 87' lang='eng'>1736</span> <span class='ocrx_word' id='word_1_171' title='bbox 1243 814 1398 841; x_wconf 86' lang='eng' dir='ltr'>(EU477134)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 978 845 1466 872; baseline 0 -6"><span class='ocrx_word' id='word_1_172' title='bbox 978 845 1143 872; x_wconf 83' lang='eng' dir='ltr'>gyllenbergii</span> <span class='ocrx_word' id='word_1_173' title='bbox 1159 845 1215 866; x_wconf 95' lang='eng' dir='ltr'>LUH</span> <span class='ocrx_word' id='word_1_174' title='bbox 1229 845 1291 866; x_wconf 92' lang='eng'>1737</span> <span class='ocrx_word' id='word_1_175' title='bbox 1310 845 1466 872; x_wconf 91' lang='eng' dir='ltr'>(EU477121)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 978 877 1466 905; baseline 0 -7"><span class='ocrx_word' id='word_1_176' title='bbox 978 877 1143 905; x_wconf 85' lang='eng' dir='ltr'>gyllenbergii</span> <span class='ocrx_word' id='word_1_177' title='bbox 1159 877 1215 898; x_wconf 95' lang='eng' dir='ltr'><strong>LUH</strong></span> <span class='ocrx_word' id='word_1_178' title='bbox 1227 877 1291 898; x_wconf 87' lang='eng'>5809</span> <span class='ocrx_word' id='word_1_179' title='bbox 1310 877 1466 905; x_wconf 90' lang='eng' dir='ltr'>(EU477131)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 978 907 1483 937; baseline 0 -6"><span class='ocrx_word' id='word_1_180' title='bbox 978 910 1143 937; x_wconf 89' lang='eng' dir='ltr'>gyllenbergii</span> <span class='ocrx_word' id='word_1_181' title='bbox 1160 910 1225 931; x_wconf 97' lang='eng' dir='ltr'><strong>NIPH</strong></span> <span class='ocrx_word' id='word_1_182' title='bbox 1236 907 1313 931; x_wconf 88' lang='eng' dir='ltr'>2150T</span> <span class='ocrx_word' id='word_1_183' title='bbox 1326 910 1483 937; x_wconf 88' lang='eng' dir='ltr'>(EU477148)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 978 942 1466 969; baseline 0 -6"><span class='ocrx_word' id='word_1_184' title='bbox 978 942 1143 969; x_wconf 89' lang='eng' dir='ltr'>gyllenbergii</span> <span class='ocrx_word' id='word_1_185' title='bbox 1159 942 1215 963; x_wconf 97' lang='eng' dir='ltr'>LUH</span> <span class='ocrx_word' id='word_1_186' title='bbox 1229 942 1291 963; x_wconf 92' lang='eng'>1740</span> <span class='ocrx_word' id='word_1_187' title='bbox 1310 942 1466 969; x_wconf 90' lang='eng' dir='ltr'>(EU477127)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 978 976 1466 1003; baseline 0 -6"><span class='ocrx_word' id='word_1_188' title='bbox 978 976 1143 1003; x_wconf 88' lang='eng' dir='ltr'>gyllenbergii</span> <span class='ocrx_word' id='word_1_189' title='bbox 1159 976 1215 997; x_wconf 97' lang='eng' dir='ltr'>LUH</span> <span class='ocrx_word' id='word_1_190' title='bbox 1227 976 1287 997; x_wconf 88' lang='eng'>6541</span> <span class='ocrx_word' id='word_1_191' title='bbox 1310 976 1466 1003; x_wconf 90' lang='eng' dir='ltr'>(EU477144)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 978 1008 1459 1035; baseline 0 -6"><span class='ocrx_word' id='word_1_192' title='bbox 978 1008 1143 1035; x_wconf 88' lang='eng' dir='ltr'>gyllenbergii</span> <span class='ocrx_word' id='word_1_193' title='bbox 1160 1008 1225 1029; x_wconf 93' lang='eng' dir='ltr'>NIPH</span> <span class='ocrx_word' id='word_1_194' title='bbox 1236 1008 1283 1029; x_wconf 88' lang='eng'>230</span> <span class='ocrx_word' id='word_1_195' title='bbox 1303 1008 1459 1035; x_wconf 90' lang='eng' dir='ltr'>(EU477106)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 978 1039 1466 1066; baseline 0 -6"><span class='ocrx_word' id='word_1_196' title='bbox 978 1039 1143 1066; x_wconf 87' lang='eng' dir='ltr'>gyllenbergii</span> <span class='ocrx_word' id='word_1_197' title='bbox 1159 1039 1215 1060; x_wconf 96' lang='eng' dir='ltr'>LUH</span> <span class='ocrx_word' id='word_1_198' title='bbox 1229 1039 1287 1060; x_wconf 93' lang='eng'>1741</span> <span class='ocrx_word' id='word_1_199' title='bbox 1310 1039 1466 1066; x_wconf 89' lang='eng' dir='ltr'>(EU477158)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 978 1072 1470 1099; baseline 0 -6"><span class='ocrx_word' id='word_1_200' title='bbox 978 1072 1143 1099; x_wconf 87' lang='eng' dir='ltr'>gyllenbergii</span> <span class='ocrx_word' id='word_1_201' title='bbox 1160 1072 1219 1093; x_wconf 94' lang='eng' dir='ltr'>RUH</span> <span class='ocrx_word' id='word_1_202' title='bbox 1231 1072 1294 1093; x_wconf 90' lang='eng'>3064</span> <span class='ocrx_word' id='word_1_203' title='bbox 1313 1072 1470 1099; x_wconf 90' lang='eng' dir='ltr'>(EU477145)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 962 1103 1476 1130; baseline 0 -6"><span class='ocrx_word' id='word_1_204' title='bbox 962 1103 1143 1130; x_wconf 87' lang='eng' dir='ltr'>.gyllenbergii</span> <span class='ocrx_word' id='word_1_205' title='bbox 1160 1103 1225 1124; x_wconf 92' lang='eng' dir='ltr'>NIPH</span> <span class='ocrx_word' id='word_1_206' title='bbox 1236 1103 1300 1124; x_wconf 91' lang='eng'>2353</span> <span class='ocrx_word' id='word_1_207' title='bbox 1319 1103 1476 1130; x_wconf 89' lang='eng' dir='ltr'>(EU477156)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 887 1129 1337 1159; baseline 0 -6"><span class='ocrx_word' id='word_1_208' title='bbox 887 1132 912 1153; x_wconf 96' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_209' title='bbox 923 1137 1012 1159; x_wconf 85' lang='eng' dir='ltr'><em>parvus</em></span> <span class='ocrx_word' id='word_1_210' title='bbox 1031 1132 1096 1153; x_wconf 87' lang='eng' dir='ltr'>NIPH</span> <span class='ocrx_word' id='word_1_211' title='bbox 1108 1129 1168 1153; x_wconf 82' lang='eng' dir='ltr'>384T</span> <span class='ocrx_word' id='word_1_212' title='bbox 1181 1132 1337 1159; x_wconf 93' lang='eng' dir='ltr'>(EU477107)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 988 1162 1551 1189; baseline 0 -6"><span class='ocrx_word' id='word_1_213' title='bbox 988 1162 1105 1183; x_wconf 84' lang='eng' dir='ltr'>Genomic</span> <span class='ocrx_word' id='word_1_214' title='bbox 1115 1168 1150 1189; x_wconf 87' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_215' title='bbox 1164 1162 1226 1183; x_wconf 89' lang='eng' dir='ltr'>14BJ</span> <span class='ocrx_word' id='word_1_216' title='bbox 1247 1162 1301 1183; x_wconf 95' lang='eng' dir='ltr'>LUH</span> <span class='ocrx_word' id='word_1_217' title='bbox 1314 1162 1376 1183; x_wconf 87' lang='eng'>1726</span> <span class='ocrx_word' id='word_1_218' title='bbox 1395 1162 1551 1189; x_wconf 91' lang='eng' dir='ltr'>(EU477147)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 920 1197 1601 1225; baseline 0 -6"><span class='ocrx_word' id='word_1_219' title='bbox 920 1197 1037 1219; x_wconf 86' lang='eng' dir='ltr'>Genomic</span> <span class='ocrx_word' id='word_1_220' title='bbox 1047 1204 1083 1225; x_wconf 87' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_221' title='bbox 1097 1197 1238 1219; x_wconf 88' lang='eng' dir='ltr'>13BJ/14TU</span> <span class='ocrx_word' id='word_1_222' title='bbox 1257 1197 1335 1219; x_wconf 89' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_223' title='bbox 1348 1197 1426 1219; x_wconf 85' lang='eng'>17905</span> <span class='ocrx_word' id='word_1_224' title='bbox 1446 1197 1601 1225; x_wconf 85' lang='eng' dir='ltr'>(EU477132)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 1115 1227 1587 1257; baseline 0 -6"><span class='ocrx_word' id='word_1_225' title='bbox 1115 1230 1140 1251; x_wconf 95' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_226' title='bbox 1148 1230 1269 1257; x_wconf 80' lang='eng' dir='ltr'>johnsoni/</span> <span class='ocrx_word' id='word_1_227' title='bbox 1286 1230 1346 1251; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_228' title='bbox 1357 1227 1417 1251; x_wconf 80' lang='eng' dir='ltr'>999T</span> <span class='ocrx_word' id='word_1_229' title='bbox 1430 1230 1587 1257; x_wconf 91' lang='eng' dir='ltr'>(EU477113)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_48' title="bbox 989 1263 1470 1290; baseline 0 -6"><span class='ocrx_word' id='word_1_230' title='bbox 989 1263 1143 1290; x_wconf 88' lang='eng' dir='ltr'>beijerinckii</span> <span class='ocrx_word' id='word_1_231' title='bbox 1160 1263 1219 1284; x_wconf 92' lang='eng' dir='ltr'>RUH</span> <span class='ocrx_word' id='word_1_232' title='bbox 1230 1263 1294 1284; x_wconf 91' lang='eng'>2762</span> <span class='ocrx_word' id='word_1_233' title='bbox 1313 1263 1470 1290; x_wconf 86' lang='eng' dir='ltr'>(EU477139)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_49' title="bbox 989 1292 1467 1322; baseline 0 -6"><span class='ocrx_word' id='word_1_234' title='bbox 989 1295 1143 1322; x_wconf 87' lang='eng' dir='ltr'>beijerinckii</span> <span class='ocrx_word' id='word_1_235' title='bbox 1160 1295 1225 1316; x_wconf 95' lang='eng' dir='ltr'><strong>NIPH</strong></span> <span class='ocrx_word' id='word_1_236' title='bbox 1237 1292 1296 1316; x_wconf 88' lang='eng' dir='ltr'>838T</span> <span class='ocrx_word' id='word_1_237' title='bbox 1310 1295 1467 1322; x_wconf 90' lang='eng' dir='ltr'>(EU477124)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_50' title="bbox 973 1327 1466 1354; baseline 0 -6"><span class='ocrx_word' id='word_1_238' title='bbox 973 1344 978 1348; x_wconf 99' lang='eng'>.</span> <span class='ocrx_word' id='word_1_239' title='bbox 989 1327 1143 1354; x_wconf 91' lang='eng' dir='ltr'>beijerinckii</span> <span class='ocrx_word' id='word_1_240' title='bbox 1159 1327 1215 1348; x_wconf 96' lang='eng' dir='ltr'>LUH</span> <span class='ocrx_word' id='word_1_241' title='bbox 1227 1327 1291 1348; x_wconf 84' lang='eng'>9424</span> <span class='ocrx_word' id='word_1_242' title='bbox 1310 1327 1466 1354; x_wconf 90' lang='eng' dir='ltr'>(EU477157)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_51' title="bbox 989 1359 1466 1386; baseline 0 -6"><span class='ocrx_word' id='word_1_243' title='bbox 989 1359 1143 1386; x_wconf 87' lang='eng' dir='ltr'>beijerinckii</span> <span class='ocrx_word' id='word_1_244' title='bbox 1159 1359 1215 1380; x_wconf 96' lang='eng' dir='ltr'><strong>LUH</strong></span> <span class='ocrx_word' id='word_1_245' title='bbox 1227 1359 1291 1380; x_wconf 89' lang='eng'>5692</span> <span class='ocrx_word' id='word_1_246' title='bbox 1310 1359 1466 1386; x_wconf 90' lang='eng' dir='ltr'>(EU477146)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_52' title="bbox 989 1392 1466 1419; baseline 0 -6"><span class='ocrx_word' id='word_1_247' title='bbox 989 1392 1143 1419; x_wconf 87' lang='eng' dir='ltr'>beijerinckii</span> <span class='ocrx_word' id='word_1_248' title='bbox 1159 1392 1215 1413; x_wconf 96' lang='eng' dir='ltr'>LUH</span> <span class='ocrx_word' id='word_1_249' title='bbox 1226 1392 1287 1413; x_wconf 93' lang='eng'>4561</span> <span class='ocrx_word' id='word_1_250' title='bbox 1310 1392 1466 1419; x_wconf 91' lang='eng' dir='ltr'>(EU477120)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_53' title="bbox 973 1423 1470 1450; baseline 0 -6"><span class='ocrx_word' id='word_1_251' title='bbox 973 1440 978 1444; x_wconf 96' lang='eng'>.</span> <span class='ocrx_word' id='word_1_252' title='bbox 989 1423 1143 1450; x_wconf 86' lang='eng' dir='ltr'>beijerinckii</span> <span class='ocrx_word' id='word_1_253' title='bbox 1160 1423 1219 1444; x_wconf 93' lang='eng' dir='ltr'>RUH</span> <span class='ocrx_word' id='word_1_254' title='bbox 1230 1423 1294 1444; x_wconf 87' lang='eng'>2879</span> <span class='ocrx_word' id='word_1_255' title='bbox 1313 1423 1470 1450; x_wconf 82' lang='eng' dir='ltr'>(EU477140)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_54' title="bbox 973 1456 1466 1483; baseline 0 -6"><span class='ocrx_word' id='word_1_256' title='bbox 973 1473 978 1477; x_wconf 99' lang='eng'>.</span> <span class='ocrx_word' id='word_1_257' title='bbox 989 1456 1143 1483; x_wconf 90' lang='eng' dir='ltr'>beijerinckii</span> <span class='ocrx_word' id='word_1_258' title='bbox 1159 1456 1215 1477; x_wconf 96' lang='eng' dir='ltr'>LUH</span> <span class='ocrx_word' id='word_1_259' title='bbox 1226 1456 1291 1477; x_wconf 86' lang='eng'>4738</span> <span class='ocrx_word' id='word_1_260' title='bbox 1310 1456 1466 1483; x_wconf 87' lang='eng' dir='ltr'>(EU477123)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_55' title="bbox 973 1487 1466 1514; baseline 0 -6"><span class='ocrx_word' id='word_1_261' title='bbox 973 1504 978 1508; x_wconf 99' lang='eng'>.</span> <span class='ocrx_word' id='word_1_262' title='bbox 989 1487 1143 1514; x_wconf 86' lang='eng' dir='ltr'>beijerinckii</span> <span class='ocrx_word' id='word_1_263' title='bbox 1159 1487 1215 1508; x_wconf 96' lang='eng' dir='ltr'><strong>LUH</strong></span> <span class='ocrx_word' id='word_1_264' title='bbox 1226 1487 1287 1508; x_wconf 90' lang='eng'>4771</span> <span class='ocrx_word' id='word_1_265' title='bbox 1310 1487 1466 1514; x_wconf 90' lang='eng' dir='ltr'>(EU477125)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_56' title="bbox 973 1522 1466 1549; baseline 0 -6"><span class='ocrx_word' id='word_1_266' title='bbox 973 1539 978 1543; x_wconf 99' lang='eng'>.</span> <span class='ocrx_word' id='word_1_267' title='bbox 989 1522 1143 1549; x_wconf 88' lang='eng' dir='ltr'>beijerinckii</span> <span class='ocrx_word' id='word_1_268' title='bbox 1159 1522 1215 1543; x_wconf 96' lang='eng' dir='ltr'>LUH</span> <span class='ocrx_word' id='word_1_269' title='bbox 1227 1522 1291 1543; x_wconf 89' lang='eng'>3340</span> <span class='ocrx_word' id='word_1_270' title='bbox 1310 1522 1466 1549; x_wconf 86' lang='eng' dir='ltr'>(EU477129)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_57' title="bbox 973 1552 1466 1579; baseline 0 -6"><span class='ocrx_word' id='word_1_271' title='bbox 973 1569 978 1573; x_wconf 99' lang='eng'>.</span> <span class='ocrx_word' id='word_1_272' title='bbox 989 1552 1143 1579; x_wconf 88' lang='eng' dir='ltr'>beijerinckii</span> <span class='ocrx_word' id='word_1_273' title='bbox 1159 1552 1215 1573; x_wconf 96' lang='eng' dir='ltr'>LUH</span> <span class='ocrx_word' id='word_1_274' title='bbox 1227 1552 1291 1573; x_wconf 87' lang='eng'>6214</span> <span class='ocrx_word' id='word_1_275' title='bbox 1310 1552 1466 1579; x_wconf 89' lang='eng' dir='ltr'>(EU477130)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_58' title="bbox 989 1585 1470 1612; baseline 0 -6"><span class='ocrx_word' id='word_1_276' title='bbox 989 1585 1143 1612; x_wconf 82' lang='eng' dir='ltr'>beijerinckii</span> <span class='ocrx_word' id='word_1_277' title='bbox 1160 1585 1219 1606; x_wconf 93' lang='eng' dir='ltr'>RUH</span> <span class='ocrx_word' id='word_1_278' title='bbox 1230 1585 1291 1606; x_wconf 89' lang='eng'>2371</span> <span class='ocrx_word' id='word_1_279' title='bbox 1313 1585 1470 1612; x_wconf 84' lang='eng' dir='ltr'>(EU477137)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_59' title="bbox 989 1617 1470 1644; baseline 0 -6"><span class='ocrx_word' id='word_1_280' title='bbox 989 1617 1143 1644; x_wconf 87' lang='eng' dir='ltr'>beijerinckii</span> <span class='ocrx_word' id='word_1_281' title='bbox 1160 1617 1219 1638; x_wconf 95' lang='eng' dir='ltr'>RUH</span> <span class='ocrx_word' id='word_1_282' title='bbox 1230 1617 1294 1638; x_wconf 89' lang='eng'>2560</span> <span class='ocrx_word' id='word_1_283' title='bbox 1313 1617 1470 1644; x_wconf 89' lang='eng' dir='ltr'>(EU477138)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_60' title="bbox 989 1648 1466 1675; baseline 0 -6"><span class='ocrx_word' id='word_1_284' title='bbox 989 1648 1143 1675; x_wconf 81' lang='eng' dir='ltr'>beijerinckii</span> <span class='ocrx_word' id='word_1_285' title='bbox 1159 1648 1215 1669; x_wconf 96' lang='eng' dir='ltr'>LUH</span> <span class='ocrx_word' id='word_1_286' title='bbox 1227 1648 1291 1669; x_wconf 90' lang='eng'>3146</span> <span class='ocrx_word' id='word_1_287' title='bbox 1310 1648 1466 1675; x_wconf 91' lang='eng' dir='ltr'>(EU477141)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_61' title="bbox 989 1681 1466 1708; baseline 0 -6"><span class='ocrx_word' id='word_1_288' title='bbox 989 1681 1143 1708; x_wconf 82' lang='eng' dir='ltr'>beijerinckii</span> <span class='ocrx_word' id='word_1_289' title='bbox 1159 1681 1215 1702; x_wconf 96' lang='eng' dir='ltr'><strong>LUH</strong></span> <span class='ocrx_word' id='word_1_290' title='bbox 1227 1681 1291 1702; x_wconf 93' lang='eng'>7834</span> <span class='ocrx_word' id='word_1_291' title='bbox 1310 1681 1466 1708; x_wconf 93' lang='eng' dir='ltr'>(EU477142)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_62' title="bbox 973 1712 1466 1740; baseline 0 -7"><span class='ocrx_word' id='word_1_292' title='bbox 973 1729 978 1733; x_wconf 96' lang='eng'>.</span> <span class='ocrx_word' id='word_1_293' title='bbox 989 1712 1143 1740; x_wconf 82' lang='eng' dir='ltr'>beijerinckii</span> <span class='ocrx_word' id='word_1_294' title='bbox 1159 1712 1215 1733; x_wconf 95' lang='eng' dir='ltr'><strong>LUH</strong></span> <span class='ocrx_word' id='word_1_295' title='bbox 1227 1712 1291 1733; x_wconf 88' lang='eng'>8896</span> <span class='ocrx_word' id='word_1_296' title='bbox 1310 1712 1466 1739; x_wconf 93' lang='eng' dir='ltr'>(EU477142)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 939 845 966 1124">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 939 845 966 1124">
+     <span class='ocr_line' id='line_1_63' title="bbox 939 845 966 1124; textangle 90"><span class='ocrx_word' id='word_1_297' title='bbox 939 845 966 1124; x_wconf 66' lang='eng'><em>&gt;&gt;&gt;&gt;&gt;&gt;&gt;&gt;&gt;</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 951 1263 978 1733">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 951 1263 978 1733">
+     <span class='ocr_line' id='line_1_64' title="bbox 951 1263 978 1733; textangle 90"><span class='ocrx_word' id='word_1_298' title='bbox 951 1263 978 1733; x_wconf 66' lang='eng'>&gt;&gt;&gt;&gt;&gt;&gt;&gt;&gt;&gt;&gt;&gt;&gt;&gt;&gt;&gt;</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001230-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001230-0-001.pbm.png
new file mode 100644
index 00000000..8b44d3d9
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001230-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001230-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001230-0-001.pbm.png.hocr
new file mode 100644
index 00000000..3509f569
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001230-0-001.pbm.png.hocr
@@ -0,0 +1,322 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001230-0-001.pbm.png"; bbox 0 0 1834 1247; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 115 15 188 25">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 115 15 188 25">
+     <span class='ocr_line' id='line_1_1' title="bbox 115 15 188 25; baseline 0 1222"><span class='ocrx_word' id='word_1_1' title='bbox 115 15 188 25; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 610 7 1035 34">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 610 7 1035 34">
+     <span class='ocr_line' id='line_1_2' title="bbox 610 7 1035 34; baseline 0 -6"><span class='ocrx_word' id='word_1_2' title='bbox 610 7 635 28; x_wconf 95' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_3' title='bbox 648 7 740 28; x_wconf 84' lang='eng' dir='ltr'>towneri</span> <span class='ocrx_word' id='word_1_4' title='bbox 755 8 792 28; x_wconf 91' lang='eng' dir='ltr'>AB</span> <span class='ocrx_word' id='word_1_5' title='bbox 805 8 877 28; x_wconf 76' lang='eng' dir='ltr'>1110T</span> <span class='ocrx_word' id='word_1_6' title='bbox 887 8 1035 34; x_wconf 83' lang='eng' dir='ltr'>(AF509823)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 63 40 1541 133">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 63 40 1541 133">
+     <span class='ocr_line' id='line_1_3' title="bbox 466 40 1541 67; baseline 0.003 -6"><span class='ocrx_word' id='word_1_7' title='bbox 466 40 760 67; x_wconf 80' lang='eng' dir='ltr'>Acinetobactergenomic</span> <span class='ocrx_word' id='word_1_8' title='bbox 769 46 804 67; x_wconf 88' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_9' title='bbox 818 41 884 61; x_wconf 91' lang='eng' dir='ltr'>15TU</span> <span class='ocrx_word' id='word_1_10' title='bbox 904 41 964 61; x_wconf 86' lang='eng' dir='ltr'>151a</span> <span class='ocrx_word' id='word_1_11' title='bbox 984 41 1097 67; x_wconf 84' lang='eng'>(293448)</span> <span class='ocrx_word' id='word_1_12' title='bbox 1504 43 1541 65; x_wconf 89' lang='eng'>1%</span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 239 73 914 118; baseline 0 -24"><span class='ocrx_word' id='word_1_13' title='bbox 239 76 457 118; x_wconf 42' lang='eng' dir='ltr'><strong>if</strong></span> <span class='ocrx_word' id='word_1_14' title='bbox 466 73 490 94; x_wconf 93' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_15' title='bbox 503 73 681 94; x_wconf 80' lang='eng' dir='ltr'>radioresistens</span> <span class='ocrx_word' id='word_1_16' title='bbox 701 73 788 94; x_wconf 81' lang='eng' dir='ltr'>17694T</span> <span class='ocrx_word' id='word_1_17' title='bbox 801 73 914 100; x_wconf 87' lang='eng'>(293445)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 63 104 866 133; baseline 0.004 -9"><span class='ocrx_word' id='word_1_18' title='bbox 63 104 108 124; x_wconf 92' lang='eng'>100</span> <span class='ocrx_word' id='word_1_19' title='bbox 414 106 440 127; x_wconf 74' lang='eng' dir='ltr'><em>‘A.</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 453 106 600 127; x_wconf 82' lang='eng' dir='ltr'>venetianus’</span> <span class='ocrx_word' id='word_1_21' title='bbox 616 106 696 127; x_wconf 92' lang='eng' dir='ltr'>RAG-1</span> <span class='ocrx_word' id='word_1_22' title='bbox 720 106 866 133; x_wconf 86' lang='eng' dir='ltr'>(AJ295007)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 284 149 376 151">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 284 149 376 151">
+     <span class='ocr_line' id='line_1_6' title="bbox 284 149 376 151; baseline 0 1096"><span class='ocrx_word' id='word_1_23' title='bbox 284 149 376 151; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 237 101 239 179">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 237 101 239 179">
+     <span class='ocr_line' id='line_1_7' title="bbox 237 101 239 179; baseline 0 1068"><span class='ocrx_word' id='word_1_24' title='bbox 237 101 239 179; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 284 144 1296 726">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 284 144 1021 237">
+     <span class='ocr_line' id='line_1_8' title="bbox 385 144 784 171; baseline 0 -6"><span class='ocrx_word' id='word_1_25' title='bbox 385 144 410 165; x_wconf 93' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 418 144 474 171; x_wconf 81' lang='eng' dir='ltr'>jun/i</span> <span class='ocrx_word' id='word_1_27' title='bbox 490 144 549 165; x_wconf 89' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_28' title='bbox 560 144 618 165; x_wconf 87' lang='eng' dir='ltr'>998T</span> <span class='ocrx_word' id='word_1_29' title='bbox 630 144 784 171; x_wconf 91' lang='eng' dir='ltr'>(AM410704)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 284 178 1021 204; baseline 0 -5"><span class='ocrx_word' id='word_1_30' title='bbox 284 182 636 184; x_wconf 94' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_31' title='bbox 645 178 669 199; x_wconf 89' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_32' title='bbox 682 178 770 204; x_wconf 84' lang='eng' dir='ltr'>gerneri</span> <span class='ocrx_word' id='word_1_33' title='bbox 788 178 864 199; x_wconf 85' lang='eng' dir='ltr'>9A01T</span> <span class='ocrx_word' id='word_1_34' title='bbox 873 178 1021 204; x_wconf 84' lang='eng' dir='ltr'>(AF509829)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 284 206 901 237; baseline 0 -6"><span class='ocrx_word' id='word_1_35' title='bbox 284 206 398 231; x_wconf 53' lang='eng' dir='ltr'>ﬂ—</span> <span class='ocrx_word' id='word_1_36' title='bbox 407 211 432 231; x_wconf 95' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_37' title='bbox 444 211 577 232; x_wconf 76' lang='eng' dir='ltr'>baumannii</span> <span class='ocrx_word' id='word_1_38' title='bbox 593 211 669 231; x_wconf 89' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_39' title='bbox 681 211 770 231; x_wconf 78' lang='eng' dir='ltr'>19606T</span> <span class='ocrx_word' id='word_1_40' title='bbox 788 211 901 237; x_wconf 88' lang='eng'>(293435)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 303 244 1210 346">
+     <span class='ocr_line' id='line_1_11' title="bbox 352 244 1108 270; baseline -0.001 -5"><span class='ocrx_word' id='word_1_41' title='bbox 352 247 367 249; x_wconf 70' lang='eng'><strong><em>‘</em></strong></span> <span class='ocrx_word' id='word_1_42' title='bbox 376 244 669 270; x_wconf 82' lang='eng' dir='ltr'>Acinetobactergenomic</span> <span class='ocrx_word' id='word_1_43' title='bbox 678 250 713 270; x_wconf 68' lang='eng' dir='ltr'>5p.</span> <span class='ocrx_word' id='word_1_44' title='bbox 727 244 793 264; x_wconf 95' lang='eng' dir='ltr'>13TU</span> <span class='ocrx_word' id='word_1_45' title='bbox 811 244 887 264; x_wconf 92' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_46' title='bbox 900 244 975 264; x_wconf 89' lang='eng'>17903</span> <span class='ocrx_word' id='word_1_47' title='bbox 994 244 1108 270; x_wconf 84' lang='eng'>(293446)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 303 276 995 303; baseline 0 -6"><span class='ocrx_word' id='word_1_48' title='bbox 303 278 550 280; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_49' title='bbox 559 276 584 297; x_wconf 94' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_50' title='bbox 597 276 687 303; x_wconf 88' lang='eng' dir='ltr'>ursingii</span> <span class='ocrx_word' id='word_1_51' title='bbox 704 276 769 297; x_wconf 95' lang='eng' dir='ltr'>NIPH</span> <span class='ocrx_word' id='word_1_52' title='bbox 781 276 838 297; x_wconf 88' lang='eng' dir='ltr'>137T</span> <span class='ocrx_word' id='word_1_53' title='bbox 850 276 995 303; x_wconf 85' lang='eng' dir='ltr'>(AJ275038)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 303 305 1210 346; baseline 0 -15"><span class='ocrx_word' id='word_1_54' title='bbox 303 305 694 346; x_wconf 42' lang='eng' dir='ltr'>JEAcmetobacter</span> <span class='ocrx_word' id='word_1_55' title='bbox 701 310 809 336; x_wconf 83' lang='eng' dir='ltr'>genomic</span> <span class='ocrx_word' id='word_1_56' title='bbox 818 316 853 336; x_wconf 80' lang='eng' dir='ltr'>5p.</span> <span class='ocrx_word' id='word_1_57' title='bbox 866 310 895 331; x_wconf 93' lang='eng'>10</span> <span class='ocrx_word' id='word_1_58' title='bbox 913 310 988 331; x_wconf 91' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_59' title='bbox 1001 310 1077 331; x_wconf 91' lang='eng'>17924</span> <span class='ocrx_word' id='word_1_60' title='bbox 1096 310 1210 336; x_wconf 87' lang='eng'>(293443)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 498 340 1296 400">
+     <span class='ocr_line' id='line_1_14' title="bbox 498 340 1148 367; baseline 0 -6"><span class='ocrx_word' id='word_1_61' title='bbox 498 340 677 361; x_wconf 85' lang='eng' dir='ltr'>Acinetobacter</span> <span class='ocrx_word' id='word_1_62' title='bbox 684 340 792 367; x_wconf 79' lang='eng' dir='ltr'>genomic</span> <span class='ocrx_word' id='word_1_63' title='bbox 801 346 836 367; x_wconf 80' lang='eng' dir='ltr'>5p.</span> <span class='ocrx_word' id='word_1_64' title='bbox 850 340 873 361; x_wconf 95' lang='eng'>11</span> <span class='ocrx_word' id='word_1_65' title='bbox 897 340 957 361; x_wconf 85' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_66' title='bbox 968 340 1014 361; x_wconf 86' lang='eng'>590</span> <span class='ocrx_word' id='word_1_67' title='bbox 1033 340 1148 366; x_wconf 87' lang='eng' dir='ltr'>(X81659)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 845 373 1296 400; baseline 0 -6"><span class='ocrx_word' id='word_1_68' title='bbox 845 373 870 394; x_wconf 95' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_69' title='bbox 882 373 1031 400; x_wconf 83' lang='eng' dir='ltr'>tjernbergiae</span> <span class='ocrx_word' id='word_1_70' title='bbox 1050 373 1128 394; x_wconf 84' lang='eng' dir='ltr'>7N16T</span> <span class='ocrx_word' id='word_1_71' title='bbox 1147 373 1296 399; x_wconf 89' lang='eng' dir='ltr'>(AF509825)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 364 406 1069 478">
+     <span class='ocr_line' id='line_1_16' title="bbox 415 406 1069 432; baseline 0 -5"><span class='ocrx_word' id='word_1_72' title='bbox 415 406 711 427; x_wconf 93' lang='eng' dir='ltr'><em>—A.</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 724 406 808 427; x_wconf 79' lang='eng' dir='ltr'>tandoii</span> <span class='ocrx_word' id='word_1_74' title='bbox 824 406 902 427; x_wconf 80' lang='eng' dir='ltr'>4N13T</span> <span class='ocrx_word' id='word_1_75' title='bbox 921 406 1069 432; x_wconf 87' lang='eng' dir='ltr'>(AF509830)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 364 439 1045 478; baseline 0 -18"><span class='ocrx_word' id='word_1_76' title='bbox 364 439 676 478; x_wconf 57' lang='eng' dir='ltr'>_‘_—A.</span> <span class='ocrx_word' id='word_1_77' title='bbox 689 439 788 460; x_wconf 87' lang='eng' dir='ltr'>bouvetii</span> <span class='ocrx_word' id='word_1_78' title='bbox 804 439 882 460; x_wconf 80' lang='eng' dir='ltr'>4B02T</span> <span class='ocrx_word' id='word_1_79' title='bbox 897 439 1045 465; x_wconf 87' lang='eng' dir='ltr'>(AF509827)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 471 469 1101 498">
+     <span class='ocr_line' id='line_1_18' title="bbox 471 469 1101 498; baseline 0.003 -5"><span class='ocrx_word' id='word_1_80' title='bbox 471 472 495 493; x_wconf 67' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_81' title='bbox 504 472 622 498; x_wconf 87' lang='eng' dir='ltr'>johnsonii</span> <span class='ocrx_word' id='word_1_82' title='bbox 632 472 708 492; x_wconf 91' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_83' title='bbox 720 472 814 496; x_wconf 51' lang='eng'>179091</span> <span class='ocrx_word' id='word_1_84' title='bbox 828 472 885 493; x_wconf 86' lang='eng' dir='ltr'>RUH</span> <span class='ocrx_word' id='word_1_85' title='bbox 896 472 975 492; x_wconf 86' lang='eng' dir='ltr'>2231T:</span> <span class='ocrx_word' id='word_1_86' title='bbox 987 469 1101 495; x_wconf 83' lang='eng'>(293440)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 416 501 1198 562">
+     <span class='ocr_line' id='line_1_19' title="bbox 512 501 1198 531; baseline 0.001 -5"><span class='ocrx_word' id='word_1_87' title='bbox 512 505 537 525; x_wconf 94' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_88' title='bbox 549 505 716 531; x_wconf 83' lang='eng' dir='ltr'>haemolyticus</span> <span class='ocrx_word' id='word_1_89' title='bbox 727 505 804 525; x_wconf 86' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_90' title='bbox 816 505 910 529; x_wconf 82' lang='eng' dir='ltr'>17906T,</span> <span class='ocrx_word' id='word_1_91' title='bbox 923 505 980 525; x_wconf 89' lang='eng' dir='ltr'>RUH</span> <span class='ocrx_word' id='word_1_92' title='bbox 991 505 1071 525; x_wconf 50' lang='eng'>22157:</span> <span class='ocrx_word' id='word_1_93' title='bbox 1083 501 1198 527; x_wconf 86' lang='eng'>(293437)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 416 534 1124 562; baseline 0.001 -8"><span class='ocrx_word' id='word_1_94' title='bbox 416 534 460 554; x_wconf 92' lang='eng'>100</span> <span class='ocrx_word' id='word_1_95' title='bbox 479 535 505 555; x_wconf 96' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_96' title='bbox 517 535 668 562; x_wconf 89' lang='eng' dir='ltr'>beijerinckii</span> <span class='ocrx_word' id='word_1_97' title='bbox 685 535 749 556; x_wconf 90' lang='eng' dir='ltr'>NIPH</span> <span class='ocrx_word' id='word_1_98' title='bbox 761 535 818 555; x_wconf 84' lang='eng' dir='ltr'>838T</span> <span class='ocrx_word' id='word_1_99' title='bbox 830 535 979 561; x_wconf 86' lang='eng' dir='ltr'>(AJ626712)</span> <span class='ocrx_word' id='word_1_100' title='bbox 989 535 1039 555; x_wconf 78' lang='eng' dir='ltr'>this</span> <span class='ocrx_word' id='word_1_101' title='bbox 1049 535 1124 561; x_wconf 90' lang='eng' dir='ltr'>study</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 479 569 1126 595">
+     <span class='ocr_line' id='line_1_21' title="bbox 479 569 1126 595; baseline 0 -6"><span class='ocrx_word' id='word_1_102' title='bbox 479 569 505 589; x_wconf 95' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_103' title='bbox 517 569 668 595; x_wconf 82' lang='eng' dir='ltr'>beijerinckii</span> <span class='ocrx_word' id='word_1_104' title='bbox 685 569 739 589; x_wconf 97' lang='eng' dir='ltr'><strong>LUH</strong></span> <span class='ocrx_word' id='word_1_105' title='bbox 751 569 813 589; x_wconf 89' lang='eng'>6214</span> <span class='ocrx_word' id='word_1_106' title='bbox 831 569 980 595; x_wconf 74' lang='eng' dir='ltr'>(M303013)</span> <span class='ocrx_word' id='word_1_107' title='bbox 991 569 1040 589; x_wconf 84' lang='eng' dir='ltr'>this</span> <span class='ocrx_word' id='word_1_108' title='bbox 1051 569 1126 595; x_wconf 88' lang='eng' dir='ltr'><strong>study</strong></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 426 601 1178 661">
+     <span class='ocr_line' id='line_1_22' title="bbox 426 601 1178 628; baseline 0 -6"><span class='ocrx_word' id='word_1_109' title='bbox 426 605 474 607; x_wconf 86' lang='eng'>—</span> <span class='ocrx_word' id='word_1_110' title='bbox 483 601 662 622; x_wconf 82' lang='eng' dir='ltr'>Acinetobacter</span> <span class='ocrx_word' id='word_1_111' title='bbox 669 601 776 628; x_wconf 84' lang='eng' dir='ltr'>genomic</span> <span class='ocrx_word' id='word_1_112' title='bbox 786 607 821 628; x_wconf 80' lang='eng' dir='ltr'>5p.</span> <span class='ocrx_word' id='word_1_113' title='bbox 835 601 863 622; x_wconf 83' lang='eng'>16</span> <span class='ocrx_word' id='word_1_114' title='bbox 880 601 957 622; x_wconf 91' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_115' title='bbox 969 601 1045 622; x_wconf 90' lang='eng'>17988</span> <span class='ocrx_word' id='word_1_116' title='bbox 1065 601 1178 628; x_wconf 89' lang='eng'>(293451)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 428 635 1077 661; baseline -0.002 -5"><span class='ocrx_word' id='word_1_117' title='bbox 428 639 474 641; x_wconf 86' lang='eng'>—</span> <span class='ocrx_word' id='word_1_118' title='bbox 483 635 662 656; x_wconf 83' lang='eng' dir='ltr'>Acinetobacter</span> <span class='ocrx_word' id='word_1_119' title='bbox 669 635 776 661; x_wconf 84' lang='eng' dir='ltr'>genomic</span> <span class='ocrx_word' id='word_1_120' title='bbox 786 641 821 661; x_wconf 86' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_121' title='bbox 835 635 895 655; x_wconf 83' lang='eng' dir='ltr'>1SBJ</span> <span class='ocrx_word' id='word_1_122' title='bbox 915 635 944 655; x_wconf 97' lang='eng'>79</span> <span class='ocrx_word' id='word_1_123' title='bbox 964 635 1077 661; x_wconf 83' lang='eng'>(293452)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 596 667 1088 726">
+     <span class='ocr_line' id='line_1_24' title="bbox 606 667 1088 693; baseline 0 -5"><span class='ocrx_word' id='word_1_124' title='bbox 606 667 630 688; x_wconf 89' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_125' title='bbox 643 667 764 688; x_wconf 84' lang='eng' dir='ltr'>schind/eri</span> <span class='ocrx_word' id='word_1_126' title='bbox 782 667 846 688; x_wconf 93' lang='eng' dir='ltr'>NIPH</span> <span class='ocrx_word' id='word_1_127' title='bbox 859 667 930 688; x_wconf 84' lang='eng' dir='ltr'>1034T</span> <span class='ocrx_word' id='word_1_128' title='bbox 943 667 1088 693; x_wconf 85' lang='eng' dir='ltr'>(AJ278311)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 596 700 1030 726; baseline 0 -5"><span class='ocrx_word' id='word_1_129' title='bbox 596 700 620 721; x_wconf 88' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_130' title='bbox 632 705 718 726; x_wconf 88' lang='eng' dir='ltr'>pan/us</span> <span class='ocrx_word' id='word_1_131' title='bbox 737 700 801 721; x_wconf 88' lang='eng' dir='ltr'>NIPH</span> <span class='ocrx_word' id='word_1_132' title='bbox 813 700 870 721; x_wconf 89' lang='eng' dir='ltr'>384T</span> <span class='ocrx_word' id='word_1_133' title='bbox 886 700 1030 726; x_wconf 86' lang='eng' dir='ltr'>(AJ293691)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 484 733 1155 790">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 484 733 1155 790">
+     <span class='ocr_line' id='line_1_26' title="bbox 579 733 1155 759; baseline 0 -5"><span class='ocrx_word' id='word_1_134' title='bbox 579 733 873 759; x_wconf 84' lang='eng' dir='ltr'>Acinetobactergenomic</span> <span class='ocrx_word' id='word_1_135' title='bbox 882 739 916 759; x_wconf 87' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_136' title='bbox 930 733 958 754; x_wconf 94' lang='eng'>17</span> <span class='ocrx_word' id='word_1_137' title='bbox 977 733 1022 754; x_wconf 87' lang='eng'>942</span> <span class='ocrx_word' id='word_1_138' title='bbox 1042 733 1155 759; x_wconf 88' lang='eng'>(293454)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 484 764 1142 790; baseline 0 -6"><span class='ocrx_word' id='word_1_139' title='bbox 484 764 509 784; x_wconf 95' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_140' title='bbox 521 764 683 790; x_wconf 88' lang='eng' dir='ltr'>gyllenbergii</span> <span class='ocrx_word' id='word_1_141' title='bbox 700 764 755 784; x_wconf 97' lang='eng' dir='ltr'><strong>LUH</strong></span> <span class='ocrx_word' id='word_1_142' title='bbox 767 764 827 784; x_wconf 85' lang='eng'>1737</span> <span class='ocrx_word' id='word_1_143' title='bbox 847 764 995 790; x_wconf 89' lang='eng' dir='ltr'>(AJ293692)</span> <span class='ocrx_word' id='word_1_144' title='bbox 1006 764 1056 784; x_wconf 84' lang='eng' dir='ltr'>this</span> <span class='ocrx_word' id='word_1_145' title='bbox 1066 764 1142 790; x_wconf 87' lang='eng' dir='ltr'>study</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 424 783 1386 922">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 424 783 1142 823">
+     <span class='ocr_line' id='line_1_28' title="bbox 424 783 1142 823; baseline 0 -6"><span class='ocrx_word' id='word_1_146' title='bbox 424 783 467 804; x_wconf 69' lang='eng'>100</span> <span class='ocrx_word' id='word_1_147' title='bbox 484 797 509 817; x_wconf 93' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_148' title='bbox 521 797 683 823; x_wconf 87' lang='eng' dir='ltr'>gyllenbergii</span> <span class='ocrx_word' id='word_1_149' title='bbox 700 797 755 817; x_wconf 96' lang='eng' dir='ltr'><strong>LUH</strong></span> <span class='ocrx_word' id='word_1_150' title='bbox 767 797 828 817; x_wconf 88' lang='eng'>1740</span> <span class='ocrx_word' id='word_1_151' title='bbox 847 797 995 823; x_wconf 88' lang='eng' dir='ltr'>(AJ293693)</span> <span class='ocrx_word' id='word_1_152' title='bbox 1006 797 1056 817; x_wconf 85' lang='eng' dir='ltr'>this</span> <span class='ocrx_word' id='word_1_153' title='bbox 1066 797 1142 823; x_wconf 83' lang='eng' dir='ltr'>study</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 484 829 1162 856">
+     <span class='ocr_line' id='line_1_29' title="bbox 484 829 1162 856; baseline 0 -6"><span class='ocrx_word' id='word_1_154' title='bbox 484 830 509 850; x_wconf 96' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_155' title='bbox 521 830 683 856; x_wconf 87' lang='eng' dir='ltr'>gyllenbergii</span> <span class='ocrx_word' id='word_1_156' title='bbox 701 830 764 850; x_wconf 94' lang='eng' dir='ltr'>NIPH</span> <span class='ocrx_word' id='word_1_157' title='bbox 776 829 850 850; x_wconf 91' lang='eng' dir='ltr'>2150T</span> <span class='ocrx_word' id='word_1_158' title='bbox 868 830 1017 856; x_wconf 88' lang='eng' dir='ltr'>(AJ293694)</span> <span class='ocrx_word' id='word_1_159' title='bbox 1027 830 1076 850; x_wconf 90' lang='eng' dir='ltr'>this</span> <span class='ocrx_word' id='word_1_160' title='bbox 1087 830 1162 856; x_wconf 87' lang='eng' dir='ltr'>study</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 579 862 1386 922">
+     <span class='ocr_line' id='line_1_30' title="bbox 584 862 1194 888; baseline -0.002 -5"><span class='ocrx_word' id='word_1_161' title='bbox 584 862 763 883; x_wconf 83' lang='eng' dir='ltr'>Acinetobacter</span> <span class='ocrx_word' id='word_1_162' title='bbox 770 862 878 888; x_wconf 85' lang='eng' dir='ltr'>genomic</span> <span class='ocrx_word' id='word_1_163' title='bbox 887 868 922 888; x_wconf 65' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_164' title='bbox 935 862 996 882; x_wconf 91' lang='eng' dir='ltr'>14BJ</span> <span class='ocrx_word' id='word_1_165' title='bbox 1015 862 1061 882; x_wconf 90' lang='eng'>382</span> <span class='ocrx_word' id='word_1_166' title='bbox 1081 862 1194 888; x_wconf 89' lang='eng'>(293453)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 579 895 1386 922; baseline -0.001 -5"><span class='ocrx_word' id='word_1_167' title='bbox 579 895 873 922; x_wconf 80' lang='eng' dir='ltr'>Acinetobactergenomic</span> <span class='ocrx_word' id='word_1_168' title='bbox 882 902 916 922; x_wconf 83' lang='eng' dir='ltr'>Sp.</span> <span class='ocrx_word' id='word_1_169' title='bbox 930 895 1069 917; x_wconf 77' lang='eng' dir='ltr'>1BBJ/14TU</span> <span class='ocrx_word' id='word_1_170' title='bbox 1088 895 1165 916; x_wconf 91' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_171' title='bbox 1177 895 1253 916; x_wconf 87' lang='eng'>17905</span> <span class='ocrx_word' id='word_1_172' title='bbox 1272 895 1386 922; x_wconf 84' lang='eng'>(293447)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 261 928 927 966">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 261 928 927 966">
+     <span class='ocr_line' id='line_1_32' title="bbox 261 928 927 966; baseline 0 -17"><span class='ocrx_word' id='word_1_173' title='bbox 261 930 501 966; x_wconf 57' lang='eng' dir='ltr'>_I:</span> <span class='ocrx_word' id='word_1_174' title='bbox 510 928 535 949; x_wconf 90' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_175' title='bbox 547 928 619 949; x_wconf 77' lang='eng' dir='ltr'>lwoffii</span> <span class='ocrx_word' id='word_1_176' title='bbox 635 928 711 949; x_wconf 89' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_177' title='bbox 723 928 799 949; x_wconf 83' lang='eng'>17925</span> <span class='ocrx_word' id='word_1_178' title='bbox 814 928 927 954; x_wconf 86' lang='eng' dir='ltr'>(Z93441)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 48 959 1822 1184">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 459 959 1197 985">
+     <span class='ocr_line' id='line_1_33' title="bbox 459 959 1197 985; baseline -0.001 -5"><span class='ocrx_word' id='word_1_179' title='bbox 459 959 638 980; x_wconf 83' lang='eng' dir='ltr'>Acinetobacter</span> <span class='ocrx_word' id='word_1_180' title='bbox 645 959 753 985; x_wconf 86' lang='eng' dir='ltr'>genomic</span> <span class='ocrx_word' id='word_1_181' title='bbox 762 959 858 985; x_wconf 85' lang='eng' dir='ltr'>species</span> <span class='ocrx_word' id='word_1_182' title='bbox 869 959 882 979; x_wconf 88' lang='eng'>6</span> <span class='ocrx_word' id='word_1_183' title='bbox 900 959 976 979; x_wconf 92' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_184' title='bbox 988 959 1064 979; x_wconf 88' lang='eng'>17979</span> <span class='ocrx_word' id='word_1_185' title='bbox 1083 959 1197 985; x_wconf 83' lang='eng'>(293439)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 561 991 1008 1019">
+     <span class='ocr_line' id='line_1_34' title="bbox 561 991 1008 1019; baseline 0 -7"><span class='ocrx_word' id='word_1_186' title='bbox 561 992 586 1012; x_wconf 96' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_187' title='bbox 599 992 672 1019; x_wconf 84' lang='eng' dir='ltr'><em>baylyi</em></span> <span class='ocrx_word' id='word_1_188' title='bbox 688 992 749 1012; x_wconf 88' lang='eng' dir='ltr'>CCM</span> <span class='ocrx_word' id='word_1_189' title='bbox 761 991 834 1012; x_wconf 81' lang='eng' dir='ltr'>7195T</span> <span class='ocrx_word' id='word_1_190' title='bbox 853 992 1008 1018; x_wconf 86' lang='eng' dir='ltr'>(AM410709)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 456 1025 1223 1051">
+     <span class='ocr_line' id='line_1_35' title="bbox 456 1025 1223 1051; baseline -0.001 -5"><span class='ocrx_word' id='word_1_191' title='bbox 456 1025 635 1046; x_wconf 79' lang='eng' dir='ltr'>Acinetobacter</span> <span class='ocrx_word' id='word_1_192' title='bbox 642 1025 750 1051; x_wconf 89' lang='eng' dir='ltr'>genomic</span> <span class='ocrx_word' id='word_1_193' title='bbox 759 1031 794 1051; x_wconf 87' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_194' title='bbox 808 1025 878 1045; x_wconf 80' lang='eng' dir='ltr'>‘close</span> <span class='ocrx_word' id='word_1_195' title='bbox 888 1026 910 1045; x_wconf 87' lang='eng' dir='ltr'>to</span> <span class='ocrx_word' id='word_1_196' title='bbox 922 1025 994 1045; x_wconf 89' lang='eng' dir='ltr'>13TU’</span> <span class='ocrx_word' id='word_1_197' title='bbox 1015 1025 1091 1045; x_wconf 88' lang='eng'>10090</span> <span class='ocrx_word' id='word_1_198' title='bbox 1110 1025 1223 1051; x_wconf 89' lang='eng'>(293449)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 419 1057 1223 1083">
+     <span class='ocr_line' id='line_1_36' title="bbox 419 1057 1223 1083; baseline 0 -5"><span class='ocrx_word' id='word_1_199' title='bbox 419 1057 599 1078; x_wconf 85' lang='eng' dir='ltr'>Acinetobacter</span> <span class='ocrx_word' id='word_1_200' title='bbox 606 1057 714 1083; x_wconf 89' lang='eng' dir='ltr'>genomic</span> <span class='ocrx_word' id='word_1_201' title='bbox 723 1063 757 1083; x_wconf 88' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_202' title='bbox 771 1057 882 1078; x_wconf 79' lang='eng' dir='ltr'>‘between</span> <span class='ocrx_word' id='word_1_203' title='bbox 894 1057 902 1078; x_wconf 95' lang='eng'>1</span> <span class='ocrx_word' id='word_1_204' title='bbox 917 1057 962 1078; x_wconf 89' lang='eng' dir='ltr'>and</span> <span class='ocrx_word' id='word_1_205' title='bbox 974 1057 993 1078; x_wconf 81' lang='eng'>3&#39;</span> <span class='ocrx_word' id='word_1_206' title='bbox 1014 1057 1091 1078; x_wconf 89' lang='eng'>10095</span> <span class='ocrx_word' id='word_1_207' title='bbox 1110 1057 1223 1083; x_wconf 87' lang='eng'>(293450)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 447 1091 964 1117">
+     <span class='ocr_line' id='line_1_37' title="bbox 447 1091 964 1117; baseline -0.002 -5"><span class='ocrx_word' id='word_1_208' title='bbox 447 1091 471 1111; x_wconf 93' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_209' title='bbox 484 1091 655 1112; x_wconf 84' lang='eng' dir='ltr'>calcoaceticus</span> <span class='ocrx_word' id='word_1_210' title='bbox 674 1091 733 1111; x_wconf 91' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_211' title='bbox 745 1091 834 1111; x_wconf 79' lang='eng' dir='ltr'>30006T</span> <span class='ocrx_word' id='word_1_212' title='bbox 850 1091 964 1117; x_wconf 87' lang='eng' dir='ltr'>(X81661)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 420 1124 1099 1150">
+     <span class='ocr_line' id='line_1_38' title="bbox 420 1124 1099 1150; baseline -0.001 -5"><span class='ocrx_word' id='word_1_213' title='bbox 420 1124 598 1145; x_wconf 84' lang='eng' dir='ltr'>Acinetobacter</span> <span class='ocrx_word' id='word_1_214' title='bbox 606 1124 713 1150; x_wconf 90' lang='eng' dir='ltr'>genomic</span> <span class='ocrx_word' id='word_1_215' title='bbox 723 1129 757 1150; x_wconf 88' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_216' title='bbox 770 1124 783 1144; x_wconf 91' lang='eng'>3</span> <span class='ocrx_word' id='word_1_217' title='bbox 801 1124 877 1144; x_wconf 89' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_218' title='bbox 890 1124 965 1144; x_wconf 90' lang='eng'>17922</span> <span class='ocrx_word' id='word_1_219' title='bbox 985 1124 1099 1150; x_wconf 86' lang='eng'>(293436)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 48 1154 1822 1184">
+     <span class='ocr_line' id='line_1_39' title="bbox 48 1154 1822 1184; baseline -0.002 -8"><span class='ocrx_word' id='word_1_220' title='bbox 48 1158 91 1178; x_wconf 85' lang='eng'>100</span> <span class='ocrx_word' id='word_1_221' title='bbox 100 1158 577 1160; x_wconf 94' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_222' title='bbox 586 1154 749 1180; x_wconf 80' lang='eng' dir='ltr'>Alkanindiges</span> <span class='ocrx_word' id='word_1_223' title='bbox 759 1154 903 1175; x_wconf 85' lang='eng' dir='ltr'>iI/inoisensis</span> <span class='ocrx_word' id='word_1_224' title='bbox 922 1154 999 1174; x_wconf 93' lang='eng' dir='ltr'>MVAB</span> <span class='ocrx_word' id='word_1_225' title='bbox 1011 1154 1087 1174; x_wconf 88' lang='eng' dir='ltr'>Hex1T</span> <span class='ocrx_word' id='word_1_226' title='bbox 1105 1154 1253 1180; x_wconf 88' lang='eng' dir='ltr'>(AF513979)</span> <span class='ocrx_word' id='word_1_227' title='bbox 1511 1157 1822 1184; x_wconf 72' lang='eng' dir='ltr'>Psychrobacterimmobm‘s</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 557 1192 1814 1247">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 557 1192 1814 1247">
+     <span class='ocr_line' id='line_1_40' title="bbox 608 1192 1814 1224; baseline 0 -11"><span class='ocrx_word' id='word_1_228' title='bbox 608 1193 612 1224; x_wconf 73' lang='eng' dir='ltr'>I</span> <span class='ocrx_word' id='word_1_229' title='bbox 1510 1192 1587 1213; x_wconf 90' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_230' title='bbox 1598 1192 1688 1213; x_wconf 74' lang='eng' dir='ltr'>43116T</span> <span class='ocrx_word' id='word_1_231' title='bbox 1698 1192 1814 1219; x_wconf 85' lang='eng' dir='ltr'>(U39399)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 557 1217 1730 1247; baseline 0.003 -9"><span class='ocrx_word' id='word_1_232' title='bbox 557 1217 601 1238; x_wconf 91' lang='eng'>100</span> <span class='ocrx_word' id='word_1_233' title='bbox 1135 1220 1258 1241; x_wconf 88' lang='eng' dir='ltr'>Moraxe/Ia</span> <span class='ocrx_word' id='word_1_234' title='bbox 1267 1220 1375 1241; x_wconf 85' lang='eng' dir='ltr'>Iacunata</span> <span class='ocrx_word' id='word_1_235' title='bbox 1392 1220 1469 1241; x_wconf 90' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_236' title='bbox 1481 1220 1569 1241; x_wconf 80' lang='eng' dir='ltr'>17967T</span> <span class='ocrx_word' id='word_1_237' title='bbox 1582 1220 1730 1247; x_wconf 86' lang='eng' dir='ltr'>(AF005160)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 282 149 284 231">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 282 149 284 231">
+     <span class='ocr_line' id='line_1_42' title="bbox 282 149 284 231; baseline 0 1016"><span class='ocrx_word' id='word_1_238' title='bbox 282 149 284 231; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 301 278 303 331">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 301 278 303 331">
+     <span class='ocr_line' id='line_1_43' title="bbox 301 278 303 331; baseline 0 916"><span class='ocrx_word' id='word_1_239' title='bbox 301 278 303 331; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 235 303 574 903">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 235 303 574 903">
+     <span class='ocr_line' id='line_1_44' title="bbox 235 303 354 380; baseline 0 -14"><span class='ocrx_word' id='word_1_240' title='bbox 235 303 354 380; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 235 380 354 546; baseline 0 -34"><span class='ocrx_word' id='word_1_241' title='bbox 235 380 354 546; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 261 546 342 641; baseline 0 -33"><span class='ocrx_word' id='word_1_242' title='bbox 261 546 342 641; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 332 641 573 751; baseline 0 0"><span class='ocrx_word' id='word_1_243' title='bbox 332 641 573 751; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_48' title="bbox 332 751 484 803; baseline 0 0"><span class='ocrx_word' id='word_1_244' title='bbox 332 751 484 803; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_49' title="bbox 346 803 424 843; baseline 0 404"><span class='ocrx_word' id='word_1_245' title='bbox 346 803 424 843; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_50' title="bbox 372 843 574 903; baseline 0 0"><span class='ocrx_word' id='word_1_246' title='bbox 372 843 574 903; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 348 393 415 395">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 348 393 415 395">
+     <span class='ocr_line' id='line_1_51' title="bbox 348 393 415 395; baseline 0 852"><span class='ocrx_word' id='word_1_247' title='bbox 348 393 415 395; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 413 377 415 412">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 413 377 415 412">
+     <span class='ocr_line' id='line_1_52' title="bbox 413 377 415 412; baseline 0 835"><span class='ocrx_word' id='word_1_248' title='bbox 413 377 415 412; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 348 232 352 506">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 348 232 352 506">
+     <span class='ocr_line' id='line_1_53' title="bbox 348 232 352 506; baseline 0 741"><span class='ocrx_word' id='word_1_249' title='bbox 348 232 352 506; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 362 458 364 549">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 362 458 364 549">
+     <span class='ocr_line' id='line_1_54' title="bbox 362 458 364 549; baseline 0 698"><span class='ocrx_word' id='word_1_250' title='bbox 362 458 364 549; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 223 138 225 719">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 223 138 225 719">
+     <span class='ocr_line' id='line_1_55' title="bbox 223 138 225 719; baseline 0 528"><span class='ocrx_word' id='word_1_251' title='bbox 223 138 225 719; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 423 623 428 719">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 423 623 428 719">
+     <span class='ocr_line' id='line_1_56' title="bbox 423 623 428 719; baseline 0 528"><span class='ocrx_word' id='word_1_252' title='bbox 423 623 428 719; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 237 446 239 988">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 237 446 239 988">
+     <span class='ocr_line' id='line_1_57' title="bbox 237 446 239 988; baseline 0 259"><span class='ocrx_word' id='word_1_253' title='bbox 237 446 239 988; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 237 986 261 988">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 237 986 261 988">
+     <span class='ocr_line' id='line_1_58' title="bbox 237 986 261 988; baseline 0 259"><span class='ocrx_word' id='word_1_254' title='bbox 237 986 261 988; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 256 992 557 1131">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 256 992 557 1131">
+     <span class='ocr_line' id='line_1_59' title="bbox 256 992 557 1012; baseline 0 235"><span class='ocrx_word' id='word_1_255' title='bbox 256 992 557 1012; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_60' title="bbox 256 1012 456 1044; baseline 0 203"><span class='ocrx_word' id='word_1_256' title='bbox 256 1012 456 1044; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_61' title="bbox 256 1044 443 1111; baseline 0 -47"><span class='ocrx_word' id='word_1_257' title='bbox 256 1044 443 1111; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_62' title="bbox 355 1111 420 1131; baseline 0 116"><span class='ocrx_word' id='word_1_258' title='bbox 355 1111 420 1131; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 259 948 261 1028">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 259 948 261 1028">
+     <span class='ocr_line' id='line_1_63' title="bbox 259 948 261 1028; baseline 0 219"><span class='ocrx_word' id='word_1_259' title='bbox 259 948 261 1028; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 6 128 8 1185">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 6 128 8 1185">
+     <span class='ocr_line' id='line_1_64' title="bbox 6 128 8 1185; baseline 0 62"><span class='ocrx_word' id='word_1_260' title='bbox 6 128 8 1185; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 8 1183 97 1185">
+    <p class='ocr_par' dir='ltr' id='par_1_42' title="bbox 8 1183 97 1185">
+     <span class='ocr_line' id='line_1_65' title="bbox 8 1183 97 1185; baseline 0 62"><span class='ocrx_word' id='word_1_261' title='bbox 8 1183 97 1185; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 609 1191 1498 1193">
+    <p class='ocr_par' dir='ltr' id='par_1_43' title="bbox 609 1191 1498 1193">
+     <span class='ocr_line' id='line_1_66' title="bbox 609 1191 1498 1193; baseline 0 54"><span class='ocrx_word' id='word_1_262' title='bbox 609 1191 1498 1193; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 98 1158 100 1209">
+    <p class='ocr_par' dir='ltr' id='par_1_44' title="bbox 98 1158 100 1209">
+     <span class='ocr_line' id='line_1_67' title="bbox 98 1158 100 1209; baseline 0 38"><span class='ocrx_word' id='word_1_263' title='bbox 98 1158 100 1209; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 98 1207 608 1209">
+    <p class='ocr_par' dir='ltr' id='par_1_45' title="bbox 98 1207 608 1209">
+     <span class='ocr_line' id='line_1_68' title="bbox 98 1207 608 1209; baseline 0 38"><span class='ocrx_word' id='word_1_264' title='bbox 98 1207 608 1209; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 609 1224 1127 1226">
+    <p class='ocr_par' dir='ltr' id='par_1_46' title="bbox 609 1224 1127 1226">
+     <span class='ocr_line' id='line_1_69' title="bbox 609 1224 1127 1226; baseline 0 21"><span class='ocrx_word' id='word_1_265' title='bbox 609 1224 1127 1226; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001248-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001248-0-000.pbm.png
new file mode 100644
index 00000000..fb8ac5d2
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001248-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001248-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001248-0-000.pbm.png.hocr
new file mode 100644
index 00000000..dbcfb35f
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001248-0-000.pbm.png.hocr
@@ -0,0 +1,116 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001248-0-000.pbm.png"; bbox 0 0 994 658; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 316 0 941 326">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 342 0 802 31">
+     <span class='ocr_line' id='line_1_1' title="bbox 342 0 802 31; baseline 0.002 -6"><span class='ocrx_word' id='word_1_1' title='bbox 342 7 368 26; x_wconf 82' lang='eng'>90</span> <span class='ocrx_word' id='word_1_2' title='bbox 384 3 408 25; x_wconf 90' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_3' title='bbox 421 3 501 26; x_wconf 87' lang='eng' dir='ltr'><em>brevis</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 512 3 576 26; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_5' title='bbox 588 0 632 26; x_wconf 81' lang='eng' dir='ltr'>30T</span> <span class='ocrx_word' id='word_1_6' title='bbox 643 3 802 31; x_wconf 86' lang='eng' dir='ltr'>(AB101593)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 336 36 889 68">
+     <span class='ocr_line' id='line_1_2' title="bbox 336 36 889 68; baseline 0 -6"><span class='ocrx_word' id='word_1_7' title='bbox 336 36 362 54; x_wconf 86' lang='eng'>45</span> <span class='ocrx_word' id='word_1_8' title='bbox 394 40 418 62; x_wconf 92' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_9' title='bbox 431 40 555 62; x_wconf 89' lang='eng' dir='ltr'>formosus</span> <span class='ocrx_word' id='word_1_10' title='bbox 566 40 630 62; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_11' title='bbox 642 37 720 62; x_wconf 88' lang='eng' dir='ltr'>9885T</span> <span class='ocrx_word' id='word_1_12' title='bbox 730 40 889 68; x_wconf 91' lang='eng' dir='ltr'>(AB112712)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 330 68 941 141">
+     <span class='ocr_line' id='line_1_3' title="bbox 330 68 941 105; baseline 0 -6"><span class='ocrx_word' id='word_1_13' title='bbox 330 68 352 87; x_wconf 63' lang='eng'>51</span> <span class='ocrx_word' id='word_1_14' title='bbox 396 77 420 99; x_wconf 90' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_15' title='bbox 433 77 608 99; x_wconf 88' lang='eng' dir='ltr'>choshinensis</span> <span class='ocrx_word' id='word_1_16' title='bbox 619 76 682 99; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_17' title='bbox 694 74 772 99; x_wconf 88' lang='eng' dir='ltr'>8552T</span> <span class='ocrx_word' id='word_1_18' title='bbox 783 77 941 105; x_wconf 89' lang='eng' dir='ltr'>(AB112713)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 417 111 895 141; baseline -0.002 -5"><span class='ocrx_word' id='word_1_19' title='bbox 417 113 440 135; x_wconf 90' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_20' title='bbox 454 113 563 136; x_wconf 86' lang='eng' dir='ltr'>reuszeri</span> <span class='ocrx_word' id='word_1_21' title='bbox 572 113 635 136; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_22' title='bbox 647 111 725 136; x_wconf 78' lang='eng' dir='ltr'>9887T</span> <span class='ocrx_word' id='word_1_23' title='bbox 736 113 895 141; x_wconf 92' lang='eng' dir='ltr'>(AB112715)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 412 148 889 178">
+     <span class='ocr_line' id='line_1_5' title="bbox 412 148 889 178; baseline 0.002 -6"><span class='ocrx_word' id='word_1_24' title='bbox 412 150 436 172; x_wconf 91' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_25' title='bbox 448 150 590 178; x_wconf 85' lang='eng' dir='ltr'>parabrevis</span> <span class='ocrx_word' id='word_1_26' title='bbox 601 150 648 173; x_wconf 92' lang='eng' dir='ltr'>IFO</span> <span class='ocrx_word' id='word_1_27' title='bbox 662 148 755 173; x_wconf 78' lang='eng' dir='ltr'>12334T</span> <span class='ocrx_word' id='word_1_28' title='bbox 766 150 889 178; x_wconf 86' lang='eng' dir='ltr'>(D78463)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 383 184 804 216">
+     <span class='ocr_line' id='line_1_6' title="bbox 383 184 804 216; baseline 0 -7"><span class='ocrx_word' id='word_1_29' title='bbox 383 187 408 209; x_wconf 89' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 421 187 472 216; x_wconf 87' lang='eng' dir='ltr'>agri</span> <span class='ocrx_word' id='word_1_31' title='bbox 481 187 545 209; x_wconf 87' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_32' title='bbox 556 184 635 209; x_wconf 82' lang='eng' dir='ltr'>6348T</span> <span class='ocrx_word' id='word_1_33' title='bbox 646 187 804 215; x_wconf 89' lang='eng' dir='ltr'>(AB112716)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 316 221 939 289">
+     <span class='ocr_line' id='line_1_7' title="bbox 418 221 939 252; baseline 0 -6"><span class='ocrx_word' id='word_1_34' title='bbox 418 224 441 246; x_wconf 94' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_35' title='bbox 455 224 606 252; x_wconf 88' lang='eng' dir='ltr'>Iimnophilus</span> <span class='ocrx_word' id='word_1_36' title='bbox 617 224 680 246; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_37' title='bbox 691 221 770 246; x_wconf 90' lang='eng' dir='ltr'>6472T</span> <span class='ocrx_word' id='word_1_38' title='bbox 781 224 939 252; x_wconf 93' lang='eng' dir='ltr'>(AB112717)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 316 258 862 289; baseline 0 -6"><span class='ocrx_word' id='word_1_39' title='bbox 316 261 340 283; x_wconf 92' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_40' title='bbox 353 262 528 289; x_wconf 78' lang='eng' dir='ltr'>centrosporus</span> <span class='ocrx_word' id='word_1_41' title='bbox 539 261 602 283; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_42' title='bbox 614 258 692 283; x_wconf 90' lang='eng' dir='ltr'>8445T</span> <span class='ocrx_word' id='word_1_43' title='bbox 703 261 862 289; x_wconf 85' lang='eng' dir='ltr'>(AB112719)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 349 295 861 326">
+     <span class='ocr_line' id='line_1_9' title="bbox 349 295 861 326; baseline 0 -5"><span class='ocrx_word' id='word_1_44' title='bbox 349 298 372 320; x_wconf 92' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_45' title='bbox 386 298 514 321; x_wconf 83' lang='eng' dir='ltr'>invocatus</span> <span class='ocrx_word' id='word_1_46' title='bbox 525 298 586 321; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_47' title='bbox 600 295 693 321; x_wconf 87' lang='eng' dir='ltr'>18962T</span> <span class='ocrx_word' id='word_1_48' title='bbox 704 298 861 326; x_wconf 85' lang='eng' dir='ltr'>(AF378232)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 0 84 455 631">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 0 84 455 631">
+     <span class='ocr_line' id='line_1_10' title="bbox 337 84 411 168; baseline 0 -12"><span class='ocrx_word' id='word_1_49' title='bbox 337 84 411 168; x_wconf 95' lang='eng' dir='ltr'>    </span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 259 168 383 193; baseline 0 465"><span class='ocrx_word' id='word_1_50' title='bbox 259 168 383 193; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 227 193 416 267; baseline 0 -35"><span class='ocrx_word' id='word_1_51' title='bbox 227 193 416 267; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 227 267 316 304; baseline 0 354"><span class='ocrx_word' id='word_1_52' title='bbox 227 267 316 304; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 192 304 347 357; baseline 0 0"><span class='ocrx_word' id='word_1_53' title='bbox 192 304 347 357; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 213 357 299 414; baseline 0 244"><span class='ocrx_word' id='word_1_54' title='bbox 213 357 299 414; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 0 414 347 452; baseline 0 206"><span class='ocrx_word' id='word_1_55' title='bbox 0 414 347 452; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 0 452 455 501; baseline 0 0"><span class='ocrx_word' id='word_1_56' title='bbox 0 452 455 501; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 0 501 420 538; baseline 0 120"><span class='ocrx_word' id='word_1_57' title='bbox 0 501 420 538; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 0 538 336 562; baseline 0 96"><span class='ocrx_word' id='word_1_58' title='bbox 0 538 336 562; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 0 562 336 599; baseline 0 59"><span class='ocrx_word' id='word_1_59' title='bbox 0 562 336 599; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 0 599 386 631; baseline 0 27"><span class='ocrx_word' id='word_1_60' title='bbox 0 599 386 631; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 299 371 994 658">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 299 371 789 400">
+     <span class='ocr_line' id='line_1_22' title="bbox 299 371 789 400; baseline 0 -6"><span class='ocrx_word' id='word_1_61' title='bbox 299 371 325 389; x_wconf 84' lang='eng'><strong>99</strong></span> <span class='ocrx_word' id='word_1_62' title='bbox 346 372 373 394; x_wconf 92' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_63' title='bbox 384 372 555 400; x_wconf 85' lang='eng' dir='ltr'>panacihumi</span> <span class='ocrx_word' id='word_1_64' title='bbox 564 371 617 394; x_wconf 91' lang='eng' dir='ltr'>C17</span> <span class='ocrx_word' id='word_1_65' title='bbox 628 372 789 400; x_wconf 85' lang='eng' dir='ltr'>(EU383032)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 347 406 879 437">
+     <span class='ocr_line' id='line_1_23' title="bbox 347 406 879 437; baseline -0.002 -6"><span class='ocrx_word' id='word_1_66' title='bbox 347 408 371 430; x_wconf 93' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_67' title='bbox 385 408 546 431; x_wconf 80' lang='eng' dir='ltr'>borstelensis</span> <span class='ocrx_word' id='word_1_68' title='bbox 557 408 620 431; x_wconf 92' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_69' title='bbox 631 406 710 431; x_wconf 90' lang='eng' dir='ltr'>6347T</span> <span class='ocrx_word' id='word_1_70' title='bbox 721 408 879 437; x_wconf 91' lang='eng' dir='ltr'>(AB112721)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 383 442 853 473">
+     <span class='ocr_line' id='line_1_24' title="bbox 383 442 853 473; baseline 0.002 -6"><span class='ocrx_word' id='word_1_71' title='bbox 383 445 407 467; x_wconf 91' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_72' title='bbox 420 445 510 468; x_wconf 85' lang='eng' dir='ltr'>levickii</span> <span class='ocrx_word' id='word_1_73' title='bbox 520 445 582 468; x_wconf 90' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_74' title='bbox 593 442 688 468; x_wconf 93' lang='eng' dir='ltr'>22481T</span> <span class='ocrx_word' id='word_1_75' title='bbox 699 445 853 473; x_wconf 86' lang='eng' dir='ltr'>(AJ715378)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 420 479 994 547">
+     <span class='ocr_line' id='line_1_25' title="bbox 458 479 994 510; baseline -0.002 -5"><span class='ocrx_word' id='word_1_76' title='bbox 458 482 482 504; x_wconf 91' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_77' title='bbox 496 482 663 505; x_wconf 83' lang='eng' dir='ltr'>thermoruber</span> <span class='ocrx_word' id='word_1_78' title='bbox 671 482 734 505; x_wconf 85' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_79' title='bbox 746 479 825 505; x_wconf 89' lang='eng' dir='ltr'>7064T</span> <span class='ocrx_word' id='word_1_80' title='bbox 835 482 994 510; x_wconf 89' lang='eng' dir='ltr'>(AB112722)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 420 516 923 547; baseline 0 -6"><span class='ocrx_word' id='word_1_81' title='bbox 420 519 444 541; x_wconf 93' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_82' title='bbox 457 519 623 547; x_wconf 86' lang='eng' dir='ltr'>laterosporus</span> <span class='ocrx_word' id='word_1_83' title='bbox 634 519 698 541; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_84' title='bbox 709 516 754 541; x_wconf 91' lang='eng' dir='ltr'>25T</span> <span class='ocrx_word' id='word_1_85' title='bbox 765 519 923 547; x_wconf 89' lang='eng' dir='ltr'>(AB112720)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 336 553 968 658">
+     <span class='ocr_line' id='line_1_27' title="bbox 336 553 866 584; baseline 0 -6"><span class='ocrx_word' id='word_1_86' title='bbox 336 556 361 578; x_wconf 95' lang='eng' dir='ltr'>B.</span> <span class='ocrx_word' id='word_1_87' title='bbox 373 556 533 584; x_wconf 85' lang='eng' dir='ltr'>ginsengisoli</span> <span class='ocrx_word' id='word_1_88' title='bbox 541 555 607 578; x_wconf 86' lang='eng' dir='ltr'>Gsoil</span> <span class='ocrx_word' id='word_1_89' title='bbox 619 553 697 578; x_wconf 82' lang='eng' dir='ltr'>3088T</span> <span class='ocrx_word' id='word_1_90' title='bbox 708 556 866 584; x_wconf 81' lang='eng' dir='ltr'>(ABZ45376)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 390 590 968 621; baseline 0 -6"><span class='ocrx_word' id='word_1_91' title='bbox 390 593 603 615; x_wconf 85' lang='eng' dir='ltr'>Aneurinibacillus</span> <span class='ocrx_word' id='word_1_92' title='bbox 613 593 804 621; x_wconf 85' lang='eng' dir='ltr'>aneurinilyticus</span> <span class='ocrx_word' id='word_1_93' title='bbox 815 592 878 615; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_94' title='bbox 890 590 968 615; x_wconf 83' lang='eng' dir='ltr'>5562T</span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 392 630 551 658; baseline 0 -6"><span class='ocrx_word' id='word_1_95' title='bbox 392 630 551 658; x_wconf 92' lang='eng' dir='ltr'>(AB112724)</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001354-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001354-0-000.pbm.png
new file mode 100644
index 00000000..a31caaaa
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001354-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001354-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001354-0-000.pbm.png.hocr
new file mode 100644
index 00000000..aa9440b3
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001354-0-000.pbm.png.hocr
@@ -0,0 +1,98 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001354-0-000.pbm.png"; bbox 0 0 1302 1125; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 5 4 1140 183">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 173 4 1140 183">
+     <span class='ocr_line' id='line_1_1' title="bbox 457 4 1061 33; baseline 0 -6"><span class='ocrx_word' id='word_1_1' title='bbox 457 6 617 27; x_wconf 66' lang='eng' dir='ltr'>Arthrobacter</span> <span class='ocrx_word' id='word_1_2' title='bbox 622 6 760 33; x_wconf 86' lang='eng' dir='ltr'>globiformis</span> <span class='ocrx_word' id='word_1_3' title='bbox 771 6 830 27; x_wconf 90' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_4' title='bbox 841 4 932 27; x_wconf 91' lang='eng' dir='ltr'>20124T</span> <span class='ocrx_word' id='word_1_5' title='bbox 942 6 1031 33; x_wconf 84' lang='eng' dir='ltr'>(M2341</span> <span class='ocrx_word' id='word_1_6' title='bbox 1040 6 1061 33; x_wconf 94' lang='eng'>1)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 365 41 922 70; baseline -0.002 -5"><span class='ocrx_word' id='word_1_7' title='bbox 365 44 508 70; x_wconf 78' lang='eng' dir='ltr'>Agromyces</span> <span class='ocrx_word' id='word_1_8' title='bbox 517 49 626 65; x_wconf 87' lang='eng' dir='ltr'>ramosus</span> <span class='ocrx_word' id='word_1_9' title='bbox 636 43 696 65; x_wconf 87' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_10' title='bbox 706 41 797 65; x_wconf 79' lang='eng' dir='ltr'>43045T</span> <span class='ocrx_word' id='word_1_11' title='bbox 807 43 922 70; x_wconf 95' lang='eng' dir='ltr'>(X77447)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 173 78 1064 108; baseline 0 -6"><span class='ocrx_word' id='word_1_12' title='bbox 173 86 197 103; x_wconf 86' lang='eng'>87</span> <span class='ocrx_word' id='word_1_13' title='bbox 423 81 658 102; x_wconf 82' lang='eng' dir='ltr'>Pseudoclavibacter</span> <span class='ocrx_word' id='word_1_14' title='bbox 665 81 768 102; x_wconf 86' lang='eng' dir='ltr'>helvo/us</span> <span class='ocrx_word' id='word_1_15' title='bbox 779 81 838 102; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_16' title='bbox 849 78 940 102; x_wconf 82' lang='eng' dir='ltr'>20419T</span> <span class='ocrx_word' id='word_1_17' title='bbox 949 81 1064 108; x_wconf 89' lang='eng' dir='ltr'>(X77440)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 571 116 1140 145; baseline 0 -6"><span class='ocrx_word' id='word_1_18' title='bbox 571 118 732 139; x_wconf 84' lang='eng' dir='ltr'>Gu/osibacter</span> <span class='ocrx_word' id='word_1_19' title='bbox 738 118 906 139; x_wconf 82' lang='eng' dir='ltr'>molinativorax</span> <span class='ocrx_word' id='word_1_20' title='bbox 915 116 985 139; x_wconf 94' lang='eng' dir='ltr'>0N4T</span> <span class='ocrx_word' id='word_1_21' title='bbox 995 118 1140 145; x_wconf 85' lang='eng' dir='ltr'>(AJ306835)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 409 153 1028 183; baseline 0 -6"><span class='ocrx_word' id='word_1_22' title='bbox 409 156 567 177; x_wconf 85' lang='eng' dir='ltr'>Leucobacter</span> <span class='ocrx_word' id='word_1_23' title='bbox 574 156 714 182; x_wconf 81' lang='eng' dir='ltr'>komagatae</span> <span class='ocrx_word' id='word_1_24' title='bbox 725 156 768 177; x_wconf 90' lang='eng' dir='ltr'>IFO</span> <span class='ocrx_word' id='word_1_25' title='bbox 781 153 869 177; x_wconf 85' lang='eng' dir='ltr'>15245T</span> <span class='ocrx_word' id='word_1_26' title='bbox 879 156 1028 183; x_wconf 88' lang='eng' dir='ltr'>(AB007419)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 3 191 1068 333">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 3 191 1068 333">
+     <span class='ocr_line' id='line_1_6' title="bbox 204 191 992 220; baseline -0.003 -4"><span class='ocrx_word' id='word_1_27' title='bbox 204 199 228 216; x_wconf 88' lang='eng'>67</span> <span class='ocrx_word' id='word_1_28' title='bbox 379 193 511 214; x_wconf 83' lang='eng' dir='ltr'><em>Frondicola</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 521 193 657 214; x_wconf 82' lang='eng' dir='ltr'>australicus</span> <span class='ocrx_word' id='word_1_30' title='bbox 667 193 727 214; x_wconf 90' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_31' title='bbox 740 191 828 214; x_wconf 88' lang='eng' dir='ltr'>17894T</span> <span class='ocrx_word' id='word_1_32' title='bbox 837 193 992 220; x_wconf 88' lang='eng' dir='ltr'>(DQ525859)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 3 228 822 257; baseline 0 -6"><span class='ocrx_word' id='word_1_33' title='bbox 3 230 27 247; x_wconf 83' lang='eng'>99</span> <span class='ocrx_word' id='word_1_34' title='bbox 354 230 559 257; x_wconf 80' lang='eng' dir='ltr'>Frigoribacterium</span> <span class='ocrx_word' id='word_1_35' title='bbox 569 230 631 251; x_wconf 87' lang='eng' dir='ltr'><em>faeni</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 639 230 680 251; x_wconf 88' lang='eng'>801</span> <span class='ocrx_word' id='word_1_37' title='bbox 686 228 697 242; x_wconf 76' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_38' title='bbox 707 230 822 257; x_wconf 88' lang='eng' dir='ltr'>(Y18807)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 443 266 1068 295; baseline 0 -6"><span class='ocrx_word' id='word_1_39' title='bbox 443 268 586 289; x_wconf 81' lang='eng' dir='ltr'>CIav/bacter</span> <span class='ocrx_word' id='word_1_40' title='bbox 593 268 773 295; x_wconf 86' lang='eng' dir='ltr'>michiganensis</span> <span class='ocrx_word' id='word_1_41' title='bbox 783 268 843 289; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_42' title='bbox 853 266 944 289; x_wconf 80' lang='eng' dir='ltr'>46364T</span> <span class='ocrx_word' id='word_1_43' title='bbox 954 268 1068 295; x_wconf 87' lang='eng' dir='ltr'>(X77435)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 195 303 940 333; baseline 0 -6"><span class='ocrx_word' id='word_1_44' title='bbox 195 305 219 322; x_wconf 80' lang='eng'>56</span> <span class='ocrx_word' id='word_1_45' title='bbox 402 306 536 327; x_wconf 85' lang='eng' dir='ltr'>Subterco/a</span> <span class='ocrx_word' id='word_1_46' title='bbox 546 306 696 333; x_wconf 85' lang='eng' dir='ltr'>frigoramans</span> <span class='ocrx_word' id='word_1_47' title='bbox 706 303 782 327; x_wconf 90' lang='eng' dir='ltr'>K265T</span> <span class='ocrx_word' id='word_1_48' title='bbox 792 306 940 333; x_wconf 87' lang='eng' dir='ltr'>(AF224723)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 39 341 1300 1057">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 39 341 1300 1057">
+     <span class='ocr_line' id='line_1_10' title="bbox 429 341 993 370; baseline 0 -6"><span class='ocrx_word' id='word_1_49' title='bbox 429 343 572 370; x_wconf 81' lang='eng' dir='ltr'>Mycetocola</span> <span class='ocrx_word' id='word_1_50' title='bbox 582 343 727 370; x_wconf 83' lang='eng' dir='ltr'>saprophi/us</span> <span class='ocrx_word' id='word_1_51' title='bbox 736 343 816 364; x_wconf 89' lang='eng' dir='ltr'>CM-01</span> <span class='ocrx_word' id='word_1_52' title='bbox 822 341 833 355; x_wconf 79' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_53' title='bbox 843 343 993 370; x_wconf 82' lang='eng' dir='ltr'>(ABO12647)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 447 378 1048 408; baseline 0.002 -7"><span class='ocrx_word' id='word_1_54' title='bbox 447 381 619 407; x_wconf 85' lang='eng' dir='ltr'>Yonghaparkia</span> <span class='ocrx_word' id='word_1_55' title='bbox 629 381 752 407; x_wconf 89' lang='eng' dir='ltr'><em>alkaliphila</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 763 378 884 402; x_wconf 84' lang='eng' dir='ltr'>KSL—113T</span> <span class='ocrx_word' id='word_1_57' title='bbox 894 380 1048 408; x_wconf 87' lang='eng' dir='ltr'>(DQ256087)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 316 416 960 445; baseline 0.008 -11"><span class='ocrx_word' id='word_1_58' title='bbox 316 418 351 435; x_wconf 90' lang='eng'>100</span> <span class='ocrx_word' id='word_1_59' title='bbox 486 418 612 439; x_wconf 84' lang='eng' dir='ltr'>Microce/Ia</span> <span class='ocrx_word' id='word_1_60' title='bbox 621 418 720 444; x_wconf 85' lang='eng' dir='ltr'>putealis</span> <span class='ocrx_word' id='word_1_61' title='bbox 729 416 805 439; x_wconf 91' lang='eng' dir='ltr'>CV-2T</span> <span class='ocrx_word' id='word_1_62' title='bbox 815 418 960 445; x_wconf 84' lang='eng' dir='ltr'>(AJ717388)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 380 453 929 482; baseline -0.002 -5"><span class='ocrx_word' id='word_1_63' title='bbox 380 455 557 482; x_wconf 85' lang='eng' dir='ltr'>Rathayibacter</span> <span class='ocrx_word' id='word_1_64' title='bbox 564 455 650 482; x_wconf 81' lang='eng' dir='ltr'>rathayi</span> <span class='ocrx_word' id='word_1_65' title='bbox 659 455 719 477; x_wconf 87' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_66' title='bbox 730 453 804 477; x_wconf 89' lang='eng' dir='ltr'>7485T</span> <span class='ocrx_word' id='word_1_67' title='bbox 814 455 929 482; x_wconf 88' lang='eng' dir='ltr'>(X77439)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 422 491 1030 520; baseline 0 -6"><span class='ocrx_word' id='word_1_68' title='bbox 422 493 544 514; x_wconf 86' lang='eng' dir='ltr'>Labedella</span> <span class='ocrx_word' id='word_1_69' title='bbox 553 493 699 520; x_wconf 84' lang='eng' dir='ltr'>gwakjiensis</span> <span class='ocrx_word' id='word_1_70' title='bbox 708 493 764 514; x_wconf 83' lang='eng' dir='ltr'>JCM</span> <span class='ocrx_word' id='word_1_71' title='bbox 777 491 865 514; x_wconf 82' lang='eng' dir='ltr'>14008T</span> <span class='ocrx_word' id='word_1_72' title='bbox 876 493 1030 520; x_wconf 85' lang='eng' dir='ltr'>(DQ533552)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 243 528 1300 557; baseline 0 -6"><span class='ocrx_word' id='word_1_73' title='bbox 243 530 267 547; x_wconf 80' lang='eng'>36</span> <span class='ocrx_word' id='word_1_74' title='bbox 647 530 830 557; x_wconf 84' lang='eng' dir='ltr'>Cryobacterium</span> <span class='ocrx_word' id='word_1_75' title='bbox 838 530 1023 557; x_wconf 85' lang='eng' dir='ltr'>psychrophi/um</span> <span class='ocrx_word' id='word_1_76' title='bbox 1032 530 1089 551; x_wconf 89' lang='eng' dir='ltr'>JCM</span> <span class='ocrx_word' id='word_1_77' title='bbox 1102 528 1174 551; x_wconf 77' lang='eng' dir='ltr'>1463T</span> <span class='ocrx_word' id='word_1_78' title='bbox 1184 530 1300 557; x_wconf 89' lang='eng' dir='ltr'>(D45058)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 377 565 968 594; baseline -0.002 -5"><span class='ocrx_word' id='word_1_79' title='bbox 377 567 570 589; x_wconf 73' lang='eng' dir='ltr'>Cunobacterium</span> <span class='ocrx_word' id='word_1_80' title='bbox 580 568 672 589; x_wconf 85' lang='eng' dir='ltr'>citreum</span> <span class='ocrx_word' id='word_1_81' title='bbox 683 567 742 589; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_82' title='bbox 753 565 843 589; x_wconf 90' lang='eng' dir='ltr'>20528T</span> <span class='ocrx_word' id='word_1_83' title='bbox 853 567 968 594; x_wconf 87' lang='eng' dir='ltr'>(X77436)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 276 603 929 632; baseline -0.003 -4"><span class='ocrx_word' id='word_1_84' title='bbox 276 611 311 628; x_wconf 87' lang='eng'>100</span> <span class='ocrx_word' id='word_1_85' title='bbox 360 605 442 632; x_wconf 81' lang='eng' dir='ltr'>Agreia</span> <span class='ocrx_word' id='word_1_86' title='bbox 452 605 574 626; x_wconf 82' lang='eng' dir='ltr'>bicolorata</span> <span class='ocrx_word' id='word_1_87' title='bbox 583 605 643 626; x_wconf 92' lang='eng' dir='ltr'>VKM</span> <span class='ocrx_word' id='word_1_88' title='bbox 653 603 771 626; x_wconf 82' lang='eng' dir='ltr'>Ac-1804T</span> <span class='ocrx_word' id='word_1_89' title='bbox 781 605 929 632; x_wconf 85' lang='eng' dir='ltr'>(AF159363)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 204 639 871 670; baseline 0 -6"><span class='ocrx_word' id='word_1_90' title='bbox 204 639 228 656; x_wconf 72' lang='eng'>38</span> <span class='ocrx_word' id='word_1_91' title='bbox 338 643 420 670; x_wconf 85' lang='eng' dir='ltr'>Agreia</span> <span class='ocrx_word' id='word_1_92' title='bbox 428 643 545 669; x_wconf 87' lang='eng' dir='ltr'>pratensis</span> <span class='ocrx_word' id='word_1_93' title='bbox 555 643 615 664; x_wconf 92' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_94' title='bbox 627 641 716 664; x_wconf 89' lang='eng' dir='ltr'>14246T</span> <span class='ocrx_word' id='word_1_95' title='bbox 726 643 871 670; x_wconf 83' lang='eng' dir='ltr'>(AJ310412)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 165 678 885 707; baseline 0 -6"><span class='ocrx_word' id='word_1_96' title='bbox 165 682 188 698; x_wconf 87' lang='eng'>72</span> <span class='ocrx_word' id='word_1_97' title='bbox 411 680 545 701; x_wconf 82' lang='eng' dir='ltr'>Subtercola</span> <span class='ocrx_word' id='word_1_98' title='bbox 554 680 641 701; x_wconf 87' lang='eng' dir='ltr'>boreus</span> <span class='ocrx_word' id='word_1_99' title='bbox 650 678 727 701; x_wconf 88' lang='eng' dir='ltr'>K300T</span> <span class='ocrx_word' id='word_1_100' title='bbox 737 680 885 707; x_wconf 89' lang='eng' dir='ltr'>(AF224722)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 388 717 765 744; baseline 0 -6"><span class='ocrx_word' id='word_1_101' title='bbox 388 717 467 739; x_wconf 84' lang='eng' dir='ltr'><strong>Strain</strong></span> <span class='ocrx_word' id='word_1_102' title='bbox 477 718 601 739; x_wconf 88' lang='eng' dir='ltr'>AHU1810</span> <span class='ocrx_word' id='word_1_103' title='bbox 612 717 765 744; x_wconf 83' lang='eng' dir='ltr'>(AB378302)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 310 753 777 782; baseline 0 -6"><span class='ocrx_word' id='word_1_104' title='bbox 310 755 345 772; x_wconf 88' lang='eng'>100</span> <span class='ocrx_word' id='word_1_105' title='bbox 389 755 467 776; x_wconf 84' lang='eng' dir='ltr'>Strain</span> <span class='ocrx_word' id='word_1_106' title='bbox 477 753 614 776; x_wconf 81' lang='eng' dir='ltr'>AHU1791T</span> <span class='ocrx_word' id='word_1_107' title='bbox 624 755 777 782; x_wconf 87' lang='eng' dir='ltr'>(AB378301)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 215 790 970 819; baseline -0.004 -3"><span class='ocrx_word' id='word_1_108' title='bbox 215 799 237 816; x_wconf 87' lang='eng'>61</span> <span class='ocrx_word' id='word_1_109' title='bbox 412 793 564 814; x_wconf 86' lang='eng' dir='ltr'>Plantibacter</span> <span class='ocrx_word' id='word_1_110' title='bbox 571 792 644 814; x_wconf 86' lang='eng' dir='ltr'><em>ﬂavus</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 655 792 714 814; x_wconf 90' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_112' title='bbox 727 790 815 814; x_wconf 88' lang='eng' dir='ltr'>14012T</span> <span class='ocrx_word' id='word_1_113' title='bbox 825 792 970 819; x_wconf 82' lang='eng' dir='ltr'>(AJ310417)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 380 827 1026 857; baseline 0 -6"><span class='ocrx_word' id='word_1_114' title='bbox 380 830 546 851; x_wconf 84' lang='eng' dir='ltr'>Okibacterium</span> <span class='ocrx_word' id='word_1_115' title='bbox 556 830 669 851; x_wconf 82' lang='eng' dir='ltr'>friti/lariae</span> <span class='ocrx_word' id='word_1_116' title='bbox 678 830 738 851; x_wconf 94' lang='eng' dir='ltr'>VKM</span> <span class='ocrx_word' id='word_1_117' title='bbox 748 827 866 851; x_wconf 79' lang='eng' dir='ltr'>Ac—2059T</span> <span class='ocrx_word' id='word_1_118' title='bbox 876 830 1026 857; x_wconf 84' lang='eng' dir='ltr'>(AB042094)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 306 865 987 894; baseline -0.004 -3"><span class='ocrx_word' id='word_1_119' title='bbox 306 874 342 891; x_wconf 88' lang='eng'>100</span> <span class='ocrx_word' id='word_1_120' title='bbox 499 868 666 894; x_wconf 87' lang='eng' dir='ltr'><em>Rhodoglobus</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 676 868 762 889; x_wconf 86' lang='eng' dir='ltr'>vestalii</span> <span class='ocrx_word' id='word_1_122' title='bbox 771 865 832 889; x_wconf 85' lang='eng' dir='ltr'>LV3T</span> <span class='ocrx_word' id='word_1_123' title='bbox 842 867 987 894; x_wconf 88' lang='eng' dir='ltr'>(AJ459101)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 350 876 1117 932; baseline 0 -6"><span class='ocrx_word' id='word_1_124' title='bbox 350 876 415 917; x_wconf 66' lang='eng' dir='ltr'>E</span> <span class='ocrx_word' id='word_1_125' title='bbox 428 905 621 926; x_wconf 82' lang='eng' dir='ltr'>Salinibacterium</span> <span class='ocrx_word' id='word_1_126' title='bbox 630 905 799 932; x_wconf 84' lang='eng' dir='ltr'>amurskyense</span> <span class='ocrx_word' id='word_1_127' title='bbox 810 905 873 926; x_wconf 93' lang='eng' dir='ltr'>KMM</span> <span class='ocrx_word' id='word_1_128' title='bbox 884 903 958 926; x_wconf 78' lang='eng' dir='ltr'>3673T</span> <span class='ocrx_word' id='word_1_129' title='bbox 968 905 1117 932; x_wconf 86' lang='eng' dir='ltr'>(AF539697)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 366 940 912 969; baseline 0 -6"><span class='ocrx_word' id='word_1_130' title='bbox 366 943 537 964; x_wconf 81' lang='eng' dir='ltr'>Microterricola</span> <span class='ocrx_word' id='word_1_131' title='bbox 548 943 638 964; x_wconf 84' lang='eng' dir='ltr'>vlrldarii</span> <span class='ocrx_word' id='word_1_132' title='bbox 646 940 752 964; x_wconf 81' lang='eng' dir='ltr'>KV—677T</span> <span class='ocrx_word' id='word_1_133' title='bbox 762 942 912 969; x_wconf 81' lang='eng' dir='ltr'>(A3282862)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 458 978 982 1007; baseline 0 -6"><span class='ocrx_word' id='word_1_134' title='bbox 458 980 570 1001; x_wconf 84' lang='eng' dir='ltr'><em>Leifsonia</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 579 980 686 1007; x_wconf 78' lang='eng' dir='ltr'>aquatica</span> <span class='ocrx_word' id='word_1_136' title='bbox 697 980 756 1001; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_137' title='bbox 767 978 857 1001; x_wconf 77' lang='eng' dir='ltr'>20146T</span> <span class='ocrx_word' id='word_1_138' title='bbox 867 980 982 1007; x_wconf 90' lang='eng' dir='ltr'>(X77450)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 39 1015 1051 1057; baseline -0.001 -18"><span class='ocrx_word' id='word_1_139' title='bbox 39 1040 79 1057; x_wconf 32' lang='eng'>0-01</span> <span class='ocrx_word' id='word_1_140' title='bbox 509 1018 659 1044; x_wconf 84' lang='eng' dir='ltr'>Agrococcus</span> <span class='ocrx_word' id='word_1_141' title='bbox 664 1018 772 1044; x_wconf 79' lang='eng' dir='ltr'>jenensis</span> <span class='ocrx_word' id='word_1_142' title='bbox 782 1017 841 1039; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_143' title='bbox 852 1015 927 1039; x_wconf 79' lang='eng' dir='ltr'>9580T</span> <span class='ocrx_word' id='word_1_144' title='bbox 937 1017 1051 1044; x_wconf 89' lang='eng' dir='ltr'>(X92492)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 8 1052 1145 1119">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 8 1052 1145 1119">
+     <span class='ocr_line' id='line_1_29' title="bbox 8 1052 1145 1082; baseline 0 -6"><span class='ocrx_word' id='word_1_145' title='bbox 8 1059 113 1072; x_wconf 83' lang='eng' dir='ltr'>I—I</span> <span class='ocrx_word' id='word_1_146' title='bbox 541 1055 735 1076; x_wconf 82' lang='eng' dir='ltr'>Microbacterium</span> <span class='ocrx_word' id='word_1_147' title='bbox 745 1055 848 1076; x_wconf 83' lang='eng' dir='ltr'>Iacticum</span> <span class='ocrx_word' id='word_1_148' title='bbox 859 1055 919 1076; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_149' title='bbox 930 1052 1020 1076; x_wconf 84' lang='eng' dir='ltr'>20427T</span> <span class='ocrx_word' id='word_1_150' title='bbox 1030 1055 1145 1082; x_wconf 92' lang='eng' dir='ltr'>(X77441)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 422 1090 1139 1119; baseline 0.006 -10"><span class='ocrx_word' id='word_1_151' title='bbox 422 1093 457 1110; x_wconf 88' lang='eng'>100</span> <span class='ocrx_word' id='word_1_152' title='bbox 509 1092 703 1113; x_wconf 82' lang='eng' dir='ltr'><em>Microbacterium</em></span> <span class='ocrx_word' id='word_1_153' title='bbox 713 1092 826 1113; x_wconf 84' lang='eng' dir='ltr'>sch/eiferi</span> <span class='ocrx_word' id='word_1_154' title='bbox 835 1092 880 1113; x_wconf 91' lang='eng' dir='ltr'>IFO</span> <span class='ocrx_word' id='word_1_155' title='bbox 892 1090 980 1113; x_wconf 91' lang='eng' dir='ltr'>15075T</span> <span class='ocrx_word' id='word_1_156' title='bbox 990 1092 1139 1119; x_wconf 83' lang='eng' dir='ltr'>(ABOO4723)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 57 399 81 416">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 57 399 81 416">
+     <span class='ocr_line' id='line_1_31' title="bbox 57 399 81 416; baseline 0 0"><span class='ocrx_word' id='word_1_157' title='bbox 57 399 81 416; x_wconf 88' lang='eng'>65</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001362-0-002.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001362-0-002.pbm.png
new file mode 100644
index 00000000..bdb07af2
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001362-0-002.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001362-0-002.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001362-0-002.pbm.png.hocr
new file mode 100644
index 00000000..ab1ca466
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001362-0-002.pbm.png.hocr
@@ -0,0 +1,131 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001362-0-002.pbm.png"; bbox 0 0 1302 898; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 0 0 1302 898">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 430 0 1180 234">
+     <span class='ocr_line' id='line_1_1' title="bbox 504 0 1054 27; baseline 0 -6"><span class='ocrx_word' id='word_1_1' title='bbox 504 1 652 21; x_wconf 84' lang='eng' dir='ltr'><em>Ha/obacillus</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 661 1 785 27; x_wconf 87' lang='eng' dir='ltr'><em>halophilus</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 794 1 852 21; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 862 0 933 21; x_wconf 77' lang='eng' dir='ltr'><em>2266T</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 943 1 1054 27; x_wconf 89' lang='eng' dir='ltr'><em>(X62174)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 573 42 1161 68; baseline 0 -5"><span class='ocrx_word' id='word_1_6' title='bbox 573 43 743 63; x_wconf 84' lang='eng' dir='ltr'><em>Marinococcus</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 752 43 876 68; x_wconf 82' lang='eng' dir='ltr'><em>ha/ophi/us</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 886 42 943 63; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 954 42 1039 63; x_wconf 89' lang='eng' dir='ltr'><em>20408T</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 1049 42 1161 68; x_wconf 86' lang='eng' dir='ltr'><em>(X90835)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 546 83 1171 110; baseline 0 -6"><span class='ocrx_word' id='word_1_11' title='bbox 546 84 769 109; x_wconf 81' lang='eng' dir='ltr'><em>SporalactobaciI/us</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 778 84 871 104; x_wconf 84' lang='eng' dir='ltr'><em>inu/inus</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 877 84 950 104; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 961 83 1045 104; x_wconf 77' lang='eng' dir='ltr'><em>15538T</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 1055 84 1171 110; x_wconf 83' lang='eng' dir='ltr'><em>(M58838)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 524 124 1180 151; baseline -0.002 -5"><span class='ocrx_word' id='word_1_16' title='bbox 524 125 729 151; x_wconf 82' lang='eng' dir='ltr'><em>Exiguobacterium</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 739 125 890 146; x_wconf 87' lang='eng' dir='ltr'><em>aurantiacum</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 900 125 979 146; x_wconf 88' lang='eng' dir='ltr'>NCDO</span> <span class='ocrx_word' id='word_1_19' title='bbox 988 124 1059 146; x_wconf 85' lang='eng' dir='ltr'><em>2321T</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 1068 125 1180 151; x_wconf 84' lang='eng' dir='ltr'><em>(X70316)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 430 166 1078 193; baseline 0 -6"><span class='ocrx_word' id='word_1_21' title='bbox 430 167 625 187; x_wconf 84' lang='eng' dir='ltr'><em>Aneurinibacillus</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 634 167 808 193; x_wconf 81' lang='eng' dir='ltr'><em>aneurinilyticus</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 818 166 876 187; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 887 166 957 187; x_wconf 74' lang='eng' dir='ltr'><em>5562T</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 967 166 1078 193; x_wconf 85' lang='eng' dir='ltr'><em>(X94194)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 492 207 995 234; baseline 0.002 -6"><span class='ocrx_word' id='word_1_26' title='bbox 492 208 646 228; x_wconf 87' lang='eng' dir='ltr'><em>Brevibaci/lus</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 655 208 728 228; x_wconf 83' lang='eng' dir='ltr'><em>brevis</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 737 208 791 229; x_wconf 92' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 802 207 872 229; x_wconf 84' lang='eng' dir='ltr'><em>2503T</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 882 208 995 234; x_wconf 90' lang='eng' dir='ltr'><em>(D78457)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 330 249 1302 442">
+     <span class='ocr_line' id='line_1_7' title="bbox 499 249 1057 275; baseline 0 -5"><span class='ocrx_word' id='word_1_31' title='bbox 499 250 661 270; x_wconf 86' lang='eng' dir='ltr'><em>Paenibacillus</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 669 250 785 275; x_wconf 84' lang='eng' dir='ltr'><em>polymyxa</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 796 250 841 270; x_wconf 93' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 854 249 1057 275; x_wconf 70' lang='eng' dir='ltr'><em>13419T(D16276)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 634 290 1302 317; baseline 0 -5"><span class='ocrx_word' id='word_1_35' title='bbox 634 291 821 317; x_wconf 87' lang='eng' dir='ltr'><em>Alicyc/obaciI/us</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 830 291 1003 312; x_wconf 82' lang='eng' dir='ltr'><em>acidoterrestris</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 1013 291 1070 312; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 1081 290 1151 312; x_wconf 79' lang='eng' dir='ltr'><em>3922T</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 1161 291 1302 317; x_wconf 85' lang='eng' dir='ltr'><em>(AJ133631)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 657 332 1274 359; baseline 0 -6"><span class='ocrx_word' id='word_1_40' title='bbox 657 333 811 353; x_wconf 84' lang='eng' dir='ltr'><em>SulfobaciI/us</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 820 333 1081 353; x_wconf 82' lang='eng' dir='ltr'><em>thermosu/ﬁdooxidans</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 1087 332 1153 353; x_wconf 76' lang='eng' dir='ltr'><em>AT-1T</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 1163 333 1215 359; x_wconf 85' lang='eng' dir='ltr'><em>(X91</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 1221 333 1274 359; x_wconf 89' lang='eng'><em>080)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 330 374 1105 400; baseline -0.001 -5"><span class='ocrx_word' id='word_1_45' title='bbox 330 374 562 400; x_wconf 80' lang='eng' dir='ltr'><em>Mechercharimyces</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 571 374 807 400; x_wconf 82' lang='eng' dir='ltr'><em>asporophorigenens</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 815 374 949 395; x_wconf 75' lang='eng' dir='ltr'><em>YM11-542T</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 960 374 1105 400; x_wconf 86' lang='eng' dir='ltr'><em>(AB239532)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 333 415 993 442; baseline 0 -6"><span class='ocrx_word' id='word_1_49' title='bbox 333 416 564 442; x_wconf 81' lang='eng' dir='ltr'><em>Mechercharimyces</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 573 416 712 441; x_wconf 85' lang='eng' dir='ltr'><em>mesophilus</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 720 415 841 436; x_wconf 77' lang='eng' dir='ltr'><em>YM3-251T</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 848 415 993 442; x_wconf 86' lang='eng' dir='ltr'><em>(AB239529)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 361 456 900 483">
+     <span class='ocr_line' id='line_1_12' title="bbox 361 456 900 483; baseline 0.002 -6"><span class='ocrx_word' id='word_1_53' title='bbox 361 457 509 478; x_wconf 86' lang='eng' dir='ltr'><em>Shimazuella</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 519 457 643 478; x_wconf 87' lang='eng' dir='ltr'><em>kribbensis</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 649 457 667 477; x_wconf 97' lang='eng' dir='ltr'>A</span> <span class='ocrx_word' id='word_1_56' title='bbox 675 456 745 478; x_wconf 78' lang='eng' dir='ltr'><em>9500T</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 755 457 900 483; x_wconf 81' lang='eng' dir='ltr'><em>(ABO49939)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 217 498 999 649">
+     <span class='ocr_line' id='line_1_13' title="bbox 389 498 999 524; baseline 0 -5"><span class='ocrx_word' id='word_1_58' title='bbox 389 498 516 519; x_wconf 88' lang='eng' dir='ltr'><em>Seinonella</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 524 499 682 524; x_wconf 80' lang='eng' dir='ltr'><em>peptonophila</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 693 498 765 519; x_wconf 90' lang='eng' dir='ltr'><em>KCTC</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 775 498 845 519; x_wconf 79' lang='eng' dir='ltr'><em>9740T</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 855 498 999 524; x_wconf 86' lang='eng' dir='ltr'><em>(AF138735)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 217 539 990 566; baseline 0 -6"><span class='ocrx_word' id='word_1_63' title='bbox 217 540 495 560; x_wconf 85' lang='eng' dir='ltr'><em>Thermof/avomicrobium</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 505 540 674 560; x_wconf 83' lang='eng' dir='ltr'><em>dichotomicum</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 684 540 756 560; x_wconf 92' lang='eng' dir='ltr'><em>KCTC</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 767 539 837 560; x_wconf 82' lang='eng' dir='ltr'><em>3667T</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 846 540 990 566; x_wconf 83' lang='eng' dir='ltr'><em>(AF138733)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 242 581 964 608; baseline 0 -6"><span class='ocrx_word' id='word_1_68' title='bbox 242 582 489 608; x_wconf 83' lang='eng' dir='ltr'><em>Thermoactinomyces</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 497 582 639 602; x_wconf 79' lang='eng' dir='ltr'><em>intermedius</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 646 581 718 602; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 728 581 814 602; x_wconf 83' lang='eng' dir='ltr'><em>33205T</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 823 581 964 608; x_wconf 88' lang='eng' dir='ltr'><em>(AJ251775)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 224 623 890 649; baseline 0.002 -6"><span class='ocrx_word' id='word_1_73' title='bbox 224 623 470 649; x_wconf 85' lang='eng' dir='ltr'><em>Thermoactinomyces</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 480 623 573 649; x_wconf 87' lang='eng' dir='ltr'><em>vulgaris</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 583 623 656 644; x_wconf 93' lang='eng' dir='ltr'><em>KCTC</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 666 623 735 644; x_wconf 80' lang='eng' dir='ltr'><em>9076T</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 745 623 890 649; x_wconf 86' lang='eng' dir='ltr'><em>(AF138739)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 240 664 755 691">
+     <span class='ocr_line' id='line_1_17' title="bbox 240 664 755 691; baseline 0 -6"><span class='ocrx_word' id='word_1_78' title='bbox 240 665 355 691; x_wconf 84' lang='eng' dir='ltr'><em>Laceye/Ia</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 363 665 439 690; x_wconf 85' lang='eng' dir='ltr'><em>putida</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 449 664 521 685; x_wconf 89' lang='eng' dir='ltr'><em>KCTC</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 532 664 601 685; x_wconf 89' lang='eng' dir='ltr'><em>3666T</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 611 665 755 691; x_wconf 86' lang='eng' dir='ltr'><em>(AF138736)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 233 705 800 732">
+     <span class='ocr_line' id='line_1_18' title="bbox 233 705 800 732; baseline -0.002 -5"><span class='ocrx_word' id='word_1_83' title='bbox 233 706 348 732; x_wconf 85' lang='eng' dir='ltr'><em>Laceyella</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 358 706 461 727; x_wconf 87' lang='eng' dir='ltr'><em>sacchari</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 470 706 556 727; x_wconf 91' lang='eng' dir='ltr'><strong>NCIMB</strong></span> <span class='ocrx_word' id='word_1_86' title='bbox 568 705 649 727; x_wconf 80' lang='eng' dir='ltr'><em>11367T</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 659 706 800 732; x_wconf 83' lang='eng' dir='ltr'><em>(AJ251777)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 219 747 828 773">
+     <span class='ocr_line' id='line_1_19' title="bbox 219 747 828 773; baseline 0 -5"><span class='ocrx_word' id='word_1_88' title='bbox 219 748 385 773; x_wconf 86' lang='eng' dir='ltr'><em>Desmospora</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 395 748 472 768; x_wconf 86' lang='eng' dir='ltr'><em>activa</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 482 748 560 768; x_wconf 93' lang='eng' dir='ltr'><strong>IMMIB</strong></span> <span class='ocrx_word' id='word_1_91' title='bbox 572 747 667 768; x_wconf 77' lang='eng' dir='ltr'><em>L-1269T</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 677 747 828 773; x_wconf 88' lang='eng' dir='ltr'><em>(AM940019)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 0 786 756 815">
+     <span class='ocr_line' id='line_1_20' title="bbox 0 786 756 815; baseline 0 -6"><span class='ocrx_word' id='word_1_93' title='bbox 0 786 22 801; x_wconf 75' lang='eng'><em>73</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 261 789 379 809; x_wconf 89' lang='eng' dir='ltr'><em>PIaniﬁ/um</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 389 789 504 809; x_wconf 82' lang='eng' dir='ltr'><em>fimeticola</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 515 788 756 815; x_wconf 75' lang='eng' dir='ltr'><em>HO165T(A3088364)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 259 830 755 856">
+     <span class='ocr_line' id='line_1_21' title="bbox 259 830 755 856; baseline 0.002 -6"><span class='ocrx_word' id='word_1_97' title='bbox 259 830 377 851; x_wconf 88' lang='eng' dir='ltr'><em>Planifilum</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 386 830 490 856; x_wconf 83' lang='eng' dir='ltr'><em>fulgidum</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 499 830 600 851; x_wconf 84' lang='eng' dir='ltr'><em>500275T</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 610 830 755 856; x_wconf 80' lang='eng' dir='ltr'><em>(A8088362)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 185 870 761 898">
+     <span class='ocr_line' id='line_1_22' title="bbox 185 870 761 898; baseline 0 -6"><span class='ocrx_word' id='word_1_101' title='bbox 185 870 217 885; x_wconf 44' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 259 872 377 892; x_wconf 85' lang='eng' dir='ltr'><em>Planifi/um</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 385 877 536 898; x_wconf 83' lang='eng' dir='ltr'><em>yunnanense</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 546 871 603 892; x_wconf 75' lang='eng' dir='ltr'><em>LA5T</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 613 872 761 898; x_wconf 84' lang='eng' dir='ltr'><em>(DQ119659)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 4 5 652 884">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 4 5 652 884">
+     <span class='ocr_line' id='line_1_23' title="bbox 188 5 570 70; baseline 0 -30"><span class='ocrx_word' id='word_1_106' title='bbox 188 5 570 70; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 155 70 546 123; baseline 0 -42"><span class='ocrx_word' id='word_1_107' title='bbox 155 70 546 123; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 143 123 519 164; baseline 0 0"><span class='ocrx_word' id='word_1_108' title='bbox 143 123 519 164; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 88 164 430 206; baseline 0 692"><span class='ocrx_word' id='word_1_109' title='bbox 88 164 430 206; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 38 206 492 247; baseline 0 651"><span class='ocrx_word' id='word_1_110' title='bbox 38 206 492 247; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 38 247 499 288; baseline 0 610"><span class='ocrx_word' id='word_1_111' title='bbox 38 247 499 288; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 38 288 634 330; baseline 0 568"><span class='ocrx_word' id='word_1_112' title='bbox 38 288 634 330; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 22 330 652 361; baseline 0 537"><span class='ocrx_word' id='word_1_113' title='bbox 22 330 652 361; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 22 361 330 413; baseline 0 485"><span class='ocrx_word' id='word_1_114' title='bbox 22 361 330 413; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 22 413 333 455; baseline 0 443"><span class='ocrx_word' id='word_1_115' title='bbox 22 413 333 455; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 22 455 361 496; baseline 0 402"><span class='ocrx_word' id='word_1_116' title='bbox 22 455 361 496; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 4 496 378 526; baseline 0 372"><span class='ocrx_word' id='word_1_117' title='bbox 4 496 378 526; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 4 526 228 662; baseline 0 -52"><span class='ocrx_word' id='word_1_118' title='bbox 4 526 228 662; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 4 662 232 745; baseline 0 -11"><span class='ocrx_word' id='word_1_119' title='bbox 4 662 232 745; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 4 745 252 884; baseline 0 -98"><span class='ocrx_word' id='word_1_120' title='bbox 4 745 252 884; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 88 16 140 32">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 88 16 140 32">
+     <span class='ocr_line' id='line_1_38' title="bbox 88 16 140 32; baseline 0 0"><span class='ocrx_word' id='word_1_121' title='bbox 88 17 116 32; x_wconf 29' lang='eng'><em>2‘0</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 124 16 140 32; x_wconf 87' lang='eng'>%</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001420-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001420-0-000.pbm.png
new file mode 100644
index 00000000..c9996573
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001420-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001420-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001420-0-000.pbm.png.hocr
new file mode 100644
index 00000000..8cebf9f7
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001420-0-000.pbm.png.hocr
@@ -0,0 +1,260 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001420-0-000.pbm.png"; bbox 0 0 1124 538; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 18 29 68 44">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 18 29 68 44">
+     <span class='ocr_line' id='line_1_1' title="bbox 18 29 68 44; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 18 29 68 44; x_wconf 87' lang='eng'>0.005</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 136 82 157 97">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 136 82 157 97">
+     <span class='ocr_line' id='line_1_2' title="bbox 136 82 157 97; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 136 82 157 97; x_wconf 88' lang='eng'>75</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 294 9 348 51">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 294 9 348 51">
+     <span class='ocr_line' id='line_1_3' title="bbox 321 9 348 30; baseline 0 0"><span class='ocrx_word' id='word_1_3' title='bbox 321 9 348 30; x_wconf 59' lang='eng'>5‘1</span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 294 36 325 51; baseline 0 0"><span class='ocrx_word' id='word_1_4' title='bbox 294 36 325 51; x_wconf 82' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 349 10 351 48">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 349 10 351 48">
+     <span class='ocr_line' id='line_1_5' title="bbox 349 10 351 48; baseline 0 490"><span class='ocrx_word' id='word_1_5' title='bbox 349 10 351 48; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 164 55 332 57">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 164 55 332 57">
+     <span class='ocr_line' id='line_1_6' title="bbox 164 55 332 57; baseline 0 481"><span class='ocrx_word' id='word_1_6' title='bbox 164 55 332 57; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 103 101 166 103">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 103 101 166 103">
+     <span class='ocr_line' id='line_1_7' title="bbox 103 101 166 103; baseline 0 435"><span class='ocrx_word' id='word_1_7' title='bbox 103 101 166 103; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 71 165 105 167">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 71 165 105 167">
+     <span class='ocr_line' id='line_1_8' title="bbox 71 165 105 167; baseline 0 371"><span class='ocrx_word' id='word_1_8' title='bbox 71 165 105 167; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 53 224 73 226">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 53 224 73 226">
+     <span class='ocr_line' id='line_1_9' title="bbox 53 224 73 226; baseline 0 312"><span class='ocrx_word' id='word_1_9' title='bbox 53 224 73 226; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 0 290 54 292">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 0 290 54 292">
+     <span class='ocr_line' id='line_1_10' title="bbox 0 290 54 292; baseline 0 246"><span class='ocrx_word' id='word_1_10' title='bbox 0 290 54 292; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 53 224 54 359">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 53 224 54 359">
+     <span class='ocr_line' id='line_1_11' title="bbox 53 224 54 359; baseline 0 179"><span class='ocrx_word' id='word_1_11' title='bbox 53 224 54 359; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 0 290 2 445">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 0 290 2 445">
+     <span class='ocr_line' id='line_1_12' title="bbox 0 290 2 445; baseline 0 93"><span class='ocrx_word' id='word_1_12' title='bbox 0 290 2 445; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 58 411 60 477">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 58 411 60 477">
+     <span class='ocr_line' id='line_1_13' title="bbox 58 411 60 477; baseline 0 61"><span class='ocrx_word' id='word_1_13' title='bbox 58 411 60 477; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 30 451 51 466">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 30 451 51 466">
+     <span class='ocr_line' id='line_1_14' title="bbox 30 451 51 466; baseline 0 0"><span class='ocrx_word' id='word_1_14' title='bbox 30 451 51 466; x_wconf 84' lang='eng'><strong>85</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 71 165 73 285">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 71 165 73 285">
+     <span class='ocr_line' id='line_1_15' title="bbox 71 165 73 285; baseline 0 253"><span class='ocrx_word' id='word_1_15' title='bbox 71 165 73 285; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 103 101 105 230">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 103 101 105 230">
+     <span class='ocr_line' id='line_1_16' title="bbox 103 101 105 230; baseline 0 308"><span class='ocrx_word' id='word_1_16' title='bbox 103 101 105 230; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 71 283 133 285">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 71 283 133 285">
+     <span class='ocr_line' id='line_1_17' title="bbox 71 283 133 285; baseline 0 253"><span class='ocrx_word' id='word_1_17' title='bbox 71 283 133 285; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 78 338 80 377">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 78 338 80 377">
+     <span class='ocr_line' id='line_1_18' title="bbox 78 338 80 377; baseline 0 161"><span class='ocrx_word' id='word_1_18' title='bbox 78 338 80 377; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 103 291 124 307">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 103 291 124 307">
+     <span class='ocr_line' id='line_1_19' title="bbox 103 291 124 307; baseline 0 0"><span class='ocrx_word' id='word_1_19' title='bbox 103 291 124 307; x_wconf 79' lang='eng'>67</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 131 265 133 304">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 131 265 133 304">
+     <span class='ocr_line' id='line_1_20' title="bbox 131 265 133 304; baseline 0 234"><span class='ocrx_word' id='word_1_20' title='bbox 131 265 133 304; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 164 55 166 148">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 164 55 166 148">
+     <span class='ocr_line' id='line_1_21' title="bbox 164 55 166 148; baseline 0 390"><span class='ocrx_word' id='word_1_21' title='bbox 164 55 166 148; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 330 28 332 84">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 330 28 332 84">
+     <span class='ocr_line' id='line_1_22' title="bbox 330 28 332 84; baseline 0 454"><span class='ocrx_word' id='word_1_22' title='bbox 330 28 332 84; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 206 119 303 121">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 206 119 303 121">
+     <span class='ocr_line' id='line_1_23' title="bbox 206 119 303 121; baseline 0 417"><span class='ocrx_word' id='word_1_23' title='bbox 206 119 303 121; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 164 146 206 148">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 164 146 206 148">
+     <span class='ocr_line' id='line_1_24' title="bbox 164 146 206 148; baseline 0 390"><span class='ocrx_word' id='word_1_24' title='bbox 164 146 206 148; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 58 475 166 477">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 58 475 166 477">
+     <span class='ocr_line' id='line_1_25' title="bbox 58 475 166 477; baseline 0 61"><span class='ocrx_word' id='word_1_25' title='bbox 58 475 166 477; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 136 483 157 498">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 136 483 157 498">
+     <span class='ocr_line' id='line_1_26' title="bbox 136 483 157 498; baseline 0 0"><span class='ocrx_word' id='word_1_26' title='bbox 136 483 157 498; x_wconf 81' lang='eng'>98</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 164 448 166 504">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 164 448 166 504">
+     <span class='ocr_line' id='line_1_27' title="bbox 164 448 166 504; baseline 0 34"><span class='ocrx_word' id='word_1_27' title='bbox 164 448 166 504; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 176 154 197 169">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 176 154 197 169">
+     <span class='ocr_line' id='line_1_28' title="bbox 176 154 197 169; baseline 0 0"><span class='ocrx_word' id='word_1_28' title='bbox 176 154 197 169; x_wconf 81' lang='eng'>73</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 204 119 206 176">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 204 119 206 176">
+     <span class='ocr_line' id='line_1_29' title="bbox 204 119 206 176; baseline 0 362"><span class='ocrx_word' id='word_1_29' title='bbox 204 119 206 176; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 463 0 1068 101">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 463 0 1068 101">
+     <span class='ocr_line' id='line_1_30' title="bbox 562 0 1040 28; baseline 0 -6"><span class='ocrx_word' id='word_1_30' title='bbox 562 1 585 22; x_wconf 91' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_31' title='bbox 598 1 753 28; x_wconf 87' lang='eng' dir='ltr'>chlororaphis</span> <span class='ocrx_word' id='word_1_32' title='bbox 764 1 810 22; x_wconf 93' lang='eng' dir='ltr'>IAM</span> <span class='ocrx_word' id='word_1_33' title='bbox 824 0 912 23; x_wconf 83' lang='eng' dir='ltr'>12354T</span> <span class='ocrx_word' id='word_1_34' title='bbox 922 1 1040 28; x_wconf 80' lang='eng'>(084011)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 590 37 1068 64; baseline 0 -5"><span class='ocrx_word' id='word_1_35' title='bbox 590 38 614 58; x_wconf 93' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_36' title='bbox 626 37 772 59; x_wconf 85' lang='eng' dir='ltr'>ﬂuorescens</span> <span class='ocrx_word' id='word_1_37' title='bbox 782 37 842 59; x_wconf 87' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_38' title='bbox 854 37 943 59; x_wconf 81' lang='eng' dir='ltr'>50090T</span> <span class='ocrx_word' id='word_1_39' title='bbox 954 37 1068 64; x_wconf 89' lang='eng'>(276662)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 463 73 884 101; baseline 0 -6"><span class='ocrx_word' id='word_1_40' title='bbox 463 74 485 95; x_wconf 91' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_41' title='bbox 498 74 605 101; x_wconf 87' lang='eng' dir='ltr'>syringae</span> <span class='ocrx_word' id='word_1_42' title='bbox 616 74 675 95; x_wconf 89' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_43' title='bbox 687 73 759 95; x_wconf 91' lang='eng' dir='ltr'>1247T</span> <span class='ocrx_word' id='word_1_44' title='bbox 769 74 884 101; x_wconf 86' lang='eng'>(276669)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 307 109 684 137">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 307 109 684 137">
+     <span class='ocr_line' id='line_1_33' title="bbox 307 109 684 137; baseline 0.003 -6"><span class='ocrx_word' id='word_1_45' title='bbox 307 110 330 131; x_wconf 94' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_46' title='bbox 341 110 419 137; x_wconf 87' lang='eng' dir='ltr'><em>putida</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 430 110 490 132; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_48' title='bbox 501 109 559 132; x_wconf 81' lang='eng' dir='ltr'>291T</span> <span class='ocrx_word' id='word_1_49' title='bbox 570 110 684 137; x_wconf 89' lang='eng'>(276667)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 206 146 789 210">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 206 146 789 210">
+     <span class='ocr_line' id='line_1_34' title="bbox 206 146 774 194; baseline 0 -26"><span class='ocrx_word' id='word_1_50' title='bbox 206 147 358 194; x_wconf 79' lang='eng' dir='ltr'>_|_—P.</span> <span class='ocrx_word' id='word_1_51' title='bbox 369 146 487 173; x_wconf 84' lang='eng' dir='ltr'><em>parafu/va</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 496 147 527 168; x_wconf 90' lang='eng' dir='ltr'>AJ</span> <span class='ocrx_word' id='word_1_53' title='bbox 538 146 613 168; x_wconf 77' lang='eng' dir='ltr'>2129T</span> <span class='ocrx_word' id='word_1_54' title='bbox 623 146 774 174; x_wconf 89' lang='eng' dir='ltr'>(ABO60132)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 265 182 789 210; baseline 0 -6"><span class='ocrx_word' id='word_1_55' title='bbox 265 183 288 204; x_wconf 92' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_56' title='bbox 299 183 494 210; x_wconf 86' lang='eng' dir='ltr'>p/ecoglossicida</span> <span class='ocrx_word' id='word_1_57' title='bbox 505 183 559 204; x_wconf 89' lang='eng' dir='ltr'>FPC</span> <span class='ocrx_word' id='word_1_58' title='bbox 570 182 627 204; x_wconf 81' lang='eng' dir='ltr'>951T</span> <span class='ocrx_word' id='word_1_59' title='bbox 638 183 789 210; x_wconf 88' lang='eng' dir='ltr'>(AB009457)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 420 219 899 246">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 420 219 899 246">
+     <span class='ocr_line' id='line_1_36' title="bbox 420 219 899 246; baseline 0 -6"><span class='ocrx_word' id='word_1_60' title='bbox 420 219 443 240; x_wconf 62' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_61' title='bbox 455 219 629 241; x_wconf 86' lang='eng' dir='ltr'>nitroreducens</span> <span class='ocrx_word' id='word_1_62' title='bbox 640 219 686 240; x_wconf 93' lang='eng' dir='ltr'>IAM</span> <span class='ocrx_word' id='word_1_63' title='bbox 699 219 771 241; x_wconf 81' lang='eng' dir='ltr'>1439T</span> <span class='ocrx_word' id='word_1_64' title='bbox 781 219 899 246; x_wconf 78' lang='eng'>(084021)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 273 255 687 283">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 273 255 687 283">
+     <span class='ocr_line' id='line_1_37' title="bbox 273 255 687 283; baseline 0 -6"><span class='ocrx_word' id='word_1_65' title='bbox 273 256 297 277; x_wconf 89' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_66' title='bbox 309 256 402 277; x_wconf 82' lang='eng' dir='ltr'>stutzeri</span> <span class='ocrx_word' id='word_1_67' title='bbox 411 256 458 277; x_wconf 93' lang='eng' dir='ltr'>IAM</span> <span class='ocrx_word' id='word_1_68' title='bbox 471 255 559 277; x_wconf 82' lang='eng' dir='ltr'>12668T</span> <span class='ocrx_word' id='word_1_69' title='bbox 569 256 687 283; x_wconf 89' lang='eng' dir='ltr'>(D84024)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 432 292 887 320">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 432 292 887 320">
+     <span class='ocr_line' id='line_1_38' title="bbox 432 292 887 320; baseline 0 -6"><span class='ocrx_word' id='word_1_70' title='bbox 432 292 455 314; x_wconf 93' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_71' title='bbox 467 292 608 320; x_wconf 88' lang='eng' dir='ltr'>aeruginosa</span> <span class='ocrx_word' id='word_1_72' title='bbox 619 292 677 314; x_wconf 91' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_73' title='bbox 690 292 762 314; x_wconf 88' lang='eng' dir='ltr'>1242T</span> <span class='ocrx_word' id='word_1_74' title='bbox 772 292 887 320; x_wconf 88' lang='eng'>(276651)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 346 328 856 429">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 346 328 856 429">
+     <span class='ocr_line' id='line_1_39' title="bbox 346 328 751 356; baseline 0 -6"><span class='ocrx_word' id='word_1_75' title='bbox 346 329 369 350; x_wconf 94' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_76' title='bbox 381 329 464 350; x_wconf 83' lang='eng' dir='ltr'>Iuteo/a</span> <span class='ocrx_word' id='word_1_77' title='bbox 476 329 522 350; x_wconf 93' lang='eng' dir='ltr'>IAM</span> <span class='ocrx_word' id='word_1_78' title='bbox 535 328 624 350; x_wconf 84' lang='eng' dir='ltr'>13000T</span> <span class='ocrx_word' id='word_1_79' title='bbox 634 329 751 356; x_wconf 87' lang='eng' dir='ltr'>(D84002)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 348 365 830 392; baseline 0 -6"><span class='ocrx_word' id='word_1_80' title='bbox 348 366 371 386; x_wconf 96' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_81' title='bbox 381 366 545 392; x_wconf 86' lang='eng' dir='ltr'>pohangensis</span> <span class='ocrx_word' id='word_1_82' title='bbox 556 365 664 387; x_wconf 76' lang='eng' dir='ltr'>H3—R18T</span> <span class='ocrx_word' id='word_1_83' title='bbox 674 365 830 392; x_wconf 76' lang='eng' dir='ltr'>(D0339144)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 347 401 856 429; baseline 0 -6"><span class='ocrx_word' id='word_1_84' title='bbox 347 402 370 423; x_wconf 91' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_85' title='bbox 381 402 551 429; x_wconf 86' lang='eng' dir='ltr'>pachastreI/ae</span> <span class='ocrx_word' id='word_1_86' title='bbox 563 402 626 423; x_wconf 92' lang='eng' dir='ltr'>KMM</span> <span class='ocrx_word' id='word_1_87' title='bbox 637 401 695 423; x_wconf 84' lang='eng' dir='ltr'>330T</span> <span class='ocrx_word' id='word_1_88' title='bbox 705 402 856 429; x_wconf 85' lang='eng' dir='ltr'>(AB125366)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 352 510 374 525">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 352 510 374 525">
+     <span class='ocr_line' id='line_1_42' title="bbox 352 510 374 525; baseline 0 0"><span class='ocrx_word' id='word_1_89' title='bbox 352 510 374 525; x_wconf 86' lang='eng'>99</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_37' title="bbox 381 484 383 522">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 381 484 383 522">
+     <span class='ocr_line' id='line_1_43' title="bbox 381 484 383 522; baseline 0 16"><span class='ocrx_word' id='word_1_90' title='bbox 381 484 383 522; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_38' title="bbox 392 437 1124 538">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 392 437 1124 538">
+     <span class='ocr_line' id='line_1_44' title="bbox 392 437 712 465; baseline 0 -6"><span class='ocrx_word' id='word_1_91' title='bbox 392 438 471 459; x_wconf 90' lang='eng' dir='ltr'><strong>Strain</strong></span> <span class='ocrx_word' id='word_1_92' title='bbox 482 437 552 459; x_wconf 83' lang='eng' dir='ltr'>83-3T</span> <span class='ocrx_word' id='word_1_93' title='bbox 559 438 712 465; x_wconf 86' lang='eng' dir='ltr'>(EU286805)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 591 474 1100 502; baseline 0 -7"><span class='ocrx_word' id='word_1_94' title='bbox 591 475 620 495; x_wconf 88' lang='eng' dir='ltr'>‘P.</span> <span class='ocrx_word' id='word_1_95' title='bbox 633 474 790 496; x_wconf 78' lang='eng' dir='ltr'>denitriﬂcans‘</span> <span class='ocrx_word' id='word_1_96' title='bbox 803 475 850 495; x_wconf 94' lang='eng' dir='ltr'>IAM</span> <span class='ocrx_word' id='word_1_97' title='bbox 863 475 939 496; x_wconf 86' lang='eng'>12023</span> <span class='ocrx_word' id='word_1_98' title='bbox 949 474 1100 502; x_wconf 77' lang='eng' dir='ltr'>(ABOZ1419)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 591 510 1124 538; baseline 0 -6"><span class='ocrx_word' id='word_1_99' title='bbox 591 511 614 532; x_wconf 93' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_100' title='bbox 625 511 807 538; x_wconf 83' lang='eng' dir='ltr'>pertucinogena</span> <span class='ocrx_word' id='word_1_101' title='bbox 818 511 863 532; x_wconf 93' lang='eng' dir='ltr'>IFO</span> <span class='ocrx_word' id='word_1_102' title='bbox 875 510 963 532; x_wconf 79' lang='eng' dir='ltr'>14163T</span> <span class='ocrx_word' id='word_1_103' title='bbox 973 511 1124 538; x_wconf 88' lang='eng' dir='ltr'>(AB021380)</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001461-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001461-0-000.pbm.png
new file mode 100644
index 00000000..86401253
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001461-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001461-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001461-0-000.pbm.png.hocr
new file mode 100644
index 00000000..faf2ae42
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001461-0-000.pbm.png.hocr
@@ -0,0 +1,148 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001461-0-000.pbm.png"; bbox 0 0 1535 855; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 85 58 124 73">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 85 58 124 73">
+     <span class='ocr_line' id='line_1_1' title="bbox 85 58 124 73; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 85 58 124 73; x_wconf 65' lang='eng'><em>0,02</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 175 0 1535 855">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 703 0 1535 281">
+     <span class='ocr_line' id='line_1_2' title="bbox 854 0 1470 26; baseline 0 -5"><span class='ocrx_word' id='word_1_2' title='bbox 854 0 994 21; x_wconf 84' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 1003 0 1150 26; x_wconf 88' lang='eng' dir='ltr'><em>aquamarina</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 1161 0 1219 21; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 1230 0 1318 21; x_wconf 79' lang='eng' dir='ltr'><em>30161T</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 1328 0 1470 26; x_wconf 86' lang='eng' dir='ltr'>(AJ306888)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 864 32 1439 58; baseline 0 -5"><span class='ocrx_word' id='word_1_7' title='bbox 864 32 1004 53; x_wconf 85' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 1013 32 1134 53; x_wconf 83' lang='eng' dir='ltr'><em>meridiana</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 1145 32 1203 53; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 1215 32 1287 53; x_wconf 87' lang='eng' dir='ltr'>5425T</span> <span class='ocrx_word' id='word_1_11' title='bbox 1297 32 1439 58; x_wconf 85' lang='eng' dir='ltr'>(AJ306891)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 1004 64 1522 90; baseline -0.002 -5"><span class='ocrx_word' id='word_1_12' title='bbox 1004 64 1144 85; x_wconf 88' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 1154 64 1311 90; x_wconf 85' lang='eng' dir='ltr'><em>magadiensis</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 1320 64 1345 84; x_wconf 90' lang='eng'><em>21</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 1360 64 1400 84; x_wconf 82' lang='eng' dir='ltr'><em>MIT</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 1410 64 1522 90; x_wconf 84' lang='eng' dir='ltr'><em>(X92150)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 974 96 1535 122; baseline 0.002 -6"><span class='ocrx_word' id='word_1_17' title='bbox 974 96 1114 117; x_wconf 89' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 1124 96 1231 117; x_wconf 88' lang='eng' dir='ltr'><em>variabilis</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 1242 96 1300 117; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 1311 96 1383 117; x_wconf 86' lang='eng' dir='ltr'>3051T</span> <span class='ocrx_word' id='word_1_21' title='bbox 1393 96 1535 122; x_wconf 86' lang='eng' dir='ltr'>(AJ306893)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 873 127 1438 153; baseline 0 -5"><span class='ocrx_word' id='word_1_22' title='bbox 873 128 1013 148; x_wconf 89' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 1023 127 1148 148; x_wconf 83' lang='eng' dir='ltr'><em>sulfidaeris</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 1159 127 1283 148; x_wconf 86' lang='eng' dir='ltr'><em>Esulfide1T</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 1292 128 1438 153; x_wconf 91' lang='eng' dir='ltr'>(AF212204)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 768 159 1319 185; baseline 0 -5"><span class='ocrx_word' id='word_1_26' title='bbox 768 160 909 180; x_wconf 87' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 919 160 1015 180; x_wconf 85' lang='eng' dir='ltr'><em>venusta</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 1026 159 1084 180; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 1094 160 1167 180; x_wconf 91' lang='eng' dir='ltr'><em>4743T</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 1177 160 1319 185; x_wconf 83' lang='eng' dir='ltr'>(AJ306894)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 766 191 1345 217; baseline -0.002 -5"><span class='ocrx_word' id='word_1_31' title='bbox 766 191 907 212; x_wconf 86' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 916 191 1099 217; x_wconf 86' lang='eng' dir='ltr'><em>hydrothermalis</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 1109 191 1190 212; x_wconf 88' lang='eng' dir='ltr'><em>Slthf2T</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 1200 191 1345 217; x_wconf 85' lang='eng' dir='ltr'>(AF212218)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 822 224 1294 249; baseline 0 -5"><span class='ocrx_word' id='word_1_35' title='bbox 822 224 962 244; x_wconf 86' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 971 224 1101 244; x_wconf 86' lang='eng' dir='ltr'><em>desiderata</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 1112 224 1172 244; x_wconf 84' lang='eng' dir='ltr'>FB2T</span> <span class='ocrx_word' id='word_1_38' title='bbox 1182 224 1294 249; x_wconf 86' lang='eng' dir='ltr'><em>(X92417)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 703 255 1334 281; baseline 0 -5"><span class='ocrx_word' id='word_1_39' title='bbox 703 255 843 276; x_wconf 86' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 852 255 982 281; x_wconf 80' lang='eng' dir='ltr'><em>campisalis</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 991 255 1065 276; x_wconf 93' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 1075 255 1179 276; x_wconf 79' lang='eng' dir='ltr'><em>700597T</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 1189 255 1334 281; x_wconf 90' lang='eng' dir='ltr'>(AF054286)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 398 287 1402 568">
+     <span class='ocr_line' id='line_1_11' title="bbox 721 287 1339 313; baseline 0 -5"><span class='ocrx_word' id='word_1_44' title='bbox 721 287 861 308; x_wconf 89' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 870 287 1005 313; x_wconf 84' lang='eng' dir='ltr'><em>halmophi/a</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 1014 287 1088 308; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 1100 287 1187 308; x_wconf 73' lang='eng' dir='ltr'><em>19717T</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 1197 287 1339 313; x_wconf 85' lang='eng' dir='ltr'>(AJ306889)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 547 319 1121 345; baseline 0.002 -6"><span class='ocrx_word' id='word_1_49' title='bbox 547 319 687 340; x_wconf 90' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 697 319 817 340; x_wconf 85' lang='eng' dir='ltr'><em>eurihalina</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 826 319 900 340; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 910 319 999 340; x_wconf 79' lang='eng' dir='ltr'><em>49336T</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 1009 319 1121 345; x_wconf 85' lang='eng' dir='ltr'>(X87218)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 564 349 1124 375; baseline 0 -5"><span class='ocrx_word' id='word_1_54' title='bbox 564 350 704 370; x_wconf 86' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 714 350 820 375; x_wconf 81' lang='eng' dir='ltr'><em>elongata</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 829 349 904 370; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 914 350 1002 370; x_wconf 84' lang='eng' dir='ltr'>33173T</span> <span class='ocrx_word' id='word_1_58' title='bbox 1012 350 1124 375; x_wconf 86' lang='eng' dir='ltr'>(X67023)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 570 382 1114 408; baseline 0 -5"><span class='ocrx_word' id='word_1_59' title='bbox 570 383 710 403; x_wconf 89' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 720 383 831 408; x_wconf 84' lang='eng' dir='ltr'><em>ha/ophila</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 842 382 899 403; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_62' title='bbox 910 383 971 403; x_wconf 91' lang='eng'><em>4770</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 978 383 988 396; x_wconf 87' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_64' title='bbox 998 383 1114 408; x_wconf 87' lang='eng' dir='ltr'>(M93353)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 398 414 966 440; baseline 0 -5"><span class='ocrx_word' id='word_1_65' title='bbox 398 415 538 435; x_wconf 88' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 548 415 709 440; x_wconf 86' lang='eng' dir='ltr'><em>organivorans</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 719 414 814 435; x_wconf 82' lang='eng' dir='ltr'><em>G-16.1T</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 823 415 966 440; x_wconf 85' lang='eng' dir='ltr'><em>(AJ616910)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 581 446 1255 472; baseline 0 -5"><span class='ocrx_word' id='word_1_69' title='bbox 581 446 812 467; x_wconf 75' lang='eng' dir='ltr'><em>Chromoha/obacter</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 819 447 951 472; x_wconf 81' lang='eng' dir='ltr'><em>sa/exigens</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 961 446 1019 467; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 1031 447 1103 467; x_wconf 84' lang='eng' dir='ltr'><em>3043T</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 1113 447 1255 472; x_wconf 84' lang='eng' dir='ltr'><em>(AJ295146)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 556 478 1259 504; baseline 0 -5"><span class='ocrx_word' id='word_1_74' title='bbox 556 478 788 499; x_wconf 80' lang='eng' dir='ltr'><em>Chromoha/obacter</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 794 479 926 499; x_wconf 84' lang='eng' dir='ltr'><em>israe/ensis</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 935 478 1009 499; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 1018 479 1107 499; x_wconf 83' lang='eng' dir='ltr'>43985T</span> <span class='ocrx_word' id='word_1_78' title='bbox 1117 479 1259 504; x_wconf 85' lang='eng' dir='ltr'>(AJ295144)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 689 510 1402 536; baseline 0 -5"><span class='ocrx_word' id='word_1_79' title='bbox 689 510 920 531; x_wconf 85' lang='eng' dir='ltr'><em>Chromohalobacter</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 927 510 1068 531; x_wconf 87' lang='eng' dir='ltr'><em>canadensis</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 1077 510 1151 531; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 1161 510 1250 531; x_wconf 78' lang='eng' dir='ltr'><em>43984T</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 1259 510 1402 536; x_wconf 86' lang='eng' dir='ltr'>(AJ295143)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 662 542 1348 568; baseline -0.001 -5"><span class='ocrx_word' id='word_1_84' title='bbox 662 542 893 563; x_wconf 86' lang='eng' dir='ltr'><em>Chromoha/obacter</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 900 542 1046 563; x_wconf 75' lang='eng' dir='ltr'><em>marismon‘ui</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 1053 542 1127 563; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 1140 542 1226 563; x_wconf 84' lang='eng' dir='ltr'><em>17056T</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 1236 542 1348 568; x_wconf 88' lang='eng' dir='ltr'>(X87219)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 175 573 1331 855">
+     <span class='ocr_line' id='line_1_20' title="bbox 678 573 1268 599; baseline 0 -5"><span class='ocrx_word' id='word_1_89' title='bbox 678 575 697 590; x_wconf 84' lang='eng'><em>71</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 752 574 892 594; x_wconf 84' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 901 573 1020 594; x_wconf 83' lang='eng' dir='ltr'><em>marisﬂavi</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 1028 573 1113 594; x_wconf 84' lang='eng' dir='ltr'><em>SW32T</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 1123 574 1208 599; x_wconf 88' lang='eng' dir='ltr'><em>(AF251</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 1216 574 1268 599; x_wconf 88' lang='eng'>143)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 811 605 1331 632; baseline 0 -6"><span class='ocrx_word' id='word_1_95' title='bbox 811 606 951 626; x_wconf 90' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 961 606 1078 626; x_wconf 85' lang='eng' dir='ltr'><em>indalinina</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 1088 605 1179 626; x_wconf 93' lang='eng' dir='ltr'><em>CG2.1T</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 1189 606 1331 632; x_wconf 86' lang='eng' dir='ltr'><em>(AJ427627)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 741 637 1285 663; baseline 0 -5"><span class='ocrx_word' id='word_1_99' title='bbox 741 637 881 658; x_wconf 81' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 891 637 1023 658; x_wconf 78' lang='eng' dir='ltr'><em>avicenniae</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 1034 637 1124 658; x_wconf 82' lang='eng' dir='ltr'><em>MWZaT</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 1134 637 1285 663; x_wconf 89' lang='eng' dir='ltr'><em>(DQ888315)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 759 669 1070 695; baseline -0.003 -5"><span class='ocrx_word' id='word_1_103' title='bbox 759 669 836 690; x_wconf 90' lang='eng' dir='ltr'><em>Strain</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 846 669 907 690; x_wconf 91' lang='eng' dir='ltr'><em>A10T</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 917 669 1070 695; x_wconf 86' lang='eng' dir='ltr'>(AM941746)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 600 701 1175 727; baseline -0.002 -5"><span class='ocrx_word' id='word_1_106' title='bbox 600 701 803 722; x_wconf 82' lang='eng' dir='ltr'><em>Modicisalibacter</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 810 701 939 722; x_wconf 86' lang='eng' dir='ltr'><em>tunisiensis</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 950 701 1014 721; x_wconf 88' lang='eng' dir='ltr'><em>LIT2T</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 1024 701 1175 727; x_wconf 86' lang='eng' dir='ltr'>(DQ641495)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 406 733 897 759; baseline 0 -5"><span class='ocrx_word' id='word_1_110' title='bbox 406 733 499 754; x_wconf 84' lang='eng' dir='ltr'><em>Cobetia</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 509 733 593 754; x_wconf 86' lang='eng' dir='ltr'><em>marina</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 604 733 662 754; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 673 733 745 753; x_wconf 95' lang='eng' dir='ltr'><em>4741T</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 755 733 897 759; x_wconf 84' lang='eng' dir='ltr'>(AJ306890)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 290 764 824 790; baseline 0 -5"><span class='ocrx_word' id='word_1_115' title='bbox 290 764 438 785; x_wconf 83' lang='eng' dir='ltr'><em>Carnimonas</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 448 764 573 790; x_wconf 87' lang='eng' dir='ltr'><em>nigrificans</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 583 764 702 785; x_wconf 88' lang='eng' dir='ltr'><em>CTCBS1T</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 712 765 824 790; x_wconf 85' lang='eng' dir='ltr'>(Y13299)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 175 796 676 822; baseline 0 -5"><span class='ocrx_word' id='word_1_119' title='bbox 175 797 292 817; x_wconf 76' lang='eng' dir='ltr'><em>Ha/otalea</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 302 797 425 817; x_wconf 77' lang='eng' dir='ltr'><em>alkali/enta</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 434 797 514 817; x_wconf 76' lang='eng' dir='ltr'><em>AW—7T</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 524 796 676 822; x_wconf 89' lang='eng' dir='ltr'>(DQ421388)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 307 828 891 855; baseline 0 -6"><span class='ocrx_word' id='word_1_123' title='bbox 307 829 457 855; x_wconf 76' lang='eng' dir='ltr'><em>Zymobacter</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 462 829 554 855; x_wconf 87' lang='eng' dir='ltr'><em>palmae</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 563 828 638 849; x_wconf 86' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 648 829 736 849; x_wconf 84' lang='eng' dir='ltr'><em>51623T</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 746 829 891 855; x_wconf 90' lang='eng' dir='ltr'>(AF211871)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 0 2 987 841">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 0 2 987 841">
+     <span class='ocr_line' id='line_1_29' title="bbox 756 2 846 39; baseline 0 816"><span class='ocrx_word' id='word_1_128' title='bbox 756 2 846 39; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 681 39 987 83; baseline 0 -12"><span class='ocrx_word' id='word_1_129' title='bbox 681 39 987 83; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 681 83 974 114; baseline 0 741"><span class='ocrx_word' id='word_1_130' title='bbox 681 83 974 114; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 444 114 873 146; baseline 0 -11"><span class='ocrx_word' id='word_1_131' title='bbox 444 114 873 146; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 444 146 768 178; baseline 0 677"><span class='ocrx_word' id='word_1_132' title='bbox 444 146 768 178; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 352 178 750 198; baseline 0 657"><span class='ocrx_word' id='word_1_133' title='bbox 352 178 750 198; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 279 198 802 242; baseline 0 0"><span class='ocrx_word' id='word_1_134' title='bbox 279 198 802 242; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 182 242 703 294; baseline 0 561"><span class='ocrx_word' id='word_1_135' title='bbox 182 242 703 294; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 182 294 703 326; baseline 0 -20"><span class='ocrx_word' id='word_1_136' title='bbox 182 294 703 326; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 182 326 546 358; baseline 0 497"><span class='ocrx_word' id='word_1_137' title='bbox 182 326 546 358; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 182 358 553 388; baseline 0 467"><span class='ocrx_word' id='word_1_138' title='bbox 182 358 553 388; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 147 388 562 465; baseline 0 -12"><span class='ocrx_word' id='word_1_139' title='bbox 147 388 562 465; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 147 465 556 485; baseline 0 370"><span class='ocrx_word' id='word_1_140' title='bbox 147 465 556 485; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 147 485 538 517; baseline 0 0"><span class='ocrx_word' id='word_1_141' title='bbox 147 485 538 517; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 147 517 517 533; baseline 0 322"><span class='ocrx_word' id='word_1_142' title='bbox 147 517 517 533; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 147 533 643 549; baseline 0 306"><span class='ocrx_word' id='word_1_143' title='bbox 147 533 643 549; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 147 549 643 581; baseline 0 274"><span class='ocrx_word' id='word_1_144' title='bbox 147 549 643 581; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 147 581 752 612; baseline 0 -15"><span class='ocrx_word' id='word_1_145' title='bbox 147 581 752 612; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 147 624 741 676; baseline 0 179"><span class='ocrx_word' id='word_1_146' title='bbox 147 624 741 676; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_48' title="bbox 0 676 742 720; baseline 0 -32"><span class='ocrx_word' id='word_1_147' title='bbox 0 676 742 720; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_49' title="bbox 0 720 406 751; baseline 0 0"><span class='ocrx_word' id='word_1_148' title='bbox 0 720 406 751; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_50' title="bbox 0 751 290 783; baseline 0 72"><span class='ocrx_word' id='word_1_149' title='bbox 0 751 290 783; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_51' title="bbox 0 783 298 841; baseline 0 -6"><span class='ocrx_word' id='word_1_150' title='bbox 0 783 298 841; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 517 511 539 526">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 517 511 539 526">
+     <span class='ocr_line' id='line_1_52' title="bbox 517 511 539 526; baseline 0 0"><span class='ocrx_word' id='word_1_151' title='bbox 517 511 539 526; x_wconf 79' lang='eng'>98</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 539 517 670 533">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 539 517 670 533">
+     <span class='ocr_line' id='line_1_53' title="bbox 539 517 670 533; baseline 0 -4"><span class='ocrx_word' id='word_1_152' title='bbox 539 517 670 533; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001479-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001479-0-001.pbm.png
new file mode 100644
index 00000000..db6bc1e8
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001479-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001479-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001479-0-001.pbm.png.hocr
new file mode 100644
index 00000000..1b77a1b2
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001479-0-001.pbm.png.hocr
@@ -0,0 +1,168 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001479-0-001.pbm.png"; bbox 0 0 1242 1333; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 17 1234 36 1248">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 17 1234 36 1248">
+     <span class='ocr_line' id='line_1_1' title="bbox 17 1234 36 1248; baseline -0.105 0"><span class='ocrx_word' id='word_1_1' title='bbox 17 1234 36 1248; x_wconf 85' lang='eng'><em>7</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 96 11 141 30">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 96 11 141 30">
+     <span class='ocr_line' id='line_1_2' title="bbox 96 11 141 30; baseline -0.022 0"><span class='ocrx_word' id='word_1_2' title='bbox 96 11 141 30; x_wconf 86' lang='eng'><em>0.01</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 272 97 292 111">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 272 97 292 111">
+     <span class='ocr_line' id='line_1_3' title="bbox 272 97 292 111; baseline 0 0"><span class='ocrx_word' id='word_1_3' title='bbox 272 97 292 111; x_wconf 81' lang='eng'><em>87</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 213 155 293 209">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 213 155 293 209">
+     <span class='ocr_line' id='line_1_4' title="bbox 213 155 234 170; baseline 0 0"><span class='ocrx_word' id='word_1_4' title='bbox 213 155 234 170; x_wconf 83' lang='eng'>88</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 272 195 293 209; baseline 0 0"><span class='ocrx_word' id='word_1_5' title='bbox 272 195 293 209; x_wconf 81' lang='eng'><em>85</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 233 450 253 464">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 233 450 253 464">
+     <span class='ocr_line' id='line_1_6' title="bbox 233 450 253 464; baseline 0 0"><span class='ocrx_word' id='word_1_6' title='bbox 233 450 253 464; x_wconf 77' lang='eng'>89</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 291 548 312 562">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 291 548 312 562">
+     <span class='ocr_line' id='line_1_7' title="bbox 291 548 312 562; baseline 0 0"><span class='ocrx_word' id='word_1_7' title='bbox 291 548 312 562; x_wconf 79' lang='eng'>99</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 135 1096 155 1111">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 135 1096 155 1111">
+     <span class='ocr_line' id='line_1_8' title="bbox 135 1096 155 1111; baseline 0 0"><span class='ocrx_word' id='word_1_8' title='bbox 135 1096 155 1111; x_wconf 76' lang='eng'>93</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 389 0 906 299">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 389 0 906 299">
+     <span class='ocr_line' id='line_1_9' title="bbox 428 0 906 24; baseline 0 -4"><span class='ocrx_word' id='word_1_9' title='bbox 428 0 450 19; x_wconf 95' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 461 0 652 20; x_wconf 82' lang='eng' dir='ltr'><em>Iuteof/uorescens</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 661 0 702 20; x_wconf 92' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 713 0 793 20; x_wconf 79' lang='eng' dir='ltr'><em>13057T</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 800 0 906 24; x_wconf 86' lang='eng' dir='ltr'>(U49008)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 408 39 798 63; baseline 0 -4"><span class='ocrx_word' id='word_1_14' title='bbox 408 39 430 59; x_wconf 69' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 442 39 540 59; x_wconf 86' lang='eng' dir='ltr'><em>coeru/ea</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 551 39 592 59; x_wconf 91' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 603 39 683 59; x_wconf 77' lang='eng' dir='ltr'><em>14679T</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 692 39 798 63; x_wconf 85' lang='eng' dir='ltr'><em>(U49002)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 389 78 831 103; baseline 0 -5"><span class='ocrx_word' id='word_1_19' title='bbox 389 79 411 98; x_wconf 91' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 423 83 573 103; x_wconf 82' lang='eng' dir='ltr'><em>verrucospora</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 584 78 624 98; x_wconf 96' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 636 79 716 98; x_wconf 91' lang='eng' dir='ltr'><em>14100T</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 725 79 831 103; x_wconf 86' lang='eng' dir='ltr'>(U49011)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 408 118 762 142; baseline 0 -5"><span class='ocrx_word' id='word_1_24' title='bbox 408 118 430 137; x_wconf 91' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 442 118 504 137; x_wconf 84' lang='eng' dir='ltr'><em>citrea</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 515 118 555 137; x_wconf 95' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 566 118 646 137; x_wconf 82' lang='eng' dir='ltr'><em>14678T</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 656 118 762 142; x_wconf 86' lang='eng' dir='ltr'><em>(U49001)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 447 157 882 181; baseline 0 -5"><span class='ocrx_word' id='word_1_29' title='bbox 447 157 469 176; x_wconf 91' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 481 157 603 181; x_wconf 85' lang='eng' dir='ltr'><em>glauciﬂava</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 611 157 737 176; x_wconf 81' lang='eng' dir='ltr'><em>AS41202T</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 746 157 882 181; x_wconf 84' lang='eng' dir='ltr'><em>(AF153881)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 487 196 848 220; baseline 0.003 -5"><span class='ocrx_word' id='word_1_33' title='bbox 487 196 509 215; x_wconf 95' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 520 201 591 216; x_wconf 88' lang='eng' dir='ltr'><em>macra</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 601 196 641 216; x_wconf 92' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 653 196 733 216; x_wconf 83' lang='eng' dir='ltr'><em>14102T</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 742 196 848 220; x_wconf 84' lang='eng' dir='ltr'><em>(U49009)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 428 235 816 259; baseline 0 -4"><span class='ocrx_word' id='word_1_38' title='bbox 428 235 450 255; x_wconf 69' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 461 235 563 255; x_wconf 85' lang='eng' dir='ltr'><em>madurae</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 572 235 623 255; x_wconf 93' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 634 235 701 255; x_wconf 81' lang='eng' dir='ltr'><em>7436T</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 710 235 816 259; x_wconf 87' lang='eng' dir='ltr'><em>(U58527)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 389 274 844 299; baseline 0 -5"><span class='ocrx_word' id='word_1_43' title='bbox 389 275 411 294; x_wconf 95' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 422 274 563 294; x_wconf 84' lang='eng' dir='ltr'><em>formosensis</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 570 274 622 294; x_wconf 87' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 632 275 699 294; x_wconf 78' lang='eng' dir='ltr'><em>7474T</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 708 275 844 299; x_wconf 88' lang='eng' dir='ltr'><em>(AF002263)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 352 314 1100 369">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 352 314 1100 369">
+     <span class='ocr_line' id='line_1_17' title="bbox 467 314 878 338; baseline 0 -5"><span class='ocrx_word' id='word_1_48' title='bbox 467 314 489 333; x_wconf 95' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 499 314 599 338; x_wconf 76' lang='eng' dir='ltr'><em>pellet/er]</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 605 314 656 333; x_wconf 90' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 667 314 878 338; x_wconf 77' lang='eng' dir='ltr'><em>3388T(AF163119)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 352 345 1100 369; baseline -0.001 -3"><span class='ocrx_word' id='word_1_52' title='bbox 352 352 382 366; x_wconf 83' lang='eng'>100</span> <span class='ocrx_word' id='word_1_53' title='bbox 523 345 544 364; x_wconf 95' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 556 350 641 365; x_wconf 85' lang='eng' dir='ltr'><em>cremea</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 650 345 725 369; x_wconf 83' lang='eng' dir='ltr'><em>subsp.</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 736 350 821 365; x_wconf 86' lang='eng' dir='ltr'><em>cremea</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 830 345 881 365; x_wconf 87' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 892 345 1100 369; x_wconf 84' lang='eng' dir='ltr'><em>3308T(AF134067)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 632 381 1208 436">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 632 381 1208 436">
+     <span class='ocr_line' id='line_1_19' title="bbox 632 381 1208 405; baseline 0 -5"><span class='ocrx_word' id='word_1_59' title='bbox 632 381 654 400; x_wconf 95' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 666 386 751 400; x_wconf 83' lang='eng' dir='ltr'><em>cremea</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 760 381 834 405; x_wconf 87' lang='eng' dir='ltr'><em>subsp.</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 845 381 955 405; x_wconf 82' lang='eng' dir='ltr'><em>rifamycini</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 964 381 1004 400; x_wconf 90' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 1016 381 1208 405; x_wconf 81' lang='eng' dir='ltr'><em>14183T(U49003)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 683 412 1148 436; baseline 0 -5"><span class='ocrx_word' id='word_1_65' title='bbox 683 412 704 431; x_wconf 93' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 716 412 869 436; x_wconf 80' lang='eng' dir='ltr'><em>catellat/spora</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 877 412 1003 431; x_wconf 71' lang='eng' dir='ltr'><em>AS41522T</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 1012 412 1148 436; x_wconf 89' lang='eng' dir='ltr'><em>(AF154127)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 428 451 867 514">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 428 451 867 514">
+     <span class='ocr_line' id='line_1_21' title="bbox 448 451 821 475; baseline 0 -5"><span class='ocrx_word' id='word_1_69' title='bbox 448 451 469 470; x_wconf 91' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 480 451 539 470; x_wconf 79' lang='eng' dir='ltr'><em>livida</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 548 451 599 470; x_wconf 91' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 609 451 676 470; x_wconf 83' lang='eng' dir='ltr'><em>3387T</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 685 451 821 475; x_wconf 83' lang='eng' dir='ltr'><em>(AF163116)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 428 490 867 514; baseline -0.002 -4"><span class='ocrx_word' id='word_1_74' title='bbox 428 490 450 509; x_wconf 95' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 460 490 586 514; x_wconf 83' lang='eng' dir='ltr'><em>yumaensis</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 594 490 645 510; x_wconf 87' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 655 490 722 510; x_wconf 75' lang='eng' dir='ltr'>3369T</span> <span class='ocrx_word' id='word_1_78' title='bbox 731 490 867 514; x_wconf 85' lang='eng' dir='ltr'><em>(AF163122)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 389 529 814 588">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 389 529 814 588">
+     <span class='ocr_line' id='line_1_23' title="bbox 389 529 793 553; baseline 0 -4"><span class='ocrx_word' id='word_1_79' title='bbox 389 530 411 549; x_wconf 88' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 423 530 511 549; x_wconf 86' lang='eng' dir='ltr'><em>vinacea</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 520 529 571 549; x_wconf 89' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 581 530 648 549; x_wconf 73' lang='eng' dir='ltr'><em>3325T</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 658 530 793 553; x_wconf 84' lang='eng' dir='ltr'><em>(AF134070)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 458 563 814 588; baseline 0 -5"><span class='ocrx_word' id='word_1_84' title='bbox 458 564 480 583; x_wconf 92' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 493 564 558 583; x_wconf 76' lang='eng' dir='ltr'><em>Viridis</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 567 563 608 583; x_wconf 92' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 619 564 699 583; x_wconf 80' lang='eng' dir='ltr'><em>15238T</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 708 564 814 588; x_wconf 89' lang='eng' dir='ltr'><em>(D85467)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 349 601 1242 1220">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 349 601 1242 1220">
+     <span class='ocr_line' id='line_1_25' title="bbox 793 601 1242 625; baseline 0.002 -5"><span class='ocrx_word' id='word_1_89' title='bbox 793 602 1011 625; x_wconf 87' lang='eng' dir='ltr'><em>Thermomonospora</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 1020 602 1104 621; x_wconf 77' lang='eng' dir='ltr'><em>sun/eta</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 1113 601 1164 621; x_wconf 90' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 1175 602 1242 621; x_wconf 84' lang='eng' dir='ltr'>3096T</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 585 633 1241 671; baseline 0 -5"><span class='ocrx_word' id='word_1_93' title='bbox 585 647 606 666; x_wconf 89' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 619 647 711 666; x_wconf 85' lang='eng' dir='ltr'><em>umbrina</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 720 647 771 666; x_wconf 93' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 781 647 848 666; x_wconf 67' lang='eng'><em>68377</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 857 647 993 671; x_wconf 86' lang='eng' dir='ltr'><em>(AF163121)</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 1106 633 1241 657; x_wconf 68' lang='eng' dir='ltr'><em>(AF002262)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 565 686 998 710; baseline 0.002 -5"><span class='ocrx_word' id='word_1_99' title='bbox 565 686 587 705; x_wconf 98' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 599 686 740 710; x_wconf 86' lang='eng' dir='ltr'><em>echinospora</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 750 686 791 706; x_wconf 90' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 802 686 882 706; x_wconf 83' lang='eng' dir='ltr'><em>14042T</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 892 686 998 710; x_wconf 83' lang='eng' dir='ltr'>(U49004)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 800 725 1190 749; baseline 0 -4"><span class='ocrx_word' id='word_1_104' title='bbox 800 726 822 745; x_wconf 75' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 834 726 908 749; x_wconf 77' lang='eng' dir='ltr'><em>spadix</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 917 725 968 745; x_wconf 83' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 978 726 1045 745; x_wconf 78' lang='eng' dir='ltr'><em>3146T</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 1054 726 1190 749; x_wconf 85' lang='eng' dir='ltr'><em>(AF163120)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 567 764 1056 789; baseline 0 -5"><span class='ocrx_word' id='word_1_109' title='bbox 567 764 708 789; x_wconf 76' lang='eng' dir='ltr'><em>Spiri/Iospora</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 718 765 777 784; x_wconf 81' lang='eng' dir='ltr'><em>rubra</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 786 764 837 784; x_wconf 88' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 847 765 1056 789; x_wconf 70' lang='eng' dir='ltr'><em>6875T(AF163123)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 349 804 774 828; baseline 0 -5"><span class='ocrx_word' id='word_1_113' title='bbox 349 804 371 823; x_wconf 94' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 383 804 460 823; x_wconf 83' lang='eng' dir='ltr'><em>fibrosa</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 468 804 538 823; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 547 804 629 823; x_wconf 83' lang='eng' dir='ltr'><em>49459T</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 639 804 732 828; x_wconf 81' lang='eng' dir='ltr'><em>(AF1631</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 741 804 774 828; x_wconf 93' lang='eng'><em>14)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 369 843 830 867; baseline 0 -5"><span class='ocrx_word' id='word_1_119' title='bbox 369 843 391 862; x_wconf 97' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 403 843 529 867; x_wconf 76' lang='eng' dir='ltr'><em>nitrit/genes</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 538 843 592 862; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 602 843 684 862; x_wconf 86' lang='eng' dir='ltr'><em>44137T</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 694 843 830 867; x_wconf 84' lang='eng' dir='ltr'><em>(AYO35999)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 469 882 943 906; baseline 0.002 -5"><span class='ocrx_word' id='word_1_124' title='bbox 469 882 610 906; x_wconf 88' lang='eng' dir='ltr'><em>Spiri/lospora</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 620 882 688 902; x_wconf 86' lang='eng' dir='ltr'><em>albida</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 699 882 739 902; x_wconf 94' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 750 882 830 902; x_wconf 88' lang='eng' dir='ltr'><em>12248T</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 837 882 943 906; x_wconf 85' lang='eng' dir='ltr'><em>(D85498)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 506 921 904 945; baseline 0 -4"><span class='ocrx_word' id='word_1_129' title='bbox 506 922 528 941; x_wconf 74' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 540 922 601 941; x_wconf 82' lang='eng' dir='ltr'><em>Iatina</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 611 921 665 941; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_132' title='bbox 675 922 757 941; x_wconf 74' lang='eng' dir='ltr'><em>43382T</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 767 922 904 945; x_wconf 83' lang='eng' dir='ltr'><em>(AY035998)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 369 960 819 985; baseline 0 -5"><span class='ocrx_word' id='word_1_134' title='bbox 369 961 391 980; x_wconf 69' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 403 961 561 985; x_wconf 80' lang='eng' dir='ltr'><em>rugatobispora</em></span> <span class='ocrx_word' id='word_1_136' title='bbox 572 960 612 980; x_wconf 94' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_137' title='bbox 623 961 704 980; x_wconf 72' lang='eng' dir='ltr'><em>14382T</em></span> <span class='ocrx_word' id='word_1_138' title='bbox 713 961 819 985; x_wconf 83' lang='eng' dir='ltr'>(U49010)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 389 999 802 1024; baseline 0 -5"><span class='ocrx_word' id='word_1_139' title='bbox 389 1000 411 1019; x_wconf 70' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_140' title='bbox 422 999 545 1019; x_wconf 83' lang='eng' dir='ltr'><em>fulvescens</em></span> <span class='ocrx_word' id='word_1_141' title='bbox 555 999 595 1019; x_wconf 91' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_142' title='bbox 607 1000 687 1019; x_wconf 81' lang='eng' dir='ltr'><em>14347T</em></span> <span class='ocrx_word' id='word_1_143' title='bbox 696 1000 802 1024; x_wconf 89' lang='eng' dir='ltr'><em>(U49005)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 467 1039 901 1063; baseline 0 -5"><span class='ocrx_word' id='word_1_144' title='bbox 467 1039 489 1058; x_wconf 98' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_145' title='bbox 501 1039 646 1058; x_wconf 79' lang='eng' dir='ltr'><em>atramentaria</em></span> <span class='ocrx_word' id='word_1_146' title='bbox 656 1039 697 1058; x_wconf 94' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_147' title='bbox 708 1039 901 1063; x_wconf 77' lang='eng' dir='ltr'><em>14695T(U49000)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 430 1077 958 1102; baseline 0.002 -5"><span class='ocrx_word' id='word_1_148' title='bbox 430 1077 460 1091; x_wconf 79' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_149' title='bbox 506 1078 528 1097; x_wconf 94' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_150' title='bbox 539 1078 681 1098; x_wconf 87' lang='eng' dir='ltr'><em>rubrobrunea</em></span> <span class='ocrx_word' id='word_1_151' title='bbox 692 1078 732 1098; x_wconf 91' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_152' title='bbox 744 1078 812 1098; x_wconf 84' lang='eng'>14622</span> <span class='ocrx_word' id='word_1_153' title='bbox 822 1078 958 1102; x_wconf 85' lang='eng' dir='ltr'><em>(AF134069)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 506 1117 907 1142; baseline 0 -5"><span class='ocrx_word' id='word_1_154' title='bbox 506 1118 528 1137; x_wconf 74' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_155' title='bbox 540 1118 648 1137; x_wconf 81' lang='eng' dir='ltr'><em>viridi/utea</em></span> <span class='ocrx_word' id='word_1_156' title='bbox 659 1117 699 1137; x_wconf 94' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_157' title='bbox 711 1118 791 1137; x_wconf 89' lang='eng' dir='ltr'><em>14480T</em></span> <span class='ocrx_word' id='word_1_158' title='bbox 800 1118 907 1142; x_wconf 85' lang='eng' dir='ltr'><em>(D86943)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 352 1156 615 1181; baseline 0 -5"><span class='ocrx_word' id='word_1_159' title='bbox 352 1156 386 1176; x_wconf 86' lang='eng' dir='ltr'><strong>BC</strong></span> <span class='ocrx_word' id='word_1_160' title='bbox 395 1157 473 1176; x_wconf 89' lang='eng' dir='ltr'><em>44T-5T</em></span> <span class='ocrx_word' id='word_1_161' title='bbox 479 1157 615 1181; x_wconf 87' lang='eng' dir='ltr'><em>(EF116925)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 349 1196 817 1220; baseline 0 -5"><span class='ocrx_word' id='word_1_162' title='bbox 349 1196 371 1215; x_wconf 94' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_163' title='bbox 383 1196 502 1220; x_wconf 85' lang='eng' dir='ltr'><em>oligospora</em></span> <span class='ocrx_word' id='word_1_164' title='bbox 510 1196 580 1215; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_165' title='bbox 589 1196 672 1215; x_wconf 74' lang='eng' dir='ltr'><em>43269T</em></span> <span class='ocrx_word' id='word_1_166' title='bbox 681 1196 817 1220; x_wconf 89' lang='eng' dir='ltr'><em>(AF163118)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 350 430 371 444">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 350 430 371 444">
+     <span class='ocr_line' id='line_1_41' title="bbox 350 430 371 444; baseline 0 0"><span class='ocrx_word' id='word_1_167' title='bbox 350 430 371 444; x_wconf 83' lang='eng'>99</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 193 1235 656 1298">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 193 1235 656 1298">
+     <span class='ocr_line' id='line_1_42' title="bbox 193 1235 588 1259; baseline 0 -5"><span class='ocrx_word' id='word_1_168' title='bbox 193 1235 215 1254; x_wconf 90' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_169' title='bbox 226 1235 306 1254; x_wconf 83' lang='eng' dir='ltr'><em>hibisca</em></span> <span class='ocrx_word' id='word_1_170' title='bbox 315 1235 366 1254; x_wconf 87' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_171' title='bbox 376 1235 443 1254; x_wconf 80' lang='eng' dir='ltr'><em>9627T</em></span> <span class='ocrx_word' id='word_1_172' title='bbox 453 1235 588 1259; x_wconf 87' lang='eng' dir='ltr'><em>(AF163115)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 271 1274 656 1298; baseline 0.003 -5"><span class='ocrx_word' id='word_1_173' title='bbox 271 1274 293 1293; x_wconf 96' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_174' title='bbox 304 1274 399 1298; x_wconf 82' lang='eng' dir='ltr'><em>kijaniata</em></span> <span class='ocrx_word' id='word_1_175' title='bbox 409 1274 450 1294; x_wconf 93' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_176' title='bbox 461 1274 541 1294; x_wconf 82' lang='eng' dir='ltr'><em>14229T</em></span> <span class='ocrx_word' id='word_1_177' title='bbox 551 1274 656 1298; x_wconf 83' lang='eng' dir='ltr'><em>(U49006)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 504 1309 1009 1333">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 504 1309 1009 1333">
+     <span class='ocr_line' id='line_1_44' title="bbox 504 1309 1009 1333; baseline 0 -5"><span class='ocrx_word' id='word_1_178' title='bbox 504 1309 660 1328; x_wconf 77' lang='eng' dir='ltr'><em>Actinocora/lia</em></span> <span class='ocrx_word' id='word_1_179' title='bbox 669 1309 755 1328; x_wconf 86' lang='eng' dir='ltr'><em>herbida</em></span> <span class='ocrx_word' id='word_1_180' title='bbox 765 1309 805 1328; x_wconf 88' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_181' title='bbox 817 1309 897 1328; x_wconf 83' lang='eng' dir='ltr'><em>15485T</em></span> <span class='ocrx_word' id='word_1_182' title='bbox 903 1309 1009 1333; x_wconf 86' lang='eng' dir='ltr'><em>(D85473)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001503-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001503-0-000.pbm.png
new file mode 100644
index 00000000..15ebb3a8
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001503-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001503-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001503-0-000.pbm.png.hocr
new file mode 100644
index 00000000..91e0e642
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001503-0-000.pbm.png.hocr
@@ -0,0 +1,166 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001503-0-000.pbm.png"; bbox 0 0 1302 1334; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 97 1314 144 1334">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 97 1314 144 1334">
+     <span class='ocr_line' id='line_1_1' title="bbox 97 1314 144 1334; baseline -0.021 0"><span class='ocrx_word' id='word_1_1' title='bbox 97 1314 144 1334; x_wconf 92' lang='eng'>0.01</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 395 442 423 462">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 395 442 423 462">
+     <span class='ocr_line' id='line_1_2' title="bbox 395 442 423 462; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 395 442 423 462; x_wconf 86' lang='eng'>97</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 308 506 349 525">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 308 506 349 525">
+     <span class='ocr_line' id='line_1_3' title="bbox 308 506 349 525; baseline 0 0"><span class='ocrx_word' id='word_1_3' title='bbox 308 506 349 525; x_wconf 90' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 319 671 380 719">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 319 671 380 719">
+     <span class='ocr_line' id='line_1_4' title="bbox 319 671 347 692; baseline 0 0"><span class='ocrx_word' id='word_1_4' title='bbox 319 671 347 692; x_wconf 84' lang='eng'>96</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 351 699 380 719; baseline 0 0"><span class='ocrx_word' id='word_1_5' title='bbox 351 699 380 719; x_wconf 82' lang='eng'>53</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 314 792 339 812">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 314 792 339 812">
+     <span class='ocr_line' id='line_1_6' title="bbox 314 792 339 812; baseline 0 0"><span class='ocrx_word' id='word_1_6' title='bbox 314 792 339 812; x_wconf 86' lang='eng'>91</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 195 879 223 899">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 195 879 223 899">
+     <span class='ocr_line' id='line_1_7' title="bbox 195 879 223 899; baseline 0 0"><span class='ocrx_word' id='word_1_7' title='bbox 195 879 223 899; x_wconf 86' lang='eng'>99</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 447 950 475 970">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 447 950 475 970">
+     <span class='ocr_line' id='line_1_8' title="bbox 447 950 475 970; baseline 0 0"><span class='ocrx_word' id='word_1_8' title='bbox 447 950 475 970; x_wconf 85' lang='eng'>88</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 334 1135 375 1155">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 334 1135 375 1155">
+     <span class='ocr_line' id='line_1_9' title="bbox 334 1135 375 1155; baseline 0.024 -1"><span class='ocrx_word' id='word_1_9' title='bbox 334 1135 375 1155; x_wconf 87' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 601 0 1177 28">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 601 0 1177 28">
+     <span class='ocr_line' id='line_1_10' title="bbox 601 0 1177 28; baseline 0 -6"><span class='ocrx_word' id='word_1_10' title='bbox 601 7 628 26; x_wconf 81' lang='eng'>73</span> <span class='ocrx_word' id='word_1_11' title='bbox 723 2 746 22; x_wconf 93' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_12' title='bbox 757 2 913 28; x_wconf 85' lang='eng' dir='ltr'>gerencseriae</span> <span class='ocrx_word' id='word_1_13' title='bbox 923 2 979 23; x_wconf 84' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_14' title='bbox 989 0 1060 23; x_wconf 88' lang='eng' dir='ltr'>6844T</span> <span class='ocrx_word' id='word_1_15' title='bbox 1070 2 1177 28; x_wconf 86' lang='eng' dir='ltr'>(X80414)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 481 34 1279 209">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 481 34 1279 209">
+     <span class='ocr_line' id='line_1_11' title="bbox 543 34 1184 64; baseline 0.002 -6"><span class='ocrx_word' id='word_1_16' title='bbox 543 34 568 54; x_wconf 89' lang='eng'>51</span> <span class='ocrx_word' id='word_1_17' title='bbox 795 39 817 58; x_wconf 93' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_18' title='bbox 829 39 906 59; x_wconf 86' lang='eng' dir='ltr'>israelii</span> <span class='ocrx_word' id='word_1_19' title='bbox 914 38 956 59; x_wconf 87' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_20' title='bbox 967 36 1066 59; x_wconf 78' lang='eng' dir='ltr'>103259T</span> <span class='ocrx_word' id='word_1_21' title='bbox 1076 39 1184 64; x_wconf 89' lang='eng' dir='ltr'>(X82450)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 650 73 1120 100; baseline 0.002 -5"><span class='ocrx_word' id='word_1_22' title='bbox 650 75 676 95; x_wconf 89' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_23' title='bbox 686 75 847 96; x_wconf 83' lang='eng' dir='ltr'>massiliensis</span> <span class='ocrx_word' id='word_1_24' title='bbox 855 73 971 96; x_wconf 87' lang='eng' dir='ltr'>4401292T</span> <span class='ocrx_word' id='word_1_25' title='bbox 979 75 1120 100; x_wconf 85' lang='eng' dir='ltr'>(EF558367)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 501 109 1161 137; baseline 0 -5"><span class='ocrx_word' id='word_1_26' title='bbox 501 112 529 132; x_wconf 94' lang='eng'>57</span> <span class='ocrx_word' id='word_1_27' title='bbox 720 111 743 131; x_wconf 94' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_28' title='bbox 755 111 833 132; x_wconf 83' lang='eng' dir='ltr'>on&#39;cola</span> <span class='ocrx_word' id='word_1_29' title='bbox 843 111 919 132; x_wconf 88' lang='eng' dir='ltr'><strong>CCUG</strong></span> <span class='ocrx_word' id='word_1_30' title='bbox 929 109 1015 132; x_wconf 77' lang='eng' dir='ltr'>46090T</span> <span class='ocrx_word' id='word_1_31' title='bbox 1024 111 1161 137; x_wconf 85' lang='eng' dir='ltr'>(AJ507295)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 481 145 1279 178; baseline 0 -10"><span class='ocrx_word' id='word_1_32' title='bbox 481 158 505 178; x_wconf 66' lang='eng'>81</span> <span class='ocrx_word' id='word_1_33' title='bbox 893 148 916 168; x_wconf 98' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_34' title='bbox 928 148 1020 168; x_wconf 81' lang='eng' dir='ltr'>dental/s</span> <span class='ocrx_word' id='word_1_35' title='bbox 1029 145 1133 168; x_wconf 81' lang='eng' dir='ltr'>R18165T</span> <span class='ocrx_word' id='word_1_36' title='bbox 1143 148 1279 173; x_wconf 85' lang='eng' dir='ltr'>(AJ697609)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 581 182 1242 209; baseline 0 -5"><span class='ocrx_word' id='word_1_37' title='bbox 581 189 609 209; x_wconf 78' lang='eng'>82</span> <span class='ocrx_word' id='word_1_38' title='bbox 864 184 887 204; x_wconf 93' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_39' title='bbox 898 184 1020 204; x_wconf 85' lang='eng' dir='ltr'>ruminicola</span> <span class='ocrx_word' id='word_1_40' title='bbox 1030 182 1087 204; x_wconf 85' lang='eng' dir='ltr'>B71T</span> <span class='ocrx_word' id='word_1_41' title='bbox 1097 184 1242 209; x_wconf 89' lang='eng' dir='ltr'>(DQO72005)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 614 218 1166 355">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 614 218 1166 355">
+     <span class='ocr_line' id='line_1_16' title="bbox 702 218 1166 246; baseline -0.002 -5"><span class='ocrx_word' id='word_1_42' title='bbox 702 221 724 240; x_wconf 92' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_43' title='bbox 736 221 872 241; x_wconf 83' lang='eng' dir='ltr'>denticolens</span> <span class='ocrx_word' id='word_1_44' title='bbox 882 220 954 241; x_wconf 90' lang='eng' dir='ltr'>NCTC</span> <span class='ocrx_word' id='word_1_45' title='bbox 966 218 1048 241; x_wconf 78' lang='eng' dir='ltr'>11490T</span> <span class='ocrx_word' id='word_1_46' title='bbox 1059 221 1166 246; x_wconf 89' lang='eng' dir='ltr'>(X80412)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 647 254 1071 282; baseline 0 -5"><span class='ocrx_word' id='word_1_47' title='bbox 647 257 670 277; x_wconf 92' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_48' title='bbox 682 257 746 277; x_wconf 80' lang='eng' dir='ltr'>catuli</span> <span class='ocrx_word' id='word_1_49' title='bbox 753 256 830 277; x_wconf 90' lang='eng' dir='ltr'>CCUG</span> <span class='ocrx_word' id='word_1_50' title='bbox 840 254 925 277; x_wconf 85' lang='eng' dir='ltr'>41709T</span> <span class='ocrx_word' id='word_1_51' title='bbox 935 257 1071 282; x_wconf 84' lang='eng' dir='ltr'>(AJ276805)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 620 291 1034 318; baseline 0 -4"><span class='ocrx_word' id='word_1_52' title='bbox 620 293 643 314; x_wconf 90' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_53' title='bbox 655 293 744 314; x_wconf 88' lang='eng' dir='ltr'>howe/lii</span> <span class='ocrx_word' id='word_1_54' title='bbox 752 293 825 314; x_wconf 90' lang='eng' dir='ltr'>NCTC</span> <span class='ocrx_word' id='word_1_55' title='bbox 837 291 1034 318; x_wconf 69' lang='eng' dir='ltr'>11636T(X80411)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 614 327 1048 355; baseline 0 -5"><span class='ocrx_word' id='word_1_56' title='bbox 614 330 637 350; x_wconf 88' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_57' title='bbox 649 330 722 350; x_wconf 82' lang='eng' dir='ltr'>slackii</span> <span class='ocrx_word' id='word_1_58' title='bbox 730 330 807 350; x_wconf 87' lang='eng' dir='ltr'><strong>CCUG</strong></span> <span class='ocrx_word' id='word_1_59' title='bbox 817 327 902 350; x_wconf 73' lang='eng' dir='ltr'>32792T</span> <span class='ocrx_word' id='word_1_60' title='bbox 912 330 1048 355; x_wconf 87' lang='eng' dir='ltr'>(AJ234066)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 493 364 1079 391">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 493 364 1079 391">
+     <span class='ocr_line' id='line_1_20' title="bbox 493 364 1079 391; baseline 0.002 -6"><span class='ocrx_word' id='word_1_61' title='bbox 493 368 522 388; x_wconf 30' lang='eng'>1.</span> <span class='ocrx_word' id='word_1_62' title='bbox 611 366 634 386; x_wconf 92' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_63' title='bbox 646 366 752 386; x_wconf 84' lang='eng' dir='ltr'>bowdenii</span> <span class='ocrx_word' id='word_1_64' title='bbox 760 366 837 386; x_wconf 89' lang='eng' dir='ltr'><strong>CCUG</strong></span> <span class='ocrx_word' id='word_1_65' title='bbox 847 364 932 386; x_wconf 79' lang='eng' dir='ltr'>37421T</span> <span class='ocrx_word' id='word_1_66' title='bbox 942 366 1079 391; x_wconf 84' lang='eng' dir='ltr'>(AJ234039)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 518 400 1302 1155">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 518 400 1302 1155">
+     <span class='ocr_line' id='line_1_21' title="bbox 572 400 1095 428; baseline 0 -6"><span class='ocrx_word' id='word_1_67' title='bbox 572 412 647 414; x_wconf 94' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_68' title='bbox 661 403 683 422; x_wconf 93' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_69' title='bbox 695 402 817 422; x_wconf 81' lang='eng' dir='ltr'><em>naeslundii</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 826 402 881 422; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_71' title='bbox 892 400 978 422; x_wconf 78' lang='eng' dir='ltr'>43013T</span> <span class='ocrx_word' id='word_1_72' title='bbox 987 402 1095 428; x_wconf 86' lang='eng' dir='ltr'>(X53226)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 522 437 1302 464; baseline 0.003 -7"><span class='ocrx_word' id='word_1_73' title='bbox 522 444 563 464; x_wconf 82' lang='eng'>100</span> <span class='ocrx_word' id='word_1_74' title='bbox 572 448 868 450; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_75' title='bbox 882 439 904 458; x_wconf 92' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_76' title='bbox 916 439 1019 459; x_wconf 80' lang='eng' dir='ltr'><em>viscosus</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 1028 439 1084 459; x_wconf 90' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_78' title='bbox 1094 437 1180 459; x_wconf 79' lang='eng' dir='ltr'>43327T</span> <span class='ocrx_word' id='word_1_79' title='bbox 1190 439 1302 464; x_wconf 86' lang='eng' dir='ltr'>(M33908)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 545 475 1030 500; baseline 0 -5"><span class='ocrx_word' id='word_1_80' title='bbox 545 475 568 495; x_wconf 93' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_81' title='bbox 580 475 717 500; x_wconf 78' lang='eng' dir='ltr'>urogenitalis</span> <span class='ocrx_word' id='word_1_82' title='bbox 726 475 803 495; x_wconf 88' lang='eng' dir='ltr'>CCUG</span> <span class='ocrx_word' id='word_1_83' title='bbox 813 475 887 495; x_wconf 88' lang='eng'>28744</span> <span class='ocrx_word' id='word_1_84' title='bbox 895 475 1030 500; x_wconf 79' lang='eng' dir='ltr'>(AJ243893)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 587 509 978 537; baseline 0 -6"><span class='ocrx_word' id='word_1_85' title='bbox 587 512 610 531; x_wconf 95' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_86' title='bbox 622 512 684 531; x_wconf 79' lang='eng' dir='ltr'><em>Davis</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 694 511 765 531; x_wconf 90' lang='eng' dir='ltr'>NCTC</span> <span class='ocrx_word' id='word_1_88' title='bbox 777 509 861 531; x_wconf 79' lang='eng' dir='ltr'>11535T</span> <span class='ocrx_word' id='word_1_89' title='bbox 871 512 978 537; x_wconf 88' lang='eng' dir='ltr'>(X81061)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 554 545 1052 573; baseline 0 -5"><span class='ocrx_word' id='word_1_90' title='bbox 554 548 577 567; x_wconf 97' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_91' title='bbox 589 548 724 568; x_wconf 83' lang='eng' dir='ltr'>radicidentis</span> <span class='ocrx_word' id='word_1_92' title='bbox 733 547 810 568; x_wconf 89' lang='eng' dir='ltr'>CCUG</span> <span class='ocrx_word' id='word_1_93' title='bbox 821 545 906 568; x_wconf 76' lang='eng' dir='ltr'>36733T</span> <span class='ocrx_word' id='word_1_94' title='bbox 915 548 1052 573; x_wconf 85' lang='eng' dir='ltr'>(AJ251986)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 635 582 1134 610; baseline 0.002 -6"><span class='ocrx_word' id='word_1_95' title='bbox 635 584 658 604; x_wconf 94' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_96' title='bbox 670 584 808 610; x_wconf 78' lang='eng' dir='ltr'>graevenitzii</span> <span class='ocrx_word' id='word_1_97' title='bbox 816 584 892 605; x_wconf 88' lang='eng' dir='ltr'><strong>CCUG</strong></span> <span class='ocrx_word' id='word_1_98' title='bbox 902 582 988 605; x_wconf 83' lang='eng' dir='ltr'>27294T</span> <span class='ocrx_word' id='word_1_99' title='bbox 997 584 1134 610; x_wconf 84' lang='eng' dir='ltr'>(AJ540309)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 601 619 1061 646; baseline 0 -5"><span class='ocrx_word' id='word_1_100' title='bbox 601 621 623 640; x_wconf 89' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_101' title='bbox 635 621 732 641; x_wconf 83' lang='eng' dir='ltr'>nasicola</span> <span class='ocrx_word' id='word_1_102' title='bbox 742 620 819 641; x_wconf 87' lang='eng' dir='ltr'>CCUG</span> <span class='ocrx_word' id='word_1_103' title='bbox 829 619 915 641; x_wconf 77' lang='eng' dir='ltr'>46092T</span> <span class='ocrx_word' id='word_1_104' title='bbox 924 621 1061 646; x_wconf 88' lang='eng' dir='ltr'>(AJ508455)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 686 655 1142 683; baseline 0.002 -6"><span class='ocrx_word' id='word_1_105' title='bbox 686 658 709 677; x_wconf 96' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_106' title='bbox 720 658 901 683; x_wconf 84' lang='eng' dir='ltr'>hongkongensis</span> <span class='ocrx_word' id='word_1_107' title='bbox 912 655 992 678; x_wconf 89' lang='eng' dir='ltr'>HKU8T</span> <span class='ocrx_word' id='word_1_108' title='bbox 1002 658 1142 683; x_wconf 83' lang='eng' dir='ltr'>(AF433168)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 562 691 1124 719; baseline 0 -5"><span class='ocrx_word' id='word_1_109' title='bbox 562 694 585 714; x_wconf 94' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_110' title='bbox 596 694 796 714; x_wconf 84' lang='eng' dir='ltr'><em>marimammalium</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 805 694 882 714; x_wconf 90' lang='eng' dir='ltr'><strong>CCUG</strong></span> <span class='ocrx_word' id='word_1_112' title='bbox 892 691 977 714; x_wconf 89' lang='eng' dir='ltr'>41710T</span> <span class='ocrx_word' id='word_1_113' title='bbox 987 694 1124 719; x_wconf 86' lang='eng' dir='ltr'>(AJ276405)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 535 728 958 755; baseline 0 -4"><span class='ocrx_word' id='word_1_114' title='bbox 535 730 557 750; x_wconf 94' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_115' title='bbox 570 730 632 751; x_wconf 81' lang='eng' dir='ltr'><em>canis</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 640 730 716 751; x_wconf 89' lang='eng' dir='ltr'>CCUG</span> <span class='ocrx_word' id='word_1_117' title='bbox 727 728 812 751; x_wconf 87' lang='eng' dir='ltr'>41706T</span> <span class='ocrx_word' id='word_1_118' title='bbox 822 730 958 755; x_wconf 86' lang='eng' dir='ltr'>(AJ243891)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 653 764 991 792; baseline 0 -6"><span class='ocrx_word' id='word_1_119' title='bbox 653 766 676 786; x_wconf 97' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_120' title='bbox 688 766 792 792; x_wconf 83' lang='eng' dir='ltr'>radingae</span> <span class='ocrx_word' id='word_1_121' title='bbox 800 764 877 786; x_wconf 92' lang='eng' dir='ltr'>APL1T</span> <span class='ocrx_word' id='word_1_122' title='bbox 884 766 991 792; x_wconf 85' lang='eng' dir='ltr'>(X78719)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 518 801 920 828; baseline 0.002 -6"><span class='ocrx_word' id='word_1_123' title='bbox 518 803 540 822; x_wconf 90' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_124' title='bbox 552 803 656 828; x_wconf 84' lang='eng' dir='ltr'>georgiae</span> <span class='ocrx_word' id='word_1_125' title='bbox 665 803 722 823; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_126' title='bbox 732 801 802 823; x_wconf 76' lang='eng' dir='ltr'>6843T</span> <span class='ocrx_word' id='word_1_127' title='bbox 813 803 920 828; x_wconf 82' lang='eng' dir='ltr'>(X80413)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 530 837 1049 864; baseline 0 -5"><span class='ocrx_word' id='word_1_128' title='bbox 530 839 553 859; x_wconf 66' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_129' title='bbox 565 839 722 864; x_wconf 78' lang='eng' dir='ltr'>odontolyticus</span> <span class='ocrx_word' id='word_1_130' title='bbox 731 839 807 859; x_wconf 90' lang='eng' dir='ltr'>CCUG</span> <span class='ocrx_word' id='word_1_131' title='bbox 817 837 903 859; x_wconf 81' lang='eng' dir='ltr'>20536T</span> <span class='ocrx_word' id='word_1_132' title='bbox 912 839 1049 864; x_wconf 82' lang='eng' dir='ltr'>(AJ234040)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 545 873 1044 901; baseline 0 -6"><span class='ocrx_word' id='word_1_133' title='bbox 545 876 568 895; x_wconf 90' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_134' title='bbox 580 876 716 895; x_wconf 83' lang='eng' dir='ltr'>cardiffensis</span> <span class='ocrx_word' id='word_1_135' title='bbox 725 876 801 895; x_wconf 88' lang='eng' dir='ltr'>CCUG</span> <span class='ocrx_word' id='word_1_136' title='bbox 811 873 897 895; x_wconf 78' lang='eng' dir='ltr'>44997T</span> <span class='ocrx_word' id='word_1_137' title='bbox 907 876 1044 901; x_wconf 86' lang='eng' dir='ltr'>(AJ421779)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 593 910 1048 937; baseline 0 -5"><span class='ocrx_word' id='word_1_138' title='bbox 593 912 616 932; x_wconf 68' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_139' title='bbox 629 912 788 932; x_wconf 82' lang='eng' dir='ltr'>vaccimaxillae</span> <span class='ocrx_word' id='word_1_140' title='bbox 798 910 901 932; x_wconf 84' lang='eng' dir='ltr'>R10176T</span> <span class='ocrx_word' id='word_1_141' title='bbox 911 912 1048 937; x_wconf 89' lang='eng' dir='ltr'>(AJ427451)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 593 946 958 974; baseline -0.003 -5"><span class='ocrx_word' id='word_1_142' title='bbox 593 948 616 968; x_wconf 95' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_143' title='bbox 628 948 741 969; x_wconf 80' lang='eng' dir='ltr'>tun&#39;censis</span> <span class='ocrx_word' id='word_1_144' title='bbox 749 946 841 969; x_wconf 93' lang='eng' dir='ltr'>APL10T</span> <span class='ocrx_word' id='word_1_145' title='bbox 851 948 958 974; x_wconf 85' lang='eng' dir='ltr'>(X78720)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 582 982 1014 1010; baseline 0.002 -6"><span class='ocrx_word' id='word_1_146' title='bbox 582 985 604 1004; x_wconf 96' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_147' title='bbox 617 984 688 1005; x_wconf 86' lang='eng' dir='ltr'>funkei</span> <span class='ocrx_word' id='word_1_148' title='bbox 696 984 773 1005; x_wconf 88' lang='eng' dir='ltr'><strong>CCUG</strong></span> <span class='ocrx_word' id='word_1_149' title='bbox 783 982 868 1005; x_wconf 79' lang='eng' dir='ltr'>42773T</span> <span class='ocrx_word' id='word_1_150' title='bbox 879 985 1014 1010; x_wconf 83' lang='eng' dir='ltr'>(AJ404889)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 562 1019 1022 1046; baseline 0 -5"><span class='ocrx_word' id='word_1_151' title='bbox 562 1021 585 1041; x_wconf 94' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_152' title='bbox 597 1021 746 1046; x_wconf 82' lang='eng' dir='ltr'>hyovaginalis</span> <span class='ocrx_word' id='word_1_153' title='bbox 755 1021 825 1041; x_wconf 90' lang='eng' dir='ltr'>NCFB</span> <span class='ocrx_word' id='word_1_154' title='bbox 835 1019 905 1041; x_wconf 75' lang='eng' dir='ltr'>2983T</span> <span class='ocrx_word' id='word_1_155' title='bbox 915 1021 1022 1046; x_wconf 84' lang='eng' dir='ltr'>(X69616)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 572 1055 1081 1083; baseline 0 -6"><span class='ocrx_word' id='word_1_156' title='bbox 572 1058 595 1077; x_wconf 93' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_157' title='bbox 607 1058 754 1077; x_wconf 82' lang='eng' dir='ltr'><em>suimastitidis</em></span> <span class='ocrx_word' id='word_1_158' title='bbox 763 1057 840 1077; x_wconf 87' lang='eng' dir='ltr'><strong>CCUG</strong></span> <span class='ocrx_word' id='word_1_159' title='bbox 850 1055 935 1077; x_wconf 77' lang='eng' dir='ltr'>3927GT</span> <span class='ocrx_word' id='word_1_160' title='bbox 945 1058 1081 1083; x_wconf 79' lang='eng' dir='ltr'>(AJ277385)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 674 1092 1163 1119; baseline 0 -5"><span class='ocrx_word' id='word_1_161' title='bbox 674 1094 698 1114; x_wconf 94' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_162' title='bbox 709 1094 836 1114; x_wconf 85' lang='eng' dir='ltr'>coleocanis</span> <span class='ocrx_word' id='word_1_163' title='bbox 846 1094 922 1114; x_wconf 87' lang='eng' dir='ltr'>CCUG</span> <span class='ocrx_word' id='word_1_164' title='bbox 931 1092 1017 1114; x_wconf 91' lang='eng' dir='ltr'>41708T</span> <span class='ocrx_word' id='word_1_165' title='bbox 1027 1094 1163 1119; x_wconf 84' lang='eng' dir='ltr'>(AJ249326)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 569 1128 1090 1155; baseline 0 -5"><span class='ocrx_word' id='word_1_166' title='bbox 569 1130 592 1150; x_wconf 95' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_167' title='bbox 604 1135 731 1155; x_wconf 84' lang='eng' dir='ltr'>europaeus</span> <span class='ocrx_word' id='word_1_168' title='bbox 740 1130 816 1150; x_wconf 89' lang='eng' dir='ltr'>CCUG</span> <span class='ocrx_word' id='word_1_169' title='bbox 827 1130 900 1150; x_wconf 86' lang='eng'>32789</span> <span class='ocrx_word' id='word_1_170' title='bbox 909 1128 938 1150; x_wconf 75' lang='eng' dir='ltr'>N</span> <span class='ocrx_word' id='word_1_171' title='bbox 945 1130 1090 1155; x_wconf 87' lang='eng' dir='ltr'>(AM084230)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 570 412 572 450">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 570 412 572 450">
+     <span class='ocr_line' id='line_1_42' title="bbox 570 412 572 450; baseline 0 884"><span class='ocrx_word' id='word_1_172' title='bbox 570 412 572 450; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 301 1164 1061 1265">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 301 1164 1061 1265">
+     <span class='ocr_line' id='line_1_43' title="bbox 469 1164 1061 1192; baseline -0.002 -5"><span class='ocrx_word' id='word_1_173' title='bbox 469 1167 492 1186; x_wconf 96' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_174' title='bbox 503 1167 561 1187; x_wconf 86' lang='eng' dir='ltr'><em>neuii</em></span> <span class='ocrx_word' id='word_1_175' title='bbox 569 1167 644 1192; x_wconf 85' lang='eng' dir='ltr'>subsp.</span> <span class='ocrx_word' id='word_1_176' title='bbox 656 1167 759 1187; x_wconf 78' lang='eng' dir='ltr'>anitratus</span> <span class='ocrx_word' id='word_1_177' title='bbox 768 1166 825 1187; x_wconf 86' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_178' title='bbox 835 1164 905 1187; x_wconf 84' lang='eng' dir='ltr'>8577T</span> <span class='ocrx_word' id='word_1_179' title='bbox 915 1167 1061 1192; x_wconf 82' lang='eng' dir='ltr'>(AM084229)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 395 1201 1012 1228; baseline 0.005 -8"><span class='ocrx_word' id='word_1_180' title='bbox 395 1201 437 1221; x_wconf 93' lang='eng'>100</span> <span class='ocrx_word' id='word_1_181' title='bbox 470 1203 493 1223; x_wconf 96' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_182' title='bbox 504 1203 562 1223; x_wconf 86' lang='eng' dir='ltr'><em>neuii</em></span> <span class='ocrx_word' id='word_1_183' title='bbox 570 1203 646 1228; x_wconf 84' lang='eng' dir='ltr'>subsp.</span> <span class='ocrx_word' id='word_1_184' title='bbox 656 1203 714 1223; x_wconf 90' lang='eng' dir='ltr'><em>neuii</em></span> <span class='ocrx_word' id='word_1_185' title='bbox 723 1203 778 1223; x_wconf 90' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_186' title='bbox 790 1201 1012 1228; x_wconf 43' lang='eng' dir='ltr'>85761(AM084228)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 301 1237 932 1265; baseline 0 -5"><span class='ocrx_word' id='word_1_187' title='bbox 301 1240 447 1260; x_wconf 85' lang='eng' dir='ltr'><em>Varibaculum</em></span> <span class='ocrx_word' id='word_1_188' title='bbox 457 1240 595 1260; x_wconf 79' lang='eng' dir='ltr'>cambn&#39;ense</span> <span class='ocrx_word' id='word_1_189' title='bbox 605 1239 682 1260; x_wconf 86' lang='eng' dir='ltr'><strong>CCUG</strong></span> <span class='ocrx_word' id='word_1_190' title='bbox 691 1237 777 1260; x_wconf 78' lang='eng' dir='ltr'>44998T</span> <span class='ocrx_word' id='word_1_191' title='bbox 787 1240 932 1265; x_wconf 88' lang='eng' dir='ltr'>(AM084231)</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001529-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001529-0-000.pbm.png
new file mode 100644
index 00000000..1cbac7f3
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001529-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001529-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001529-0-000.pbm.png.hocr
new file mode 100644
index 00000000..6580046c
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001529-0-000.pbm.png.hocr
@@ -0,0 +1,164 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001529-0-000.pbm.png"; bbox 0 0 1420 1054; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 3 18 631 1033">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 3 18 631 1033">
+     <span class='ocr_line' id='line_1_1' title="bbox 392 18 473 92; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 392 18 473 92; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 348 92 469 163; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 348 92 469 163; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 339 163 513 236; baseline 0 -37"><span class='ocrx_word' id='word_1_3' title='bbox 339 163 513 236; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 339 236 455 275; baseline 0 779"><span class='ocrx_word' id='word_1_4' title='bbox 339 236 455 275; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 256 275 436 306; baseline 0 748"><span class='ocrx_word' id='word_1_5' title='bbox 256 275 436 306; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 256 306 491 345; baseline 0 709"><span class='ocrx_word' id='word_1_6' title='bbox 256 306 491 345; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 252 345 517 416; baseline 0 0"><span class='ocrx_word' id='word_1_7' title='bbox 252 345 517 416; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 177 416 475 459; baseline 0 0"><span class='ocrx_word' id='word_1_8' title='bbox 177 416 475 459; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 177 459 517 488; baseline 0 566"><span class='ocrx_word' id='word_1_9' title='bbox 177 459 517 488; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 177 488 475 531; baseline 0 0"><span class='ocrx_word' id='word_1_10' title='bbox 177 488 475 531; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 3 531 454 567; baseline 0 0"><span class='ocrx_word' id='word_1_11' title='bbox 3 531 454 567; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 3 567 424 595; baseline 0 459"><span class='ocrx_word' id='word_1_12' title='bbox 3 567 424 595; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 7 595 424 635; baseline 0 419"><span class='ocrx_word' id='word_1_13' title='bbox 7 595 424 635; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 3 635 463 676; baseline 0 0"><span class='ocrx_word' id='word_1_14' title='bbox 3 635 463 676; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 3 676 631 710; baseline 0 344"><span class='ocrx_word' id='word_1_15' title='bbox 3 676 631 710; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 3 710 584 746; baseline 0.003 -2"><span class='ocrx_word' id='word_1_16' title='bbox 3 710 584 746; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 3 746 543 853; baseline 0.013 -6"><span class='ocrx_word' id='word_1_17' title='bbox 3 746 543 853; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 7 853 532 884; baseline 0 170"><span class='ocrx_word' id='word_1_18' title='bbox 7 853 532 884; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 3 884 532 928; baseline 0 0"><span class='ocrx_word' id='word_1_19' title='bbox 3 884 532 928; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 3 993 14 1033; baseline 0 21"><span class='ocrx_word' id='word_1_20' title='bbox 3 993 14 1033; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 464 6 1141 220">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 464 6 1141 220">
+     <span class='ocr_line' id='line_1_21' title="bbox 473 6 1120 40; baseline 0 -7"><span class='ocrx_word' id='word_1_21' title='bbox 473 10 627 33; x_wconf 78' lang='eng' dir='ltr'><em>Pedobactcr</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 640 10 764 40; x_wconf 61' lang='eng' dir='ltr'><em>afficanus</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 777 10 847 33; x_wconf 90' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_24' title='bbox 860 6 955 33; x_wconf 90' lang='eng' dir='ltr'><em>12126T</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 964 10 1120 39; x_wconf 87' lang='eng' dir='ltr'>(AJ438171)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 470 43 1062 76; baseline 0 -6"><span class='ocrx_word' id='word_1_26' title='bbox 470 46 623 70; x_wconf 67' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 635 49 706 70; x_wconf 77' lang='eng' dir='ltr'><em>caeni</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 718 47 789 70; x_wconf 90' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_29' title='bbox 800 43 898 70; x_wconf 83' lang='eng' dir='ltr'><em>22862T</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 906 47 1062 76; x_wconf 86' lang='eng' dir='ltr'>(AJ786798)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 469 79 1141 112; baseline -0.001 -6"><span class='ocrx_word' id='word_1_31' title='bbox 469 82 622 106; x_wconf 74' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 631 84 804 112; x_wconf 73' lang='eng' dir='ltr'><em>panaciterrae</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 819 82 888 106; x_wconf 87' lang='eng' dir='ltr'>Gsoil</span> <span class='ocrx_word' id='word_1_34' title='bbox 901 79 964 106; x_wconf 91' lang='eng' dir='ltr'><em>042T</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 975 83 1141 111; x_wconf 80' lang='eng' dir='ltr'>(ABZ45368)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 473 114 1112 147; baseline -0.002 -6"><span class='ocrx_word' id='word_1_36' title='bbox 473 117 625 141; x_wconf 74' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 638 117 770 147; x_wconf 68' lang='eng' dir='ltr'><em>hepal‘irzus</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 783 118 853 141; x_wconf 87' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_39' title='bbox 863 114 945 141; x_wconf 83' lang='eng' dir='ltr'><em>2366T</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 956 118 1112 146; x_wconf 83' lang='eng' dir='ltr'>(AJ438172)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 464 150 1125 183; baseline -0.002 -6"><span class='ocrx_word' id='word_1_41' title='bbox 464 153 617 177; x_wconf 71' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 628 153 790 183; x_wconf 73' lang='eng' dir='ltr'><em>ginsengiso/i</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 804 153 872 177; x_wconf 83' lang='eng' dir='ltr'>Gsoil</span> <span class='ocrx_word' id='word_1_44' title='bbox 888 150 948 177; x_wconf 86' lang='eng' dir='ltr'><em>104T</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 960 154 1125 183; x_wconf 87' lang='eng' dir='ltr'>(AB24537I)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 513 187 1053 220; baseline 0 -6"><span class='ocrx_word' id='word_1_46' title='bbox 513 191 666 214; x_wconf 79' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 680 191 773 214; x_wconf 72' lang='eng' dir='ltr'><em>insulae</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 785 187 886 214; x_wconf 86' lang='eng' dir='ltr'><em>DS-39T</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 895 191 1053 220; x_wconf 85' lang='eng' dir='ltr'>(EF100697)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 455 221 1184 290">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 455 221 1184 290">
+     <span class='ocr_line' id='line_1_27' title="bbox 455 221 1184 257; baseline 0 -7"><span class='ocrx_word' id='word_1_50' title='bbox 455 221 498 244; x_wconf 70' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 508 227 750 257; x_wconf 62' lang='eng' dir='ltr'><em>Splzingobaclerium</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 766 229 925 250; x_wconf 74' lang='eng' dir='ltr'><em>antarcticum</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 940 227 1016 250; x_wconf 87' lang='eng' dir='ltr'>6BlY</span> <span class='ocrx_word' id='word_1_54' title='bbox 1027 228 1071 255; x_wconf 82' lang='eng' dir='ltr'>(AJ</span> <span class='ocrx_word' id='word_1_55' title='bbox 1076 227 1184 255; x_wconf 85' lang='eng'>576248)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 505 257 1128 290; baseline -0.002 -6"><span class='ocrx_word' id='word_1_56' title='bbox 505 260 656 284; x_wconf 77' lang='eng' dir='ltr'><em>Pedabacter</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 667 263 770 290; x_wconf 76' lang='eng' dir='ltr'><em>piscium</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 783 261 853 284; x_wconf 86' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_59' title='bbox 869 261 873 283; x_wconf 96' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 885 257 958 284; x_wconf 88' lang='eng' dir='ltr'><em>1725T</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 972 261 1128 290; x_wconf 88' lang='eng' dir='ltr'>(AJ438174)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 424 294 1414 759">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 424 294 1164 653">
+     <span class='ocr_line' id='line_1_29' title="bbox 491 294 1164 328; baseline 0 -6"><span class='ocrx_word' id='word_1_62' title='bbox 491 298 644 322; x_wconf 78' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 656 300 803 328; x_wconf 77' lang='eng' dir='ltr'><em>cryocom‘tis</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 816 298 887 322; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_65' title='bbox 901 294 996 322; x_wconf 81' lang='eng' dir='ltr'><em>14825T</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 1007 298 1164 328; x_wconf 84' lang='eng' dir='ltr'>(AJ438170)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 522 331 1154 365; baseline -0.002 -7"><span class='ocrx_word' id='word_1_67' title='bbox 522 334 674 358; x_wconf 79' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 687 334 859 365; x_wconf 76' lang='eng' dir='ltr'><em>lzimalayensis</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 872 331 986 358; x_wconf 76' lang='eng' dir='ltr'><em>HHSZ2T</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 997 335 1154 364; x_wconf 77' lang='eng' dir='ltr'>(A.1583425)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 518 367 1085 400; baseline -0.002 -6"><span class='ocrx_word' id='word_1_71' title='bbox 518 370 651 394; x_wconf 75' lang='eng' dir='ltr'><em>edabacter</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 663 370 778 400; x_wconf 78' lang='eng' dir='ltr'><em>aquatilis</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 792 367 901 394; x_wconf 80' lang='eng' dir='ltr'><em>ARlO7T</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 913 371 987 399; x_wconf 88' lang='eng' dir='ltr'>(AMI</span> <span class='ocrx_word' id='word_1_75' title='bbox 999 371 1085 400; x_wconf 87' lang='eng'>14396)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 475 404 1058 436; baseline 0 -5"><span class='ocrx_word' id='word_1_76' title='bbox 475 407 628 431; x_wconf 76' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 640 415 725 431; x_wconf 72' lang='eng' dir='ltr'><em>roseus</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 738 404 880 431; x_wconf 75' lang='eng' dir='ltr'><em>CL-GP80T</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 890 408 959 436; x_wconf 86' lang='eng' dir='ltr'>(DQl</span> <span class='ocrx_word' id='word_1_80' title='bbox 970 408 1058 436; x_wconf 88' lang='eng'>12353)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 517 439 1117 472; baseline 0 -6"><span class='ocrx_word' id='word_1_81' title='bbox 517 443 671 466; x_wconf 78' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 682 445 832 466; x_wconf 59' lang='eng' dir='ltr'><em>suwonensz’s</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 850 439 938 466; x_wconf 82' lang='eng' dir='ltr'><em>15-52T</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 949 443 1117 472; x_wconf 84' lang='eng' dir='ltr'>(DQ097274)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 517 475 1155 508; baseline 0 -6"><span class='ocrx_word' id='word_1_85' title='bbox 517 479 670 502; x_wconf 78' lang='eng' dir='ltr'><em>Pedobacrer</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 682 479 860 502; x_wconf 71' lang='eng' dir='ltr'><em>sandarakinus</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 875 475 976 502; x_wconf 87' lang='eng' dir='ltr'><em>DS-27T</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 987 479 1155 508; x_wconf 85' lang='eng' dir='ltr'>(DQ235228)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 475 512 1038 544; baseline -0.002 -6"><span class='ocrx_word' id='word_1_89' title='bbox 475 514 627 538; x_wconf 75' lang='eng' dir='ltr'><em>Pedabacrer</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 640 514 755 538; x_wconf 77' lang='eng' dir='ltr'><em>terrico/a</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 767 512 868 538; x_wconf 87' lang='eng' dir='ltr'><em>DS-45T</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 879 515 1038 544; x_wconf 86' lang='eng' dir='ltr'>(EF446147)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 454 547 979 579; baseline -0.002 -5"><span class='ocrx_word' id='word_1_93' title='bbox 454 550 606 574; x_wconf 75' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 619 550 697 574; x_wconf 78' lang='eng' dir='ltr'><em>lentus</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 708 547 809 574; x_wconf 88' lang='eng' dir='ltr'><em>DS-40T</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 820 551 979 579; x_wconf 85' lang='eng' dir='ltr'>(EF446146)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 424 584 1094 618; baseline -0.001 -7"><span class='ocrx_word' id='word_1_97' title='bbox 424 587 579 611; x_wconf 82' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 591 587 793 618; x_wconf 78' lang='eng' dir='ltr'><em>(laechungensis</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 807 587 861 610; x_wconf 86' lang='eng' dir='ltr'><em>Dae</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 873 584 918 610; x_wconf 83' lang='eng' dir='ltr'><em>13T</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 929 587 1094 616; x_wconf 88' lang='eng' dir='ltr'>(AB267722)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 463 620 1078 653; baseline -0.002 -6"><span class='ocrx_word' id='word_1_102' title='bbox 463 623 615 647; x_wconf 77' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 627 623 720 647; x_wconf 74' lang='eng' dir='ltr'><em>salrans</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 732 624 802 647; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_105' title='bbox 817 620 910 647; x_wconf 91' lang='eng' dir='ltr'><em>12145T</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 922 624 1078 653; x_wconf 85' lang='eng' dir='ltr'>(AJ438173)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 584 658 1414 759">
+     <span class='ocr_line' id='line_1_39' title="bbox 757 658 1262 691; baseline 0 -6"><span class='ocrx_word' id='word_1_107' title='bbox 757 661 907 685; x_wconf 77' lang='eng' dir='ltr'><em>Olivibacter</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 921 664 976 685; x_wconf 77' lang='eng' dir='ltr'><em>itius</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 987 658 1083 685; x_wconf 89' lang='eng' dir='ltr'><em>AW-6T</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 1095 662 1262 691; x_wconf 88' lang='eng' dir='ltr'>(DQ421387)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 631 693 1262 727; baseline 0 -7"><span class='ocrx_word' id='word_1_111' title='bbox 631 696 847 727; x_wconf 76' lang='eng' dir='ltr'><em>Parapedobacler</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 861 696 984 720; x_wconf 79' lang='eng' dir='ltr'><em>koreensis</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 997 693 1083 727; x_wconf 86' lang='eng' dir='ltr'><em>Jipl4T</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 1095 697 1262 726; x_wconf 84' lang='eng' dir='ltr'>(DQ680836)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 584 726 1414 759; baseline 0 -6"><span class='ocrx_word' id='word_1_115' title='bbox 584 729 920 759; x_wconf 75' lang='eng' dir='ltr'><em>Pseudosphingobacterium</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 937 729 1093 753; x_wconf 67' lang='eng' dir='ltr'><em>domesticum</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 1108 726 1230 753; x_wconf 88' lang='eng' dir='ltr'><em>DC-186T</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 1242 730 1414 759; x_wconf 87' lang='eng' dir='ltr'>(AM407725)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 378 762 1368 1048">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 506 762 1300 977">
+     <span class='ocr_line' id='line_1_42' title="bbox 522 762 1249 795; baseline 0 -7"><span class='ocrx_word' id='word_1_119' title='bbox 522 765 764 795; x_wconf 66' lang='eng' dir='ltr'><em>Sphingobuclerium</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 780 765 943 795; x_wconf 76' lang='eng' dir='ltr'><em>daejeonense</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 958 762 1075 788; x_wconf 58' lang='eng' dir='ltr'>&#39;1&#39;R6-04T</span> <span class='ocrx_word' id='word_1_122' title='bbox 1083 765 1249 794; x_wconf 81' lang='eng' dir='ltr'>(ABZ49372)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 527 797 1246 831; baseline 0 -7"><span class='ocrx_word' id='word_1_123' title='bbox 527 801 769 831; x_wconf 72' lang='eng' dir='ltr'><em>Sphingobactcrium</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 785 803 892 824; x_wconf 77' lang='eng' dir='ltr'><em>mizumii</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 904 801 974 824; x_wconf 91' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_126' title='bbox 988 797 1246 830; x_wconf 73' lang='eng' dir='ltr'>11724T(AJ438175)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 544 835 1182 868; baseline 0 -7"><span class='ocrx_word' id='word_1_127' title='bbox 544 838 771 868; x_wconf 72' lang='eng' dir='ltr'><em>phl’ngobacterium</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 787 840 907 868; x_wconf 77' lang='eng' dir='ltr'><em>composri</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 919 835 1011 861; x_wconf 91' lang='eng' dir='ltr'><em>4M24T</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 1023 839 1070 867; x_wconf 89' lang='eng' dir='ltr'><em>(EF</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 1077 838 1182 865; x_wconf 88' lang='eng'>122436)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 532 870 1294 904; baseline -0.001 -7"><span class='ocrx_word' id='word_1_132' title='bbox 532 873 775 904; x_wconf 73' lang='eng' dir='ltr'><em>Sphingobacterl’um</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 789 875 953 904; x_wconf 75' lang='eng' dir='ltr'><em>spiritivomm</em></span> <span class='ocrx_word' id='word_1_134' title='bbox 968 874 1038 897; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_135' title='bbox 1048 870 1129 897; x_wconf 85' lang='eng' dir='ltr'><em>2582T</em></span> <span class='ocrx_word' id='word_1_136' title='bbox 1138 874 1294 903; x_wconf 86' lang='eng' dir='ltr'>(AJ459411)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 540 907 1262 940; baseline 0 -7"><span class='ocrx_word' id='word_1_137' title='bbox 540 910 902 940; x_wconf 70' lang='eng' dir='ltr'><em>Sphingobaclerhtmfaecium</em></span> <span class='ocrx_word' id='word_1_138' title='bbox 915 910 985 933; x_wconf 85' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_139' title='bbox 1000 907 1090 933; x_wconf 36' lang='eng'><em>11690&#39;1</em></span> <span class='ocrx_word' id='word_1_140' title='bbox 1105 910 1262 938; x_wconf 83' lang='eng' dir='ltr'>(AJ438176)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 506 944 1300 977; baseline -0.001 -6"><span class='ocrx_word' id='word_1_141' title='bbox 506 947 748 977; x_wconf 75' lang='eng' dir='ltr'><em>Sphingobacterium</em></span> <span class='ocrx_word' id='word_1_142' title='bbox 765 947 940 977; x_wconf 75' lang='eng' dir='ltr'><em>I‘halpophi/um</em></span> <span class='ocrx_word' id='word_1_143' title='bbox 955 948 1025 971; x_wconf 90' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_144' title='bbox 1040 944 1130 971; x_wconf 83' lang='eng' dir='ltr'><em>11723T</em></span> <span class='ocrx_word' id='word_1_145' title='bbox 1144 948 1300 977; x_wconf 87' lang='eng' dir='ltr'>(AJ438177)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 378 980 1368 1048">
+     <span class='ocr_line' id='line_1_48' title="bbox 378 980 1289 1011; baseline 0 -6"><span class='ocrx_word' id='word_1_146' title='bbox 378 987 408 1010; x_wconf 82' lang='eng'>98</span> <span class='ocrx_word' id='word_1_147' title='bbox 518 981 761 1011; x_wconf 76' lang='eng' dir='ltr'><em>Sphingobacterium</em></span> <span class='ocrx_word' id='word_1_148' title='bbox 776 981 928 1005; x_wconf 75' lang='eng' dir='ltr'><em>multivorum</em></span> <span class='ocrx_word' id='word_1_149' title='bbox 944 982 1003 1004; x_wconf 89' lang='eng' dir='ltr'><em>1AM</em></span> <span class='ocrx_word' id='word_1_150' title='bbox 1019 980 1289 1010; x_wconf 72' lang='eng' dir='ltr'>14316T(A13100738)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_49' title="bbox 753 1015 1368 1048; baseline 0 -6"><span class='ocrx_word' id='word_1_151' title='bbox 753 1018 910 1042; x_wconf 75' lang='eng' dir='ltr'><em>Bacteroides</em></span> <span class='ocrx_word' id='word_1_152' title='bbox 918 1018 1019 1048; x_wconf 75' lang='eng' dir='ltr'><em>fragilis</em></span> <span class='ocrx_word' id='word_1_153' title='bbox 1031 1019 1101 1042; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_154' title='bbox 1111 1015 1191 1042; x_wconf 86' lang='eng' dir='ltr'><em>2151T</em></span> <span class='ocrx_word' id='word_1_155' title='bbox 1203 1019 1368 1047; x_wconf 87' lang='eng' dir='ltr'>(AB050106)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 59 117 114 140">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 59 117 114 140">
+     <span class='ocr_line' id='line_1_50' title="bbox 59 117 114 140; baseline -0.018 0"><span class='ocrx_word' id='word_1_156' title='bbox 59 117 114 140; x_wconf 88' lang='eng'><em>0.02</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 295 261 338 284">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 295 261 338 284">
+     <span class='ocr_line' id='line_1_51' title="bbox 295 261 338 284; baseline 0.023 -1"><span class='ocrx_word' id='word_1_157' title='bbox 295 261 338 284; x_wconf 90' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 219 392 249 415">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 219 392 249 415">
+     <span class='ocr_line' id='line_1_52' title="bbox 219 392 249 415; baseline 0 0"><span class='ocrx_word' id='word_1_158' title='bbox 219 392 249 415; x_wconf 86' lang='eng'><em>86</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 10 1027 756 1029">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 10 1027 756 1029">
+     <span class='ocr_line' id='line_1_53' title="bbox 10 1027 756 1029; baseline 0 25"><span class='ocrx_word' id='word_1_159' title='bbox 10 1027 756 1029; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001537-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001537-0-001.pbm.png
new file mode 100644
index 00000000..c04865c5
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001537-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001537-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001537-0-001.pbm.png.hocr
new file mode 100644
index 00000000..63de0b1d
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001537-0-001.pbm.png.hocr
@@ -0,0 +1,271 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001537-0-001.pbm.png"; bbox 0 0 1242 840; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 63 0 120 23">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 63 0 120 23">
+     <span class='ocr_line' id='line_1_1' title="bbox 63 0 120 23; baseline -0.018 0"><span class='ocrx_word' id='word_1_1' title='bbox 63 0 120 23; x_wconf 88' lang='eng'><em>0.02</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 317 75 1069 148">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 317 75 1069 148">
+     <span class='ocr_line' id='line_1_2' title="bbox 352 75 1069 105; baseline 0.001 -7"><span class='ocrx_word' id='word_1_2' title='bbox 352 76 576 98; x_wconf 87' lang='eng' dir='ltr'><em>Desulfuromonas</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 586 76 750 105; x_wconf 85' lang='eng' dir='ltr'><em>acetexigens</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 767 76 831 99; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 846 75 923 99; x_wconf 80' lang='eng' dir='ltr'><em>1397T</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 943 76 1069 105; x_wconf 82' lang='eng' dir='ltr'>(U23140)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 317 119 1001 148; baseline 0 -6"><span class='ocrx_word' id='word_1_7' title='bbox 317 119 548 142; x_wconf 79' lang='eng' dir='ltr'><em>Desulfuromonas</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 557 119 757 148; x_wconf 77' lang='eng' dir='ltr'><em>michiganensis’</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 773 120 824 142; x_wconf 91' lang='eng' dir='ltr'><em>BB1</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 840 120 1001 148; x_wconf 87' lang='eng' dir='ltr'>(AF357915)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 118 109 177 110">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 118 109 177 110">
+     <span class='ocr_line' id='line_1_4' title="bbox 118 109 177 110; baseline 0 730"><span class='ocrx_word' id='word_1_11' title='bbox 118 109 177 110; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 175 87 177 132">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 175 87 177 132">
+     <span class='ocr_line' id='line_1_5' title="bbox 175 87 177 132; baseline 0 708"><span class='ocrx_word' id='word_1_12' title='bbox 175 87 177 132; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 37 142 120 144">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 37 142 120 144">
+     <span class='ocr_line' id='line_1_6' title="bbox 37 142 120 144; baseline 0 696"><span class='ocrx_word' id='word_1_13' title='bbox 37 142 120 144; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 20 197 39 199">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 20 197 39 199">
+     <span class='ocr_line' id='line_1_7' title="bbox 20 197 39 199; baseline 0 641"><span class='ocrx_word' id='word_1_14' title='bbox 20 197 39 199; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 37 142 39 252">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 37 142 39 252">
+     <span class='ocr_line' id='line_1_8' title="bbox 37 142 39 252; baseline 0 588"><span class='ocrx_word' id='word_1_15' title='bbox 37 142 39 252; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 118 109 119 175">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 118 109 119 175">
+     <span class='ocr_line' id='line_1_9' title="bbox 118 109 119 175; baseline 0 665"><span class='ocrx_word' id='word_1_16' title='bbox 118 109 119 175; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 323 161 1006 234">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 323 161 1006 234">
+     <span class='ocr_line' id='line_1_10' title="bbox 327 161 1006 190; baseline -0.001 -5"><span class='ocrx_word' id='word_1_17' title='bbox 327 162 551 185; x_wconf 84' lang='eng' dir='ltr'><em>Desulfuromonas</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 561 163 760 185; x_wconf 83' lang='eng' dir='ltr'><em>Chloroethenica</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 773 161 860 184; x_wconf 91' lang='eng' dir='ltr'><em>TT4BT</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 880 162 1006 190; x_wconf 88' lang='eng' dir='ltr'>(U49748)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 323 204 935 234; baseline -0.002 -6"><span class='ocrx_word' id='word_1_21' title='bbox 323 206 472 228; x_wconf 83' lang='eng' dir='ltr'><em>Pelobacter</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 480 206 642 228; x_wconf 82' lang='eng' dir='ltr'><em>carbinolicus</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 668 205 717 228; x_wconf 87' lang='eng' dir='ltr'><em>Gra</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 730 204 794 228; x_wconf 83' lang='eng' dir='ltr'><em>Bd1T</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 811 205 935 234; x_wconf 84' lang='eng' dir='ltr'>(X79413)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 37 250 125 252">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 37 250 125 252">
+     <span class='ocr_line' id='line_1_12' title="bbox 37 250 125 252; baseline 0 588"><span class='ocrx_word' id='word_1_26' title='bbox 37 250 125 252; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 20 197 21 381">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 20 197 21 381">
+     <span class='ocr_line' id='line_1_13' title="bbox 20 197 21 381; baseline 0 459"><span class='ocrx_word' id='word_1_27' title='bbox 20 197 21 381; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 20 380 49 381">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 20 380 49 381">
+     <span class='ocr_line' id='line_1_14' title="bbox 20 380 49 381; baseline 0 459"><span class='ocrx_word' id='word_1_28' title='bbox 20 380 49 381; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 47 347 49 413">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 47 347 49 413">
+     <span class='ocr_line' id='line_1_15' title="bbox 47 347 49 413; baseline 0 427"><span class='ocrx_word' id='word_1_29' title='bbox 47 347 49 413; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 190 247 1156 407">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 190 247 1156 407">
+     <span class='ocr_line' id='line_1_16' title="bbox 190 247 941 278; baseline 0 -7"><span class='ocrx_word' id='word_1_30' title='bbox 190 260 306 262; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_31' title='bbox 317 249 466 271; x_wconf 81' lang='eng' dir='ltr'><em>Pelobacter</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 474 249 642 278; x_wconf 83' lang='eng' dir='ltr'><em>acetylenicus</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 661 249 758 277; x_wconf 83' lang='eng' dir='ltr'>WoAcy</span> <span class='ocrx_word' id='word_1_34' title='bbox 771 247 797 271; x_wconf 83' lang='eng' dir='ltr'><em>1T</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 816 249 941 277; x_wconf 86' lang='eng' dir='ltr'>(X70955)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 307 292 928 322; baseline 0.002 -7"><span class='ocrx_word' id='word_1_36' title='bbox 307 292 456 315; x_wconf 81' lang='eng' dir='ltr'><em>Pelobacter</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 465 292 612 315; x_wconf 84' lang='eng' dir='ltr'><em>venetianus</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 630 293 694 316; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 706 292 786 316; x_wconf 78' lang='eng' dir='ltr'><em>2394T</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 802 294 928 322; x_wconf 87' lang='eng' dir='ltr'>(U41562)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 337 334 977 364; baseline -0.002 -6"><span class='ocrx_word' id='word_1_41' title='bbox 337 335 561 358; x_wconf 86' lang='eng' dir='ltr'><em>Desulfuromonas</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 569 336 700 364; x_wconf 79' lang='eng' dir='ltr'><em>palm/tatis</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 721 334 834 357; x_wconf 89' lang='eng' dir='ltr'><em>SDBY1T</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 851 335 977 363; x_wconf 86' lang='eng' dir='ltr'><em>(U28172)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 438 377 1156 407; baseline 0 -6"><span class='ocrx_word' id='word_1_45' title='bbox 438 379 653 401; x_wconf 83' lang='eng' dir='ltr'><em>Geoalkalibacter</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 660 379 843 407; x_wconf 80' lang='eng' dir='ltr'><em>ferr/hydriticus</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 860 377 969 401; x_wconf 85' lang='eng' dir='ltr'><em>2-0531T</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 989 378 1156 407; x_wconf 80' lang='eng' dir='ltr'><em>(DQ309326)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 124 217 125 283">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 124 217 125 283">
+     <span class='ocr_line' id='line_1_20' title="bbox 124 217 125 283; baseline 0 557"><span class='ocrx_word' id='word_1_49' title='bbox 124 217 125 283; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 124 282 190 283">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 124 282 190 283">
+     <span class='ocr_line' id='line_1_21' title="bbox 124 282 190 283; baseline 0 557"><span class='ocrx_word' id='word_1_50' title='bbox 124 282 190 283; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 189 260 190 305">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 189 260 190 305">
+     <span class='ocr_line' id='line_1_22' title="bbox 189 260 190 305; baseline 0 535"><span class='ocrx_word' id='word_1_51' title='bbox 189 260 190 305; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 190 303 296 305">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 190 303 296 305">
+     <span class='ocr_line' id='line_1_23' title="bbox 190 303 296 305; baseline 0 535"><span class='ocrx_word' id='word_1_52' title='bbox 190 303 296 305; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 47 411 275 413">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 47 411 275 413">
+     <span class='ocr_line' id='line_1_24' title="bbox 47 411 275 413; baseline 0 427"><span class='ocrx_word' id='word_1_53' title='bbox 47 411 275 413; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 273 390 275 434">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 273 390 275 434">
+     <span class='ocr_line' id='line_1_25' title="bbox 273 390 275 434; baseline 0 406"><span class='ocrx_word' id='word_1_54' title='bbox 273 390 275 434; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 466 419 1242 495">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 466 419 1242 495">
+     <span class='ocr_line' id='line_1_26' title="bbox 530 419 1242 449; baseline 0 -7"><span class='ocrx_word' id='word_1_55' title='bbox 530 420 761 442; x_wconf 85' lang='eng' dir='ltr'><em>Geoalkalibacter</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 768 420 963 442; x_wconf 86' lang='eng' dir='ltr'><em>subterraneus</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 978 419 1061 443; x_wconf 81' lang='eng' dir='ltr'><em>Red1T</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 1078 420 1242 449; x_wconf 89' lang='eng' dir='ltr'>(EU182247)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 466 465 990 495; baseline 0.004 -7"><span class='ocrx_word' id='word_1_59' title='bbox 466 465 755 493; x_wconf 85' lang='eng' dir='ltr'><em>Geobacterpelophilus</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 780 466 848 489; x_wconf 88' lang='eng' dir='ltr'><em>Dfr2T</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 864 467 990 495; x_wconf 86' lang='eng' dir='ltr'><em>(U96918)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 12 519 485 521">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 12 519 485 521">
+     <span class='ocr_line' id='line_1_28' title="bbox 12 519 485 521; baseline 0 319"><span class='ocrx_word' id='word_1_62' title='bbox 12 519 485 521; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 12 736 14 802">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 12 736 14 802">
+     <span class='ocr_line' id='line_1_29' title="bbox 12 736 14 802; baseline 0 38"><span class='ocrx_word' id='word_1_63' title='bbox 12 736 14 802; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 365 508 1184 798">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 497 508 1057 538">
+     <span class='ocr_line' id='line_1_30' title="bbox 497 508 1057 538; baseline 0.004 -7"><span class='ocrx_word' id='word_1_64' title='bbox 497 508 786 537; x_wconf 80' lang='eng' dir='ltr'><em>Geobacterpickeringii</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 804 509 873 533; x_wconf 89' lang='eng' dir='ltr'><em>G13T</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 890 510 1057 538; x_wconf 89' lang='eng' dir='ltr'><em>(DQ145535)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 590 552 1175 582">
+     <span class='ocr_line' id='line_1_31' title="bbox 590 552 1175 582; baseline 0.005 -8"><span class='ocrx_word' id='word_1_67' title='bbox 590 552 734 574; x_wconf 82' lang='eng' dir='ltr'><em>Geobacter</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 741 552 943 574; x_wconf 87' lang='eng' dir='ltr'><em>sulfurreducens</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 958 552 1032 576; x_wconf 92' lang='eng' dir='ltr'><em>PCAT</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 1048 554 1175 582; x_wconf 87' lang='eng' dir='ltr'>(U13928)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 519 595 1115 625">
+     <span class='ocr_line' id='line_1_32' title="bbox 519 595 1115 625; baseline 0.005 -8"><span class='ocrx_word' id='word_1_71' title='bbox 519 595 663 617; x_wconf 86' lang='eng' dir='ltr'><em>Geobacter</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 670 595 896 623; x_wconf 87' lang='eng' dir='ltr'><em>hydrogenophilus</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 913 596 972 619; x_wconf 74' lang='eng' dir='ltr'><em>H-2T</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 989 597 1115 625; x_wconf 89' lang='eng' dir='ltr'>(U28173)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 519 638 1116 668">
+     <span class='ocr_line' id='line_1_33' title="bbox 519 638 1116 668; baseline 0.003 -7"><span class='ocrx_word' id='word_1_75' title='bbox 519 649 530 651; x_wconf 52' lang='eng'><em>»</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 542 638 801 667; x_wconf 79' lang='eng' dir='ltr'><em>Geobactergrbiciae</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 817 639 939 663; x_wconf 89' lang='eng' dir='ltr'><em>TACP-2T</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 955 640 1116 668; x_wconf 89' lang='eng' dir='ltr'>(AF335182)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 519 681 1171 712">
+     <span class='ocr_line' id='line_1_34' title="bbox 519 681 1171 712; baseline 0.005 -8"><span class='ocrx_word' id='word_1_79' title='bbox 519 692 540 694; x_wconf 97' lang='eng'>—</span> <span class='ocrx_word' id='word_1_80' title='bbox 552 681 697 704; x_wconf 87' lang='eng' dir='ltr'><em>Geobacter</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 704 681 919 704; x_wconf 86' lang='eng' dir='ltr'><em>metal/ireducens</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 934 682 1034 706; x_wconf 91' lang='eng' dir='ltr'><em>GS-15T</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 1050 683 1171 712; x_wconf 86' lang='eng' dir='ltr'>(L07834)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 365 725 1184 798">
+     <span class='ocr_line' id='line_1_35' title="bbox 365 725 1022 755; baseline 0.005 -8"><span class='ocrx_word' id='word_1_84' title='bbox 365 725 606 747; x_wconf 79' lang='eng' dir='ltr'><em>Geothermobacter</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 614 725 718 747; x_wconf 83' lang='eng' dir='ltr'><em>ehrlichii</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 739 725 843 749; x_wconf 83' lang='eng' dir='ltr'><em>88015T</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 859 727 1022 755; x_wconf 87' lang='eng' dir='ltr'>(AY155599)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 484 767 1184 798; baseline 0.004 -8"><span class='ocrx_word' id='word_1_88' title='bbox 484 767 708 790; x_wconf 86' lang='eng' dir='ltr'><em>Desulfuromonas</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 718 768 882 790; x_wconf 82' lang='eng' dir='ltr'><em>acetoxidans</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 899 769 963 792; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 975 769 1038 792; x_wconf 83' lang='eng' dir='ltr'><em>684T</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 1055 770 1184 798; x_wconf 89' lang='eng' dir='ltr'><em>(M26634)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 196 476 199 562">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 196 476 199 562">
+     <span class='ocr_line' id='line_1_37' title="bbox 196 476 199 562; baseline 0 278"><span class='ocrx_word' id='word_1_93' title='bbox 196 476 199 562; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 197 561 577 564">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 197 561 577 564">
+     <span class='ocr_line' id='line_1_38' title="bbox 197 561 577 564; baseline 0 276"><span class='ocrx_word' id='word_1_94' title='bbox 197 561 577 564; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 264 519 265 603">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 264 519 265 603">
+     <span class='ocr_line' id='line_1_39' title="bbox 264 519 265 603; baseline 0 237"><span class='ocrx_word' id='word_1_95' title='bbox 264 519 265 603; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 264 602 318 603">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 264 602 318 603">
+     <span class='ocr_line' id='line_1_40' title="bbox 264 602 318 603; baseline 0 237"><span class='ocrx_word' id='word_1_96' title='bbox 264 602 318 603; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 317 563 318 641">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 317 563 318 641">
+     <span class='ocr_line' id='line_1_41' title="bbox 317 563 318 641; baseline 0 199"><span class='ocrx_word' id='word_1_97' title='bbox 317 563 318 641; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 317 639 377 641">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 317 639 377 641">
+     <span class='ocr_line' id='line_1_42' title="bbox 317 639 377 641; baseline 0 199"><span class='ocrx_word' id='word_1_98' title='bbox 317 639 377 641; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 376 606 377 672">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 376 606 377 672">
+     <span class='ocr_line' id='line_1_43' title="bbox 376 606 377 672; baseline 0 168"><span class='ocrx_word' id='word_1_99' title='bbox 376 606 377 672; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 376 671 519 672">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 376 671 519 672">
+     <span class='ocr_line' id='line_1_44' title="bbox 376 671 519 672; baseline 0 168"><span class='ocrx_word' id='word_1_100' title='bbox 376 671 519 672; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 517 649 519 694">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 517 649 519 694">
+     <span class='ocr_line' id='line_1_45' title="bbox 517 649 519 694; baseline 0 146"><span class='ocrx_word' id='word_1_101' title='bbox 517 649 519 694; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 12 800 175 802">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 12 800 175 802">
+     <span class='ocr_line' id='line_1_46' title="bbox 12 800 175 802; baseline 0 38"><span class='ocrx_word' id='word_1_102' title='bbox 12 800 175 802; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 173 779 176 823">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 173 779 176 823">
+     <span class='ocr_line' id='line_1_47' title="bbox 173 779 176 823; baseline 0 17"><span class='ocrx_word' id='word_1_103' title='bbox 173 779 176 823; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 368 810 960 840">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 368 810 960 840">
+     <span class='ocr_line' id='line_1_48' title="bbox 368 810 960 840; baseline 0.002 -7"><span class='ocrx_word' id='word_1_104' title='bbox 368 811 592 833; x_wconf 89' lang='eng' dir='ltr'><em>Desulfuromonas</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 602 811 715 839; x_wconf 83' lang='eng' dir='ltr'><em>thiophila</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 734 810 819 834; x_wconf 87' lang='eng' dir='ltr'><em>N227T</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 836 811 960 840; x_wconf 89' lang='eng' dir='ltr'>(Y11560)</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001552-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001552-0-000.pbm.png
new file mode 100644
index 00000000..56ebe098
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001552-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001552-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001552-0-000.pbm.png.hocr
new file mode 100644
index 00000000..e4167840
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001552-0-000.pbm.png.hocr
@@ -0,0 +1,63 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001552-0-000.pbm.png"; bbox 0 0 994 400; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 355 0 875 30">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 355 0 875 30">
+     <span class='ocr_line' id='line_1_1' title="bbox 355 0 875 30; baseline 0 -6"><span class='ocrx_word' id='word_1_1' title='bbox 355 3 504 24; x_wconf 82' lang='eng' dir='ltr'><em>Alcanivorax</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 513 3 676 24; x_wconf 81' lang='eng' dir='ltr'><em>borkumensis</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 685 0 750 24; x_wconf 84' lang='eng' dir='ltr'><em>8K2T</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 760 3 875 30; x_wconf 83' lang='eng' dir='ltr'><em>(Y12579)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 0 11 354 387">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 0 11 354 387">
+     <span class='ocr_line' id='line_1_2' title="bbox 142 11 354 108; baseline 0 -61"><span class='ocrx_word' id='word_1_5' title='bbox 142 11 354 108; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 0 108 337 171; baseline -0.009 0"><span class='ocrx_word' id='word_1_6' title='bbox 0 108 337 171; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 0 171 334 230; baseline -0.006 0"><span class='ocrx_word' id='word_1_7' title='bbox 0 171 334 230; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 0 230 295 290; baseline 0.014 -4"><span class='ocrx_word' id='word_1_8' title='bbox 0 230 295 290; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 0 290 347 387; baseline 0 0"><span class='ocrx_word' id='word_1_9' title='bbox 0 290 347 387; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 33 55 815 92">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 33 55 815 92">
+     <span class='ocr_line' id='line_1_7' title="bbox 33 55 815 92; baseline 0.001 -7"><span class='ocrx_word' id='word_1_10' title='bbox 33 55 83 76; x_wconf 76' lang='eng'><em>0-01</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 342 65 491 86; x_wconf 85' lang='eng' dir='ltr'><em>Alcanivorax</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 496 65 605 92; x_wconf 87' lang='eng' dir='ltr'><em>jadensis</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 614 62 658 86; x_wconf 80' lang='eng' dir='ltr'><em>T9T</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 669 65 815 91; x_wconf 88' lang='eng' dir='ltr'><em>(AJOO1150)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 207 123 994 338">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 295 123 994 275">
+     <span class='ocr_line' id='line_1_8' title="bbox 337 123 994 153; baseline 0 -6"><span class='ocrx_word' id='word_1_15' title='bbox 337 126 502 147; x_wconf 84' lang='eng' dir='ltr'><em>Alcanivorax</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 511 126 724 153; x_wconf 83' lang='eng' dir='ltr'><em>hongdengensis</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 732 123 832 147; x_wconf 80' lang='eng' dir='ltr'><em>A-11-3T</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 841 126 994 153; x_wconf 86' lang='eng' dir='ltr'><em>(EU438901)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 336 185 890 214; baseline 0 -6"><span class='ocrx_word' id='word_1_19' title='bbox 336 187 485 208; x_wconf 83' lang='eng' dir='ltr'><em>Alcanivorax</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 496 187 646 208; x_wconf 82' lang='eng' dir='ltr'><em>venustensis</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 656 185 731 208; x_wconf 89' lang='eng' dir='ltr'><em>|SO4T</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 741 187 890 214; x_wconf 88' lang='eng' dir='ltr'><em>(AF328762)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 295 245 876 275; baseline 0 -6"><span class='ocrx_word' id='word_1_23' title='bbox 295 248 444 269; x_wconf 83' lang='eng' dir='ltr'><em>Alcanivorax</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 453 248 583 269; x_wconf 84' lang='eng' dir='ltr'><em>balearicus</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 594 248 654 269; x_wconf 89' lang='eng' dir='ltr'><em>MAC</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 659 245 715 269; x_wconf 80' lang='eng' dir='ltr'><em>L04T</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 726 248 876 275; x_wconf 84' lang='eng' dir='ltr'><em>(AY686709)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 207 303 770 338">
+     <span class='ocr_line' id='line_1_11' title="bbox 207 303 770 338; baseline 0 -6"><span class='ocrx_word' id='word_1_28' title='bbox 207 303 251 324; x_wconf 76' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 268 311 417 332; x_wconf 83' lang='eng' dir='ltr'><em>Alcanivorax</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 426 311 546 332; x_wconf 85' lang='eng' dir='ltr'><em>dieselo/ei</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 555 309 609 332; x_wconf 85' lang='eng' dir='ltr'><em>B—5T</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 619 311 770 338; x_wconf 85' lang='eng' dir='ltr'><em>(AY683537)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 348 370 973 400">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 348 370 973 400">
+     <span class='ocr_line' id='line_1_12' title="bbox 348 370 973 400; baseline -0.002 -6"><span class='ocrx_word' id='word_1_33' title='bbox 348 373 531 394; x_wconf 88' lang='eng' dir='ltr'><em>Pseudomonas</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 541 372 687 394; x_wconf 89' lang='eng' dir='ltr'><em>ﬂuorescens</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 698 373 744 393; x_wconf 92' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 758 370 846 394; x_wconf 87' lang='eng' dir='ltr'><em>12022T</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 856 373 973 400; x_wconf 82' lang='eng' dir='ltr'><em>(D84013)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001651-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001651-0-001.pbm.png
new file mode 100644
index 00000000..38945c51
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001651-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001651-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001651-0-001.pbm.png.hocr
new file mode 100644
index 00000000..b8238fb0
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001651-0-001.pbm.png.hocr
@@ -0,0 +1,198 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001651-0-001.pbm.png"; bbox 0 0 1302 1637; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 138 0 1210 92">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 139 0 1210 88">
+     <span class='ocr_line' id='line_1_1' title="bbox 338 0 831 26; baseline 0 -5"><span class='ocrx_word' id='word_1_1' title='bbox 338 3 505 21; x_wconf 82' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 514 3 631 21; x_wconf 85' lang='eng' dir='ltr'><em>chacoense</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 640 0 697 21; x_wconf 83' lang='eng' dir='ltr'><em>PR5T</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 706 3 831 26; x_wconf 85' lang='eng' dir='ltr'>(AJ278249)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 139 32 967 69; baseline 0 -17"><span class='ocrx_word' id='word_1_5' title='bbox 139 53 149 69; x_wconf 76' lang='eng'>0</span> <span class='ocrx_word' id='word_1_6' title='bbox 159 53 180 69; x_wconf 69' lang='eng'><em>10</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 366 34 573 52; x_wconf 80' lang='eng' dir='ltr'><em>Pseudaminobacter</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 579 34 751 57; x_wconf 76' lang='eng' dir='ltr'><em>salicylatoxidans</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 760 32 830 52; x_wconf 90' lang='eng' dir='ltr'><em>BN12T</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 839 34 967 57; x_wconf 87' lang='eng' dir='ltr'>(AF072542)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 152 63 1210 88; baseline 0.002 -6"><span class='ocrx_word' id='word_1_11' title='bbox 152 66 154 69; x_wconf 91' lang='eng'>&#39;</span> <span class='ocrx_word' id='word_1_12' title='bbox 335 65 501 83; x_wconf 80' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 509 65 675 83; x_wconf 78' lang='eng' dir='ltr'><em>mediterraneum</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 684 65 735 83; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 746 63 822 83; x_wconf 78' lang='eng' dir='ltr'><em>11555T</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 831 65 928 88; x_wconf 87' lang='eng' dir='ltr'>(L38825)</span> <span class='ocrx_word' id='word_1_17' title='bbox 1069 67 1210 87; x_wconf 84' lang='eng' dir='ltr'><em>Rhizobiales</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 117 78 201 83">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 117 78 201 83">
+     <span class='ocr_line' id='line_1_4' title="bbox 117 78 201 83; baseline 0 1554"><span class='ocrx_word' id='word_1_18' title='bbox 117 78 201 83; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 222 90 1302 1637">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 344 95 918 151">
+     <span class='ocr_line' id='line_1_5' title="bbox 344 95 918 120; baseline 0 -5"><span class='ocrx_word' id='word_1_19' title='bbox 344 97 518 120; x_wconf 78' lang='eng' dir='ltr'><em>PhyI/obacterium</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 526 97 646 120; x_wconf 81' lang='eng' dir='ltr'><em>Ieguminum</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 655 97 706 115; x_wconf 87' lang='eng' dir='ltr'><em>ORS</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 717 95 779 115; x_wconf 79' lang='eng' dir='ltr'><em>1419T</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 788 97 918 120; x_wconf 87' lang='eng' dir='ltr'>(AY785323)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 344 126 765 151; baseline 0 -5"><span class='ocrx_word' id='word_1_24' title='bbox 344 128 422 146; x_wconf 83' lang='eng' dir='ltr'><em>Ensifer</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 428 129 524 151; x_wconf 80' lang='eng' dir='ltr'><em>terangae</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 533 128 583 146; x_wconf 91' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 593 126 657 146; x_wconf 74' lang='eng' dir='ltr'><em>7834T</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 666 128 765 151; x_wconf 83' lang='eng' dir='ltr'>(X68388)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 447 158 967 247">
+     <span class='ocr_line' id='line_1_7' title="bbox 476 158 967 184; baseline 0 -5"><span class='ocrx_word' id='word_1_29' title='bbox 476 161 617 179; x_wconf 79' lang='eng' dir='ltr'><em>Roseobacter</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 623 161 699 179; x_wconf 81' lang='eng' dir='ltr'><em>litora/is</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 706 160 772 179; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 781 158 859 179; x_wconf 77' lang='eng' dir='ltr'><em>49566T</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 868 161 967 184; x_wconf 83' lang='eng' dir='ltr'>(X78312)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 451 190 964 215; baseline 0 -5"><span class='ocrx_word' id='word_1_34' title='bbox 451 192 550 215; x_wconf 82' lang='eng' dir='ltr'><em>Ruegeria</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 558 192 718 215; x_wconf 79' lang='eng' dir='ltr'><em>gelatinovorans</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 727 192 768 210; x_wconf 90' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 779 190 855 210; x_wconf 81' lang='eng' dir='ltr'><em>12617T</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 863 192 964 215; x_wconf 87' lang='eng' dir='ltr'>(D88523)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 447 221 934 247; baseline -0.002 -5"><span class='ocrx_word' id='word_1_39' title='bbox 447 224 584 242; x_wconf 82' lang='eng' dir='ltr'><em>Roseovarius</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 592 224 679 242; x_wconf 75' lang='eng' dir='ltr'><em>Iolerans</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 688 223 739 242; x_wconf 86' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 750 221 826 242; x_wconf 83' lang='eng' dir='ltr'><em>11457T</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 835 223 934 247; x_wconf 84' lang='eng' dir='ltr'>(Y11551)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 222 253 1302 1637">
+     <span class='ocr_line' id='line_1_10' title="bbox 411 253 976 278; baseline 0 -5"><span class='ocrx_word' id='word_1_44' title='bbox 411 255 719 273; x_wconf 79' lang='eng' dir='ltr'><em>Silicibacterlacuscaerulensis</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 728 255 779 273; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 791 253 866 273; x_wconf 81' lang='eng' dir='ltr'><em>11314T</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 876 255 976 278; x_wconf 85' lang='eng' dir='ltr'><em>(U77644)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 437 284 910 310; baseline 0 -5"><span class='ocrx_word' id='word_1_48' title='bbox 437 287 556 305; x_wconf 79' lang='eng' dir='ltr'><em>Roseivivax</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 563 287 685 305; x_wconf 80' lang='eng' dir='ltr'><em>ha/odurans</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 693 286 741 305; x_wconf 87' lang='eng' dir='ltr'><em>OCh</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 750 284 801 305; x_wconf 80' lang='eng' dir='ltr'><em>239T</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 810 286 910 310; x_wconf 87' lang='eng' dir='ltr'>(D85829)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 381 316 916 342; baseline -0.002 -5"><span class='ocrx_word' id='word_1_53' title='bbox 381 319 509 337; x_wconf 81' lang='eng' dir='ltr'><em>Paracoccus</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 517 318 648 337; x_wconf 84' lang='eng' dir='ltr'><em>denitriﬁcans</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 656 318 722 337; x_wconf 88' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_56' title='bbox 733 316 808 336; x_wconf 83' lang='eng' dir='ltr'><em>17741T</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 817 318 916 342; x_wconf 86' lang='eng' dir='ltr'>(Y16927)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 250 348 887 373; baseline 0 -5"><span class='ocrx_word' id='word_1_58' title='bbox 250 361 260 371; x_wconf 84' lang='eng'><strong>.</strong></span> <span class='ocrx_word' id='word_1_59' title='bbox 376 350 519 368; x_wconf 81' lang='eng' dir='ltr'><em>Rhodobacter</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 524 350 658 373; x_wconf 84' lang='eng' dir='ltr'><em>sphaeroides</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 667 350 719 368; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 730 348 778 368; x_wconf 80' lang='eng' dir='ltr'><em>158T</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 787 350 887 373; x_wconf 87' lang='eng' dir='ltr'>(X53855)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 377 379 995 405; baseline -0.002 -5"><span class='ocrx_word' id='word_1_64' title='bbox 377 382 519 400; x_wconf 83' lang='eng' dir='ltr'><em>Pseudovibrio</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 527 382 680 400; x_wconf 82' lang='eng' dir='ltr'><em>ascidiaceicola</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 689 381 756 400; x_wconf 86' lang='eng' dir='ltr'><em>NRBC</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 767 379 857 400; x_wconf 90' lang='eng' dir='ltr'><em>100514T</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 866 381 995 405; x_wconf 85' lang='eng' dir='ltr'><em>(AB175663)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 366 411 865 436; baseline 0 -5"><span class='ocrx_word' id='word_1_69' title='bbox 366 413 507 431; x_wconf 84' lang='eng' dir='ltr'><em>Pseudovibrio</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 516 413 646 431; x_wconf 81' lang='eng' dir='ltr'><em>denitriﬁcans</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 656 411 727 431; x_wconf 81' lang='eng' dir='ltr'><em>DN34T</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 736 413 865 436; x_wconf 85' lang='eng' dir='ltr'><em>(AY486423)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 369 442 894 468; baseline 0 -5"><span class='ocrx_word' id='word_1_73' title='bbox 369 445 523 463; x_wconf 81' lang='eng' dir='ltr'><em>Nesiotobacter</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 529 445 665 463; x_wconf 83' lang='eng' dir='ltr'><em>exalbescens</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 674 442 757 463; x_wconf 81' lang='eng' dir='ltr'><em>LA33BT</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 766 445 894 468; x_wconf 89' lang='eng' dir='ltr'><em>(AF513441)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 329 474 775 499; baseline 0 -5"><span class='ocrx_word' id='word_1_77' title='bbox 329 476 410 499; x_wconf 71' lang='eng' dir='ltr'><em>Stappia</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 419 477 529 499; x_wconf 75' lang='eng' dir='ltr'><em>aggregate</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 538 476 579 494; x_wconf 95' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 590 474 666 494; x_wconf 74' lang='eng' dir='ltr'><em>12614T</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 675 476 775 499; x_wconf 88' lang='eng' dir='ltr'>(D88520)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 346 505 778 531; baseline -0.002 -5"><span class='ocrx_word' id='word_1_82' title='bbox 346 507 427 530; x_wconf 79' lang='eng' dir='ltr'><em>Stappia</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 436 508 532 526; x_wconf 78' lang='eng' dir='ltr'><em>stellulata</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 542 508 582 525; x_wconf 90' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 593 505 669 526; x_wconf 83' lang='eng' dir='ltr'><em>12621T</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 678 507 778 531; x_wconf 86' lang='eng' dir='ltr'>(D88525)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 351 537 926 562; baseline 0 -5"><span class='ocrx_word' id='word_1_87' title='bbox 351 539 487 557; x_wconf 84' lang='eng' dir='ltr'><em>Kordiimonas</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 495 539 679 562; x_wconf 84' lang='eng' dir='ltr'><em>gwangyangensis</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 687 537 787 557; x_wconf 86' lang='eng' dir='ltr'><em>GW14-5T</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 797 539 926 562; x_wconf 85' lang='eng' dir='ltr'><em>(AY682384)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 383 568 946 593; baseline 0 -4"><span class='ocrx_word' id='word_1_91' title='bbox 383 570 519 589; x_wconf 84' lang='eng' dir='ltr'><em>Parvularcula</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 528 570 669 589; x_wconf 79' lang='eng' dir='ltr'><em>bermudensis</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 678 568 809 589; x_wconf 73' lang='eng' dir='ltr'><em>HTCC2503T</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 818 570 946 593; x_wconf 84' lang='eng' dir='ltr'>(AF544015)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 399 600 973 626; baseline -0.002 -5"><span class='ocrx_word' id='word_1_95' title='bbox 399 603 542 621; x_wconf 84' lang='eng' dir='ltr'><em>Asticcacaulis</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 550 603 675 621; x_wconf 82' lang='eng' dir='ltr'><em>excentricus</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 682 602 748 621; x_wconf 87' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 759 600 834 621; x_wconf 83' lang='eng' dir='ltr'><em>15261T</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 843 602 973 626; x_wconf 89' lang='eng' dir='ltr'>(ABO16610)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 381 632 892 657; baseline 0 -5"><span class='ocrx_word' id='word_1_100' title='bbox 381 634 514 652; x_wconf 80' lang='eng' dir='ltr'><em>Caulobacter</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 521 634 623 652; x_wconf 82' lang='eng' dir='ltr'><em>vibrioides</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 632 634 684 652; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 694 632 757 652; x_wconf 74' lang='eng' dir='ltr'><em>9893T</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 766 634 892 657; x_wconf 88' lang='eng' dir='ltr'>(AJ227754)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 354 663 898 688; baseline 0.002 -5"><span class='ocrx_word' id='word_1_105' title='bbox 354 665 525 684; x_wconf 81' lang='eng' dir='ltr'><em>Brevundimonas</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 533 665 624 684; x_wconf 82' lang='eng' dir='ltr'><em>diminuta</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 632 665 699 684; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 709 663 785 684; x_wconf 84' lang='eng' dir='ltr'><em>11568T</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 794 665 898 688; x_wconf 85' lang='eng' dir='ltr'>(M59064)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 404 695 980 720; baseline 0 -5"><span class='ocrx_word' id='word_1_110' title='bbox 404 697 567 720; x_wconf 85' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 574 697 710 720; x_wconf 71' lang='eng' dir='ltr'><em>paucimobilis</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 718 697 784 715; x_wconf 87' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 793 695 870 715; x_wconf 79' lang='eng' dir='ltr'><em>29837T</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 879 697 980 720; x_wconf 87' lang='eng' dir='ltr'><em>(U37337)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 427 726 1302 752; baseline -0.001 -5"><span class='ocrx_word' id='word_1_115' title='bbox 427 729 563 752; x_wconf 87' lang='eng' dir='ltr'><em>Zymomonas</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 571 729 646 747; x_wconf 84' lang='eng' dir='ltr'><em>mobilis</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 654 728 720 747; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 731 727 806 747; x_wconf 77' lang='eng' dir='ltr'><em>10988T</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 815 729 944 752; x_wconf 81' lang='eng' dir='ltr'>(AF281031)</span> <span class='ocrx_word' id='word_1_120' title='bbox 1070 726 1302 751; x_wconf 83' lang='eng' dir='ltr'><em>Sphingomonada/es</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 385 758 828 783; baseline 0 -5"><span class='ocrx_word' id='word_1_121' title='bbox 385 760 527 778; x_wconf 81' lang='eng' dir='ltr'><em>Blastamonas</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 535 760 632 778; x_wconf 84' lang='eng' dir='ltr'><em>ursinco/a</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 641 758 720 778; x_wconf 74' lang='eng' dir='ltr'><em>KR-99T</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 729 760 828 783; x_wconf 92' lang='eng' dir='ltr'>(Y10677)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 579 789 1013 815; baseline 0 -5"><span class='ocrx_word' id='word_1_125' title='bbox 579 791 730 810; x_wconf 84' lang='eng' dir='ltr'><em>Craurococcus</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 737 796 811 810; x_wconf 86' lang='eng' dir='ltr'><em>roseus</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 820 789 903 810; x_wconf 85' lang='eng' dir='ltr'><em>NS13OT</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 912 791 1013 815; x_wconf 86' lang='eng' dir='ltr'>(D85828)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 529 821 980 846; baseline 0 -5"><span class='ocrx_word' id='word_1_129' title='bbox 529 823 727 841; x_wconf 81' lang='eng' dir='ltr'><em>Paracraurococcus</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 735 823 794 841; x_wconf 86' lang='eng' dir='ltr'><em>ruber</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 801 821 870 841; x_wconf 79' lang='eng' dir='ltr'><em>N889T</em></span> <span class='ocrx_word' id='word_1_132' title='bbox 879 823 980 846; x_wconf 85' lang='eng' dir='ltr'>(D85827)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 538 852 1003 877; baseline -0.002 -4"><span class='ocrx_word' id='word_1_133' title='bbox 538 855 682 873; x_wconf 82' lang='eng' dir='ltr'><em>Roseomonas</em></span> <span class='ocrx_word' id='word_1_134' title='bbox 691 855 782 877; x_wconf 74' lang='eng' dir='ltr'><em>aquatica</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 790 852 860 873; x_wconf 80' lang='eng' dir='ltr'><em>TR53T</em></span> <span class='ocrx_word' id='word_1_136' title='bbox 869 854 1003 877; x_wconf 83' lang='eng' dir='ltr'>(AM231587)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 530 884 1043 909; baseline -0.002 -4"><span class='ocrx_word' id='word_1_137' title='bbox 530 886 678 905; x_wconf 82' lang='eng' dir='ltr'><em>Raseococcus</em></span> <span class='ocrx_word' id='word_1_138' title='bbox 686 886 862 909; x_wconf 84' lang='eng' dir='ltr'><em>thiosulfatophilus</em></span> <span class='ocrx_word' id='word_1_139' title='bbox 871 884 935 905; x_wconf 84' lang='eng' dir='ltr'><em>RB-3T</em></span> <span class='ocrx_word' id='word_1_140' title='bbox 944 886 1043 909; x_wconf 81' lang='eng' dir='ltr'>(X72908)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 448 916 940 943; baseline 0 -7"><span class='ocrx_word' id='word_1_141' title='bbox 448 933 458 943; x_wconf 69' lang='eng'>.</span> <span class='ocrx_word' id='word_1_142' title='bbox 482 918 616 936; x_wconf 75' lang='eng' dir='ltr'><em>Acetobacler</em></span> <span class='ocrx_word' id='word_1_143' title='bbox 622 918 720 936; x_wconf 79' lang='eng' dir='ltr'><em>orienta/is</em></span> <span class='ocrx_word' id='word_1_144' title='bbox 728 918 750 936; x_wconf 89' lang='eng'>21</span> <span class='ocrx_word' id='word_1_145' title='bbox 757 916 802 936; x_wconf 91' lang='eng' dir='ltr'><em>F-2T</em></span> <span class='ocrx_word' id='word_1_146' title='bbox 810 918 940 941; x_wconf 78' lang='eng' dir='ltr'>(A3052706)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 494 947 891 972; baseline 0.003 -5"><span class='ocrx_word' id='word_1_147' title='bbox 494 949 580 968; x_wconf 81' lang='eng' dir='ltr'><em>Kozakia</em></span> <span class='ocrx_word' id='word_1_148' title='bbox 588 949 684 968; x_wconf 86' lang='eng' dir='ltr'><em>baliensis</em></span> <span class='ocrx_word' id='word_1_149' title='bbox 691 947 753 968; x_wconf 78' lang='eng' dir='ltr'><em>Yo-3T</em></span> <span class='ocrx_word' id='word_1_150' title='bbox 762 949 891 972; x_wconf 78' lang='eng' dir='ltr'>(A8056321)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 475 979 1034 1004; baseline 0 -5"><span class='ocrx_word' id='word_1_151' title='bbox 475 981 636 999; x_wconf 82' lang='eng' dir='ltr'><em>Gluconobacter</em></span> <span class='ocrx_word' id='word_1_152' title='bbox 642 981 733 1004; x_wconf 86' lang='eng' dir='ltr'><em>oxydans</em></span> <span class='ocrx_word' id='word_1_153' title='bbox 742 981 809 999; x_wconf 88' lang='eng' dir='ltr'><em>NRBC</em></span> <span class='ocrx_word' id='word_1_154' title='bbox 820 979 896 999; x_wconf 79' lang='eng' dir='ltr'><em>14819T</em></span> <span class='ocrx_word' id='word_1_155' title='bbox 905 981 1034 1004; x_wconf 85' lang='eng' dir='ltr'><em>(AB178433)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 371 1010 814 1036; baseline 0 -6"><span class='ocrx_word' id='word_1_156' title='bbox 371 1013 454 1031; x_wconf 84' lang='eng' dir='ltr'><em>Tistrella</em></span> <span class='ocrx_word' id='word_1_157' title='bbox 463 1013 539 1031; x_wconf 85' lang='eng' dir='ltr'><em>mobilis</em></span> <span class='ocrx_word' id='word_1_158' title='bbox 548 1013 588 1030; x_wconf 95' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_159' title='bbox 599 1010 675 1031; x_wconf 44' lang='eng' dir='ltr'><em>14872.r</em></span> <span class='ocrx_word' id='word_1_160' title='bbox 684 1012 814 1036; x_wconf 87' lang='eng' dir='ltr'><em>(ABO71665)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 407 1042 854 1067; baseline 0 -5"><span class='ocrx_word' id='word_1_161' title='bbox 407 1044 537 1062; x_wconf 86' lang='eng' dir='ltr'><em>Rhodovibrio</em></span> <span class='ocrx_word' id='word_1_162' title='bbox 546 1044 677 1062; x_wconf 86' lang='eng' dir='ltr'><em>sodomensis</em></span> <span class='ocrx_word' id='word_1_163' title='bbox 686 1042 742 1062; x_wconf 89' lang='eng' dir='ltr'><em>DS1T</em></span> <span class='ocrx_word' id='word_1_164' title='bbox 751 1044 854 1067; x_wconf 84' lang='eng' dir='ltr'>(M59072)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 363 1073 878 1099; baseline 0.002 -6"><span class='ocrx_word' id='word_1_165' title='bbox 363 1076 496 1098; x_wconf 86' lang='eng' dir='ltr'><em>Azospin&#39;llum</em></span> <span class='ocrx_word' id='word_1_166' title='bbox 504 1075 605 1098; x_wconf 85' lang='eng' dir='ltr'><em>Iipoferum</em></span> <span class='ocrx_word' id='word_1_167' title='bbox 613 1075 679 1094; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_168' title='bbox 688 1073 765 1094; x_wconf 81' lang='eng' dir='ltr'><em>29707T</em></span> <span class='ocrx_word' id='word_1_169' title='bbox 774 1075 878 1099; x_wconf 88' lang='eng' dir='ltr'><em>(M59061)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 369 1105 989 1130; baseline 0 -5"><span class='ocrx_word' id='word_1_170' title='bbox 369 1107 555 1130; x_wconf 76' lang='eng' dir='ltr'><em>Magnetospirillum</em></span> <span class='ocrx_word' id='word_1_171' title='bbox 563 1107 746 1130; x_wconf 83' lang='eng' dir='ltr'><em>gryphiswaldense</em></span> <span class='ocrx_word' id='word_1_172' title='bbox 756 1107 807 1125; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_173' title='bbox 816 1105 881 1125; x_wconf 79' lang='eng' dir='ltr'><em>6361T</em></span> <span class='ocrx_word' id='word_1_174' title='bbox 890 1107 989 1130; x_wconf 82' lang='eng' dir='ltr'>(Y10109)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 361 1136 885 1162; baseline -0.002 -5"><span class='ocrx_word' id='word_1_175' title='bbox 361 1139 485 1161; x_wconf 82' lang='eng' dir='ltr'><em>Rhodospira</em></span> <span class='ocrx_word' id='word_1_176' title='bbox 494 1139 578 1161; x_wconf 84' lang='eng' dir='ltr'><em>trueperi</em></span> <span class='ocrx_word' id='word_1_177' title='bbox 584 1138 650 1157; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_178' title='bbox 659 1136 750 1157; x_wconf 83' lang='eng' dir='ltr'><em>700224T</em></span> <span class='ocrx_word' id='word_1_179' title='bbox 759 1138 885 1162; x_wconf 87' lang='eng' dir='ltr'>(AJ001276)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 349 1168 795 1193; baseline 0 -5"><span class='ocrx_word' id='word_1_180' title='bbox 349 1170 472 1193; x_wconf 84' lang='eng' dir='ltr'><em>Roseospira</em></span> <span class='ocrx_word' id='word_1_181' title='bbox 481 1170 565 1193; x_wconf 82' lang='eng' dir='ltr'><em>goensis</em></span> <span class='ocrx_word' id='word_1_182' title='bbox 573 1168 652 1188; x_wconf 75' lang='eng' dir='ltr'><em>.JA135T</em></span> <span class='ocrx_word' id='word_1_183' title='bbox 661 1170 795 1193; x_wconf 83' lang='eng' dir='ltr'>(AM283537)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 351 1199 899 1225; baseline 0 -5"><span class='ocrx_word' id='word_1_184' title='bbox 351 1202 513 1225; x_wconf 80' lang='eng' dir='ltr'><em>Rhodaspiril/urn</em></span> <span class='ocrx_word' id='word_1_185' title='bbox 522 1202 599 1220; x_wconf 82' lang='eng' dir='ltr'><em>rubrum</em></span> <span class='ocrx_word' id='word_1_186' title='bbox 606 1202 673 1220; x_wconf 86' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_187' title='bbox 683 1199 759 1220; x_wconf 89' lang='eng' dir='ltr'><em>11170T</em></span> <span class='ocrx_word' id='word_1_188' title='bbox 768 1202 899 1225; x_wconf 86' lang='eng' dir='ltr'>(CP000230)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 333 1231 832 1264; baseline 0 -13"><span class='ocrx_word' id='word_1_189' title='bbox 333 1253 344 1264; x_wconf 62' lang='eng'><strong>.</strong></span> <span class='ocrx_word' id='word_1_190' title='bbox 366 1234 516 1256; x_wconf 86' lang='eng' dir='ltr'><em>Thalassospira</em></span> <span class='ocrx_word' id='word_1_191' title='bbox 525 1234 634 1252; x_wconf 77' lang='eng' dir='ltr'><em>xiamensis</em></span> <span class='ocrx_word' id='word_1_192' title='bbox 643 1231 694 1252; x_wconf 87' lang='eng' dir='ltr'><em>M-5T</em></span> <span class='ocrx_word' id='word_1_193' title='bbox 703 1233 832 1257; x_wconf 85' lang='eng' dir='ltr'>(AY189753)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 366 1263 938 1288; baseline 0 -5"><span class='ocrx_word' id='word_1_194' title='bbox 366 1265 516 1288; x_wconf 71' lang='eng' dir='ltr'><em>Thalessospira</em></span> <span class='ocrx_word' id='word_1_195' title='bbox 525 1265 648 1283; x_wconf 79' lang='eng' dir='ltr'><em>Iucentensis</em></span> <span class='ocrx_word' id='word_1_196' title='bbox 657 1265 709 1283; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_197' title='bbox 720 1263 795 1283; x_wconf 89' lang='eng' dir='ltr'><em>14000T</em></span> <span class='ocrx_word' id='word_1_198' title='bbox 804 1265 938 1288; x_wconf 82' lang='eng' dir='ltr'><em>(AM294944)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 358 1294 917 1320; baseline -0.002 -5"><span class='ocrx_word' id='word_1_199' title='bbox 358 1297 509 1319; x_wconf 85' lang='eng' dir='ltr'><em>Thalassospira</em></span> <span class='ocrx_word' id='word_1_200' title='bbox 516 1296 666 1319; x_wconf 83' lang='eng' dir='ltr'><em>profundimaris</em></span> <span class='ocrx_word' id='word_1_201' title='bbox 674 1297 750 1315; x_wconf 89' lang='eng' dir='ltr'>WP021</span> <span class='ocrx_word' id='word_1_202' title='bbox 757 1294 778 1314; x_wconf 96' lang='eng' dir='ltr'><em>1T</em></span> <span class='ocrx_word' id='word_1_203' title='bbox 787 1296 917 1320; x_wconf 85' lang='eng' dir='ltr'>(AY186195)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 366 1326 1052 1351; baseline 0 -5"><span class='ocrx_word' id='word_1_204' title='bbox 366 1328 496 1346; x_wconf 81' lang='eng' dir='ltr'><em>Terasak/e/la</em></span> <span class='ocrx_word' id='word_1_205' title='bbox 503 1328 573 1351; x_wconf 87' lang='eng' dir='ltr'><em>pusiI/a</em></span> <span class='ocrx_word' id='word_1_206' title='bbox 583 1328 621 1346; x_wconf 94' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_207' title='bbox 631 1326 708 1346; x_wconf 79' lang='eng' dir='ltr'><em>13613T</em></span> <span class='ocrx_word' id='word_1_208' title='bbox 716 1328 846 1351; x_wconf 84' lang='eng' dir='ltr'>(AB006768)</span> <span class='ocrx_word' id='word_1_209' title='bbox 1038 1346 1052 1349; x_wconf 99' lang='eng'><strong>_</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 327 1359 692 1383; baseline 0 -6"><span class='ocrx_word' id='word_1_210' title='bbox 327 1359 388 1378; x_wconf 81' lang='eng' dir='ltr'><em>Strain</em></span> <span class='ocrx_word' id='word_1_211' title='bbox 399 1359 472 1378; x_wconf 85' lang='eng' dir='ltr'>KOPRI</span> <span class='ocrx_word' id='word_1_212' title='bbox 484 1360 549 1378; x_wconf 88' lang='eng'>13522</span> <span class='ocrx_word' id='word_1_213' title='bbox 558 1359 692 1383; x_wconf 87' lang='eng' dir='ltr'>(DQ167245)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 338 1389 797 1414; baseline 0 -5"><span class='ocrx_word' id='word_1_214' title='bbox 338 1391 447 1409; x_wconf 88' lang='eng' dir='ltr'><em>Kiloniella</em></span> <span class='ocrx_word' id='word_1_215' title='bbox 455 1391 576 1409; x_wconf 86' lang='eng' dir='ltr'><em>Iaminariae</em></span> <span class='ocrx_word' id='word_1_216' title='bbox 585 1389 654 1409; x_wconf 90' lang='eng' dir='ltr'><em>LD81T</em></span> <span class='ocrx_word' id='word_1_217' title='bbox 663 1391 797 1414; x_wconf 87' lang='eng' dir='ltr'><em>(AM749667)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 347 1420 804 1446; baseline -0.002 -5"><span class='ocrx_word' id='word_1_218' title='bbox 347 1422 430 1441; x_wconf 85' lang='eng' dir='ltr'><em>Orientia</em></span> <span class='ocrx_word' id='word_1_219' title='bbox 440 1423 599 1445; x_wconf 82' lang='eng' dir='ltr'><em>tsutsugamushi</em></span> <span class='ocrx_word' id='word_1_220' title='bbox 607 1420 667 1445; x_wconf 77' lang='eng' dir='ltr'><em>KarpT</em></span> <span class='ocrx_word' id='word_1_221' title='bbox 676 1422 804 1446; x_wconf 88' lang='eng' dir='ltr'>(AFO62074)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_48' title="bbox 306 1452 1222 1477; baseline 0.003 -5"><span class='ocrx_word' id='word_1_222' title='bbox 306 1454 411 1472; x_wconf 74' lang='eng' dir='ltr'><em>Rickettsia</em></span> <span class='ocrx_word' id='word_1_223' title='bbox 419 1454 537 1477; x_wconf 82' lang='eng' dir='ltr'><em>prowazekii</em></span> <span class='ocrx_word' id='word_1_224' title='bbox 545 1452 616 1472; x_wconf 69' lang='eng' dir='ltr'><em>Breian</em></span> <span class='ocrx_word' id='word_1_225' title='bbox 625 1454 729 1477; x_wconf 80' lang='eng' dir='ltr'>(M21789)</span> <span class='ocrx_word' id='word_1_226' title='bbox 1069 1455 1222 1475; x_wconf 82' lang='eng' dir='ltr'><em>Rickettsia/es</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_49' title="bbox 406 1485 726 1509; baseline 0 -5"><span class='ocrx_word' id='word_1_227' title='bbox 406 1486 518 1504; x_wconf 74' lang='eng' dir='ltr'><em>Wo/bachia</em></span> <span class='ocrx_word' id='word_1_228' title='bbox 526 1486 616 1509; x_wconf 74' lang='eng' dir='ltr'><em>pipientis</em></span> <span class='ocrx_word' id='word_1_229' title='bbox 625 1485 726 1509; x_wconf 82' lang='eng' dir='ltr'>(U23709)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_50' title="bbox 263 1515 841 1541; baseline 0.002 -6"><span class='ocrx_word' id='word_1_230' title='bbox 263 1518 447 1540; x_wconf 85' lang='eng' dir='ltr'><em>Hyphomicrobium</em></span> <span class='ocrx_word' id='word_1_231' title='bbox 456 1518 539 1536; x_wconf 82' lang='eng' dir='ltr'><em>indicum</em></span> <span class='ocrx_word' id='word_1_232' title='bbox 549 1517 616 1536; x_wconf 88' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_233' title='bbox 627 1515 703 1536; x_wconf 78' lang='eng' dir='ltr'><em>14233T</em></span> <span class='ocrx_word' id='word_1_234' title='bbox 712 1517 841 1541; x_wconf 85' lang='eng' dir='ltr'>(AB159513)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_51' title="bbox 274 1547 664 1572; baseline 0 -5"><span class='ocrx_word' id='word_1_235' title='bbox 274 1549 334 1567; x_wconf 71' lang='eng' dir='ltr'><em>Vibrio</em></span> <span class='ocrx_word' id='word_1_236' title='bbox 342 1549 433 1572; x_wconf 73' lang='eng' dir='ltr'><em>chagasii</em></span> <span class='ocrx_word' id='word_1_237' title='bbox 441 1547 530 1567; x_wconf 78' lang='eng' dir='ltr'><em>R-3712T</em></span> <span class='ocrx_word' id='word_1_238' title='bbox 539 1549 664 1572; x_wconf 84' lang='eng' dir='ltr'><em>(AJ316199)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_52' title="bbox 284 1580 678 1604; baseline 0 -5"><span class='ocrx_word' id='word_1_239' title='bbox 284 1581 410 1599; x_wconf 74' lang='eng' dir='ltr'><em>Escherichia</em></span> <span class='ocrx_word' id='word_1_240' title='bbox 419 1581 456 1599; x_wconf 83' lang='eng' dir='ltr'><em>coli</em></span> <span class='ocrx_word' id='word_1_241' title='bbox 462 1581 508 1599; x_wconf 88' lang='eng' dir='ltr'><em>W31</em></span> <span class='ocrx_word' id='word_1_242' title='bbox 515 1581 539 1599; x_wconf 91' lang='eng'><em>10</em></span> <span class='ocrx_word' id='word_1_243' title='bbox 549 1580 678 1604; x_wconf 81' lang='eng' dir='ltr'>(AP009048)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_53' title="bbox 222 1610 1052 1637; baseline 0 -7"><span class='ocrx_word' id='word_1_244' title='bbox 222 1612 441 1630; x_wconf 76' lang='eng' dir='ltr'><em>Pseudoalteromonas</em></span> <span class='ocrx_word' id='word_1_245' title='bbox 449 1612 568 1630; x_wconf 84' lang='eng' dir='ltr'><em>maricaloris</em></span> <span class='ocrx_word' id='word_1_246' title='bbox 576 1612 630 1630; x_wconf 94' lang='eng' dir='ltr'>KMM</span> <span class='ocrx_word' id='word_1_247' title='bbox 640 1610 690 1630; x_wconf 82' lang='eng' dir='ltr'><em>636T</em></span> <span class='ocrx_word' id='word_1_248' title='bbox 699 1612 827 1635; x_wconf 87' lang='eng' dir='ltr'><em>(AF144036)</em></span> <span class='ocrx_word' id='word_1_249' title='bbox 1038 1633 1052 1637; x_wconf 99' lang='eng'><strong>_</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 1069 333 1275 356">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 1069 334 1275 354">
+     <span class='ocr_line' id='line_1_54' title="bbox 1069 334 1275 354; baseline 0 0"><span class='ocrx_word' id='word_1_250' title='bbox 1069 334 1275 354; x_wconf 83' lang='eng' dir='ltr'><em>Rhodobacterales</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 1068 532 1272 590">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 1069 533 1272 588">
+     <span class='ocr_line' id='line_1_55' title="bbox 1069 533 1272 553; baseline 0 0"><span class='ocrx_word' id='word_1_251' title='bbox 1069 533 1272 553; x_wconf 84' lang='eng' dir='ltr'><em>Kordiimonada/es</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_56' title="bbox 1069 567 1266 588; baseline 0.005 -1"><span class='ocrx_word' id='word_1_252' title='bbox 1069 567 1266 588; x_wconf 79' lang='eng' dir='ltr'><em>‘Parvu/arculales’</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 330 615 1266 653">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 330 615 1266 651">
+     <span class='ocr_line' id='line_1_57' title="bbox 330 615 340 625; baseline 0 0"><span class='ocrx_word' id='word_1_253' title='bbox 330 615 340 625; x_wconf 73' lang='eng' dir='ltr'><strong>I</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_58' title="bbox 1070 631 1266 651; baseline 0 0"><span class='ocrx_word' id='word_1_254' title='bbox 1070 631 1266 651; x_wconf 82' lang='eng' dir='ltr'><em>Caulobactera/es</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 1034 521 1054 696">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 1036 521 1052 696">
+     <span class='ocr_line' id='line_1_59' title="bbox 1036 521 1052 696; textangle 90"><span class='ocrx_word' id='word_1_255' title='bbox 1036 693 1051 696; x_wconf 99' lang='eng' dir='ltr'><strong>I</strong></span> <span class='ocrx_word' id='word_1_256' title='bbox 1036 521 1052 590; x_wconf 82' lang='eng' dir='ltr'>III”</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 1036 775 1052 791">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 1036 775 1052 791">
+     <span class='ocr_line' id='line_1_60' title="bbox 1036 775 1052 791; textangle 90"><span class='ocrx_word' id='word_1_257' title='bbox 1036 788 1051 791; x_wconf 90' lang='eng' dir='ltr'>I</span> <span class='ocrx_word' id='word_1_258' title='bbox 1038 775 1052 778; x_wconf 99' lang='eng' dir='ltr'>I</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 1069 1057 1262 1085">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 1069 1058 1262 1084">
+     <span class='ocr_line' id='line_1_61' title="bbox 1069 1058 1262 1084; baseline 0 -6"><span class='ocrx_word' id='word_1_259' title='bbox 1069 1058 1262 1084; x_wconf 85' lang='eng' dir='ltr'><em>Rhodospirillales</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 1036 1504 1051 1523">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 1036 1504 1051 1523">
+     <span class='ocr_line' id='line_1_62' title="bbox 1036 1504 1051 1523; textangle 90"><span class='ocrx_word' id='word_1_260' title='bbox 1036 1520 1051 1523; x_wconf 99' lang='eng' dir='ltr'>I</span> <span class='ocrx_word' id='word_1_261' title='bbox 1038 1504 1051 1507; x_wconf 97' lang='eng' dir='ltr'><strong>l</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 1068 1569 1181 1596">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 1069 1569 1181 1595">
+     <span class='ocr_line' id='line_1_63' title="bbox 1069 1569 1181 1595; baseline 0 -6"><span class='ocrx_word' id='word_1_262' title='bbox 1069 1569 1181 1595; x_wconf 89' lang='eng' dir='ltr'><em>Outgroup</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 1036 163 1068 1635">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 1036 163 1068 1635">
+     <span class='ocr_line' id='line_1_64' title="bbox 1036 163 1068 1635; baseline 0 2"><span class='ocrx_word' id='word_1_263' title='bbox 1036 163 1068 1635; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001677-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001677-0-001.pbm.png
new file mode 100644
index 00000000..bb2dc2bc
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001677-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001677-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001677-0-001.pbm.png.hocr
new file mode 100644
index 00000000..6cb13a9b
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001677-0-001.pbm.png.hocr
@@ -0,0 +1,134 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001677-0-001.pbm.png"; bbox 0 0 1302 826; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 292 27 1082 84">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 292 27 1082 84">
+     <span class='ocr_line' id='line_1_1' title="bbox 526 27 1082 62; baseline -0.002 -6"><span class='ocrx_word' id='word_1_1' title='bbox 526 34 709 56; x_wconf 84' lang='eng' dir='ltr'><em>Methanolobus</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 718 34 891 61; x_wconf 84' lang='eng' dir='ltr'><em>bombayensis</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 901 27 954 55; x_wconf 93' lang='eng' dir='ltr'><em>B-1T</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 963 34 1082 62; x_wconf 89' lang='eng' dir='ltr'><em>(U20148)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 292 68 376 84; baseline 0 0"><span class='ocrx_word' id='word_1_5' title='bbox 292 68 376 84; x_wconf 80' lang='eng'><em>68/71/73</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 370 91 387 93">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 370 91 387 93">
+     <span class='ocr_line' id='line_1_3' title="bbox 370 91 387 93; baseline 0 733"><span class='ocrx_word' id='word_1_6' title='bbox 370 91 387 93; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 385 47 387 134">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 385 47 387 134">
+     <span class='ocr_line' id='line_1_4' title="bbox 385 47 387 134; baseline 0 692"><span class='ocrx_word' id='word_1_7' title='bbox 385 47 387 134; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 282 116 1055 152">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 282 116 1055 152">
+     <span class='ocr_line' id='line_1_5' title="bbox 282 116 1055 152; baseline 0 -7"><span class='ocrx_word' id='word_1_8' title='bbox 282 136 365 152; x_wconf 69' lang='eng'><em>82,70,54</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 388 135 456 137; x_wconf 96' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_10' title='bbox 464 123 647 145; x_wconf 87' lang='eng' dir='ltr'><em>Methanolobus</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 658 123 767 145; x_wconf 80' lang='eng' dir='ltr'><em>tinder/us</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 778 123 839 145; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 850 116 1055 151; x_wconf 74' lang='eng' dir='ltr'><em>2278T(M59135)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 0 153 460 765">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 0 153 460 765">
+     <span class='ocr_line' id='line_1_6' title="bbox 332 153 374 206; baseline 0 0"><span class='ocrx_word' id='word_1_14' title='bbox 332 153 374 206; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 330 206 342 239; baseline 0 587"><span class='ocrx_word' id='word_1_15' title='bbox 330 206 342 239; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 292 239 342 257; baseline 0 569"><span class='ocrx_word' id='word_1_16' title='bbox 292 239 342 257; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 292 257 342 277; baseline 0 549"><span class='ocrx_word' id='word_1_17' title='bbox 292 257 342 277; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 140 277 441 369; baseline 0 -27"><span class='ocrx_word' id='word_1_18' title='bbox 140 277 441 369; x_wconf 95' lang='eng' dir='ltr'><em>     </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 140 369 441 454; baseline 0 -20"><span class='ocrx_word' id='word_1_19' title='bbox 140 369 441 454; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 47 454 460 548; baseline 0 -61"><span class='ocrx_word' id='word_1_20' title='bbox 47 454 460 548; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 0 613 455 727; baseline 0 -69"><span class='ocrx_word' id='word_1_21' title='bbox 0 613 455 727; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 47 727 429 765; baseline 0 61"><span class='ocrx_word' id='word_1_22' title='bbox 47 727 429 765; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 370 91 372 224">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 370 91 372 224">
+     <span class='ocr_line' id='line_1_15' title="bbox 370 91 372 224; baseline 0 602"><span class='ocrx_word' id='word_1_23' title='bbox 370 91 372 224; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 246 206 979 240">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 246 206 979 240">
+     <span class='ocr_line' id='line_1_16' title="bbox 246 206 979 240; baseline 0.004 -9"><span class='ocrx_word' id='word_1_24' title='bbox 246 214 330 231; x_wconf 85' lang='eng'><em>88/80/80</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 370 224 431 227; x_wconf 98' lang='eng'>—</span> <span class='ocrx_word' id='word_1_26' title='bbox 439 213 622 234; x_wconf 84' lang='eng' dir='ltr'><em>Methanolobus</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 632 213 723 234; x_wconf 82' lang='eng' dir='ltr'><em>vulcani</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 732 206 979 240; x_wconf 74' lang='eng' dir='ltr'><em>PL-12/MT(U20155)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 1107 243 1302 266">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 1107 243 1302 266">
+     <span class='ocr_line' id='line_1_17' title="bbox 1107 243 1302 266; baseline 0 0"><span class='ocrx_word' id='word_1_29' title='bbox 1107 243 1302 266; x_wconf 82' lang='eng' dir='ltr'><em>Methanolobus</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 183 294 1026 334">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 183 294 1026 334">
+     <span class='ocr_line' id='line_1_18' title="bbox 183 294 1026 334; baseline 0 -11"><span class='ocrx_word' id='word_1_30' title='bbox 183 318 290 334; x_wconf 64' lang='eng'><em>100,100,97</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 435 302 632 323; x_wconf 84' lang='eng' dir='ltr'><em>Methanolobus</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 641 301 762 329; x_wconf 88' lang='eng' dir='ltr'><em>profundi</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 771 294 863 323; x_wconf 90' lang='eng' dir='ltr'><em>MobMT</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 872 301 1026 329; x_wconf 88' lang='eng' dir='ltr'><em>(AB370245)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 445 385 953 418">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 445 385 953 418">
+     <span class='ocr_line' id='line_1_19' title="bbox 445 385 953 418; baseline 0 -6"><span class='ocrx_word' id='word_1_35' title='bbox 445 391 628 412; x_wconf 84' lang='eng' dir='ltr'><em>Methanolobus</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 638 391 723 418; x_wconf 85' lang='eng' dir='ltr'><em>taylorii</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 731 385 953 418; x_wconf 74' lang='eng' dir='ltr'><em>GS-16T(U20154)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 55 462 1043 508">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 55 462 1043 508">
+     <span class='ocr_line' id='line_1_20' title="bbox 55 462 916 488; baseline 0 -9"><span class='ocrx_word' id='word_1_38' title='bbox 55 462 139 479; x_wconf 83' lang='eng'>66/59/50</span> <span class='ocrx_word' id='word_1_39' title='bbox 801 480 804 483; x_wconf 48' lang='eng'><strong><em>.</em></strong></span> <span class='ocrx_word' id='word_1_40' title='bbox 905 474 916 488; x_wconf 71' lang='eng' dir='ltr'>T</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 465 480 1043 508; baseline -0.002 -6"><span class='ocrx_word' id='word_1_41' title='bbox 465 480 649 502; x_wconf 86' lang='eng' dir='ltr'><em>Methanolobus</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 659 486 817 507; x_wconf 79' lang='eng' dir='ltr'><em>oregonen3/s</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 826 480 900 501; x_wconf 94' lang='eng' dir='ltr'>WAL1</span> <span class='ocrx_word' id='word_1_44' title='bbox 923 480 1043 508; x_wconf 88' lang='eng' dir='ltr'><em>(U20152)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 1094 3 1096 534">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 1094 3 1096 534">
+     <span class='ocr_line' id='line_1_22' title="bbox 1094 3 1096 534; baseline 0 292"><span class='ocrx_word' id='word_1_45' title='bbox 1094 3 1096 534; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 443 564 1056 597">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 443 564 1056 597">
+     <span class='ocr_line' id='line_1_23' title="bbox 443 564 1056 597; baseline 0 -6"><span class='ocrx_word' id='word_1_46' title='bbox 443 570 689 597; x_wconf 85' lang='eng' dir='ltr'><em>Methanohalophilus</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 698 570 769 591; x_wconf 76' lang='eng' dir='ltr'><em>mahii</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 778 569 839 591; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 851 564 1056 597; x_wconf 66' lang='eng' dir='ltr'><em>5219T(M59133)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 63 633 1164 687">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 63 633 1164 687">
+     <span class='ocr_line' id='line_1_24' title="bbox 63 633 144 650; baseline -0.012 0"><span class='ocrx_word' id='word_1_50' title='bbox 63 633 144 650; x_wconf 85' lang='eng'>57/56/51</span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 464 653 1164 687; baseline 0 -6"><span class='ocrx_word' id='word_1_51' title='bbox 464 659 708 681; x_wconf 80' lang='eng' dir='ltr'><em>Methanococcoides</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 717 659 875 687; x_wconf 80' lang='eng' dir='ltr'><em>methylutens</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 886 659 947 681; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 958 653 1164 687; x_wconf 74' lang='eng' dir='ltr'><em>2657T(M59127)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 429 743 1033 775">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 429 743 1033 775">
+     <span class='ocr_line' id='line_1_26' title="bbox 429 743 1033 775; baseline 0 -6"><span class='ocrx_word' id='word_1_55' title='bbox 429 748 635 769; x_wconf 87' lang='eng' dir='ltr'><em>Methanosarcina</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 646 748 736 769; x_wconf 87' lang='eng' dir='ltr'><em>barkeri</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 745 747 806 769; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 818 743 1033 775; x_wconf 71' lang='eng' dir='ltr'><em>800T(AJO12094)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 128 809 169 826">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 128 809 169 826">
+     <span class='ocr_line' id='line_1_27' title="bbox 128 809 169 826; baseline 0 0"><span class='ocrx_word' id='word_1_59' title='bbox 128 809 169 826; x_wconf 60' lang='eng'><em>0,02</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001685-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001685-0-001.pbm.png
new file mode 100644
index 00000000..db529a33
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001685-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001685-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001685-0-001.pbm.png.hocr
new file mode 100644
index 00000000..de50ab7b
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001685-0-001.pbm.png.hocr
@@ -0,0 +1,120 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001685-0-001.pbm.png"; bbox 0 0 1243 1002; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 0 1 734 965">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 0 1 734 965">
+     <span class='ocr_line' id='line_1_1' title="bbox 0 1 118 47; baseline 0 955"><span class='ocrx_word' id='word_1_1' title='bbox 0 1 118 47; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 0 47 180 89; baseline 0 913"><span class='ocrx_word' id='word_1_2' title='bbox 0 47 180 89; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 0 89 410 129; baseline 0 873"><span class='ocrx_word' id='word_1_3' title='bbox 0 89 410 129; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 0 129 567 171; baseline 0 0"><span class='ocrx_word' id='word_1_4' title='bbox 0 129 567 171; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 0 171 339 211; baseline 0 791"><span class='ocrx_word' id='word_1_5' title='bbox 0 171 339 211; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 0 211 390 253; baseline 0 749"><span class='ocrx_word' id='word_1_6' title='bbox 0 211 390 253; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 25 253 453 295; baseline 0 707"><span class='ocrx_word' id='word_1_7' title='bbox 25 253 453 295; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 25 295 492 324; baseline 0 678"><span class='ocrx_word' id='word_1_8' title='bbox 25 295 492 324; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 25 324 434 417; baseline 0 -81"><span class='ocrx_word' id='word_1_9' title='bbox 25 324 434 417; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 96 417 426 500; baseline 0 0"><span class='ocrx_word' id='word_1_10' title='bbox 96 417 426 500; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 96 500 426 542; baseline 0 0"><span class='ocrx_word' id='word_1_11' title='bbox 96 500 426 542; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 96 542 431 626; baseline 0 -42"><span class='ocrx_word' id='word_1_12' title='bbox 96 542 431 626; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 191 626 400 668; baseline 0 334"><span class='ocrx_word' id='word_1_13' title='bbox 191 626 400 668; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 191 668 477 748; baseline 0 0"><span class='ocrx_word' id='word_1_14' title='bbox 191 668 477 748; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 192 748 482 790; baseline 0 212"><span class='ocrx_word' id='word_1_15' title='bbox 192 748 482 790; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 192 790 544 834; baseline 0 168"><span class='ocrx_word' id='word_1_16' title='bbox 192 790 544 834; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 218 834 547 874; baseline 0 128"><span class='ocrx_word' id='word_1_17' title='bbox 218 834 547 874; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 218 874 565 916; baseline 0 86"><span class='ocrx_word' id='word_1_18' title='bbox 218 874 565 916; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 218 916 734 965; baseline 0 -25"><span class='ocrx_word' id='word_1_19' title='bbox 218 916 734 965; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 5 977 137 999">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 5 977 137 999">
+     <span class='ocr_line' id='line_1_20' title="bbox 5 977 137 999; baseline 0 0"><span class='ocrx_word' id='word_1_20' title='bbox 5 982 57 987; x_wconf 86' lang='eng'>—</span> <span class='ocrx_word' id='word_1_21' title='bbox 69 977 137 999; x_wconf 91' lang='eng'>0.005</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 118 4 720 34">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 118 4 720 33">
+     <span class='ocr_line' id='line_1_21' title="bbox 118 4 720 33; baseline 0 -6"><span class='ocrx_word' id='word_1_22' title='bbox 118 6 244 33; x_wconf 87' lang='eng' dir='ltr'><em>Dugane/la</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 255 6 409 33; x_wconf 86' lang='eng' dir='ltr'><em>violaceinigra</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 418 6 466 27; x_wconf 94' lang='eng' dir='ltr'><em>YIM</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 477 4 720 33; x_wconf 75' lang='eng' dir='ltr'><em>31327T(AY376163)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 180 46 1241 983">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 180 46 1241 983">
+     <span class='ocr_line' id='line_1_22' title="bbox 180 46 625 75; baseline 0.002 -6"><span class='ocrx_word' id='word_1_26' title='bbox 180 48 281 69; x_wconf 78' lang='eng' dir='ltr'><em>Mass/lie</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 291 48 415 69; x_wconf 87' lang='eng' dir='ltr'><em>albidiﬂava</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 423 46 467 70; x_wconf 92' lang='eng' dir='ltr'><em>45T</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 476 48 625 75; x_wconf 84' lang='eng' dir='ltr'><em>(AY965999)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 410 86 1033 115; baseline -0.002 -5"><span class='ocrx_word' id='word_1_30' title='bbox 410 89 548 110; x_wconf 86' lang='eng' dir='ltr'><em>Naxibacter</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 554 89 718 110; x_wconf 86' lang='eng' dir='ltr'><em>alkalitolerans</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 726 89 775 109; x_wconf 95' lang='eng' dir='ltr'><em>YIM</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 786 86 875 110; x_wconf 82' lang='eng' dir='ltr'>31775T</span> <span class='ocrx_word' id='word_1_34' title='bbox 884 88 1033 115; x_wconf 88' lang='eng' dir='ltr'><em>(AY679161)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 577 128 1020 157; baseline 0.002 -6"><span class='ocrx_word' id='word_1_35' title='bbox 577 130 666 152; x_wconf 86' lang='eng' dir='ltr'><em>Telluria</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 676 130 742 152; x_wconf 81' lang='eng' dir='ltr'><em>mixta</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 750 130 812 152; x_wconf 92' lang='eng' dir='ltr'><em>ACM</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 824 128 897 152; x_wconf 89' lang='eng' dir='ltr'><em>1762T</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 906 130 1020 157; x_wconf 86' lang='eng' dir='ltr'><em>(X65589)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 339 168 1012 197; baseline 0 -5"><span class='ocrx_word' id='word_1_40' title='bbox 339 171 570 192; x_wconf 83' lang='eng' dir='ltr'><em>Janthinobacterium</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 579 171 802 197; x_wconf 85' lang='eng' dir='ltr'><em>agaricidamnosum</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 810 168 888 192; x_wconf 67' lang='eng' dir='ltr'><em>W1r1’:T</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 898 170 1012 197; x_wconf 93' lang='eng' dir='ltr'><em>(Y08845)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 390 210 991 239; baseline 0 -5"><span class='ocrx_word' id='word_1_44' title='bbox 390 213 560 239; x_wconf 86' lang='eng' dir='ltr'><em>Aquaspin&#39;llum</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 570 213 676 234; x_wconf 85' lang='eng' dir='ltr'><em>arcticum</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 686 213 732 234; x_wconf 94' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 745 210 833 234; x_wconf 82' lang='eng' dir='ltr'><em>14963T</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 842 213 991 239; x_wconf 89' lang='eng' dir='ltr'><em>(ABO74523)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 453 252 1029 281; baseline 0 -6"><span class='ocrx_word' id='word_1_49' title='bbox 453 254 658 275; x_wconf 85' lang='eng' dir='ltr'><em>Herminiimonas</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 666 254 755 281; x_wconf 88' lang='eng' dir='ltr'><em>glaciei</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 762 252 869 275; x_wconf 82' lang='eng' dir='ltr'><em>UMB49T</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 878 254 1029 281; x_wconf 82' lang='eng' dir='ltr'><em>(EU489741)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 501 294 1060 322; baseline 0 -6"><span class='ocrx_word' id='word_1_53' title='bbox 501 295 752 316; x_wconf 85' lang='eng' dir='ltr'><em>Ultramicrobacterium</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 764 294 899 316; x_wconf 85' lang='eng' dir='ltr'><em>ISSDS-831</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 913 294 1060 322; x_wconf 88' lang='eng' dir='ltr'><em>(EF620474)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 434 337 992 363; baseline 0 -5"><span class='ocrx_word' id='word_1_56' title='bbox 434 337 664 358; x_wconf 80' lang='eng' dir='ltr'><em>Janthinobacterium</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 673 343 707 363; x_wconf 92' lang='eng' dir='ltr'><em>sp.</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 720 337 831 358; x_wconf 83' lang='eng' dir='ltr'><em>Marseille</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 841 337 992 363; x_wconf 86' lang='eng' dir='ltr'><em>(CP000269)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 356 377 916 404; baseline 0 -6"><span class='ocrx_word' id='word_1_60' title='bbox 356 377 399 398; x_wconf 92' lang='eng'>100</span> <span class='ocrx_word' id='word_1_61' title='bbox 437 377 688 399; x_wconf 84' lang='eng' dir='ltr'><em>Ultramicrobacterium</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 699 377 753 399; x_wconf 95' lang='eng' dir='ltr'><em>Um1</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 767 377 916 404; x_wconf 84' lang='eng' dir='ltr'><em>(AY387012)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 435 419 934 446; baseline 0 -6"><span class='ocrx_word' id='word_1_64' title='bbox 435 419 686 440; x_wconf 87' lang='eng' dir='ltr'><em>Ultramicrobacterium</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 698 419 770 440; x_wconf 93' lang='eng' dir='ltr'><em>HI-G4</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 781 419 934 446; x_wconf 87' lang='eng' dir='ltr'><em>(DQ205303)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 435 461 911 487; baseline 0 -5"><span class='ocrx_word' id='word_1_67' title='bbox 435 461 686 482; x_wconf 87' lang='eng' dir='ltr'><em>Ultramicrobacterium</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 698 461 751 482; x_wconf 94' lang='eng' dir='ltr'><em>ND5</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 762 461 911 487; x_wconf 78' lang='eng' dir='ltr'><em>(ABOOB506)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 428 499 1033 528; baseline 0 -5"><span class='ocrx_word' id='word_1_70' title='bbox 428 502 616 523; x_wconf 85' lang='eng' dir='ltr'><em>Herm/niimonas</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 625 502 782 523; x_wconf 83' lang='eng' dir='ltr'><em>saxobsidens</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 791 501 840 523; x_wconf 83' lang='eng' dir='ltr'><em>N81</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 847 499 872 523; x_wconf 93' lang='eng' dir='ltr'><em>1T</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 879 502 1033 528; x_wconf 86' lang='eng' dir='ltr'><em>(AM493906)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 425 541 1099 570; baseline 0 -6"><span class='ocrx_word' id='word_1_75' title='bbox 425 543 614 564; x_wconf 88' lang='eng' dir='ltr'><em>Herminiimonas</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 623 543 819 570; x_wconf 83' lang='eng' dir='ltr'><em>arsenicoxydans</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 828 541 941 564; x_wconf 89' lang='eng' dir='ltr'><em>ULPAs1T</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 951 543 1099 570; x_wconf 87' lang='eng' dir='ltr'><em>(AY728038)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 438 583 1092 612; baseline 0.002 -6"><span class='ocrx_word' id='word_1_79' title='bbox 438 585 627 606; x_wconf 88' lang='eng' dir='ltr'><em>Herminiimonas</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 636 585 739 612; x_wconf 85' lang='eng' dir='ltr'><em>aquatilis</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 748 585 829 607; x_wconf 91' lang='eng' dir='ltr'><strong>CCUG</strong></span> <span class='ocrx_word' id='word_1_82' title='bbox 840 583 929 607; x_wconf 79' lang='eng' dir='ltr'><em>36956T</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 938 585 1092 612; x_wconf 82' lang='eng' dir='ltr'><em>(AM085762)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 408 623 948 653; baseline 0 -6"><span class='ocrx_word' id='word_1_84' title='bbox 408 626 597 647; x_wconf 86' lang='eng' dir='ltr'><em>Herminiimonas</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 606 626 710 647; x_wconf 83' lang='eng' dir='ltr'><em>fonticola</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 719 623 790 647; x_wconf 77' lang='eng' dir='ltr'><em>S-94T</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 799 626 948 653; x_wconf 88' lang='eng' dir='ltr'><em>(AY676462)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 407 664 1052 694; baseline 0 -5"><span class='ocrx_word' id='word_1_88' title='bbox 407 664 451 685; x_wconf 84' lang='eng'>100</span> <span class='ocrx_word' id='word_1_89' title='bbox 489 668 670 694; x_wconf 86' lang='eng' dir='ltr'><em>HerbaspiriI/um</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 680 668 800 689; x_wconf 83' lang='eng' dir='ltr'><em>Iusitanum</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 809 665 895 689; x_wconf 70' lang='eng' dir='ltr'><em>PIS—12T</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 905 667 1052 694; x_wconf 81' lang='eng' dir='ltr'><em>(AF543312)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 477 706 968 734; baseline 0 -5"><span class='ocrx_word' id='word_1_93' title='bbox 477 708 657 734; x_wconf 83' lang='eng' dir='ltr'><em>Herbaspin&#39;llum</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 667 708 751 729; x_wconf 86' lang='eng' dir='ltr'><em>hiltneri</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 759 706 805 729; x_wconf 81' lang='eng' dir='ltr'><em>N3T</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 814 708 968 734; x_wconf 86' lang='eng' dir='ltr'><em>(DQ150563)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 489 747 1145 776; baseline 0 -5"><span class='ocrx_word' id='word_1_97' title='bbox 489 750 670 776; x_wconf 87' lang='eng' dir='ltr'><em>Herbaspirillum</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 679 750 858 776; x_wconf 85' lang='eng' dir='ltr'><em>rhizosphaerae</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 867 747 982 771; x_wconf 77' lang='eng' dir='ltr'><em>UMS-37T</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 991 750 1145 776; x_wconf 86' lang='eng' dir='ltr'><em>(DQ188986)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 557 789 1081 819; baseline 0 -6"><span class='ocrx_word' id='word_1_101' title='bbox 557 792 695 813; x_wconf 84' lang='eng' dir='ltr'><em>Collimonas</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 704 792 850 819; x_wconf 86' lang='eng' dir='ltr'><em>fungivorans</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 858 789 928 813; x_wconf 68' lang='eng' dir='ltr'><em>TerﬁT</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 937 792 1081 818; x_wconf 83' lang='eng' dir='ltr'><em>(AJ310394)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 547 829 1107 859; baseline 0 -6"><span class='ocrx_word' id='word_1_105' title='bbox 547 832 702 853; x_wconf 85' lang='eng' dir='ltr'><em>Paucimonas</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 711 832 833 859; x_wconf 86' lang='eng' dir='ltr'><em>Iemoignei</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 841 832 899 853; x_wconf 92' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 909 829 983 853; x_wconf 90' lang='eng' dir='ltr'><em>2207T</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 992 832 1107 858; x_wconf 86' lang='eng' dir='ltr'><em>(X92555)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 565 871 1190 901; baseline 0 -6"><span class='ocrx_word' id='word_1_110' title='bbox 565 874 772 895; x_wconf 83' lang='eng' dir='ltr'><em>Oxalicibacterium</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 782 874 864 895; x_wconf 85' lang='eng' dir='ltr'><em>ﬂavum</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 874 874 932 895; x_wconf 94' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 942 871 1032 895; x_wconf 88' lang='eng' dir='ltr'><em>21571T</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 1042 874 1190 901; x_wconf 83' lang='eng' dir='ltr'><em>(AY061962)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 743 912 1241 941; baseline 0 -5"><span class='ocrx_word' id='word_1_115' title='bbox 743 914 896 936; x_wconf 84' lang='eng' dir='ltr'><em>Oxalobacter</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 902 914 1042 941; x_wconf 81' lang='eng' dir='ltr'><em>form/genes</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 1050 912 1116 936; x_wconf 92' lang='eng' dir='ltr'><em>OXBT</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 1126 915 1241 941; x_wconf 87' lang='eng' dir='ltr'><em>(U49757)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 487 954 1115 983; baseline 0 -5"><span class='ocrx_word' id='word_1_119' title='bbox 487 957 667 978; x_wconf 84' lang='eng' dir='ltr'><em>Undibacterium</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 675 957 761 983; x_wconf 87' lang='eng' dir='ltr'><em>pigrum</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 770 956 852 978; x_wconf 91' lang='eng' dir='ltr'><strong>CCUG</strong></span> <span class='ocrx_word' id='word_1_122' title='bbox 862 954 952 978; x_wconf 81' lang='eng' dir='ltr'><em>49009T</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 961 956 1115 983; x_wconf 84' lang='eng' dir='ltr'><em>(AM397630)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001693-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001693-0-001.pbm.png
new file mode 100644
index 00000000..df4e89d6
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001693-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001693-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001693-0-001.pbm.png.hocr
new file mode 100644
index 00000000..c9a85dce
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001693-0-001.pbm.png.hocr
@@ -0,0 +1,485 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001693-0-001.pbm.png"; bbox 0 0 1302 1124; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 43 846 69 864">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 43 846 69 864">
+     <span class='ocr_line' id='line_1_1' title="bbox 43 846 69 864; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 43 846 69 864; x_wconf 90' lang='eng'><em>80</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 78 546 122 565">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 78 546 122 565">
+     <span class='ocr_line' id='line_1_2' title="bbox 78 546 122 565; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 78 546 122 565; x_wconf 89' lang='eng'>0.01</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 257 747 296 766">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 257 747 296 766">
+     <span class='ocr_line' id='line_1_3' title="bbox 257 747 296 766; baseline 0 0"><span class='ocrx_word' id='word_1_3' title='bbox 257 747 296 766; x_wconf 90' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 343 417 384 419">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 343 417 384 419">
+     <span class='ocr_line' id='line_1_4' title="bbox 343 417 384 419; baseline 0 705"><span class='ocrx_word' id='word_1_4' title='bbox 343 417 384 419; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 307 624 345 625">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 307 624 345 625">
+     <span class='ocr_line' id='line_1_5' title="bbox 307 624 345 625; baseline 0 499"><span class='ocrx_word' id='word_1_5' title='bbox 307 624 345 625; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 80 771 309 773">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 80 771 309 773">
+     <span class='ocr_line' id='line_1_6' title="bbox 80 771 309 773; baseline 0 351"><span class='ocrx_word' id='word_1_6' title='bbox 80 771 309 773; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 28 870 82 872">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 28 870 82 872">
+     <span class='ocr_line' id='line_1_7' title="bbox 28 870 82 872; baseline 0 252"><span class='ocrx_word' id='word_1_7' title='bbox 28 870 82 872; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 4 944 29 946">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 4 944 29 946">
+     <span class='ocr_line' id='line_1_8' title="bbox 4 944 29 946; baseline 0 178"><span class='ocrx_word' id='word_1_8' title='bbox 4 944 29 946; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 28 870 29 1020">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 28 870 29 1020">
+     <span class='ocr_line' id='line_1_9' title="bbox 28 870 29 1020; baseline 0 104"><span class='ocrx_word' id='word_1_9' title='bbox 28 870 29 1020; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 80 771 82 971">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 80 771 82 971">
+     <span class='ocr_line' id='line_1_10' title="bbox 80 771 82 971; baseline 0 153"><span class='ocrx_word' id='word_1_10' title='bbox 80 771 82 971; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 28 1019 291 1020">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 28 1019 291 1020">
+     <span class='ocr_line' id='line_1_11' title="bbox 28 1019 291 1020; baseline 0 104"><span class='ocrx_word' id='word_1_11' title='bbox 28 1019 291 1020; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 4 944 6 1086">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 4 944 6 1086">
+     <span class='ocr_line' id='line_1_12' title="bbox 4 944 6 1086; baseline 0 38"><span class='ocrx_word' id='word_1_12' title='bbox 4 944 6 1086; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 4 1084 188 1086">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 4 1084 188 1086">
+     <span class='ocr_line' id='line_1_13' title="bbox 4 1084 188 1086; baseline 0 38"><span class='ocrx_word' id='word_1_13' title='bbox 4 1084 188 1086; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 143 1094 182 1113">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 143 1094 182 1113">
+     <span class='ocr_line' id='line_1_14' title="bbox 143 1094 182 1113; baseline 0 0"><span class='ocrx_word' id='word_1_14' title='bbox 143 1094 182 1113; x_wconf 90' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 187 1068 188 1103">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 187 1068 188 1103">
+     <span class='ocr_line' id='line_1_15' title="bbox 187 1068 188 1103; baseline 0 21"><span class='ocrx_word' id='word_1_15' title='bbox 187 1068 188 1103; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 289 1002 291 1037">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 289 1002 291 1037">
+     <span class='ocr_line' id='line_1_16' title="bbox 289 1002 291 1037; baseline 0 87"><span class='ocrx_word' id='word_1_16' title='bbox 289 1002 291 1037; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 239 1028 278 1047">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 239 1028 278 1047">
+     <span class='ocr_line' id='line_1_17' title="bbox 239 1028 278 1047; baseline 0 0"><span class='ocrx_word' id='word_1_17' title='bbox 239 1028 278 1047; x_wconf 88' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 343 417 345 829">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 343 417 345 829">
+     <span class='ocr_line' id='line_1_18' title="bbox 343 417 345 829; baseline 0 295"><span class='ocrx_word' id='word_1_18' title='bbox 343 417 345 829; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 380 161 537 411">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 380 161 537 411">
+     <span class='ocr_line' id='line_1_19' title="bbox 422 161 463 206; baseline 0 -14"><span class='ocrx_word' id='word_1_19' title='bbox 422 161 463 206; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 422 206 463 239; baseline 0 885"><span class='ocrx_word' id='word_1_20' title='bbox 422 206 463 239; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 413 239 467 304; baseline 0 0"><span class='ocrx_word' id='word_1_21' title='bbox 413 239 467 304; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 380 304 500 339; baseline 0 785"><span class='ocrx_word' id='word_1_22' title='bbox 380 304 500 339; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 380 339 537 386; baseline 0 0"><span class='ocrx_word' id='word_1_23' title='bbox 380 339 537 386; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 413 386 507 411; baseline 0 713"><span class='ocrx_word' id='word_1_24' title='bbox 413 386 507 411; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 459 1 1235 458">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 467 1 1235 94">
+     <span class='ocr_line' id='line_1_25' title="bbox 467 1 1094 27; baseline 0 -5"><span class='ocrx_word' id='word_1_25' title='bbox 467 7 497 26; x_wconf 78' lang='eng'><em>_—</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 507 3 706 27; x_wconf 74' lang='eng' dir='ltr'><em>Methy/obacterium</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 714 3 809 22; x_wconf 79' lang='eng' dir='ltr'><em>zatmam&#39;i</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 817 3 896 22; x_wconf 92' lang='eng' dir='ltr'><em>NCIMB</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 907 1 986 22; x_wconf 84' lang='eng' dir='ltr'><em>12243T</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 994 3 1094 27; x_wconf 87' lang='eng' dir='ltr'><em>(L20804)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 551 34 1073 61; baseline 0 -6"><span class='ocrx_word' id='word_1_31' title='bbox 551 37 750 61; x_wconf 82' lang='eng' dir='ltr'><em>Methylobacterium</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 757 37 863 60; x_wconf 85' lang='eng' dir='ltr'><em>podarium</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 873 34 932 55; x_wconf 82' lang='eng' dir='ltr'><em>FM4T</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 941 36 1073 61; x_wconf 86' lang='eng' dir='ltr'><em>(AF514774)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 610 68 1235 94; baseline 0 -6"><span class='ocrx_word' id='word_1_35' title='bbox 610 70 809 94; x_wconf 77' lang='eng' dir='ltr'><em>Methy/obacterium</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 818 70 1024 88; x_wconf 83' lang='eng' dir='ltr'><em>chloromethanicum</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 1033 68 1097 88; x_wconf 88' lang='eng' dir='ltr'><em>CM4T</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 1104 69 1235 94; x_wconf 85' lang='eng' dir='ltr'><em>(AF198624)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 591 100 1121 126">
+     <span class='ocr_line' id='line_1_28' title="bbox 591 100 1121 126; baseline 0 -5"><span class='ocrx_word' id='word_1_39' title='bbox 591 103 791 126; x_wconf 80' lang='eng' dir='ltr'><em>Methy/obacterium</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 799 103 907 121; x_wconf 80' lang='eng' dir='ltr'><em>Iusitanum</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 916 100 982 121; x_wconf 92' lang='eng' dir='ltr'><em>RXMT</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 988 102 1121 126; x_wconf 83' lang='eng' dir='ltr'><em>(AY009403)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 459 133 1116 193">
+     <span class='ocr_line' id='line_1_29' title="bbox 459 133 985 175; baseline 0 -21"><span class='ocrx_word' id='word_1_43' title='bbox 459 136 679 175; x_wconf 72' lang='eng' dir='ltr'><em>LMethy/obacterium</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 686 136 755 159; x_wconf 87' lang='eng' dir='ltr'><em>populi</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 763 133 844 154; x_wconf 81' lang='eng' dir='ltr'><em>BJ001T</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 852 135 985 160; x_wconf 88' lang='eng' dir='ltr'>(AY251818)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 497 167 1116 193; baseline 0 -5"><span class='ocrx_word' id='word_1_47' title='bbox 497 169 696 193; x_wconf 81' lang='eng' dir='ltr'><em>Methylobacterium</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 705 169 854 193; x_wconf 79' lang='eng' dir='ltr'><em>thiocyanatum</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 862 167 1004 188; x_wconf 76' lang='eng' dir='ltr'><em>ALL/SCN-PT</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 1012 169 1116 193; x_wconf 85' lang='eng' dir='ltr'><em>(U58018)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 466 200 1095 226">
+     <span class='ocr_line' id='line_1_31' title="bbox 466 200 1095 226; baseline 0 -5"><span class='ocrx_word' id='word_1_51' title='bbox 466 202 665 226; x_wconf 80' lang='eng' dir='ltr'><em>Methy/obacterium</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 674 202 818 221; x_wconf 82' lang='eng' dir='ltr'><em>aminovorans</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 826 202 882 221; x_wconf 90' lang='eng' dir='ltr'><em>CCM</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 891 200 958 221; x_wconf 80' lang='eng' dir='ltr'><em>4612T</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 967 202 1095 226; x_wconf 87' lang='eng' dir='ltr'><em>(AJ851086)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 467 233 1069 259">
+     <span class='ocr_line' id='line_1_32' title="bbox 467 233 1069 259; baseline 0 -5"><span class='ocrx_word' id='word_1_56' title='bbox 467 239 484 241; x_wconf 74' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_57' title='bbox 491 235 691 259; x_wconf 79' lang='eng' dir='ltr'><em>Methy/obacterium</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 699 236 824 259; x_wconf 81' lang='eng' dir='ltr'><em>extorquens</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 831 235 882 254; x_wconf 89' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 891 233 957 254; x_wconf 83' lang='eng' dir='ltr'><em>2802T</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 966 235 1069 259; x_wconf 86' lang='eng' dir='ltr'><em>(D32224)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 467 268 1109 292">
+     <span class='ocr_line' id='line_1_33' title="bbox 467 268 1109 292; baseline 0 -5"><span class='ocrx_word' id='word_1_62' title='bbox 467 272 511 274; x_wconf 86' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_63' title='bbox 520 268 719 292; x_wconf 80' lang='eng' dir='ltr'><em>Methylobacterium</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 728 268 874 287; x_wconf 76' lang='eng' dir='ltr'><em>rhodes/anum</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 882 268 932 287; x_wconf 88' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 941 268 996 287; x_wconf 91' lang='eng'>2810</span> <span class='ocrx_word' id='word_1_67' title='bbox 1005 268 1109 292; x_wconf 85' lang='eng' dir='ltr'><em>(D32228)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 500 299 1032 326">
+     <span class='ocr_line' id='line_1_34' title="bbox 500 299 1032 326; baseline 0 -5"><span class='ocrx_word' id='word_1_68' title='bbox 500 302 699 326; x_wconf 78' lang='eng' dir='ltr'><em>Methylobacterium</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 707 302 829 321; x_wconf 84' lang='eng' dir='ltr'><em>suomiense</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 838 299 891 321; x_wconf 88' lang='eng' dir='ltr'><em>F20T</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 900 302 1032 326; x_wconf 86' lang='eng' dir='ltr'><em>(AY009404)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 530 333 1047 359">
+     <span class='ocr_line' id='line_1_35' title="bbox 530 333 1047 359; baseline 0 -6"><span class='ocrx_word' id='word_1_72' title='bbox 530 335 730 359; x_wconf 80' lang='eng' dir='ltr'><em>Methy/obacterium</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 738 335 849 359; x_wconf 87' lang='eng' dir='ltr'><em>salsuginis</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 857 333 906 353; x_wconf 82' lang='eng' dir='ltr'><em>MRT</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 915 334 1047 359; x_wconf 88' lang='eng' dir='ltr'><em>(EF015478)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 541 366 1187 392">
+     <span class='ocr_line' id='line_1_36' title="bbox 541 366 1187 392; baseline -0.002 -5"><span class='ocrx_word' id='word_1_76' title='bbox 541 368 740 392; x_wconf 77' lang='eng' dir='ltr'><em>Methylobacterlum</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 748 368 975 387; x_wconf 79' lang='eng' dir='ltr'><em>dichloromethanicum</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 984 366 1047 386; x_wconf 90' lang='eng' dir='ltr'><em>DM4T</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 1055 368 1187 392; x_wconf 87' lang='eng' dir='ltr'><em>(AF227128)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 507 399 1065 425">
+     <span class='ocr_line' id='line_1_37' title="bbox 507 399 1065 425; baseline 0 -5"><span class='ocrx_word' id='word_1_80' title='bbox 507 401 706 425; x_wconf 81' lang='eng' dir='ltr'><em>Methylobacterium</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 714 401 819 420; x_wconf 86' lang='eng' dir='ltr'><em>rhodinum</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 827 401 877 420; x_wconf 88' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 887 399 953 420; x_wconf 82' lang='eng' dir='ltr'><em>2811T</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 962 401 1065 425; x_wconf 83' lang='eng' dir='ltr'><em>(D32229)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 470 432 1151 458">
+     <span class='ocr_line' id='line_1_38' title="bbox 470 432 1151 458; baseline 0.003 -7"><span class='ocrx_word' id='word_1_85' title='bbox 470 432 496 451; x_wconf 84' lang='eng'>99</span> <span class='ocrx_word' id='word_1_86' title='bbox 513 438 570 440; x_wconf 89' lang='eng'>—</span> <span class='ocrx_word' id='word_1_87' title='bbox 579 434 779 458; x_wconf 77' lang='eng' dir='ltr'><em>Methylobacterium</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 787 434 923 453; x_wconf 83' lang='eng' dir='ltr'><em>adhaesivum</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 930 432 1004 453; x_wconf 91' lang='eng' dir='ltr'><em>AR27T</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 1013 434 1151 458; x_wconf 86' lang='eng' dir='ltr'><em>(AM040156)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 474 7 476 42">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 474 7 476 42">
+     <span class='ocr_line' id='line_1_39' title="bbox 474 7 476 42; baseline 0 1082"><span class='ocrx_word' id='word_1_91' title='bbox 474 7 476 42; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 475 40 542 42">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 475 40 542 42">
+     <span class='ocr_line' id='line_1_40' title="bbox 475 40 542 42; baseline 0 1082"><span class='ocrx_word' id='word_1_92' title='bbox 475 40 542 42; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 465 24 475 274">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 465 24 475 274">
+     <span class='ocr_line' id='line_1_41' title="bbox 465 24 475 274; baseline 0 850"><span class='ocrx_word' id='word_1_93' title='bbox 465 24 475 274; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 462 49 467 274">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 462 49 467 274">
+     <span class='ocr_line' id='line_1_42' title="bbox 462 49 467 274; baseline 0 850"><span class='ocrx_word' id='word_1_94' title='bbox 462 49 467 274; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 465 49 467 274">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 465 49 467 274">
+     <span class='ocr_line' id='line_1_43' title="bbox 465 49 467 274; baseline 0 850"><span class='ocrx_word' id='word_1_95' title='bbox 465 49 467 274; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 401 455 513 457">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 401 455 513 457">
+     <span class='ocr_line' id='line_1_44' title="bbox 401 455 513 457; baseline 0 667"><span class='ocrx_word' id='word_1_96' title='bbox 401 455 513 457; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 382 339 384 498">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 382 339 384 498">
+     <span class='ocr_line' id='line_1_45' title="bbox 382 339 384 498; baseline 0 626"><span class='ocrx_word' id='word_1_97' title='bbox 382 339 384 498; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 382 496 402 498">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 382 496 402 498">
+     <span class='ocr_line' id='line_1_46' title="bbox 382 496 402 498; baseline 0 626"><span class='ocrx_word' id='word_1_98' title='bbox 382 496 402 498; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 401 455 402 539">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 401 455 402 539">
+     <span class='ocr_line' id='line_1_47' title="bbox 401 455 402 539; baseline 0 585"><span class='ocrx_word' id='word_1_99' title='bbox 401 455 402 539; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 511 438 513 473">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 511 438 513 473">
+     <span class='ocr_line' id='line_1_48' title="bbox 511 438 513 473; baseline 0 651"><span class='ocrx_word' id='word_1_100' title='bbox 511 438 513 473; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 513 471 596 473">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 513 471 596 473">
+     <span class='ocr_line' id='line_1_49' title="bbox 513 471 596 473; baseline 0 651"><span class='ocrx_word' id='word_1_101' title='bbox 513 471 596 473; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 605 465 1135 491">
+    <p class='ocr_par' dir='ltr' id='par_1_42' title="bbox 605 465 1135 491">
+     <span class='ocr_line' id='line_1_50' title="bbox 605 465 1135 491; baseline 0 -5"><span class='ocrx_word' id='word_1_102' title='bbox 605 467 804 491; x_wconf 81' lang='eng' dir='ltr'><em>Methy/obacterium</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 813 467 867 486; x_wconf 82' lang='eng' dir='ltr'><em>iners</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 875 465 995 486; x_wconf 79' lang='eng' dir='ltr'><em>53173-33T</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 1003 467 1135 491; x_wconf 86' lang='eng' dir='ltr'>(EF174497)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 435 498 1119 524">
+    <p class='ocr_par' dir='ltr' id='par_1_43' title="bbox 435 498 1119 524">
+     <span class='ocr_line' id='line_1_51' title="bbox 435 498 1119 524; baseline 0 -5"><span class='ocrx_word' id='word_1_106' title='bbox 435 504 503 506; x_wconf 90' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_107' title='bbox 512 501 711 524; x_wconf 79' lang='eng' dir='ltr'><em>Methylobacterium</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 720 501 872 524; x_wconf 84' lang='eng' dir='ltr'><em>organophilum</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 880 500 931 519; x_wconf 84' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 940 498 1006 519; x_wconf 82' lang='eng' dir='ltr'><em>2833T</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 1015 500 1119 524; x_wconf 86' lang='eng' dir='ltr'><em>(D32226)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 401 538 576 539">
+    <p class='ocr_par' dir='ltr' id='par_1_44' title="bbox 401 538 576 539">
+     <span class='ocr_line' id='line_1_52' title="bbox 401 538 576 539; baseline 0 585"><span class='ocrx_word' id='word_1_112' title='bbox 401 538 576 539; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 433 504 435 573">
+    <p class='ocr_par' dir='ltr' id='par_1_45' title="bbox 433 504 435 573">
+     <span class='ocr_line' id='line_1_53' title="bbox 433 504 435 573; baseline 0 551"><span class='ocrx_word' id='word_1_113' title='bbox 433 504 435 573; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 583 531 1134 558">
+    <p class='ocr_par' dir='ltr' id='par_1_46' title="bbox 583 531 1134 558">
+     <span class='ocr_line' id='line_1_54' title="bbox 583 531 1134 558; baseline 0 -6"><span class='ocrx_word' id='word_1_114' title='bbox 583 534 782 558; x_wconf 80' lang='eng' dir='ltr'><em>Methy/obacterium</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 787 534 872 558; x_wconf 81' lang='eng' dir='ltr'><em>jeotgali</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 879 531 988 552; x_wconf 64' lang='eng' dir='ltr'><em>SZROGl-QT</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 997 533 1134 558; x_wconf 81' lang='eng' dir='ltr'><em>(DQ471331)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_37' title="bbox 433 571 684 573">
+    <p class='ocr_par' dir='ltr' id='par_1_47' title="bbox 433 571 684 573">
+     <span class='ocr_line' id='line_1_55' title="bbox 433 571 684 573; baseline 0 551"><span class='ocrx_word' id='word_1_118' title='bbox 433 571 684 573; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_38' title="bbox 413 579 440 598">
+    <p class='ocr_par' dir='ltr' id='par_1_48' title="bbox 413 579 440 598">
+     <span class='ocr_line' id='line_1_56' title="bbox 413 579 440 598; baseline 0 0"><span class='ocrx_word' id='word_1_119' title='bbox 413 579 440 598; x_wconf 87' lang='eng'>59</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_39' title="bbox 343 828 414 829">
+    <p class='ocr_par' dir='ltr' id='par_1_49' title="bbox 343 828 414 829">
+     <span class='ocr_line' id='line_1_57' title="bbox 343 828 414 829; baseline 0 295"><span class='ocrx_word' id='word_1_120' title='bbox 343 828 414 829; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_40' title="bbox 307 624 309 921">
+    <p class='ocr_par' dir='ltr' id='par_1_50' title="bbox 307 624 309 921">
+     <span class='ocr_line' id='line_1_58' title="bbox 307 624 309 921; baseline 0 203"><span class='ocrx_word' id='word_1_121' title='bbox 307 624 309 921; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_41' title="bbox 412 803 414 854">
+    <p class='ocr_par' dir='ltr' id='par_1_51' title="bbox 412 803 414 854">
+     <span class='ocr_line' id='line_1_59' title="bbox 412 803 414 854; baseline 0 270"><span class='ocrx_word' id='word_1_122' title='bbox 412 803 414 854; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_42' title="bbox 414 803 494 805">
+    <p class='ocr_par' dir='ltr' id='par_1_52' title="bbox 414 803 494 805">
+     <span class='ocr_line' id='line_1_60' title="bbox 414 803 494 805; baseline 0 319"><span class='ocrx_word' id='word_1_123' title='bbox 414 803 494 805; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_43' title="bbox 444 564 1299 856">
+    <p class='ocr_par' dir='ltr' id='par_1_53' title="bbox 444 564 1247 631">
+     <span class='ocr_line' id='line_1_61' title="bbox 692 564 1247 590; baseline 0 -5"><span class='ocrx_word' id='word_1_124' title='bbox 692 566 891 590; x_wconf 80' lang='eng' dir='ltr'><em>Methy/obacterium</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 899 566 1026 590; x_wconf 76' lang='eng' dir='ltr'><em>h/spanicum</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 1035 564 1110 585; x_wconf 89' lang='eng' dir='ltr'><em>GP34T</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 1119 566 1247 590; x_wconf 83' lang='eng' dir='ltr'><em>(AJ635304)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_62' title="bbox 444 598 1227 631; baseline 0 -12"><span class='ocrx_word' id='word_1_128' title='bbox 444 613 470 631; x_wconf 77' lang='eng'><em>52</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 639 600 838 624; x_wconf 81' lang='eng' dir='ltr'><em>Methy/obacterium</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 846 600 958 619; x_wconf 82' lang='eng' dir='ltr'><em>aero/atum</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 967 598 1087 619; x_wconf 82' lang='eng' dir='ltr'><em>54133-11T</em></span> <span class='ocrx_word' id='word_1_132' title='bbox 1095 599 1227 624; x_wconf 84' lang='eng' dir='ltr'><em>(EF174498)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_54' title="bbox 475 631 1237 696">
+     <span class='ocr_line' id='line_1_63' title="bbox 475 631 1237 665; baseline 0 -13"><span class='ocrx_word' id='word_1_133' title='bbox 475 646 501 665; x_wconf 75' lang='eng'><em>64</em></span> <span class='ocrx_word' id='word_1_134' title='bbox 629 633 828 657; x_wconf 81' lang='eng' dir='ltr'><em>Methy/obacterium</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 836 633 991 657; x_wconf 85' lang='eng' dir='ltr'><em>mesophi/icum</em></span> <span class='ocrx_word' id='word_1_136' title='bbox 999 633 1049 652; x_wconf 88' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_137' title='bbox 1058 631 1125 652; x_wconf 80' lang='eng' dir='ltr'><em>2829T</em></span> <span class='ocrx_word' id='word_1_138' title='bbox 1134 633 1237 657; x_wconf 86' lang='eng' dir='ltr'><em>(D32225)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_64' title="bbox 505 664 1237 696; baseline 0 -11"><span class='ocrx_word' id='word_1_139' title='bbox 505 677 531 696; x_wconf 77' lang='eng'><strong>86</strong></span> <span class='ocrx_word' id='word_1_140' title='bbox 609 666 808 690; x_wconf 80' lang='eng' dir='ltr'><em>Methylobacterium</em></span> <span class='ocrx_word' id='word_1_141' title='bbox 817 666 962 690; x_wconf 85' lang='eng' dir='ltr'><em>fujisawaense</em></span> <span class='ocrx_word' id='word_1_142' title='bbox 971 666 1024 685; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_143' title='bbox 1034 664 1100 685; x_wconf 83' lang='eng' dir='ltr'><em>5686T</em></span> <span class='ocrx_word' id='word_1_144' title='bbox 1109 666 1237 690; x_wconf 88' lang='eng' dir='ltr'><em>(AJ250801)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_55' title="bbox 551 697 1299 790">
+     <span class='ocr_line' id='line_1_65' title="bbox 551 697 1228 728; baseline 0 -10"><span class='ocrx_word' id='word_1_145' title='bbox 551 709 577 728; x_wconf 77' lang='eng'><em>85</em></span> <span class='ocrx_word' id='word_1_146' title='bbox 629 700 828 723; x_wconf 81' lang='eng' dir='ltr'><em>Methylobacterium</em></span> <span class='ocrx_word' id='word_1_147' title='bbox 836 700 982 718; x_wconf 80' lang='eng' dir='ltr'><em>radioto/erans</em></span> <span class='ocrx_word' id='word_1_148' title='bbox 990 699 1040 718; x_wconf 92' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_149' title='bbox 1050 697 1116 718; x_wconf 81' lang='eng' dir='ltr'><em>2831T</em></span> <span class='ocrx_word' id='word_1_150' title='bbox 1125 699 1228 723; x_wconf 86' lang='eng' dir='ltr'><em>(D32227)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_66' title="bbox 626 731 1299 757; baseline -0.001 -5"><span class='ocrx_word' id='word_1_151' title='bbox 626 733 843 757; x_wconf 83' lang='eng' dir='ltr'><em>Methylobacterium</em></span> <span class='ocrx_word' id='word_1_152' title='bbox 850 733 1037 757; x_wconf 85' lang='eng' dir='ltr'><em>phyllosphaerae</em></span> <span class='ocrx_word' id='word_1_153' title='bbox 1045 731 1160 752; x_wconf 88' lang='eng' dir='ltr'><em>CBMB27T</em></span> <span class='ocrx_word' id='word_1_154' title='bbox 1168 732 1299 757; x_wconf 85' lang='eng' dir='ltr'><em>(EF126746)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_67' title="bbox 567 763 1156 790; baseline 0 -5"><span class='ocrx_word' id='word_1_155' title='bbox 567 763 593 782; x_wconf 90' lang='eng'><em>54</em></span> <span class='ocrx_word' id='word_1_156' title='bbox 612 766 811 790; x_wconf 84' lang='eng' dir='ltr'><em>Methylobacterium</em></span> <span class='ocrx_word' id='word_1_157' title='bbox 819 771 895 790; x_wconf 86' lang='eng' dir='ltr'><em>oryzae</em></span> <span class='ocrx_word' id='word_1_158' title='bbox 903 764 1014 785; x_wconf 81' lang='eng' dir='ltr'><em>CBMBZOT</em></span> <span class='ocrx_word' id='word_1_159' title='bbox 1023 766 1156 790; x_wconf 83' lang='eng' dir='ltr'><em>(AY683045)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_56' title="bbox 448 797 1067 856">
+     <span class='ocr_line' id='line_1_68' title="bbox 502 797 1011 823; baseline 0 -5"><span class='ocrx_word' id='word_1_160' title='bbox 502 799 701 823; x_wconf 74' lang='eng' dir='ltr'><em>Methylobacterium</em></span> <span class='ocrx_word' id='word_1_161' title='bbox 711 799 803 818; x_wconf 84' lang='eng' dir='ltr'><em>variabi/e</em></span> <span class='ocrx_word' id='word_1_162' title='bbox 811 797 874 818; x_wconf 84' lang='eng' dir='ltr'><em>GR3T</em></span> <span class='ocrx_word' id='word_1_163' title='bbox 882 799 1011 823; x_wconf 85' lang='eng' dir='ltr'><em>(AJ851087)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_69' title="bbox 448 830 1067 856; baseline 0.002 -6"><span class='ocrx_word' id='word_1_164' title='bbox 448 836 513 837; x_wconf 41' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_165' title='bbox 522 832 721 856; x_wconf 81' lang='eng' dir='ltr'><em>Methy/obacterium</em></span> <span class='ocrx_word' id='word_1_166' title='bbox 730 832 845 855; x_wconf 81' lang='eng' dir='ltr'><em>aquat/cum</em></span> <span class='ocrx_word' id='word_1_167' title='bbox 854 830 930 851; x_wconf 82' lang='eng' dir='ltr'><em>GR16T</em></span> <span class='ocrx_word' id='word_1_168' title='bbox 939 832 1067 856; x_wconf 87' lang='eng' dir='ltr'><em>(AJ635303)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_44' title="bbox 460 538 462 606">
+    <p class='ocr_par' dir='ltr' id='par_1_57' title="bbox 460 538 462 606">
+     <span class='ocr_line' id='line_1_70' title="bbox 460 538 462 606; baseline 0 518"><span class='ocrx_word' id='word_1_169' title='bbox 460 538 462 606; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_45' title="bbox 460 604 630 606">
+    <p class='ocr_par' dir='ltr' id='par_1_58' title="bbox 460 604 630 606">
+     <span class='ocr_line' id='line_1_71' title="bbox 460 604 630 606; baseline 0 518"><span class='ocrx_word' id='word_1_170' title='bbox 460 604 630 606; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_46' title="bbox 481 571 483 639">
+    <p class='ocr_par' dir='ltr' id='par_1_59' title="bbox 481 571 483 639">
+     <span class='ocr_line' id='line_1_72' title="bbox 481 571 483 639; baseline 0 485"><span class='ocrx_word' id='word_1_171' title='bbox 481 571 483 639; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_47' title="bbox 481 637 620 639">
+    <p class='ocr_par' dir='ltr' id='par_1_60' title="bbox 481 637 620 639">
+     <span class='ocr_line' id='line_1_73' title="bbox 481 637 620 639; baseline 0 485"><span class='ocrx_word' id='word_1_172' title='bbox 481 637 620 639; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_48' title="bbox 516 604 518 671">
+    <p class='ocr_par' dir='ltr' id='par_1_61' title="bbox 516 604 518 671">
+     <span class='ocr_line' id='line_1_74' title="bbox 516 604 518 671; baseline 0 453"><span class='ocrx_word' id='word_1_173' title='bbox 516 604 518 671; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_49' title="bbox 516 669 547 671">
+    <p class='ocr_par' dir='ltr' id='par_1_62' title="bbox 516 669 547 671">
+     <span class='ocr_line' id='line_1_75' title="bbox 516 669 547 671; baseline 0 453"><span class='ocrx_word' id='word_1_174' title='bbox 516 669 547 671; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_50' title="bbox 545 637 547 700">
+    <p class='ocr_par' dir='ltr' id='par_1_63' title="bbox 545 637 547 700">
+     <span class='ocr_line' id='line_1_76' title="bbox 545 637 547 700; baseline 0 424"><span class='ocrx_word' id='word_1_175' title='bbox 545 637 547 700; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_51' title="bbox 412 852 448 854">
+    <p class='ocr_par' dir='ltr' id='par_1_64' title="bbox 412 852 448 854">
+     <span class='ocr_line' id='line_1_77' title="bbox 412 852 448 854; baseline 0 270"><span class='ocrx_word' id='word_1_176' title='bbox 412 852 448 854; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_52' title="bbox 413 862 440 881">
+    <p class='ocr_par' dir='ltr' id='par_1_65' title="bbox 413 862 440 881">
+     <span class='ocr_line' id='line_1_78' title="bbox 413 862 440 881; baseline 0 0"><span class='ocrx_word' id='word_1_177' title='bbox 413 862 440 881; x_wconf 89' lang='eng'>88</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_53' title="bbox 307 919 419 921">
+    <p class='ocr_par' dir='ltr' id='par_1_66' title="bbox 307 919 419 921">
+     <span class='ocr_line' id='line_1_79' title="bbox 307 919 419 921; baseline 0 203"><span class='ocrx_word' id='word_1_178' title='bbox 307 919 419 921; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_54' title="bbox 291 1035 380 1037">
+    <p class='ocr_par' dir='ltr' id='par_1_67' title="bbox 291 1035 380 1037">
+     <span class='ocr_line' id='line_1_80' title="bbox 291 1035 380 1037; baseline 0 87"><span class='ocrx_word' id='word_1_179' title='bbox 291 1035 380 1037; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_55' title="bbox 369 929 407 948">
+    <p class='ocr_par' dir='ltr' id='par_1_68' title="bbox 369 929 407 948">
+     <span class='ocr_line' id='line_1_81' title="bbox 369 929 407 948; baseline 0.026 -1"><span class='ocrx_word' id='word_1_180' title='bbox 369 929 407 948; x_wconf 90' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_56' title="bbox 417 902 419 937">
+    <p class='ocr_par' dir='ltr' id='par_1_69' title="bbox 417 902 419 937">
+     <span class='ocr_line' id='line_1_82' title="bbox 417 902 419 937; baseline 0 187"><span class='ocrx_word' id='word_1_181' title='bbox 417 902 419 937; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_57' title="bbox 447 836 448 871">
+    <p class='ocr_par' dir='ltr' id='par_1_70' title="bbox 447 836 448 871">
+     <span class='ocr_line' id='line_1_83' title="bbox 447 836 448 871; baseline 0 253"><span class='ocrx_word' id='word_1_182' title='bbox 447 836 448 871; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_58' title="bbox 448 863 1021 889">
+    <p class='ocr_par' dir='ltr' id='par_1_71' title="bbox 448 863 1021 889">
+     <span class='ocr_line' id='line_1_84' title="bbox 448 863 1021 889; baseline -0.002 -5"><span class='ocrx_word' id='word_1_183' title='bbox 448 869 490 871; x_wconf 86' lang='eng'>—</span> <span class='ocrx_word' id='word_1_184' title='bbox 498 865 697 889; x_wconf 80' lang='eng' dir='ltr'><em>Methy/obacterium</em></span> <span class='ocrx_word' id='word_1_185' title='bbox 705 865 781 889; x_wconf 87' lang='eng' dir='ltr'><em>platani</em></span> <span class='ocrx_word' id='word_1_186' title='bbox 788 863 881 884; x_wconf 80' lang='eng' dir='ltr'><em>PMBOZT</em></span> <span class='ocrx_word' id='word_1_187' title='bbox 890 865 1021 889; x_wconf 83' lang='eng' dir='ltr'><em>(EF426729)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_59' title="bbox 419 896 1011 922">
+    <p class='ocr_par' dir='ltr' id='par_1_72' title="bbox 419 896 1011 922">
+     <span class='ocr_line' id='line_1_85' title="bbox 419 896 1011 922; baseline 0 -5"><span class='ocrx_word' id='word_1_188' title='bbox 419 902 473 904; x_wconf 88' lang='eng'>—</span> <span class='ocrx_word' id='word_1_189' title='bbox 481 898 681 922; x_wconf 80' lang='eng' dir='ltr'><em>Methy/obacterium</em></span> <span class='ocrx_word' id='word_1_190' title='bbox 689 898 792 917; x_wconf 83' lang='eng' dir='ltr'><em>isbi/iense</em></span> <span class='ocrx_word' id='word_1_191' title='bbox 800 896 874 917; x_wconf 87' lang='eng' dir='ltr'><em>AR24T</em></span> <span class='ocrx_word' id='word_1_192' title='bbox 883 898 1011 922; x_wconf 85' lang='eng' dir='ltr'><em>(AJ888239)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_60' title="bbox 468 930 1130 1022">
+    <p class='ocr_par' dir='ltr' id='par_1_73' title="bbox 468 930 1130 1022">
+     <span class='ocr_line' id='line_1_86' title="bbox 544 930 1130 956; baseline 0 -6"><span class='ocrx_word' id='word_1_193' title='bbox 544 932 743 956; x_wconf 79' lang='eng' dir='ltr'><em>Methylobacterium</em></span> <span class='ocrx_word' id='word_1_194' title='bbox 752 932 853 950; x_wconf 87' lang='eng' dir='ltr'><em>nodulans</em></span> <span class='ocrx_word' id='word_1_195' title='bbox 861 931 915 950; x_wconf 87' lang='eng' dir='ltr'><em>ORS</em></span> <span class='ocrx_word' id='word_1_196' title='bbox 924 930 990 950; x_wconf 76' lang='eng' dir='ltr'><em>2060T</em></span> <span class='ocrx_word' id='word_1_197' title='bbox 998 931 1130 955; x_wconf 85' lang='eng' dir='ltr'><em>(AF220783)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_87' title="bbox 468 963 1010 989; baseline -0.002 -5"><span class='ocrx_word' id='word_1_198' title='bbox 468 965 647 989; x_wconf 84' lang='eng' dir='ltr'><em>Methylorhabdus</em></span> <span class='ocrx_word' id='word_1_199' title='bbox 655 965 784 984; x_wconf 79' lang='eng' dir='ltr'><em>multlvorans</em></span> <span class='ocrx_word' id='word_1_200' title='bbox 793 963 870 984; x_wconf 81' lang='eng' dir='ltr'><em>DM13T</em></span> <span class='ocrx_word' id='word_1_201' title='bbox 879 965 1010 989; x_wconf 87' lang='eng' dir='ltr'><em>(AF004845)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_88' title="bbox 497 996 1008 1022; baseline 0 -5"><span class='ocrx_word' id='word_1_202' title='bbox 497 998 612 1017; x_wconf 78' lang='eng' dir='ltr'><em>Albibacter</em></span> <span class='ocrx_word' id='word_1_203' title='bbox 618 998 782 1022; x_wconf 81' lang='eng' dir='ltr'><em>methy/ovorans</em></span> <span class='ocrx_word' id='word_1_204' title='bbox 791 996 868 1017; x_wconf 91' lang='eng' dir='ltr'><em>DM10T</em></span> <span class='ocrx_word' id='word_1_205' title='bbox 877 998 1008 1022; x_wconf 83' lang='eng' dir='ltr'><em>(AF273213)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_61' title="bbox 390 1029 833 1055">
+    <p class='ocr_par' dir='ltr' id='par_1_74' title="bbox 390 1029 833 1055">
+     <span class='ocr_line' id='line_1_89' title="bbox 390 1029 833 1055; baseline 0 -5"><span class='ocrx_word' id='word_1_206' title='bbox 390 1031 516 1055; x_wconf 81' lang='eng' dir='ltr'><em>Methylopi/a</em></span> <span class='ocrx_word' id='word_1_207' title='bbox 525 1031 632 1055; x_wconf 77' lang='eng' dir='ltr'><em>capsu/ata</em></span> <span class='ocrx_word' id='word_1_208' title='bbox 642 1029 693 1050; x_wconf 92' lang='eng' dir='ltr'><em>|M1T</em></span> <span class='ocrx_word' id='word_1_209' title='bbox 702 1031 833 1055; x_wconf 91' lang='eng' dir='ltr'><em>(AF004844)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_62' title="bbox 478 1062 1132 1121">
+    <p class='ocr_par' dir='ltr' id='par_1_75' title="bbox 478 1062 1132 1121">
+     <span class='ocr_line' id='line_1_90' title="bbox 693 1062 1132 1088; baseline 0 -5"><span class='ocrx_word' id='word_1_210' title='bbox 693 1064 845 1088; x_wconf 83' lang='eng' dir='ltr'><em>Methy/ocystis</em></span> <span class='ocrx_word' id='word_1_211' title='bbox 852 1069 928 1088; x_wconf 87' lang='eng' dir='ltr'><em>parvus</em></span> <span class='ocrx_word' id='word_1_212' title='bbox 936 1062 1017 1083; x_wconf 92' lang='eng' dir='ltr'><em>OBBPT</em></span> <span class='ocrx_word' id='word_1_213' title='bbox 1025 1064 1132 1088; x_wconf 84' lang='eng' dir='ltr'><em>(M29026)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_91' title="bbox 478 1095 983 1121; baseline 0 -5"><span class='ocrx_word' id='word_1_214' title='bbox 478 1097 625 1121; x_wconf 80' lang='eng' dir='ltr'><em>Methy/osinus</em></span> <span class='ocrx_word' id='word_1_215' title='bbox 633 1097 784 1121; x_wconf 83' lang='eng' dir='ltr'><em>trichosporium</em></span> <span class='ocrx_word' id='word_1_216' title='bbox 793 1095 867 1116; x_wconf 73' lang='eng' dir='ltr'><em>OBSbT</em></span> <span class='ocrx_word' id='word_1_217' title='bbox 877 1097 983 1121; x_wconf 84' lang='eng' dir='ltr'><em>(M29024)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001719-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001719-0-001.pbm.png
new file mode 100644
index 00000000..c2364202
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001719-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001719-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001719-0-001.pbm.png.hocr
new file mode 100644
index 00000000..ddb1f99f
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001719-0-001.pbm.png.hocr
@@ -0,0 +1,130 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001719-0-001.pbm.png"; bbox 0 0 994 831; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 156 395 182 409">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 156 395 182 409">
+     <span class='ocr_line' id='line_1_1' title="bbox 156 395 182 409; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 156 395 182 409; x_wconf 61' lang='eng' dir='ltr'><em>6m</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 188 207 190 618">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 188 207 190 618">
+     <span class='ocr_line' id='line_1_2' title="bbox 188 207 190 618; baseline 0 213"><span class='ocrx_word' id='word_1_2' title='bbox 188 207 190 618; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 206 597 243 611">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 206 597 243 611">
+     <span class='ocr_line' id='line_1_3' title="bbox 206 597 243 611; baseline 0.027 -1"><span class='ocrx_word' id='word_1_3' title='bbox 206 597 243 611; x_wconf 62' lang='eng'>1000</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 305 12 947 38">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 305 12 947 38">
+     <span class='ocr_line' id='line_1_4' title="bbox 305 12 947 38; baseline 0 -5"><span class='ocrx_word' id='word_1_4' title='bbox 305 13 496 33; x_wconf 81' lang='eng' dir='ltr'><em>—Clostridium</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 506 13 610 38; x_wconf 83' lang='eng' dir='ltr'><em>hungatei</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 616 13 686 33; x_wconf 86' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 696 12 796 33; x_wconf 77' lang='eng' dir='ltr'><em>700212T</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 805 13 947 38; x_wconf 86' lang='eng' dir='ltr'><em>(AF020429)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 338 91 860 117">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 338 91 860 117">
+     <span class='ocr_line' id='line_1_5' title="bbox 338 91 860 117; baseline 0 -5"><span class='ocrx_word' id='word_1_9' title='bbox 338 91 487 112; x_wconf 85' lang='eng' dir='ltr'><em>-Clostridium</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 497 92 605 112; x_wconf 82' lang='eng' dir='ltr'><em>termitidis</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 614 91 671 112; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 682 92 740 112; x_wconf 81' lang='eng'><em>5396</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 751 91 860 117; x_wconf 87' lang='eng' dir='ltr'>(X71854)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 303 24 305 144">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 303 24 305 144">
+     <span class='ocr_line' id='line_1_6' title="bbox 303 24 305 144; baseline 0 687"><span class='ocrx_word' id='word_1_14' title='bbox 303 24 305 144; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 303 142 339 144">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 303 142 339 144">
+     <span class='ocr_line' id='line_1_7' title="bbox 303 142 339 144; baseline 0 687"><span class='ocrx_word' id='word_1_15' title='bbox 303 142 339 144; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 308 148 942 195">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 308 148 942 195">
+     <span class='ocr_line' id='line_1_8' title="bbox 308 148 339 162; baseline 0 0"><span class='ocrx_word' id='word_1_16' title='bbox 308 148 339 162; x_wconf 83' lang='eng' dir='ltr'><em>ooo</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 339 169 942 195; baseline 0 -5"><span class='ocrx_word' id='word_1_17' title='bbox 339 182 359 184; x_wconf 98' lang='eng'>—</span> <span class='ocrx_word' id='word_1_18' title='bbox 365 170 499 190; x_wconf 78' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 508 170 676 195; x_wconf 79' lang='eng' dir='ltr'><em>cellobioparum</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 686 170 743 190; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 756 169 823 190; x_wconf 79' lang='eng' dir='ltr'><em>1351T</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 832 170 942 195; x_wconf 85' lang='eng' dir='ltr'>(X71856)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 337 104 339 184">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 337 104 339 184">
+     <span class='ocr_line' id='line_1_10' title="bbox 337 104 339 184; baseline 0 647"><span class='ocrx_word' id='word_1_23' title='bbox 337 104 339 184; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 253 189 291 202">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 253 189 291 202">
+     <span class='ocr_line' id='line_1_11' title="bbox 253 189 291 202; baseline 0 0"><span class='ocrx_word' id='word_1_24' title='bbox 253 189 291 202; x_wconf 83' lang='eng'>1000</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 372 249 955 275">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 372 249 955 275">
+     <span class='ocr_line' id='line_1_12' title="bbox 372 249 955 275; baseline -0.002 -5"><span class='ocrx_word' id='word_1_25' title='bbox 372 249 505 270; x_wconf 84' lang='eng' dir='ltr'><em>Clostn&#39;dium</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 513 250 690 275; x_wconf 86' lang='eng' dir='ltr'><em>papyroso/vens</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 699 249 756 270; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 767 249 836 270; x_wconf 73' lang='eng' dir='ltr'><em>2782T</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 846 249 955 275; x_wconf 86' lang='eng' dir='ltr'>(X71852)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 405 324 688 355">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 405 324 688 355">
+     <span class='ocr_line' id='line_1_13' title="bbox 405 324 688 355; baseline 0.004 -7"><span class='ocrx_word' id='word_1_30' title='bbox 405 324 506 349; x_wconf 78' lang='eng' dir='ltr'><em>CDT-1T</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 517 325 688 355; x_wconf 82' lang='eng' dir='ltr'><em>(A3267266)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 292 406 923 432">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 292 406 923 432">
+     <span class='ocr_line' id='line_1_14' title="bbox 292 406 923 432; baseline 0 -5"><span class='ocrx_word' id='word_1_32' title='bbox 292 406 321 419; x_wconf 67' lang='eng'><em>726</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 384 407 518 427; x_wconf 84' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 523 407 583 432; x_wconf 87' lang='eng' dir='ltr'><em>josui</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 592 407 665 427; x_wconf 83' lang='eng' dir='ltr'>FERM</span> <span class='ocrx_word' id='word_1_36' title='bbox 677 406 772 427; x_wconf 82' lang='eng' dir='ltr'><em>P-9684T</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 782 407 923 432; x_wconf 82' lang='eng' dir='ltr'><em>(ABO11OS7)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 321 468 993 512">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 321 468 993 512">
+     <span class='ocr_line' id='line_1_15' title="bbox 321 468 359 482; baseline 0.026 -1"><span class='ocrx_word' id='word_1_38' title='bbox 321 468 359 482; x_wconf 83' lang='eng'>1000</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 398 486 993 512; baseline -0.002 -5"><span class='ocrx_word' id='word_1_39' title='bbox 398 486 531 507; x_wconf 80' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 541 487 702 512; x_wconf 78' lang='eng' dir='ltr'><em>cellu/o/yﬂcum</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 708 486 779 507; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 790 486 874 507; x_wconf 77' lang='eng' dir='ltr'><em>35319T</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 883 486 993 512; x_wconf 86' lang='eng' dir='ltr'>(X71847)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 252 564 846 591">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 252 564 846 591">
+     <span class='ocr_line' id='line_1_17' title="bbox 252 564 846 591; baseline 0 -6"><span class='ocrx_word' id='word_1_44' title='bbox 252 565 397 585; x_wconf 81' lang='eng' dir='ltr'><em>—Acetivibrio</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 406 565 558 591; x_wconf 79' lang='eng' dir='ltr'><em>cellu/o/yticus</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 565 565 635 585; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 646 564 730 585; x_wconf 81' lang='eng' dir='ltr'><em>33288T</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 739 565 846 591; x_wconf 84' lang='eng' dir='ltr'><em>(L35516)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 250 577 252 658">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 250 577 252 658">
+     <span class='ocr_line' id='line_1_18' title="bbox 250 577 252 658; baseline 0 173"><span class='ocrx_word' id='word_1_49' title='bbox 250 577 252 658; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 252 643 855 749">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 252 643 855 749">
+     <span class='ocr_line' id='line_1_19' title="bbox 252 643 784 669; baseline 0 -5"><span class='ocrx_word' id='word_1_50' title='bbox 252 644 417 664; x_wconf 84' lang='eng' dir='ltr'><em>—C/ostridium</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 427 644 520 664; x_wconf 83' lang='eng' dir='ltr'><em>aldrichii</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 528 644 585 664; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 595 643 664 664; x_wconf 82' lang='eng' dir='ltr'><em>6159T</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 674 644 784 669; x_wconf 83' lang='eng' dir='ltr'>(X71846)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 286 723 855 749; baseline -0.002 -5"><span class='ocrx_word' id='word_1_55' title='bbox 286 724 420 744; x_wconf 87' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 429 724 592 744; x_wconf 83' lang='eng' dir='ltr'><em>thermoce/lum</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 602 724 658 744; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 671 723 738 744; x_wconf 76' lang='eng' dir='ltr'><em>1237T</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 748 724 855 749; x_wconf 85' lang='eng' dir='ltr'>(L09173)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 306 801 775 828">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 306 801 775 828">
+     <span class='ocr_line' id='line_1_21' title="bbox 306 801 775 828; baseline 0 -6"><span class='ocrx_word' id='word_1_60' title='bbox 306 802 398 822; x_wconf 80' lang='eng' dir='ltr'><em>Bacillus</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 407 802 489 822; x_wconf 83' lang='eng' dir='ltr'><em>subtilis</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 499 802 576 822; x_wconf 91' lang='eng' dir='ltr'><em>NCDO</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 588 801 655 822; x_wconf 73' lang='eng' dir='ltr'><em>1769T</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 665 802 775 828; x_wconf 83' lang='eng' dir='ltr'><em>(X60646)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001743-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001743-0-000.pbm.png
new file mode 100644
index 00000000..181e643e
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001743-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001743-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001743-0-000.pbm.png.hocr
new file mode 100644
index 00000000..e4769f4b
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001743-0-000.pbm.png.hocr
@@ -0,0 +1,670 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001743-0-000.pbm.png"; bbox 0 0 1479 1660; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 173 8 206 24">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 173 8 206 24">
+     <span class='ocr_line' id='line_1_1' title="bbox 173 8 206 24; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 173 8 206 24; x_wconf 86' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 21 32 213 34">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 21 32 213 34">
+     <span class='ocr_line' id='line_1_2' title="bbox 21 32 213 34; baseline 0 1626"><span class='ocrx_word' id='word_1_2' title='bbox 21 32 213 34; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 21 32 23 618">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 21 32 23 618">
+     <span class='ocr_line' id='line_1_3' title="bbox 21 32 23 618; baseline 0 1042"><span class='ocrx_word' id='word_1_3' title='bbox 21 32 23 618; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 211 11 213 56">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 211 11 213 56">
+     <span class='ocr_line' id='line_1_4' title="bbox 211 11 213 56; baseline 0 1604"><span class='ocrx_word' id='word_1_4' title='bbox 211 11 213 56; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 223 174 245 190">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 223 174 245 190">
+     <span class='ocr_line' id='line_1_5' title="bbox 223 174 245 190; baseline 0 0"><span class='ocrx_word' id='word_1_5' title='bbox 223 174 245 190; x_wconf 81' lang='eng'><em>78</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 357 126 390 142">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 357 126 390 142">
+     <span class='ocr_line' id='line_1_6' title="bbox 357 126 390 142; baseline 0 0"><span class='ocrx_word' id='word_1_6' title='bbox 357 126 390 142; x_wconf 88' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 346 0 1018 69">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 346 0 1018 69">
+     <span class='ocr_line' id='line_1_7' title="bbox 438 0 1018 26; baseline 0 -5"><span class='ocrx_word' id='word_1_7' title='bbox 438 1 601 21; x_wconf 84' lang='eng' dir='ltr'><em>Cel/u/omonas</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 610 1 717 26; x_wconf 83' lang='eng' dir='ltr'><em>flavigena</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 728 1 812 21; x_wconf 91' lang='eng' dir='ltr'><em>NCIMB</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 822 0 892 21; x_wconf 79' lang='eng' dir='ltr'><em>8073T</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 909 1 1018 26; x_wconf 82' lang='eng' dir='ltr'><strong>(X79463)</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 346 43 896 69; baseline 0 -5"><span class='ocrx_word' id='word_1_12' title='bbox 346 44 509 64; x_wconf 84' lang='eng' dir='ltr'><em>Ce/lu/omonas</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 517 44 615 64; x_wconf 84' lang='eng' dir='ltr'><em>ce/Iasea</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 627 44 683 64; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 693 43 778 64; x_wconf 74' lang='eng' dir='ltr'><em>20118T</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 787 44 896 69; x_wconf 88' lang='eng' dir='ltr'><em>(X83804)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 426 94 459 110">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 426 94 459 110">
+     <span class='ocr_line' id='line_1_9' title="bbox 426 94 459 110; baseline 0 0"><span class='ocrx_word' id='word_1_17' title='bbox 426 94 459 110; x_wconf 89' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 395 118 466 120">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 395 118 466 120">
+     <span class='ocr_line' id='line_1_10' title="bbox 395 118 466 120; baseline 0 1540"><span class='ocrx_word' id='word_1_18' title='bbox 395 118 466 120; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 251 150 397 152">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 251 150 397 152">
+     <span class='ocr_line' id='line_1_11' title="bbox 251 150 397 152; baseline 0 1508"><span class='ocrx_word' id='word_1_19' title='bbox 251 150 397 152; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 217 199 253 201">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 217 199 253 201">
+     <span class='ocr_line' id='line_1_12' title="bbox 217 199 253 201; baseline 0 1459"><span class='ocrx_word' id='word_1_20' title='bbox 217 199 253 201; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 217 199 219 314">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 217 199 219 314">
+     <span class='ocr_line' id='line_1_13' title="bbox 217 199 219 314; baseline 0 1346"><span class='ocrx_word' id='word_1_21' title='bbox 217 199 219 314; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 119 406 186 408">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 119 406 186 408">
+     <span class='ocr_line' id='line_1_14' title="bbox 119 406 186 408; baseline 0 1252"><span class='ocrx_word' id='word_1_22' title='bbox 119 406 186 408; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 21 616 121 618">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 21 616 121 618">
+     <span class='ocr_line' id='line_1_15' title="bbox 21 616 121 618; baseline 0 1042"><span class='ocrx_word' id='word_1_23' title='bbox 21 616 121 618; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 91 628 113 644">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 91 628 113 644">
+     <span class='ocr_line' id='line_1_16' title="bbox 91 628 113 644; baseline 0 0"><span class='ocrx_word' id='word_1_24' title='bbox 91 628 113 644; x_wconf 68' lang='eng' dir='ltr'><em>SB</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 119 406 121 829">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 119 406 121 829">
+     <span class='ocr_line' id='line_1_17' title="bbox 119 406 121 829; baseline 0 831"><span class='ocrx_word' id='word_1_25' title='bbox 119 406 121 829; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 184 316 186 499">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 184 316 186 499">
+     <span class='ocr_line' id='line_1_18' title="bbox 184 316 186 499; baseline 0 1161"><span class='ocrx_word' id='word_1_26' title='bbox 184 316 186 499; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 251 150 253 249">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 251 150 253 249">
+     <span class='ocr_line' id='line_1_19' title="bbox 251 150 253 249; baseline 0 1411"><span class='ocrx_word' id='word_1_27' title='bbox 251 150 253 249; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 251 247 282 249">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 251 247 282 249">
+     <span class='ocr_line' id='line_1_20' title="bbox 251 247 282 249; baseline 0 1411"><span class='ocrx_word' id='word_1_28' title='bbox 251 247 282 249; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 280 225 282 270">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 280 225 282 270">
+     <span class='ocr_line' id='line_1_21' title="bbox 280 225 282 270; baseline 0 1390"><span class='ocrx_word' id='word_1_29' title='bbox 280 225 282 270; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 252 258 273 274">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 252 258 273 274">
+     <span class='ocr_line' id='line_1_22' title="bbox 252 258 273 274; baseline 0 0"><span class='ocrx_word' id='word_1_30' title='bbox 252 258 273 274; x_wconf 83' lang='eng'><strong>79</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 318 354 319 399">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 318 354 319 399">
+     <span class='ocr_line' id='line_1_23' title="bbox 318 354 319 399; baseline 0 1261"><span class='ocrx_word' id='word_1_31' title='bbox 318 354 319 399; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 289 387 311 403">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 289 387 311 403">
+     <span class='ocr_line' id='line_1_24' title="bbox 289 387 311 403; baseline 0 0"><span class='ocrx_word' id='word_1_32' title='bbox 289 387 311 403; x_wconf 82' lang='eng'>99</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 253 480 275 497">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 253 480 275 497">
+     <span class='ocr_line' id='line_1_25' title="bbox 253 480 275 497; baseline 0 0"><span class='ocrx_word' id='word_1_33' title='bbox 253 480 275 497; x_wconf 86' lang='eng'><em>96</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 221 505 283 507">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 221 505 283 507">
+     <span class='ocr_line' id='line_1_26' title="bbox 221 505 283 507; baseline 0 1153"><span class='ocrx_word' id='word_1_34' title='bbox 221 505 283 507; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 197 440 199 555">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 197 440 199 555">
+     <span class='ocr_line' id='line_1_27' title="bbox 197 440 199 555; baseline 0 1105"><span class='ocrx_word' id='word_1_35' title='bbox 197 440 199 555; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 197 553 223 555">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 197 553 223 555">
+     <span class='ocr_line' id='line_1_28' title="bbox 197 553 223 555; baseline 0 1105"><span class='ocrx_word' id='word_1_36' title='bbox 197 553 223 555; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 221 505 223 604">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 221 505 223 604">
+     <span class='ocr_line' id='line_1_29' title="bbox 221 505 223 604; baseline 0 1056"><span class='ocrx_word' id='word_1_37' title='bbox 221 505 223 604; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 226 771 248 787">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 226 771 248 787">
+     <span class='ocr_line' id='line_1_30' title="bbox 226 771 248 787; baseline 0 0"><span class='ocrx_word' id='word_1_38' title='bbox 226 771 248 787; x_wconf 81' lang='eng'><em>99</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 281 483 283 528">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 281 483 283 528">
+     <span class='ocr_line' id='line_1_31' title="bbox 281 483 283 528; baseline 0 1132"><span class='ocrx_word' id='word_1_39' title='bbox 281 483 283 528; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 344 613 374 629">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 344 613 374 629">
+     <span class='ocr_line' id='line_1_32' title="bbox 344 613 374 629; baseline 0 0"><span class='ocrx_word' id='word_1_40' title='bbox 344 613 374 629; x_wconf 89' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 275 739 297 755">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 275 739 297 755">
+     <span class='ocr_line' id='line_1_33' title="bbox 275 739 297 755; baseline 0 0"><span class='ocrx_word' id='word_1_41' title='bbox 275 739 297 755; x_wconf 82' lang='eng'><strong>98</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 255 763 305 765">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 255 763 305 765">
+     <span class='ocr_line' id='line_1_34' title="bbox 255 763 305 765; baseline 0 895"><span class='ocrx_word' id='word_1_42' title='bbox 255 763 305 765; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 303 741 305 786">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 303 741 305 786">
+     <span class='ocr_line' id='line_1_35' title="bbox 303 741 305 786; baseline 0 874"><span class='ocrx_word' id='word_1_43' title='bbox 303 741 305 786; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 159 795 257 797">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 159 795 257 797">
+     <span class='ocr_line' id='line_1_36' title="bbox 159 795 257 797; baseline 0 863"><span class='ocrx_word' id='word_1_44' title='bbox 159 795 257 797; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 255 763 257 829">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 255 763 257 829">
+     <span class='ocr_line' id='line_1_37' title="bbox 255 763 257 829; baseline 0 831"><span class='ocrx_word' id='word_1_45' title='bbox 255 763 257 829; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_37' title="bbox 319 354 390 356">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 319 354 390 356">
+     <span class='ocr_line' id='line_1_38' title="bbox 319 354 390 356; baseline 0 1304"><span class='ocrx_word' id='word_1_46' title='bbox 319 354 390 356; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_38' title="bbox 395 118 397 185">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 395 118 397 185">
+     <span class='ocr_line' id='line_1_39' title="bbox 395 118 397 185; baseline 0 1475"><span class='ocrx_word' id='word_1_47' title='bbox 395 118 397 185; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_39' title="bbox 397 183 499 185">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 397 183 499 185">
+     <span class='ocr_line' id='line_1_40' title="bbox 397 183 499 185; baseline 0 1475"><span class='ocrx_word' id='word_1_48' title='bbox 397 183 499 185; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_40' title="bbox 464 96 466 141">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 464 96 466 141">
+     <span class='ocr_line' id='line_1_41' title="bbox 464 96 466 141; baseline 0 1519"><span class='ocrx_word' id='word_1_49' title='bbox 464 96 466 141; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_41' title="bbox 466 86 1125 198">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 466 86 1125 198">
+     <span class='ocr_line' id='line_1_42' title="bbox 466 86 1086 112; baseline 0 -5"><span class='ocrx_word' id='word_1_50' title='bbox 466 96 497 98; x_wconf 97' lang='eng'>—</span> <span class='ocrx_word' id='word_1_51' title='bbox 506 87 690 107; x_wconf 74' lang='eng' dir='ltr'><em>Microbacterium</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 699 87 807 107; x_wconf 82' lang='eng' dir='ltr'><em>sch/eiferi</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 816 87 872 107; x_wconf 86' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 883 86 967 107; x_wconf 83' lang='eng' dir='ltr'><em>20489T</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 977 87 1086 112; x_wconf 85' lang='eng' dir='ltr'><strong>(Y17237)</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 466 129 1107 155; baseline 0 -5"><span class='ocrx_word' id='word_1_56' title='bbox 466 139 525 141; x_wconf 96' lang='eng'>—</span> <span class='ocrx_word' id='word_1_57' title='bbox 534 130 718 150; x_wconf 82' lang='eng' dir='ltr'><em>Microbacterium</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 727 130 826 150; x_wconf 76' lang='eng' dir='ltr'><em>lacticum</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 836 130 893 150; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 903 129 988 150; x_wconf 83' lang='eng' dir='ltr'><em>20427T</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 998 130 1107 155; x_wconf 89' lang='eng' dir='ltr'><strong>(X77441)</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 508 172 1125 198; baseline 0 -5"><span class='ocrx_word' id='word_1_62' title='bbox 508 173 693 193; x_wconf 75' lang='eng' dir='ltr'><em>Microbacterium</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 702 173 845 198; x_wconf 84' lang='eng' dir='ltr'><em>quuefaciens</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 855 173 911 193; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 922 172 1006 193; x_wconf 87' lang='eng' dir='ltr'><em>20638T</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 1016 173 1125 198; x_wconf 97' lang='eng' dir='ltr'><strong>(X77444)</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_42' title="bbox 405 215 1017 328">
+    <p class='ocr_par' dir='ltr' id='par_1_42' title="bbox 405 215 1017 328">
+     <span class='ocr_line' id='line_1_45' title="bbox 445 215 976 241; baseline 0 -5"><span class='ocrx_word' id='word_1_67' title='bbox 445 216 590 236; x_wconf 81' lang='eng' dir='ltr'><em>Plantibacter</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 597 216 667 236; x_wconf 85' lang='eng' dir='ltr'><em>flavus</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 677 216 733 236; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 745 215 828 236; x_wconf 79' lang='eng' dir='ltr'><em>14012T</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 837 216 976 241; x_wconf 86' lang='eng' dir='ltr'><em>(AJ310417)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 405 258 1017 284; baseline 0 -6"><span class='ocrx_word' id='word_1_72' title='bbox 405 258 562 279; x_wconf 75' lang='eng' dir='ltr'><em>Okibacterium</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 572 258 679 279; x_wconf 80' lang='eng' dir='ltr'><em>friti/Iariae</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 687 259 744 278; x_wconf 93' lang='eng' dir='ltr'><em>VKM</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 754 258 865 279; x_wconf 74' lang='eng' dir='ltr'><em>Ac—ZOSQT</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 874 259 1017 284; x_wconf 85' lang='eng' dir='ltr'><em>(ABO42094)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 497 301 1012 328; baseline 0 -6"><span class='ocrx_word' id='word_1_77' title='bbox 497 302 639 328; x_wconf 86' lang='eng' dir='ltr'><em>Agrococcus</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 644 302 747 328; x_wconf 86' lang='eng' dir='ltr'><em>jenensis</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 757 302 813 322; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 824 301 894 322; x_wconf 70' lang='eng' dir='ltr'><em>9580T</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 903 302 1012 328; x_wconf 84' lang='eng' dir='ltr'><strong>(X92492)</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_43' title="bbox 399 344 911 371">
+    <p class='ocr_par' dir='ltr' id='par_1_43' title="bbox 399 344 911 371">
+     <span class='ocr_line' id='line_1_48' title="bbox 399 344 911 371; baseline 0 -6"><span class='ocrx_word' id='word_1_82' title='bbox 399 345 505 365; x_wconf 70' lang='eng' dir='ltr'><em>Leffson/a</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 514 350 574 371; x_wconf 87' lang='eng' dir='ltr'><em>poae</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 583 345 640 365; x_wconf 92' lang='eng' dir='ltr'><em>VKM</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 650 344 911 371; x_wconf 65' lang='eng' dir='ltr'><em>Ac—1401T(AF116342)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_44' title="bbox 455 387 953 413">
+    <p class='ocr_par' dir='ltr' id='par_1_44' title="bbox 455 387 953 413">
+     <span class='ocr_line' id='line_1_49' title="bbox 455 387 953 413; baseline 0 -5"><span class='ocrx_word' id='word_1_86' title='bbox 455 388 561 408; x_wconf 85' lang='eng' dir='ltr'><em>Leifsonia</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 571 388 672 413; x_wconf 82' lang='eng' dir='ltr'><em>aquatica</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 683 388 739 408; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 750 387 834 408; x_wconf 76' lang='eng' dir='ltr'><em>20146T</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 844 388 953 413; x_wconf 89' lang='eng' dir='ltr'><em>(X77450)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_45' title="bbox 384 569 452 571">
+    <p class='ocr_par' dir='ltr' id='par_1_45' title="bbox 384 569 452 571">
+     <span class='ocr_line' id='line_1_50' title="bbox 384 569 452 571; baseline 0 1089"><span class='ocrx_word' id='word_1_91' title='bbox 384 569 452 571; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_46' title="bbox 382 569 384 636">
+    <p class='ocr_par' dir='ltr' id='par_1_46' title="bbox 382 569 384 636">
+     <span class='ocr_line' id='line_1_51' title="bbox 382 569 384 636; baseline 0 1024"><span class='ocrx_word' id='word_1_92' title='bbox 382 569 384 636; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_47' title="bbox 532 430 1117 456">
+    <p class='ocr_par' dir='ltr' id='par_1_47' title="bbox 532 430 1117 456">
+     <span class='ocr_line' id='line_1_52' title="bbox 532 430 1117 456; baseline 0 -5"><span class='ocrx_word' id='word_1_93' title='bbox 532 431 683 451; x_wconf 82' lang='eng' dir='ltr'><em>Leucobacter</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 689 431 822 456; x_wconf 80' lang='eng' dir='ltr'><em>komagatae</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 833 431 875 451; x_wconf 90' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 887 430 969 451; x_wconf 88' lang='eng' dir='ltr'><em>15245T</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 979 431 1117 456; x_wconf 83' lang='eng' dir='ltr'><strong>(AJ746337)</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_48' title="bbox 463 473 914 499">
+    <p class='ocr_par' dir='ltr' id='par_1_48' title="bbox 463 473 914 499">
+     <span class='ocr_line' id='line_1_53' title="bbox 463 473 914 499; baseline 0 -5"><span class='ocrx_word' id='word_1_98' title='bbox 463 474 590 494; x_wconf 83' lang='eng' dir='ltr'><em>Subtercola</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 600 474 682 494; x_wconf 82' lang='eng' dir='ltr'><em>boreus</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 692 473 763 494; x_wconf 83' lang='eng' dir='ltr'><em>K300T</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 773 474 914 499; x_wconf 87' lang='eng' dir='ltr'><em>(AF224722)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_49' title="bbox 384 613 504 657">
+    <p class='ocr_par' dir='ltr' id='par_1_49' title="bbox 384 613 504 657">
+     <span class='ocr_line' id='line_1_54' title="bbox 384 613 504 657; baseline 0 0"><span class='ocrx_word' id='word_1_102' title='bbox 384 613 504 657; x_wconf 70' lang='eng'><em>—1_</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_50' title="bbox 416 645 1081 715">
+    <p class='ocr_par' dir='ltr' id='par_1_50' title="bbox 416 645 1081 715">
+     <span class='ocr_line' id='line_1_55' title="bbox 416 645 928 671; baseline 0 -5"><span class='ocrx_word' id='word_1_103' title='bbox 416 645 446 661; x_wconf 80' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 476 646 582 666; x_wconf 84' lang='eng' dir='ltr'><em>Leifsonia</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 592 646 654 666; x_wconf 84' lang='eng' dir='ltr'><em>rubra</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 664 646 722 666; x_wconf 87' lang='eng' dir='ltr'><em>CMS</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 732 646 779 666; x_wconf 88' lang='eng' dir='ltr'><em>76rT</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 789 646 928 671; x_wconf 84' lang='eng' dir='ltr'><strong>(AJ438585)</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_56' title="bbox 471 688 1081 715; baseline 0 -6"><span class='ocrx_word' id='word_1_109' title='bbox 471 689 696 709; x_wconf 79' lang='eng' dir='ltr'><em>Pseudoc/avibacter</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 702 689 801 709; x_wconf 86' lang='eng' dir='ltr'><em>he/volus</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 811 689 867 709; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_112' title='bbox 877 688 962 709; x_wconf 81' lang='eng' dir='ltr'><em>20419T</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 972 689 1081 715; x_wconf 90' lang='eng' dir='ltr'><em>(X77440)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_51' title="bbox 119 826 426 828">
+    <p class='ocr_par' dir='ltr' id='par_1_51' title="bbox 119 826 426 828">
+     <span class='ocr_line' id='line_1_57' title="bbox 119 826 426 828; baseline 0 832"><span class='ocrx_word' id='word_1_114' title='bbox 119 826 426 828; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_52' title="bbox 134 698 136 957">
+    <p class='ocr_par' dir='ltr' id='par_1_52' title="bbox 134 698 136 957">
+     <span class='ocr_line' id='line_1_58' title="bbox 134 698 136 957; baseline 0 703"><span class='ocrx_word' id='word_1_115' title='bbox 134 698 136 957; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_53' title="bbox 105 1511 142 1527">
+    <p class='ocr_par' dir='ltr' id='par_1_53' title="bbox 105 1511 142 1527">
+     <span class='ocr_line' id='line_1_59' title="bbox 105 1511 142 1527; baseline -0.027 0"><span class='ocrx_word' id='word_1_116' title='bbox 105 1511 142 1527; x_wconf 91' lang='eng'><em>0.01</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_54' title="bbox 159 795 161 872">
+    <p class='ocr_par' dir='ltr' id='par_1_54' title="bbox 159 795 161 872">
+     <span class='ocr_line' id='line_1_60' title="bbox 159 795 161 872; baseline 0 788"><span class='ocrx_word' id='word_1_117' title='bbox 159 795 161 872; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_55' title="bbox 163 967 165 1191">
+    <p class='ocr_par' dir='ltr' id='par_1_55' title="bbox 163 967 165 1191">
+     <span class='ocr_line' id='line_1_61' title="bbox 163 967 165 1191; baseline 0 469"><span class='ocrx_word' id='word_1_118' title='bbox 163 967 165 1191; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_56' title="bbox 193 1063 222 1065">
+    <p class='ocr_par' dir='ltr' id='par_1_56' title="bbox 193 1063 222 1065">
+     <span class='ocr_line' id='line_1_62' title="bbox 193 1063 222 1065; baseline 0 595"><span class='ocrx_word' id='word_1_119' title='bbox 193 1063 222 1065; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_57' title="bbox 220 1042 222 1087">
+    <p class='ocr_par' dir='ltr' id='par_1_57' title="bbox 220 1042 222 1087">
+     <span class='ocr_line' id='line_1_63' title="bbox 220 1042 222 1087; baseline 0 573"><span class='ocrx_word' id='word_1_120' title='bbox 220 1042 222 1087; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_58' title="bbox 193 1063 195 1130">
+    <p class='ocr_par' dir='ltr' id='par_1_58' title="bbox 193 1063 195 1130">
+     <span class='ocr_line' id='line_1_64' title="bbox 193 1063 195 1130; baseline 0 530"><span class='ocrx_word' id='word_1_121' title='bbox 193 1063 195 1130; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_59' title="bbox 163 1189 186 1191">
+    <p class='ocr_par' dir='ltr' id='par_1_59' title="bbox 163 1189 186 1191">
+     <span class='ocr_line' id='line_1_65' title="bbox 163 1189 186 1191; baseline 0 469"><span class='ocrx_word' id='word_1_122' title='bbox 163 1189 186 1191; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_60' title="bbox 184 1096 186 1286">
+    <p class='ocr_par' dir='ltr' id='par_1_60' title="bbox 184 1096 186 1286">
+     <span class='ocr_line' id='line_1_66' title="bbox 184 1096 186 1286; baseline 0 374"><span class='ocrx_word' id='word_1_123' title='bbox 184 1096 186 1286; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_61' title="bbox 184 1284 205 1286">
+    <p class='ocr_par' dir='ltr' id='par_1_61' title="bbox 184 1284 205 1286">
+     <span class='ocr_line' id='line_1_67' title="bbox 184 1284 205 1286; baseline 0 374"><span class='ocrx_word' id='word_1_124' title='bbox 184 1284 205 1286; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_62' title="bbox 203 1225 205 1346">
+    <p class='ocr_par' dir='ltr' id='par_1_62' title="bbox 203 1225 205 1346">
+     <span class='ocr_line' id='line_1_68' title="bbox 203 1225 205 1346; baseline 0 314"><span class='ocrx_word' id='word_1_125' title='bbox 203 1225 205 1346; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_63' title="bbox 216 1301 218 1391">
+    <p class='ocr_par' dir='ltr' id='par_1_63' title="bbox 216 1301 218 1391">
+     <span class='ocr_line' id='line_1_69' title="bbox 216 1301 218 1391; baseline 0 269"><span class='ocrx_word' id='word_1_126' title='bbox 216 1301 218 1391; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_64' title="bbox 312 910 334 927">
+    <p class='ocr_par' dir='ltr' id='par_1_64' title="bbox 312 910 334 927">
+     <span class='ocr_line' id='line_1_70' title="bbox 312 910 334 927; baseline -0.045 0"><span class='ocrx_word' id='word_1_127' title='bbox 312 910 334 927; x_wconf 81' lang='eng'><strong>97</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_65' title="bbox 314 935 342 937">
+    <p class='ocr_par' dir='ltr' id='par_1_65' title="bbox 314 935 342 937">
+     <span class='ocr_line' id='line_1_71' title="bbox 314 935 342 937; baseline 0 723"><span class='ocrx_word' id='word_1_128' title='bbox 314 935 342 937; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_66' title="bbox 340 913 342 958">
+    <p class='ocr_par' dir='ltr' id='par_1_66' title="bbox 340 913 342 958">
+     <span class='ocr_line' id='line_1_72' title="bbox 340 913 342 958; baseline 0 702"><span class='ocrx_word' id='word_1_129' title='bbox 340 913 342 958; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_67' title="bbox 275 943 309 959">
+    <p class='ocr_par' dir='ltr' id='par_1_67' title="bbox 275 943 309 959">
+     <span class='ocr_line' id='line_1_73' title="bbox 275 943 309 959; baseline 0.029 -1"><span class='ocrx_word' id='word_1_130' title='bbox 275 943 309 959; x_wconf 82' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_68' title="bbox 314 935 316 1000">
+    <p class='ocr_par' dir='ltr' id='par_1_68' title="bbox 314 935 316 1000">
+     <span class='ocr_line' id='line_1_74' title="bbox 314 935 316 1000; baseline 0 660"><span class='ocrx_word' id='word_1_131' title='bbox 314 935 316 1000; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_69' title="bbox 305 1201 337 1217">
+    <p class='ocr_par' dir='ltr' id='par_1_69' title="bbox 305 1201 337 1217">
+     <span class='ocr_line' id='line_1_75' title="bbox 305 1201 337 1217; baseline 0.031 -1"><span class='ocrx_word' id='word_1_132' title='bbox 305 1201 337 1217; x_wconf 89' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_70' title="bbox 343 1192 345 1259">
+    <p class='ocr_par' dir='ltr' id='par_1_70' title="bbox 343 1192 345 1259">
+     <span class='ocr_line' id='line_1_76' title="bbox 343 1192 345 1259; baseline 0 401"><span class='ocrx_word' id='word_1_133' title='bbox 343 1192 345 1259; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_71' title="bbox 216 1389 263 1391">
+    <p class='ocr_par' dir='ltr' id='par_1_71' title="bbox 216 1389 263 1391">
+     <span class='ocr_line' id='line_1_77' title="bbox 216 1389 263 1391; baseline 0 269"><span class='ocrx_word' id='word_1_134' title='bbox 216 1389 263 1391; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_72' title="bbox 261 1343 263 1437">
+    <p class='ocr_par' dir='ltr' id='par_1_72' title="bbox 261 1343 263 1437">
+     <span class='ocr_line' id='line_1_78' title="bbox 261 1343 263 1437; baseline 0 223"><span class='ocrx_word' id='word_1_135' title='bbox 261 1343 263 1437; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_73' title="bbox 283 516 1116 629">
+    <p class='ocr_par' dir='ltr' id='par_1_73' title="bbox 283 516 1116 629">
+     <span class='ocr_line' id='line_1_79' title="bbox 283 516 936 542; baseline 0 -5"><span class='ocrx_word' id='word_1_136' title='bbox 283 526 388 528; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_137' title='bbox 395 517 473 542; x_wconf 86' lang='eng' dir='ltr'><em>Agreia</em></span> <span class='ocrx_word' id='word_1_138' title='bbox 483 517 599 537; x_wconf 82' lang='eng' dir='ltr'><em>bico/orata</em></span> <span class='ocrx_word' id='word_1_139' title='bbox 608 517 665 537; x_wconf 93' lang='eng' dir='ltr'><em>VKM</em></span> <span class='ocrx_word' id='word_1_140' title='bbox 674 516 785 537; x_wconf 72' lang='eng' dir='ltr'><em>Ac—1804T</em></span> <span class='ocrx_word' id='word_1_141' title='bbox 795 517 936 542; x_wconf 84' lang='eng' dir='ltr'><em>(AF159363)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_80' title="bbox 461 559 1116 585; baseline 0 -5"><span class='ocrx_word' id='word_1_142' title='bbox 461 560 646 580; x_wconf 71' lang='eng' dir='ltr'><em>Salinibacterium</em></span> <span class='ocrx_word' id='word_1_143' title='bbox 655 560 816 585; x_wconf 82' lang='eng' dir='ltr'><em>amurskyense</em></span> <span class='ocrx_word' id='word_1_144' title='bbox 826 560 885 580; x_wconf 92' lang='eng' dir='ltr'><em>KMM</em></span> <span class='ocrx_word' id='word_1_145' title='bbox 897 559 965 580; x_wconf 71' lang='eng' dir='ltr'><em>3673T</em></span> <span class='ocrx_word' id='word_1_146' title='bbox 975 560 1116 585; x_wconf 83' lang='eng' dir='ltr'><em>(AF539697)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_81' title="bbox 513 602 977 629; baseline 0 -6"><span class='ocrx_word' id='word_1_147' title='bbox 513 603 672 629; x_wconf 82' lang='eng' dir='ltr'><em>Rhodoglobus</em></span> <span class='ocrx_word' id='word_1_148' title='bbox 682 603 764 623; x_wconf 81' lang='eng' dir='ltr'><em>vesta/ii</em></span> <span class='ocrx_word' id='word_1_149' title='bbox 773 602 829 623; x_wconf 75' lang='eng' dir='ltr'><em>LV3T</em></span> <span class='ocrx_word' id='word_1_150' title='bbox 838 603 977 629; x_wconf 81' lang='eng' dir='ltr'><em>(AJ459101)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_74' title="bbox 305 731 867 800">
+    <p class='ocr_par' dir='ltr' id='par_1_74' title="bbox 305 731 867 800">
+     <span class='ocr_line' id='line_1_82' title="bbox 305 731 830 758; baseline 0 -6"><span class='ocrx_word' id='word_1_151' title='bbox 305 741 326 743; x_wconf 97' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_152' title='bbox 334 732 503 758; x_wconf 76' lang='eng' dir='ltr'><em>Rathayibacter</em></span> <span class='ocrx_word' id='word_1_153' title='bbox 510 732 566 752; x_wconf 78' lang='eng' dir='ltr'><em>tritici</em></span> <span class='ocrx_word' id='word_1_154' title='bbox 574 732 631 752; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_155' title='bbox 642 731 711 752; x_wconf 83' lang='eng' dir='ltr'><em>7486T</em></span> <span class='ocrx_word' id='word_1_156' title='bbox 721 732 830 758; x_wconf 84' lang='eng' dir='ltr'><strong>(X77438)</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_83' title="bbox 305 774 867 800; baseline 0 -5"><span class='ocrx_word' id='word_1_157' title='bbox 305 784 338 786; x_wconf 97' lang='eng'>—</span> <span class='ocrx_word' id='word_1_158' title='bbox 346 775 516 800; x_wconf 80' lang='eng' dir='ltr'><em>Rathayibacter</em></span> <span class='ocrx_word' id='word_1_159' title='bbox 522 775 604 800; x_wconf 83' lang='eng' dir='ltr'><em>rathayi</em></span> <span class='ocrx_word' id='word_1_160' title='bbox 613 775 669 795; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_161' title='bbox 680 774 749 795; x_wconf 83' lang='eng' dir='ltr'><em>7485T</em></span> <span class='ocrx_word' id='word_1_162' title='bbox 758 775 867 800; x_wconf 80' lang='eng' dir='ltr'><strong>(X77439)</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_75' title="bbox 374 817 956 886">
+    <p class='ocr_par' dir='ltr' id='par_1_75' title="bbox 374 817 956 886">
+     <span class='ocr_line' id='line_1_84' title="bbox 435 817 956 843; baseline 0 -5"><span class='ocrx_word' id='word_1_163' title='bbox 435 818 604 843; x_wconf 81' lang='eng' dir='ltr'><em>Rathayibacter</em></span> <span class='ocrx_word' id='word_1_164' title='bbox 611 818 694 838; x_wconf 79' lang='eng' dir='ltr'><em>toxicus</em></span> <span class='ocrx_word' id='word_1_165' title='bbox 703 818 756 838; x_wconf 83' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_166' title='bbox 767 817 836 838; x_wconf 79' lang='eng' dir='ltr'><em>9669T</em></span> <span class='ocrx_word' id='word_1_167' title='bbox 845 818 956 843; x_wconf 91' lang='eng' dir='ltr'><strong>(D84127)</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_85' title="bbox 374 860 935 886; baseline 0 -5"><span class='ocrx_word' id='word_1_168' title='bbox 374 861 557 881; x_wconf 74' lang='eng' dir='ltr'><em>Curtobacterium</em></span> <span class='ocrx_word' id='word_1_169' title='bbox 567 861 655 881; x_wconf 76' lang='eng' dir='ltr'><em>citreum</em></span> <span class='ocrx_word' id='word_1_170' title='bbox 665 861 722 881; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_171' title='bbox 732 860 816 881; x_wconf 80' lang='eng' dir='ltr'><em>20528T</em></span> <span class='ocrx_word' id='word_1_172' title='bbox 826 861 935 886; x_wconf 87' lang='eng' dir='ltr'><strong>(X77436)</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_76' title="bbox 316 904 946 1016">
+    <p class='ocr_par' dir='ltr' id='par_1_76' title="bbox 316 904 946 1016">
+     <span class='ocr_line' id='line_1_86' title="bbox 342 904 946 930; baseline -0.002 -5"><span class='ocrx_word' id='word_1_173' title='bbox 342 913 359 915; x_wconf 93' lang='eng'>-</span> <span class='ocrx_word' id='word_1_174' title='bbox 368 905 503 930; x_wconf 80' lang='eng' dir='ltr'><em>Mycetoco/a</em></span> <span class='ocrx_word' id='word_1_175' title='bbox 514 905 694 925; x_wconf 78' lang='eng' dir='ltr'><em>tolaasinivorans</em></span> <span class='ocrx_word' id='word_1_176' title='bbox 703 904 793 925; x_wconf 79' lang='eng' dir='ltr'><em>CM—05T</em></span> <span class='ocrx_word' id='word_1_177' title='bbox 803 905 946 930; x_wconf 85' lang='eng' dir='ltr'><em>(ABO12646)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_87' title="bbox 342 946 846 973; baseline 0 -6"><span class='ocrx_word' id='word_1_178' title='bbox 342 956 355 958; x_wconf 96' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_179' title='bbox 364 947 499 973; x_wconf 81' lang='eng' dir='ltr'><em>Mycetoco/a</em></span> <span class='ocrx_word' id='word_1_180' title='bbox 509 947 595 967; x_wconf 83' lang='eng' dir='ltr'><em>lacteus</em></span> <span class='ocrx_word' id='word_1_181' title='bbox 604 946 693 967; x_wconf 83' lang='eng' dir='ltr'><em>CM-10T</em></span> <span class='ocrx_word' id='word_1_182' title='bbox 703 947 846 973; x_wconf 87' lang='eng' dir='ltr'><em>(AB012648)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_88' title="bbox 316 989 885 1016; baseline 0 -6"><span class='ocrx_word' id='word_1_183' title='bbox 316 999 342 1001; x_wconf 97' lang='eng'>—</span> <span class='ocrx_word' id='word_1_184' title='bbox 351 990 486 1016; x_wconf 84' lang='eng' dir='ltr'><em>Mycetocola</em></span> <span class='ocrx_word' id='word_1_185' title='bbox 496 990 635 1016; x_wconf 86' lang='eng' dir='ltr'><em>saprophi/us</em></span> <span class='ocrx_word' id='word_1_186' title='bbox 644 989 734 1010; x_wconf 77' lang='eng' dir='ltr'><em>CM-01T</em></span> <span class='ocrx_word' id='word_1_187' title='bbox 743 990 885 1016; x_wconf 85' lang='eng' dir='ltr'><em>(ABO12647)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_77' title="bbox 348 1033 995 1145">
+    <p class='ocr_par' dir='ltr' id='par_1_77' title="bbox 348 1033 995 1145">
+     <span class='ocr_line' id='line_1_89' title="bbox 416 1033 995 1058; baseline 0 -5"><span class='ocrx_word' id='word_1_188' title='bbox 416 1033 552 1053; x_wconf 77' lang='eng' dir='ltr'><em>Clavibacter</em></span> <span class='ocrx_word' id='word_1_189' title='bbox 558 1033 730 1058; x_wconf 85' lang='eng' dir='ltr'><em>michiganensis</em></span> <span class='ocrx_word' id='word_1_190' title='bbox 740 1033 755 1053; x_wconf 91' lang='eng' dir='ltr'>P</span> <span class='ocrx_word' id='word_1_191' title='bbox 764 1033 842 1053; x_wconf 90' lang='eng'>250/01</span> <span class='ocrx_word' id='word_1_192' title='bbox 856 1033 995 1058; x_wconf 86' lang='eng' dir='ltr'><em>(AJ310416)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_90' title="bbox 402 1075 913 1101; baseline 0 -5"><span class='ocrx_word' id='word_1_193' title='bbox 402 1076 529 1096; x_wconf 83' lang='eng' dir='ltr'><em>Subterco/a</em></span> <span class='ocrx_word' id='word_1_194' title='bbox 539 1076 682 1101; x_wconf 82' lang='eng' dir='ltr'><em>frigoramans</em></span> <span class='ocrx_word' id='word_1_195' title='bbox 692 1075 763 1096; x_wconf 89' lang='eng' dir='ltr'><em>K265T</em></span> <span class='ocrx_word' id='word_1_196' title='bbox 772 1076 913 1101; x_wconf 87' lang='eng' dir='ltr'><em>(AF224723)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_91' title="bbox 348 1118 793 1145; baseline 0 -6"><span class='ocrx_word' id='word_1_197' title='bbox 348 1119 544 1144; x_wconf 80' lang='eng' dir='ltr'><em>Frigoribacterium</em></span> <span class='ocrx_word' id='word_1_198' title='bbox 553 1119 612 1139; x_wconf 81' lang='eng' dir='ltr'><em>faeni</em></span> <span class='ocrx_word' id='word_1_199' title='bbox 620 1119 659 1139; x_wconf 88' lang='eng'><em>801</em></span> <span class='ocrx_word' id='word_1_200' title='bbox 665 1118 674 1130; x_wconf 65' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_201' title='bbox 684 1119 793 1145; x_wconf 88' lang='eng' dir='ltr'><strong>(Y18807)</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_78' title="bbox 388 1168 418 1184">
+    <p class='ocr_par' dir='ltr' id='par_1_78' title="bbox 388 1168 418 1184">
+     <span class='ocr_line' id='line_1_92' title="bbox 388 1168 418 1184; baseline 0 0"><span class='ocrx_word' id='word_1_202' title='bbox 388 1168 418 1184; x_wconf 86' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_79' title="bbox 345 1192 425 1194">
+    <p class='ocr_par' dir='ltr' id='par_1_79' title="bbox 345 1192 425 1194">
+     <span class='ocr_line' id='line_1_93' title="bbox 345 1192 425 1194; baseline 0 466"><span class='ocrx_word' id='word_1_203' title='bbox 345 1192 425 1194; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_80' title="bbox 345 1257 428 1259">
+    <p class='ocr_par' dir='ltr' id='par_1_80' title="bbox 345 1257 428 1259">
+     <span class='ocr_line' id='line_1_94' title="bbox 345 1257 428 1259; baseline 0 401"><span class='ocrx_word' id='word_1_204' title='bbox 345 1257 428 1259; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_81' title="bbox 426 1171 428 1216">
+    <p class='ocr_par' dir='ltr' id='par_1_81' title="bbox 426 1171 428 1216">
+     <span class='ocr_line' id='line_1_95' title="bbox 426 1171 428 1216; baseline 0 444"><span class='ocrx_word' id='word_1_205' title='bbox 426 1171 428 1216; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_82' title="bbox 428 1161 1012 1274">
+    <p class='ocr_par' dir='ltr' id='par_1_82' title="bbox 428 1161 1012 1274">
+     <span class='ocr_line' id='line_1_96' title="bbox 428 1161 916 1187; baseline 0 -5"><span class='ocrx_word' id='word_1_206' title='bbox 428 1171 466 1173; x_wconf 97' lang='eng'>—</span> <span class='ocrx_word' id='word_1_207' title='bbox 475 1162 596 1182; x_wconf 72' lang='eng' dir='ltr'><em>Mlcroce/la</em></span> <span class='ocrx_word' id='word_1_208' title='bbox 604 1162 698 1187; x_wconf 77' lang='eng' dir='ltr'><em>putealis</em></span> <span class='ocrx_word' id='word_1_209' title='bbox 707 1161 768 1182; x_wconf 73' lang='eng' dir='ltr'><em>CV2T</em></span> <span class='ocrx_word' id='word_1_210' title='bbox 778 1162 916 1187; x_wconf 81' lang='eng' dir='ltr'><strong>(AJ717388)</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_97' title="bbox 428 1205 949 1231; baseline 0 -6"><span class='ocrx_word' id='word_1_211' title='bbox 428 1214 464 1216; x_wconf 97' lang='eng'>—</span> <span class='ocrx_word' id='word_1_212' title='bbox 474 1205 594 1225; x_wconf 84' lang='eng' dir='ltr'><em>Microcella</em></span> <span class='ocrx_word' id='word_1_213' title='bbox 604 1206 721 1231; x_wconf 81' lang='eng' dir='ltr'><em>alkaliphila</em></span> <span class='ocrx_word' id='word_1_214' title='bbox 730 1205 801 1225; x_wconf 89' lang='eng' dir='ltr'><em>AC4rT</em></span> <span class='ocrx_word' id='word_1_215' title='bbox 811 1205 949 1231; x_wconf 85' lang='eng' dir='ltr'><strong>(AJ717385)</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_98' title="bbox 439 1248 1012 1274; baseline 0 -6"><span class='ocrx_word' id='word_1_216' title='bbox 439 1248 603 1274; x_wconf 85' lang='eng' dir='ltr'><em>Yonghaparkia</em></span> <span class='ocrx_word' id='word_1_217' title='bbox 613 1248 730 1274; x_wconf 82' lang='eng' dir='ltr'><em>alkaliphi/a</em></span> <span class='ocrx_word' id='word_1_218' title='bbox 741 1248 855 1268; x_wconf 83' lang='eng' dir='ltr'><em>KSL-113T</em></span> <span class='ocrx_word' id='word_1_219' title='bbox 864 1248 1012 1274; x_wconf 81' lang='eng' dir='ltr'><em>(D0256087)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_83' title="bbox 387 1291 1127 1360">
+    <p class='ocr_par' dir='ltr' id='par_1_83' title="bbox 387 1291 1127 1360">
+     <span class='ocr_line' id='line_1_99' title="bbox 387 1291 942 1317; baseline 0 -5"><span class='ocrx_word' id='word_1_220' title='bbox 387 1292 502 1312; x_wconf 84' lang='eng' dir='ltr'><em>Labede/Ia</em></span> <span class='ocrx_word' id='word_1_221' title='bbox 512 1292 651 1317; x_wconf 82' lang='eng' dir='ltr'><em>gwakjiensis</em></span> <span class='ocrx_word' id='word_1_222' title='bbox 661 1291 785 1312; x_wconf 88' lang='eng' dir='ltr'><em>KSW2-17T</em></span> <span class='ocrx_word' id='word_1_223' title='bbox 794 1291 942 1317; x_wconf 81' lang='eng' dir='ltr'><em>(D0533552)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_100' title="bbox 475 1333 1127 1360; baseline 0 -6"><span class='ocrx_word' id='word_1_224' title='bbox 475 1334 649 1360; x_wconf 84' lang='eng' dir='ltr'><em>Cryobacterium</em></span> <span class='ocrx_word' id='word_1_225' title='bbox 657 1334 832 1360; x_wconf 80' lang='eng' dir='ltr'><em>psyohrophi/um</em></span> <span class='ocrx_word' id='word_1_226' title='bbox 843 1334 900 1354; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_227' title='bbox 909 1333 979 1354; x_wconf 80' lang='eng' dir='ltr'><em>4854T</em></span> <span class='ocrx_word' id='word_1_228' title='bbox 989 1334 1127 1360; x_wconf 85' lang='eng' dir='ltr'><em>(AJ544063)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_84' title="bbox 261 1435 428 1437">
+    <p class='ocr_par' dir='ltr' id='par_1_84' title="bbox 261 1435 428 1437">
+     <span class='ocr_line' id='line_1_101' title="bbox 261 1435 428 1437; baseline 0 223"><span class='ocrx_word' id='word_1_229' title='bbox 261 1435 428 1437; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_85' title="bbox 388 1446 421 1462">
+    <p class='ocr_par' dir='ltr' id='par_1_85' title="bbox 388 1446 421 1462">
+     <span class='ocr_line' id='line_1_102' title="bbox 388 1446 421 1462; baseline 0 0"><span class='ocrx_word' id='word_1_230' title='bbox 388 1446 421 1462; x_wconf 87' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_86' title="bbox 426 1386 428 1487">
+    <p class='ocr_par' dir='ltr' id='par_1_86' title="bbox 426 1386 428 1487">
+     <span class='ocr_line' id='line_1_103' title="bbox 426 1386 428 1487; baseline 0 173"><span class='ocrx_word' id='word_1_231' title='bbox 426 1386 428 1487; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_87' title="bbox 489 1469 511 1485">
+    <p class='ocr_par' dir='ltr' id='par_1_87' title="bbox 489 1469 511 1485">
+     <span class='ocr_line' id='line_1_104' title="bbox 489 1469 511 1485; baseline 0 0"><span class='ocrx_word' id='word_1_232' title='bbox 489 1469 511 1485; x_wconf 82' lang='eng'><em>69</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_88' title="bbox 426 1485 464 1487">
+    <p class='ocr_par' dir='ltr' id='par_1_88' title="bbox 426 1485 464 1487">
+     <span class='ocr_line' id='line_1_105' title="bbox 426 1485 464 1487; baseline 0 173"><span class='ocrx_word' id='word_1_233' title='bbox 426 1485 464 1487; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_89' title="bbox 434 1496 456 1513">
+    <p class='ocr_par' dir='ltr' id='par_1_89' title="bbox 434 1496 456 1513">
+     <span class='ocr_line' id='line_1_106' title="bbox 434 1496 456 1513; baseline 0 0"><span class='ocrx_word' id='word_1_234' title='bbox 434 1496 456 1513; x_wconf 78' lang='eng'><strong>89</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_90' title="bbox 520 1472 614 1474">
+    <p class='ocr_par' dir='ltr' id='par_1_90' title="bbox 520 1472 614 1474">
+     <span class='ocr_line' id='line_1_107' title="bbox 520 1472 614 1474; baseline 0 186"><span class='ocrx_word' id='word_1_235' title='bbox 520 1472 614 1474; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_91' title="bbox 501 1493 520 1495">
+    <p class='ocr_par' dir='ltr' id='par_1_91' title="bbox 501 1493 520 1495">
+     <span class='ocr_line' id='line_1_108' title="bbox 501 1493 520 1495; baseline 0 165"><span class='ocrx_word' id='word_1_236' title='bbox 501 1493 520 1495; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_92' title="bbox 462 1429 464 1544">
+    <p class='ocr_par' dir='ltr' id='par_1_92' title="bbox 462 1429 464 1544">
+     <span class='ocr_line' id='line_1_109' title="bbox 462 1429 464 1544; baseline 0 116"><span class='ocrx_word' id='word_1_237' title='bbox 462 1429 464 1544; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_93' title="bbox 501 1493 503 1592">
+    <p class='ocr_par' dir='ltr' id='par_1_93' title="bbox 501 1493 503 1592">
+     <span class='ocr_line' id='line_1_110' title="bbox 501 1493 503 1592; baseline 0 68"><span class='ocrx_word' id='word_1_238' title='bbox 501 1493 503 1592; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_94' title="bbox 518 1472 520 1517">
+    <p class='ocr_par' dir='ltr' id='par_1_94' title="bbox 518 1472 520 1517">
+     <span class='ocr_line' id='line_1_111' title="bbox 518 1472 520 1517; baseline 0 143"><span class='ocrx_word' id='word_1_239' title='bbox 518 1472 520 1517; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_95' title="bbox 428 1376 1307 1401">
+    <p class='ocr_par' dir='ltr' id='par_1_95' title="bbox 428 1376 1307 1401">
+     <span class='ocr_line' id='line_1_112' title="bbox 428 1376 1307 1401; baseline 0 -5"><span class='ocrx_word' id='word_1_240' title='bbox 428 1386 534 1388; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_241' title='bbox 542 1376 696 1396; x_wconf 86' lang='eng' dir='ltr'><em>‘Candidatus</em></span> <span class='ocrx_word' id='word_1_242' title='bbox 706 1376 858 1396; x_wconf 86' lang='eng' dir='ltr'><em>Planktoluna</em></span> <span class='ocrx_word' id='word_1_243' title='bbox 867 1376 976 1396; x_wconf 88' lang='eng' dir='ltr'><em>difficilis’</em></span> <span class='ocrx_word' id='word_1_244' title='bbox 987 1376 1147 1396; x_wconf 88' lang='eng' dir='ltr'><em>MWH-7Well8</em></span> <span class='ocrx_word' id='word_1_245' title='bbox 1158 1376 1307 1401; x_wconf 84' lang='eng' dir='ltr'><em>(AM939566)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_96' title="bbox 622 1419 1479 1574">
+    <p class='ocr_par' dir='ltr' id='par_1_96' title="bbox 622 1419 1479 1574">
+     <span class='ocr_line' id='line_1_113' title="bbox 654 1419 1314 1444; baseline 0 -5"><span class='ocrx_word' id='word_1_246' title='bbox 654 1419 808 1439; x_wconf 83' lang='eng' dir='ltr'><em>‘Candidatus</em></span> <span class='ocrx_word' id='word_1_247' title='bbox 816 1419 931 1444; x_wconf 89' lang='eng' dir='ltr'><em>Aquiluna</em></span> <span class='ocrx_word' id='word_1_248' title='bbox 942 1419 1016 1439; x_wconf 90' lang='eng' dir='ltr'><em>rubra’</em></span> <span class='ocrx_word' id='word_1_249' title='bbox 1027 1419 1162 1439; x_wconf 88' lang='eng' dir='ltr'><em>MWH-Dar4</em></span> <span class='ocrx_word' id='word_1_250' title='bbox 1172 1419 1314 1444; x_wconf 86' lang='eng' dir='ltr'><em>(AJ565416)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_114' title="bbox 622 1461 1370 1487; baseline -0.001 -5"><span class='ocrx_word' id='word_1_251' title='bbox 622 1461 776 1482; x_wconf 83' lang='eng' dir='ltr'><em>‘Candidatus</em></span> <span class='ocrx_word' id='word_1_252' title='bbox 786 1462 921 1482; x_wconf 91' lang='eng' dir='ltr'><em>Limnoluna</em></span> <span class='ocrx_word' id='word_1_253' title='bbox 932 1462 1005 1482; x_wconf 89' lang='eng' dir='ltr'><em>rubra’</em></span> <span class='ocrx_word' id='word_1_254' title='bbox 1017 1462 1211 1487; x_wconf 84' lang='eng' dir='ltr'><em>MWH-EgelM2-3</em></span> <span class='ocrx_word' id='word_1_255' title='bbox 1221 1462 1370 1487; x_wconf 84' lang='eng' dir='ltr'><em>(AM943659)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_115' title="bbox 741 1505 1479 1530; baseline 0 -5"><span class='ocrx_word' id='word_1_256' title='bbox 741 1505 895 1525; x_wconf 80' lang='eng' dir='ltr'><em>‘Candidatus</em></span> <span class='ocrx_word' id='word_1_257' title='bbox 906 1505 1020 1525; x_wconf 90' lang='eng' dir='ltr'><em>Flaviluna</em></span> <span class='ocrx_word' id='word_1_258' title='bbox 1031 1505 1105 1525; x_wconf 87' lang='eng' dir='ltr'><em>lacus’</em></span> <span class='ocrx_word' id='word_1_259' title='bbox 1116 1505 1319 1525; x_wconf 87' lang='eng' dir='ltr'><em>MWH-Creno3D3</em></span> <span class='ocrx_word' id='word_1_260' title='bbox 1330 1505 1479 1530; x_wconf 82' lang='eng' dir='ltr'><em>(AM939567)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_116' title="bbox 674 1548 1384 1574; baseline 0 -6"><span class='ocrx_word' id='word_1_261' title='bbox 674 1548 828 1568; x_wconf 81' lang='eng' dir='ltr'><em>‘Candidatus</em></span> <span class='ocrx_word' id='word_1_262' title='bbox 838 1548 977 1568; x_wconf 85' lang='eng' dir='ltr'><em>Rhodoluna</em></span> <span class='ocrx_word' id='word_1_263' title='bbox 988 1548 1092 1568; x_wconf 75' lang='eng' dir='ltr'><em>lacicola‘</em></span> <span class='ocrx_word' id='word_1_264' title='bbox 1104 1548 1225 1568; x_wconf 91' lang='eng' dir='ltr'><em>MWH-Ta8</em></span> <span class='ocrx_word' id='word_1_265' title='bbox 1235 1548 1384 1574; x_wconf 87' lang='eng' dir='ltr'><strong>(AM182889)</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_97' title="bbox 501 1590 551 1592">
+    <p class='ocr_par' dir='ltr' id='par_1_97' title="bbox 501 1590 551 1592">
+     <span class='ocr_line' id='line_1_117' title="bbox 501 1590 551 1592; baseline 0 68"><span class='ocrx_word' id='word_1_266' title='bbox 501 1590 551 1592; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_98' title="bbox 521 1601 543 1617">
+    <p class='ocr_par' dir='ltr' id='par_1_98' title="bbox 521 1601 543 1617">
+     <span class='ocr_line' id='line_1_118' title="bbox 521 1601 543 1617; baseline 0 0"><span class='ocrx_word' id='word_1_267' title='bbox 521 1601 543 1617; x_wconf 87' lang='eng'><em>87</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_99' title="bbox 549 1558 551 1624">
+    <p class='ocr_par' dir='ltr' id='par_1_99' title="bbox 549 1558 551 1624">
+     <span class='ocr_line' id='line_1_119' title="bbox 549 1558 551 1624; baseline 0 36"><span class='ocrx_word' id='word_1_268' title='bbox 549 1558 551 1624; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_100' title="bbox 562 1591 1449 1660">
+    <p class='ocr_par' dir='ltr' id='par_1_100' title="bbox 562 1591 1449 1660">
+     <span class='ocr_line' id='line_1_120' title="bbox 562 1591 1449 1616; baseline 0 -5"><span class='ocrx_word' id='word_1_269' title='bbox 562 1601 630 1603; x_wconf 97' lang='eng'>—</span> <span class='ocrx_word' id='word_1_270' title='bbox 646 1591 800 1611; x_wconf 82' lang='eng' dir='ltr'><em>‘Candidatus</em></span> <span class='ocrx_word' id='word_1_271' title='bbox 810 1591 949 1611; x_wconf 87' lang='eng' dir='ltr'><em>Rhodoluna</em></span> <span class='ocrx_word' id='word_1_272' title='bbox 960 1591 1101 1616; x_wconf 88' lang='eng' dir='ltr'><em>limnophila’</em></span> <span class='ocrx_word' id='word_1_273' title='bbox 1112 1591 1294 1611; x_wconf 88' lang='eng' dir='ltr'><em>MWH-VicMua1</em></span> <span class='ocrx_word' id='word_1_274' title='bbox 1307 1591 1449 1616; x_wconf 89' lang='eng' dir='ltr'><em>(AJ565417)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_121' title="bbox 670 1634 1438 1660; baseline 0 -6"><span class='ocrx_word' id='word_1_275' title='bbox 670 1634 824 1654; x_wconf 85' lang='eng' dir='ltr'><em>‘Candidatus</em></span> <span class='ocrx_word' id='word_1_276' title='bbox 834 1634 973 1654; x_wconf 89' lang='eng' dir='ltr'><em>Rhodoluna</em></span> <span class='ocrx_word' id='word_1_277' title='bbox 984 1634 1140 1660; x_wconf 88' lang='eng' dir='ltr'><em>planktonica’</em></span> <span class='ocrx_word' id='word_1_278' title='bbox 1151 1634 1283 1654; x_wconf 90' lang='eng' dir='ltr'><em>MWH-Dar1</em></span> <span class='ocrx_word' id='word_1_279' title='bbox 1296 1634 1438 1660; x_wconf 88' lang='eng' dir='ltr'><em>(AJ565415)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_101' title="bbox 560 1601 562 1646">
+    <p class='ocr_par' dir='ltr' id='par_1_101' title="bbox 560 1601 562 1646">
+     <span class='ocr_line' id='line_1_122' title="bbox 560 1601 562 1646; baseline 0 14"><span class='ocrx_word' id='word_1_280' title='bbox 560 1601 562 1646; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_102' title="bbox 562 1644 662 1646">
+    <p class='ocr_par' dir='ltr' id='par_1_102' title="bbox 562 1644 662 1646">
+     <span class='ocr_line' id='line_1_123' title="bbox 562 1644 662 1646; baseline 0 14"><span class='ocrx_word' id='word_1_281' title='bbox 562 1644 662 1646; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001768-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001768-0-001.pbm.png
new file mode 100644
index 00000000..34e45e05
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001768-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001768-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001768-0-001.pbm.png.hocr
new file mode 100644
index 00000000..99994029
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001768-0-001.pbm.png.hocr
@@ -0,0 +1,298 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001768-0-001.pbm.png"; bbox 0 0 1657 1045; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 38 3 85 23">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 38 3 85 23">
+     <span class='ocr_line' id='line_1_1' title="bbox 38 3 85 23; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 38 3 85 23; x_wconf 89' lang='eng'><em>0.01</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 60 622 85 640">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 60 622 85 640">
+     <span class='ocr_line' id='line_1_2' title="bbox 60 622 85 640; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 60 622 85 640; x_wconf 78' lang='eng'>88</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 296 366 321 383">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 296 366 321 383">
+     <span class='ocr_line' id='line_1_3' title="bbox 296 366 321 383; baseline 0 0"><span class='ocrx_word' id='word_1_3' title='bbox 296 366 321 383; x_wconf 81' lang='eng'><em>99</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 614 7 1274 386">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 660 7 1253 81">
+     <span class='ocr_line' id='line_1_4' title="bbox 673 7 1253 37; baseline -0.002 -5"><span class='ocrx_word' id='word_1_4' title='bbox 673 9 747 32; x_wconf 88' lang='eng' dir='ltr'><em>Vibrio</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 755 9 925 37; x_wconf 85' lang='eng' dir='ltr'><em>proteolyticus</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 933 9 1015 32; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 1028 7 1121 32; x_wconf 88' lang='eng' dir='ltr'><em>15338T</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 1131 9 1253 37; x_wconf 88' lang='eng' dir='ltr'><em>(X74723)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 660 51 1149 81; baseline 0 -6"><span class='ocrx_word' id='word_1_9' title='bbox 660 53 733 75; x_wconf 88' lang='eng' dir='ltr'><em>Vibrio</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 743 53 824 75; x_wconf 76' lang='eng' dir='ltr'><em>nere/s</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 833 53 914 75; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 925 51 1020 75; x_wconf 77' lang='eng' dir='ltr'><em>25917T</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 1028 53 1149 81; x_wconf 82' lang='eng' dir='ltr'>(X74716)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 668 94 1134 125">
+     <span class='ocr_line' id='line_1_6' title="bbox 668 94 1134 125; baseline 0.002 -7"><span class='ocrx_word' id='word_1_14' title='bbox 668 96 742 119; x_wconf 89' lang='eng' dir='ltr'><em>Vibrio</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 752 96 886 119; x_wconf 86' lang='eng' dir='ltr'><em>diabolicus</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 900 94 1003 119; x_wconf 91' lang='eng' dir='ltr'><em>HE8OOT</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 1014 96 1134 125; x_wconf 85' lang='eng' dir='ltr'>(X99762)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 614 138 1211 209">
+     <span class='ocr_line' id='line_1_7' title="bbox 639 138 1211 168; baseline 0 -6"><span class='ocrx_word' id='word_1_18' title='bbox 639 140 712 162; x_wconf 83' lang='eng' dir='ltr'><em>Vibrio</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 721 140 870 162; x_wconf 86' lang='eng' dir='ltr'><em>brasiliensis</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 881 140 943 162; x_wconf 88' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 954 138 1049 162; x_wconf 89' lang='eng' dir='ltr'><em>20546T</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 1057 140 1211 168; x_wconf 84' lang='eng' dir='ltr'>(AJ316172)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 614 181 1143 209; baseline -0.006 -4"><span class='ocrx_word' id='word_1_23' title='bbox 614 184 688 206; x_wconf 86' lang='eng' dir='ltr'><em>Vibrio</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 698 184 810 206; x_wconf 79' lang='eng' dir='ltr'><em>tubiashii</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 823 183 905 206; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 917 181 1011 206; x_wconf 82' lang='eng' dir='ltr'>19109T</span> <span class='ocrx_word' id='word_1_27' title='bbox 1022 181 1143 209; x_wconf 92' lang='eng' dir='ltr'>(X74725)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 649 224 1274 343">
+     <span class='ocr_line' id='line_1_9' title="bbox 680 224 1274 255; baseline 0 -6"><span class='ocrx_word' id='word_1_28' title='bbox 680 227 753 249; x_wconf 89' lang='eng' dir='ltr'><em>Vibrio</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 763 227 932 255; x_wconf 80' lang='eng' dir='ltr'><em>coral/iilyticus</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 943 227 1005 249; x_wconf 91' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 1015 224 1111 249; x_wconf 81' lang='eng' dir='ltr'><em>20984T</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 1122 227 1274 255; x_wconf 90' lang='eng' dir='ltr'>(AJ440005)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 664 268 1217 298; baseline 0.002 -6"><span class='ocrx_word' id='word_1_33' title='bbox 664 270 738 293; x_wconf 83' lang='eng' dir='ltr'><em>Vibrio</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 747 270 877 298; x_wconf 81' lang='eng' dir='ltr'><em>neptun/us</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 888 270 950 293; x_wconf 90' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 961 268 1056 293; x_wconf 88' lang='eng' dir='ltr'><em>20536T</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 1064 270 1217 298; x_wconf 82' lang='eng' dir='ltr'><em>(AJ316171)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 649 312 1178 343; baseline 0 -7"><span class='ocrx_word' id='word_1_38' title='bbox 649 315 723 337; x_wconf 84' lang='eng' dir='ltr'><em>Vibrio</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 733 315 853 337; x_wconf 78' lang='eng' dir='ltr'><em>oriental/&#39;3</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 861 314 943 337; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 954 312 1049 337; x_wconf 78' lang='eng' dir='ltr'><em>33934T</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 1057 315 1178 343; x_wconf 86' lang='eng' dir='ltr'>(X74719)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 703 355 1193 386">
+     <span class='ocr_line' id='line_1_12' title="bbox 703 355 1193 386; baseline 0 -6"><span class='ocrx_word' id='word_1_43' title='bbox 703 358 777 380; x_wconf 80' lang='eng' dir='ltr'><em>Vibrio</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 787 358 901 380; x_wconf 84' lang='eng' dir='ltr'><em>cholerae</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 911 358 993 380; x_wconf 92' lang='eng' dir='ltr'><em>CECT</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 1003 355 1064 380; x_wconf 86' lang='eng' dir='ltr'><em>514T</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 1072 358 1193 386; x_wconf 84' lang='eng' dir='ltr'>(X76337)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 399 14 679 321">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 399 14 679 321">
+     <span class='ocr_line' id='line_1_13' title="bbox 586 14 669 96; baseline 0 -44"><span class='ocrx_word' id='word_1_48' title='bbox 586 14 669 96; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 560 96 664 140; baseline 0 0"><span class='ocrx_word' id='word_1_49' title='bbox 560 96 664 140; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 560 140 638 167; baseline 0 878"><span class='ocrx_word' id='word_1_50' title='bbox 560 140 638 167; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 560 167 614 183; baseline 0 862"><span class='ocrx_word' id='word_1_51' title='bbox 560 167 614 183; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 399 183 614 223; baseline 0 822"><span class='ocrx_word' id='word_1_52' title='bbox 399 183 614 223; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 399 223 679 253; baseline 0 792"><span class='ocrx_word' id='word_1_53' title='bbox 399 223 679 253; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 399 253 664 297; baseline 0 748"><span class='ocrx_word' id='word_1_54' title='bbox 399 253 664 297; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 555 297 645 321; baseline 0 0"><span class='ocrx_word' id='word_1_55' title='bbox 555 297 645 321; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 559 85 584 103">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 559 85 584 103">
+     <span class='ocr_line' id='line_1_21' title="bbox 559 85 584 103; baseline 0 0"><span class='ocrx_word' id='word_1_56' title='bbox 559 85 584 103; x_wconf 83' lang='eng'>56</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 370 278 395 295">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 370 278 395 295">
+     <span class='ocr_line' id='line_1_22' title="bbox 370 278 395 295; baseline 0 0"><span class='ocrx_word' id='word_1_57' title='bbox 370 278 395 295; x_wconf 86' lang='eng'><em>85</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 330 307 403 309">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 330 307 403 309">
+     <span class='ocr_line' id='line_1_23' title="bbox 330 307 403 309; baseline 0 736"><span class='ocrx_word' id='word_1_58' title='bbox 330 307 403 309; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 401 252 403 364">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 401 252 403 364">
+     <span class='ocr_line' id='line_1_24' title="bbox 401 252 403 364; baseline 0 681"><span class='ocrx_word' id='word_1_59' title='bbox 401 252 403 364; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 137 397 332 399">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 137 397 332 399">
+     <span class='ocr_line' id='line_1_25' title="bbox 137 397 332 399; baseline 0 646"><span class='ocrx_word' id='word_1_60' title='bbox 137 397 332 399; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 137 397 139 713">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 137 397 139 713">
+     <span class='ocr_line' id='line_1_26' title="bbox 137 397 139 713; baseline 0 332"><span class='ocrx_word' id='word_1_61' title='bbox 137 397 139 713; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 636 401 1153 429">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 636 401 1153 429">
+     <span class='ocr_line' id='line_1_27' title="bbox 636 401 1153 429; baseline 0 -6"><span class='ocrx_word' id='word_1_62' title='bbox 636 401 709 423; x_wconf 83' lang='eng' dir='ltr'><em>Vibrio</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 719 401 819 423; x_wconf 84' lang='eng' dir='ltr'><em>hollisae</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 831 401 892 423; x_wconf 91' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 903 401 985 423; x_wconf 84' lang='eng'>21416</span> <span class='ocrx_word' id='word_1_66' title='bbox 1001 401 1153 429; x_wconf 82' lang='eng' dir='ltr'><em>(AJ514910)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 637 442 1188 511">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 637 442 1188 511">
+     <span class='ocr_line' id='line_1_28' title="bbox 637 442 1188 473; baseline 0 -7"><span class='ocrx_word' id='word_1_67' title='bbox 637 445 760 467; x_wconf 79' lang='eng' dir='ltr'><em>terovibrio</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 770 445 849 467; x_wconf 87' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 858 444 920 467; x_wconf 92' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 931 442 1027 467; x_wconf 92' lang='eng' dir='ltr'><em>22228T</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 1035 445 1188 473; x_wconf 84' lang='eng' dir='ltr'>(AJ842343)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 757 480 1032 511; baseline 0.004 -7"><span class='ocrx_word' id='word_1_72' title='bbox 757 480 855 504; x_wconf 96' lang='eng' dir='ltr'><em>ND1-1T</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 870 483 1032 511; x_wconf 82' lang='eng' dir='ltr'><em>(A3285018)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 775 523 1652 604">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 775 523 1652 604">
+     <span class='ocr_line' id='line_1_30' title="bbox 781 523 1652 554; baseline 0 -6"><span class='ocrx_word' id='word_1_74' title='bbox 781 526 924 548; x_wconf 85' lang='eng' dir='ltr'><em>Salinivibrio</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 934 526 1051 548; x_wconf 78' lang='eng' dir='ltr'><em>costicola</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 1063 526 1147 554; x_wconf 86' lang='eng' dir='ltr'><em>subsp.</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 1157 526 1305 554; x_wconf 86' lang='eng' dir='ltr'><em>alca/iphi/us</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 1315 526 1378 548; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 1392 523 1486 548; x_wconf 82' lang='eng' dir='ltr'><em>16359T</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 1500 526 1652 554; x_wconf 88' lang='eng' dir='ltr'>(AJ640132)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 775 573 1606 604; baseline -0.001 -6"><span class='ocrx_word' id='word_1_81' title='bbox 775 575 919 598; x_wconf 78' lang='eng' dir='ltr'><em>Sal/nivibrio</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 929 575 1045 598; x_wconf 83' lang='eng' dir='ltr'><em>costico/a</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 1062 575 1146 604; x_wconf 81' lang='eng' dir='ltr'>subsp.</span> <span class='ocrx_word' id='word_1_84' title='bbox 1164 575 1280 598; x_wconf 77' lang='eng' dir='ltr'><em>cost/cola</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 1303 575 1397 597; x_wconf 90' lang='eng' dir='ltr'><em>NCIMB</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 1408 573 1470 597; x_wconf 88' lang='eng' dir='ltr'><em>701T</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 1485 575 1606 604; x_wconf 86' lang='eng' dir='ltr'>(X95527)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 685 614 1640 685">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 685 614 1640 685">
+     <span class='ocr_line' id='line_1_32' title="bbox 760 614 1640 644; baseline 0 -6"><span class='ocrx_word' id='word_1_88' title='bbox 760 615 904 638; x_wconf 83' lang='eng' dir='ltr'><em>Salinivibrio</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 914 616 1030 638; x_wconf 72' lang='eng' dir='ltr'><em>cost/bola</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 1049 616 1134 644; x_wconf 86' lang='eng' dir='ltr'><em>subsp.</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 1152 616 1300 638; x_wconf 77' lang='eng' dir='ltr'><em>val/ismon‘is</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 1320 616 1382 639; x_wconf 86' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 1394 614 1473 639; x_wconf 89' lang='eng' dir='ltr'><em>8285T</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 1484 616 1640 644; x_wconf 86' lang='eng' dir='ltr'><em>(AF057016)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 685 654 1381 685; baseline 0.001 -8"><span class='ocrx_word' id='word_1_95' title='bbox 685 658 710 676; x_wconf 84' lang='eng'><em>97</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 745 656 888 678; x_wconf 76' lang='eng' dir='ltr'><em>Salin/vibrio</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 896 656 1067 684; x_wconf 83' lang='eng' dir='ltr'><em>proteolyticus</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 1076 654 1204 678; x_wconf 90' lang='eng' dir='ltr'><em>AF—2004T</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 1218 656 1381 685; x_wconf 80' lang='eng' dir='ltr'>(D0092443)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 639 697 1178 728">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 639 697 1178 728">
+     <span class='ocr_line' id='line_1_34' title="bbox 639 697 1178 728; baseline 0 -6"><span class='ocrx_word' id='word_1_100' title='bbox 639 700 794 722; x_wconf 85' lang='eng' dir='ltr'><em>Escherichia</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 804 700 849 722; x_wconf 88' lang='eng' dir='ltr'><em>coli</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 861 699 942 722; x_wconf 88' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 955 700 963 721; x_wconf 95' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 972 697 1048 722; x_wconf 91' lang='eng' dir='ltr'><em>1775T</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 1058 700 1178 728; x_wconf 89' lang='eng' dir='ltr'>(X80725)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 356 396 631 452">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 356 396 631 452">
+     <span class='ocr_line' id='line_1_35' title="bbox 356 396 631 452; baseline 0 0"><span class='ocrx_word' id='word_1_106' title='bbox 356 396 631 452; x_wconf 50' lang='eng' dir='ltr'><em>ﬂ:</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 600 445 634 466">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 600 445 634 466">
+     <span class='ocr_line' id='line_1_36' title="bbox 600 445 634 466; baseline 0 0"><span class='ocrx_word' id='word_1_107' title='bbox 600 445 634 466; x_wconf 92' lang='eng' dir='ltr'><em>En</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 330 307 332 489">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 330 307 332 489">
+     <span class='ocr_line' id='line_1_37' title="bbox 330 307 332 489; baseline 0 556"><span class='ocrx_word' id='word_1_108' title='bbox 330 307 332 489; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 330 487 356 489">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 330 487 356 489">
+     <span class='ocr_line' id='line_1_38' title="bbox 330 487 356 489; baseline 0 556"><span class='ocrx_word' id='word_1_109' title='bbox 330 487 356 489; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 350 489 778 674">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 350 489 778 674">
+     <span class='ocr_line' id='line_1_39' title="bbox 350 489 757 526; baseline 0 0"><span class='ocrx_word' id='word_1_110' title='bbox 350 489 757 526; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 350 526 778 599; baseline 0 -46"><span class='ocrx_word' id='word_1_111' title='bbox 350 526 778 599; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 667 599 757 649; baseline 0 -10"><span class='ocrx_word' id='word_1_112' title='bbox 667 599 757 649; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 681 649 743 674; baseline 0 0"><span class='ocrx_word' id='word_1_113' title='bbox 681 649 685 674; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> <span class='ocrx_word' id='word_1_114' title='bbox 710 649 743 674; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 319 503 344 521">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 319 503 344 521">
+     <span class='ocr_line' id='line_1_43' title="bbox 319 503 344 521; baseline 0 0"><span class='ocrx_word' id='word_1_115' title='bbox 319 503 344 521; x_wconf 83' lang='eng'>56</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 354 427 356 547">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 354 427 356 547">
+     <span class='ocr_line' id='line_1_44' title="bbox 354 427 356 547; baseline 0 498"><span class='ocrx_word' id='word_1_116' title='bbox 354 427 356 547; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 624 526 745 575">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 624 526 745 575">
+     <span class='ocr_line' id='line_1_45' title="bbox 708 526 745 544; baseline 0 0"><span class='ocrx_word' id='word_1_117' title='bbox 708 526 745 544; x_wconf 90' lang='eng'><em>100</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 624 558 661 575; baseline 0 0"><span class='ocrx_word' id='word_1_118' title='bbox 624 558 661 575; x_wconf 89' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 650 612 675 630">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 650 612 675 630">
+     <span class='ocr_line' id='line_1_47' title="bbox 650 612 675 630; baseline 0 0"><span class='ocrx_word' id='word_1_119' title='bbox 650 612 675 630; x_wconf 87' lang='eng'><em>66</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 91 754 619 756">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 91 754 619 756">
+     <span class='ocr_line' id='line_1_48' title="bbox 91 754 619 756; baseline 0 289"><span class='ocrx_word' id='word_1_120' title='bbox 91 754 619 756; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 622 743 1182 773">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 622 743 1182 773">
+     <span class='ocr_line' id='line_1_49' title="bbox 622 743 1182 773; baseline 0 -6"><span class='ocrx_word' id='word_1_121' title='bbox 622 745 777 767; x_wconf 90' lang='eng' dir='ltr'><em>Aeromonas</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 786 745 911 767; x_wconf 83' lang='eng' dir='ltr'><em>biva/v/um</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 921 743 1003 767; x_wconf 88' lang='eng' dir='ltr'><em>868ET</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 1019 745 1182 773; x_wconf 86' lang='eng' dir='ltr'>(DQ504429)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 59 798 582 800">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 59 798 582 800">
+     <span class='ocr_line' id='line_1_50' title="bbox 59 798 582 800; baseline 0 245"><span class='ocrx_word' id='word_1_125' title='bbox 59 798 582 800; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 59 898 84 916">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 59 898 84 916">
+     <span class='ocr_line' id='line_1_51' title="bbox 59 898 84 916; baseline 0 0"><span class='ocrx_word' id='word_1_126' title='bbox 59 898 84 916; x_wconf 82' lang='eng'>99</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 583 790 1237 821">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 583 790 1237 821">
+     <span class='ocr_line' id='line_1_52' title="bbox 583 790 1237 821; baseline 0 -6"><span class='ocrx_word' id='word_1_127' title='bbox 583 793 782 821; x_wconf 85' lang='eng' dir='ltr'><em>Psychromonas</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 792 793 921 815; x_wconf 78' lang='eng' dir='ltr'><em>antarct/ca</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 937 792 1000 815; x_wconf 92' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 1014 790 1107 815; x_wconf 92' lang='eng' dir='ltr'><em>10704T</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 1116 793 1237 821; x_wconf 85' lang='eng' dir='ltr'>(Y14697)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 90 841 774 843">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 90 841 774 843">
+     <span class='ocr_line' id='line_1_53' title="bbox 90 841 774 843; baseline 0 202"><span class='ocrx_word' id='word_1_132' title='bbox 90 841 774 843; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 90 557 93 925">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 90 557 93 925">
+     <span class='ocr_line' id='line_1_54' title="bbox 90 557 93 925; baseline 0 120"><span class='ocrx_word' id='word_1_133' title='bbox 90 557 93 925; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 277 975 314 993">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 277 975 314 993">
+     <span class='ocr_line' id='line_1_55' title="bbox 277 975 314 993; baseline 0.027 -1"><span class='ocrx_word' id='word_1_134' title='bbox 277 975 314 993; x_wconf 90' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 773 834 1419 865">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 773 834 1419 865">
+     <span class='ocr_line' id='line_1_56' title="bbox 773 834 1419 865; baseline 0 -6"><span class='ocrx_word' id='word_1_135' title='bbox 773 837 978 859; x_wconf 83' lang='eng' dir='ltr'><em>Aestuariibacter</em></span> <span class='ocrx_word' id='word_1_136' title='bbox 985 837 1120 865; x_wconf 81' lang='eng' dir='ltr'><em>halophi/us</em></span> <span class='ocrx_word' id='word_1_137' title='bbox 1138 834 1255 859; x_wconf 76' lang='eng' dir='ltr'><em>JCZO43T</em></span> <span class='ocrx_word' id='word_1_138' title='bbox 1262 837 1419 865; x_wconf 89' lang='eng' dir='ltr'><em>(AY207503)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 92 877 1375 963">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 97 877 1375 958">
+     <span class='ocr_line' id='line_1_57' title="bbox 618 877 1375 909; baseline 0 -6"><span class='ocrx_word' id='word_1_139' title='bbox 618 880 885 903; x_wconf 85' lang='eng' dir='ltr'><em>Pseudoa/teromonas</em></span> <span class='ocrx_word' id='word_1_140' title='bbox 894 880 1069 909; x_wconf 79' lang='eng' dir='ltr'><em>bacteriolytica</em></span> <span class='ocrx_word' id='word_1_141' title='bbox 1090 880 1139 902; x_wconf 89' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_142' title='bbox 1153 877 1375 909; x_wconf 78' lang='eng' dir='ltr'><em>14595T(D89929)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_58' title="bbox 97 922 1315 958; baseline 0 -12"><span class='ocrx_word' id='word_1_143' title='bbox 97 940 122 958; x_wconf 71' lang='eng'><em>62</em></span> <span class='ocrx_word' id='word_1_144' title='bbox 326 924 801 946; x_wconf 82' lang='eng' dir='ltr'><em>—Pseudoalteromonas</em></span> <span class='ocrx_word' id='word_1_145' title='bbox 815 924 973 952; x_wconf 82' lang='eng' dir='ltr'><em>halop/anktis</em></span> <span class='ocrx_word' id='word_1_146' title='bbox 986 924 1067 946; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_147' title='bbox 1080 922 1173 946; x_wconf 83' lang='eng' dir='ltr'><em>14393T</em></span> <span class='ocrx_word' id='word_1_148' title='bbox 1195 924 1315 952; x_wconf 90' lang='eng' dir='ltr'>(X67024)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 324 928 326 996">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 324 928 326 996">
+     <span class='ocr_line' id='line_1_59' title="bbox 324 928 326 996; baseline 0 49"><span class='ocrx_word' id='word_1_149' title='bbox 324 928 326 996; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_37' title="bbox 326 965 1283 1039">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 447 965 1283 1039">
+     <span class='ocr_line' id='line_1_60' title="bbox 506 965 1241 996; baseline 0 -6"><span class='ocrx_word' id='word_1_150' title='bbox 506 968 774 990; x_wconf 81' lang='eng' dir='ltr'><em>Pseudoalteromonas</em></span> <span class='ocrx_word' id='word_1_151' title='bbox 782 968 897 996; x_wconf 81' lang='eng' dir='ltr'><em>piscicida</em></span> <span class='ocrx_word' id='word_1_152' title='bbox 920 968 970 990; x_wconf 93' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_153' title='bbox 983 965 1077 990; x_wconf 81' lang='eng' dir='ltr'><em>12932T</em></span> <span class='ocrx_word' id='word_1_154' title='bbox 1085 968 1241 996; x_wconf 86' lang='eng' dir='ltr'><em>(AF297959)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_61' title="bbox 447 1004 1283 1039; baseline 0 -6"><span class='ocrx_word' id='word_1_155' title='bbox 447 1004 485 1022; x_wconf 66' lang='eng'><em>10°</em></span> <span class='ocrx_word' id='word_1_156' title='bbox 507 1011 775 1033; x_wconf 81' lang='eng' dir='ltr'><em>Pseudoalteromonas</em></span> <span class='ocrx_word' id='word_1_157' title='bbox 784 1011 930 1033; x_wconf 83' lang='eng' dir='ltr'><em>mar/caloris</em></span> <span class='ocrx_word' id='word_1_158' title='bbox 949 1009 1283 1039; x_wconf 72' lang='eng' dir='ltr'>LMG19692T(AF144036)</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001784-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001784-0-000.pbm.png
new file mode 100644
index 00000000..21793490
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001784-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001784-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001784-0-000.pbm.png.hocr
new file mode 100644
index 00000000..bcb44b53
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001784-0-000.pbm.png.hocr
@@ -0,0 +1,126 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001784-0-000.pbm.png"; bbox 0 0 1183 772; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 239 0 1183 772">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 239 0 868 30">
+     <span class='ocr_line' id='line_1_1' title="bbox 239 0 868 30; baseline 0 -6"><span class='ocrx_word' id='word_1_1' title='bbox 239 4 266 23; x_wconf 90' lang='eng'><em>55</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 307 3 486 24; x_wconf 83' lang='eng' dir='ltr'><em>Xanthomonas</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 496 3 604 24; x_wconf 85' lang='eng' dir='ltr'><em>sacchan&#39;</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 613 2 672 24; x_wconf 93' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 683 0 742 24; x_wconf 91' lang='eng' dir='ltr'><em>471T</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 753 3 868 30; x_wconf 89' lang='eng' dir='ltr'>(Y10766)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 303 37 1076 178">
+     <span class='ocr_line' id='line_1_2' title="bbox 323 37 892 66; baseline 0.002 -6"><span class='ocrx_word' id='word_1_7' title='bbox 323 40 502 61; x_wconf 81' lang='eng' dir='ltr'><em>Xanthomonas</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 511 40 610 61; x_wconf 88' lang='eng' dir='ltr'><em>melonis</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 621 39 680 61; x_wconf 92' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 691 37 766 61; x_wconf 83' lang='eng' dir='ltr'><em>8670T</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 777 40 892 66; x_wconf 87' lang='eng' dir='ltr'>(Y10756)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 303 74 898 104; baseline 0 -6"><span class='ocrx_word' id='word_1_12' title='bbox 303 77 483 98; x_wconf 83' lang='eng' dir='ltr'><em>Xanthomonas</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 493 77 632 104; x_wconf 82' lang='eng' dir='ltr'><em>campestris</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 642 77 701 98; x_wconf 91' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 713 74 771 98; x_wconf 89' lang='eng' dir='ltr'><em>568T</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 782 77 898 104; x_wconf 86' lang='eng' dir='ltr'><em>(X95917)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 311 111 1076 140; baseline 0 -5"><span class='ocrx_word' id='word_1_17' title='bbox 311 114 583 135; x_wconf 83' lang='eng' dir='ltr'><em>Pseudoxanthomonas</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 592 114 791 140; x_wconf 87' lang='eng' dir='ltr'><em>broegbemensis</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 802 111 920 135; x_wconf 89' lang='eng' dir='ltr'><em>B1616/1T</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 930 114 1076 140; x_wconf 84' lang='eng' dir='ltr'><em>(AJO12231)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 324 148 981 178; baseline 0 -6"><span class='ocrx_word' id='word_1_21' title='bbox 324 151 567 178; x_wconf 82' lang='eng' dir='ltr'><em>Stenotrophomonas</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 577 151 714 178; x_wconf 82' lang='eng' dir='ltr'><em>maltophi/ia</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 725 151 784 172; x_wconf 92' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 796 148 854 172; x_wconf 84' lang='eng' dir='ltr'><em>958T</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 865 151 981 178; x_wconf 83' lang='eng' dir='ltr'><em>(X95923)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 325 185 890 215">
+     <span class='ocr_line' id='line_1_6' title="bbox 325 185 890 215; baseline 0 -5"><span class='ocrx_word' id='word_1_26' title='bbox 325 188 346 209; x_wconf 91' lang='eng' dir='ltr'><em>X</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 344 188 409 215; x_wconf 88' lang='eng' dir='ltr'><em>ylel/a</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 420 188 540 210; x_wconf 81' lang='eng' dir='ltr'><em>fastidiosa</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 550 188 628 210; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 639 185 730 210; x_wconf 88' lang='eng' dir='ltr'><em>35879T</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 740 188 890 215; x_wconf 88' lang='eng' dir='ltr'><em>(AF192343)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 326 223 917 252">
+     <span class='ocr_line' id='line_1_7' title="bbox 326 223 917 252; baseline -0.002 -5"><span class='ocrx_word' id='word_1_32' title='bbox 326 225 475 247; x_wconf 81' lang='eng' dir='ltr'><em>Luteimonas</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 485 225 592 252; x_wconf 84' lang='eng' dir='ltr'><em>mephitis</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 602 223 761 247; x_wconf 81' lang='eng' dir='ltr'><em>B1953/27.1T</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 771 225 917 252; x_wconf 82' lang='eng' dir='ltr'><em>(AJ012228)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 310 260 970 363">
+     <span class='ocr_line' id='line_1_8' title="bbox 326 260 970 289; baseline -0.002 -5"><span class='ocrx_word' id='word_1_36' title='bbox 326 262 469 289; x_wconf 81' lang='eng' dir='ltr'><em>Lysobacter</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 476 268 656 289; x_wconf 88' lang='eng' dir='ltr'><em>enzymogenes</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 666 262 726 284; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 738 260 813 284; x_wconf 88' lang='eng' dir='ltr'><em>2043T</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 824 262 970 289; x_wconf 85' lang='eng' dir='ltr'><em>(AJ298291)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 310 297 924 326; baseline -0.002 -5"><span class='ocrx_word' id='word_1_41' title='bbox 310 299 454 326; x_wconf 83' lang='eng' dir='ltr'><em>Lysobacter</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 461 299 605 321; x_wconf 80' lang='eng' dir='ltr'><em>antibioticus</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 616 299 675 321; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 687 297 762 321; x_wconf 77' lang='eng' dir='ltr'><em>2044T</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 773 299 924 326; x_wconf 84' lang='eng' dir='ltr'><em>(ABO19582)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 314 334 842 363; baseline 0 -5"><span class='ocrx_word' id='word_1_46' title='bbox 314 337 462 358; x_wconf 82' lang='eng' dir='ltr'><em>Fulvimonas</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 471 337 515 358; x_wconf 90' lang='eng' dir='ltr'><em>soli</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 524 336 583 358; x_wconf 89' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 596 334 685 358; x_wconf 78' lang='eng' dir='ltr'><em>19981T</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 696 337 842 363; x_wconf 85' lang='eng' dir='ltr'><em>(AJ311653)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 347 371 798 401">
+     <span class='ocr_line' id='line_1_11' title="bbox 347 371 798 401; baseline 0 -6"><span class='ocrx_word' id='word_1_51' title='bbox 347 374 426 401; x_wconf 86' lang='eng' dir='ltr'><em>Dye/Ia</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 432 374 543 401; x_wconf 84' lang='eng' dir='ltr'><em>japonioa</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 552 371 636 395; x_wconf 84' lang='eng' dir='ltr'><em>XD53T</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 647 374 798 401; x_wconf 86' lang='eng' dir='ltr'><em>(AB110498)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 349 408 797 438">
+     <span class='ocr_line' id='line_1_12' title="bbox 349 408 797 438; baseline 0 -6"><span class='ocrx_word' id='word_1_55' title='bbox 349 411 427 438; x_wconf 85' lang='eng' dir='ltr'><em>Dye/Ia</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 437 411 561 432; x_wconf 88' lang='eng' dir='ltr'><em>koreensis</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 572 408 635 432; x_wconf 91' lang='eng' dir='ltr'><em>BB4T</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 646 411 797 438; x_wconf 88' lang='eng' dir='ltr'><em>(AY884571)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 344 445 1075 698">
+     <span class='ocr_line' id='line_1_13' title="bbox 351 445 882 475; baseline 0 -6"><span class='ocrx_word' id='word_1_59' title='bbox 351 448 465 469; x_wconf 80' lang='eng' dir='ltr'><em>Frateuria</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 476 448 579 469; x_wconf 84' lang='eng' dir='ltr'><em>aurantia</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 590 448 635 469; x_wconf 94' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 646 445 721 469; x_wconf 81' lang='eng' dir='ltr'><em>3245T</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 731 448 882 475; x_wconf 78' lang='eng' dir='ltr'><em>(ABOQ1194)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 352 483 991 512; baseline 0 -5"><span class='ocrx_word' id='word_1_64' title='bbox 352 485 552 507; x_wconf 82' lang='eng' dir='ltr'><em>Rhodanobacter</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 558 485 710 512; x_wconf 76' lang='eng' dir='ltr'><em>ginseng/soli</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 719 483 831 507; x_wconf 91' lang='eng' dir='ltr'><em>GR17—7T</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 842 485 991 512; x_wconf 93' lang='eng' dir='ltr'>(EF166075)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 344 520 932 549; baseline -0.002 -5"><span class='ocrx_word' id='word_1_68' title='bbox 344 522 545 544; x_wconf 84' lang='eng' dir='ltr'><em>Rhodanobacter</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 551 522 695 549; x_wconf 83' lang='eng' dir='ltr'><em>spathiphylli</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 705 520 765 544; x_wconf 79' lang='eng' dir='ltr'><em>B39T</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 776 522 932 549; x_wconf 88' lang='eng' dir='ltr'><em>(AM087226)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 353 557 914 586; baseline -0.002 -5"><span class='ocrx_word' id='word_1_72' title='bbox 353 559 552 581; x_wconf 83' lang='eng' dir='ltr'><em>Rhodanobacter</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 560 560 633 581; x_wconf 88' lang='eng' dir='ltr'><em>terrae</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 644 557 754 581; x_wconf 82' lang='eng' dir='ltr'><em>GP18—1T</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 764 559 914 586; x_wconf 92' lang='eng' dir='ltr'>(EF166076)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 389 594 1075 623; baseline 0 -5"><span class='ocrx_word' id='word_1_76' title='bbox 389 597 589 618; x_wconf 82' lang='eng' dir='ltr'><em>Rhodanobacter</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 595 596 790 618; x_wconf 81' lang='eng' dir='ltr'><em>lindaniclasticus</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 801 594 915 618; x_wconf 81' lang='eng' dir='ltr'><em>RP5557T</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 926 596 1075 623; x_wconf 88' lang='eng' dir='ltr'><em>(AFO39167)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 383 631 999 660; baseline 0 -5"><span class='ocrx_word' id='word_1_80' title='bbox 383 634 584 655; x_wconf 81' lang='eng' dir='ltr'><em>Rhodanobacter</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 590 634 744 660; x_wconf 80' lang='eng' dir='ltr'><em>thiooxydans</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 754 631 837 655; x_wconf 78' lang='eng' dir='ltr'><em>LCSZT</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 847 634 999 660; x_wconf 76' lang='eng' dir='ltr'><em>(A8286179)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 373 668 889 698; baseline 0 -6"><span class='ocrx_word' id='word_1_84' title='bbox 373 671 573 692; x_wconf 81' lang='eng' dir='ltr'><em>Rhodanobacter</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 580 671 655 692; x_wconf 87' lang='eng' dir='ltr'><em>fu/vus</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 663 668 727 698; x_wconf 88' lang='eng' dir='ltr'><em>Jip2T</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 738 671 889 698; x_wconf 88' lang='eng' dir='ltr'><em>(AB100608)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 303 705 1183 772">
+     <span class='ocr_line' id='line_1_20' title="bbox 303 705 1183 736; baseline 0 -6"><span class='ocrx_word' id='word_1_88' title='bbox 303 705 330 724; x_wconf 76' lang='eng'>64</span> <span class='ocrx_word' id='word_1_89' title='bbox 368 708 583 730; x_wconf 86' lang='eng' dir='ltr'><em>Rhodanobacter</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 589 708 854 736; x_wconf 88' lang='eng' dir='ltr'><em>ginsenosidimutans</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 863 708 933 730; x_wconf 91' lang='eng' dir='ltr'><em>Gsoil</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 944 706 1019 730; x_wconf 88' lang='eng' dir='ltr'><em>3054T</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 1029 708 1183 735; x_wconf 87' lang='eng' dir='ltr'><em>(EU332826)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 397 742 911 772; baseline 0 -6"><span class='ocrx_word' id='word_1_94' title='bbox 397 745 545 767; x_wconf 83' lang='eng' dir='ltr'><em>Escherichia</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 555 745 598 767; x_wconf 86' lang='eng' dir='ltr'><em>coli</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 606 745 684 767; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 697 742 786 767; x_wconf 90' lang='eng' dir='ltr'><em>11775T</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 796 745 911 772; x_wconf 89' lang='eng' dir='ltr'><em>(X80725)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 0 6 389 760">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 0 6 389 760">
+     <span class='ocr_line' id='line_1_22' title="bbox 231 6 317 59; baseline 0 0"><span class='ocrx_word' id='word_1_99' title='bbox 231 6 317 59; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 231 59 303 80; baseline 0 692"><span class='ocrx_word' id='word_1_100' title='bbox 231 59 303 80; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 184 80 311 154; baseline 0 -35"><span class='ocrx_word' id='word_1_101' title='bbox 184 80 311 154; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 119 154 319 230; baseline 0 -37"><span class='ocrx_word' id='word_1_102' title='bbox 119 154 319 230; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 119 230 319 283; baseline 0 0"><span class='ocrx_word' id='word_1_103' title='bbox 119 230 319 283; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 0 283 310 303; baseline 0 469"><span class='ocrx_word' id='word_1_104' title='bbox 0 283 310 303; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 0 303 310 340; baseline 0 432"><span class='ocrx_word' id='word_1_105' title='bbox 0 303 310 340; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 0 340 314 377; baseline 0 395"><span class='ocrx_word' id='word_1_106' title='bbox 0 340 314 377; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 0 377 343 416; baseline 0 356"><span class='ocrx_word' id='word_1_107' title='bbox 0 377 343 416; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 0 416 347 453; baseline 0 319"><span class='ocrx_word' id='word_1_108' title='bbox 0 416 347 453; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 0 453 347 506; baseline 0 0"><span class='ocrx_word' id='word_1_109' title='bbox 0 453 347 506; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 0 506 341 526; baseline 0 246"><span class='ocrx_word' id='word_1_110' title='bbox 0 506 341 526; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 0 526 344 563; baseline 0 209"><span class='ocrx_word' id='word_1_111' title='bbox 0 526 344 563; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 0 563 388 617; baseline 0 0"><span class='ocrx_word' id='word_1_112' title='bbox 0 563 388 617; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 0 617 383 653; baseline 0 0"><span class='ocrx_word' id='word_1_113' title='bbox 0 617 383 653; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 0 653 373 690; baseline 0 0"><span class='ocrx_word' id='word_1_114' title='bbox 0 653 373 690; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 0 690 303 713; baseline 0 59"><span class='ocrx_word' id='word_1_115' title='bbox 0 690 303 713; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 0 713 389 760; baseline 0 0"><span class='ocrx_word' id='word_1_116' title='bbox 0 713 389 760; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001792-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001792-0-000.pbm.png
new file mode 100644
index 00000000..ae4b1d36
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001792-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001792-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001792-0-000.pbm.png.hocr
new file mode 100644
index 00000000..c73ee9aa
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001792-0-000.pbm.png.hocr
@@ -0,0 +1,146 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001792-0-000.pbm.png"; bbox 0 0 1539 1047; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 154 9 433 57">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 154 9 433 57">
+     <span class='ocr_line' id='line_1_1' title="bbox 154 9 433 30; baseline 0 -5"><span class='ocrx_word' id='word_1_1' title='bbox 154 9 246 25; x_wconf 85' lang='eng' dir='ltr'><em>onsen/ed</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 255 9 312 25; x_wconf 80' lang='eng' dir='ltr'><em>Indels</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 321 13 336 25; x_wconf 90' lang='eng' dir='ltr'><em>In</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 344 13 411 30; x_wconf 80' lang='eng' dir='ltr'><em>gyrase</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 418 9 433 25; x_wconf 88' lang='eng' dir='ltr'>A</span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 170 36 405 57; baseline 0.004 -5"><span class='ocrx_word' id='word_1_6' title='bbox 170 36 213 52; x_wconf 87' lang='eng' dir='ltr'>ATP</span> <span class='ocrx_word' id='word_1_7' title='bbox 222 36 311 57; x_wconf 82' lang='eng' dir='ltr'><em>synthase</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 320 36 361 53; x_wconf 74' lang='eng' dir='ltr'><em>beta</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 369 36 405 53; x_wconf 84' lang='eng' dir='ltr'><em>and</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 164 63 1285 105">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 164 63 1285 105">
+     <span class='ocr_line' id='line_1_3' title="bbox 164 63 413 84; baseline 0 -5"><span class='ocrx_word' id='word_1_10' title='bbox 164 63 259 79; x_wconf 84' lang='eng' dir='ltr'><em>ribosomal</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 268 63 335 84; x_wconf 76' lang='eng' dir='ltr'><em>protein</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 344 63 369 79; x_wconf 80' lang='eng'><em>52</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 378 63 413 79; x_wconf 83' lang='eng' dir='ltr'><em>and</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 612 84 1285 105; baseline 0 0"><span class='ocrx_word' id='word_1_14' title='bbox 612 85 723 102; x_wconf 83' lang='eng'><em>100/99/100</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 767 84 904 105; x_wconf 82' lang='eng' dir='ltr'><em>Clostrldium</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 912 85 1031 105; x_wconf 84' lang='eng' dir='ltr'><em>botulinum</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 1039 85 1057 105; x_wconf 91' lang='eng' dir='ltr'>A</span> <span class='ocrx_word' id='word_1_18' title='bbox 1067 85 1132 105; x_wconf 83' lang='eng' dir='ltr'><em>strain</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 1141 84 1216 105; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 1226 85 1285 105; x_wconf 86' lang='eng'><em>3502</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 106 116 1539 877">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 106 116 1539 877">
+     <span class='ocr_line' id='line_1_5' title="bbox 765 116 1266 142; baseline 0 -5"><span class='ocrx_word' id='word_1_21' title='bbox 765 116 902 137; x_wconf 82' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 911 117 1030 137; x_wconf 79' lang='eng' dir='ltr'><em>botulinum</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 1040 117 1054 137; x_wconf 97' lang='eng' dir='ltr'>F</span> <span class='ocrx_word' id='word_1_24' title='bbox 1064 117 1129 137; x_wconf 79' lang='eng' dir='ltr'><em>strain</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 1141 117 1266 142; x_wconf 82' lang='eng' dir='ltr'>Langeland</span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 351 148 995 183; baseline 0 -14"><span class='ocrx_word' id='word_1_26' title='bbox 351 159 449 175; x_wconf 55' lang='eng'><em>“30/38/58</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 495 166 569 183; x_wconf 35' lang='eng'><em>71/78/7</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 782 148 919 183; x_wconf 53' lang='eng' dir='ltr'><em>Closfridium</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 928 149 995 183; x_wconf 71' lang='eng' dir='ltr'><em>tetani</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 738 180 977 206; baseline -0.004 -5"><span class='ocrx_word' id='word_1_30' title='bbox 738 180 874 201; x_wconf 74' lang='eng' dir='ltr'><em>ClostrId/um</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 883 180 977 206; x_wconf 86' lang='eng' dir='ltr'><em>kluyven</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 732 212 1061 238; baseline 0 -5"><span class='ocrx_word' id='word_1_32' title='bbox 732 212 868 233; x_wconf 84' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 877 213 1061 238; x_wconf 82' lang='eng' dir='ltr'><em>acetobutylicum</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 805 244 1081 270; baseline -0.004 -5"><span class='ocrx_word' id='word_1_34' title='bbox 805 244 942 265; x_wconf 84' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 951 244 1081 270; x_wconf 84' lang='eng' dir='ltr'><em>beijerinckii</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 159 276 1178 304; baseline -0.003 -5"><span class='ocrx_word' id='word_1_36' title='bbox 159 282 257 299; x_wconf 81' lang='eng'><em>100/94/99</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 384 287 495 304; x_wconf 70' lang='eng' dir='ltr'><em>100/9moo</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 715 276 851 296; x_wconf 85' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 859 276 999 302; x_wconf 84' lang='eng' dir='ltr'><em>perfringens</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 1006 276 1080 296; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 1092 276 1178 296; x_wconf 83' lang='eng' dir='ltr'><em>13124T</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 565 308 1099 334; baseline -0.002 -4"><span class='ocrx_word' id='word_1_42' title='bbox 565 314 675 331; x_wconf 85' lang='eng'><em>100/100/94</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 725 308 861 329; x_wconf 81' lang='eng' dir='ltr'><em>Clostridlum</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 869 308 1008 334; x_wconf 78' lang='eng' dir='ltr'><em>perfringens</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 1017 308 1099 329; x_wconf 83' lang='eng' dir='ltr'>SM101</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 727 340 1048 366; baseline 0 -5"><span class='ocrx_word' id='word_1_46' title='bbox 727 340 864 361; x_wconf 78' lang='eng' dir='ltr'><em>Clostrldiurn</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 872 340 1011 366; x_wconf 78' lang='eng' dir='ltr'><em>pelfringens</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 1021 341 1048 361; x_wconf 83' lang='eng'><em>13</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 881 372 1231 398; baseline -0.003 -5"><span class='ocrx_word' id='word_1_49' title='bbox 881 372 1017 393; x_wconf 82' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 1024 372 1231 398; x_wconf 81' lang='eng' dir='ltr'><em>phytofermentans</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 710 404 939 424; baseline 0 0"><span class='ocrx_word' id='word_1_51' title='bbox 710 404 846 424; x_wconf 76' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 856 404 939 424; x_wconf 86' lang='eng' dir='ltr'><em>difﬁci/e</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 228 436 974 462; baseline -0.004 -3"><span class='ocrx_word' id='word_1_53' title='bbox 228 443 338 459; x_wconf 83' lang='eng'><em>100/59/100</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 689 436 833 462; x_wconf 72' lang='eng' dir='ltr'><em>‘AIka/iphi/us</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 843 436 974 457; x_wconf 82' lang='eng' dir='ltr'><em>oremlandii’</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 334 466 1055 494; baseline 0.001 -6"><span class='ocrx_word' id='word_1_56' title='bbox 334 466 415 483; x_wconf 66' lang='eng'><em>100/96“</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 421 466 444 483; x_wconf 84' lang='eng'>00</span> <span class='ocrx_word' id='word_1_58' title='bbox 712 468 856 494; x_wconf 79' lang='eng' dir='ltr'><em>‘A/kaliphilus</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 865 468 1055 494; x_wconf 78' lang='eng' dir='ltr'><em>metal/iredigens’</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 584 500 895 520; baseline 0 0"><span class='ocrx_word' id='word_1_60' title='bbox 584 500 721 520; x_wconf 85' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 730 500 895 520; x_wconf 77' lang='eng' dir='ltr'><em>thermocellum</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 115 531 1050 557; baseline -0.002 -3"><span class='ocrx_word' id='word_1_62' title='bbox 115 537 126 554; x_wconf 82' lang='eng'><em>9</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 131 539 137 544; x_wconf 66' lang='eng'><em>‘</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 146 537 201 554; x_wconf 85' lang='eng'>81/82</span> <span class='ocrx_word' id='word_1_65' title='bbox 619 531 855 557; x_wconf 81' lang='eng' dir='ltr'><em>Caldicelluloslruptor</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 861 532 1050 557; x_wconf 80' lang='eng' dir='ltr'><em>saccharolytlcus</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 334 564 1172 589; baseline 0 -5"><span class='ocrx_word' id='word_1_67' title='bbox 334 564 444 580; x_wconf 84' lang='eng'><em>100/55/100</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 693 564 951 584; x_wconf 76' lang='eng' dir='ltr'><em>Thermoanaerobacter</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 956 564 1172 589; x_wconf 81' lang='eng' dir='ltr'><em>pseudethanollcus</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 595 596 1038 622; baseline 0.002 -6"><span class='ocrx_word' id='word_1_70' title='bbox 595 596 853 617; x_wconf 80' lang='eng' dir='ltr'><em>Thermoanaerobacter</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 859 596 1038 622; x_wconf 82' lang='eng' dir='ltr'><em>tengcongensis</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 656 628 1044 654; baseline 0 -6"><span class='ocrx_word' id='word_1_72' title='bbox 656 628 868 654; x_wconf 79' lang='eng' dir='ltr'><em>Symbiobacterium</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 878 628 1044 653; x_wconf 80' lang='eng' dir='ltr'><em>thermophilum</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 670 660 1026 680; baseline 0 0"><span class='ocrx_word' id='word_1_74' title='bbox 670 660 898 680; x_wconf 80' lang='eng' dir='ltr'><em>Desulﬁtobacterium</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 907 660 1026 680; x_wconf 88' lang='eng' dir='ltr'><em>hafniense</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 106 692 1058 744; baseline 0 -32"><span class='ocrx_word' id='word_1_76' title='bbox 106 718 192 735; x_wconf 51' lang='eng' dir='ltr'><em>“JO/51,—</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 248 705 345 722; x_wconf 56' lang='eng' dir='ltr'><em>womwg</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 601 724 623 744; x_wconf 82' lang='eng' dir='ltr'><em>M</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 770 692 978 726; x_wconf 71' lang='eng' dir='ltr'><em>Syntrophomonas</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 988 692 1058 712; x_wconf 88' lang='eng' dir='ltr'><em>wolfei</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 242 724 887 744; baseline 0 0"><span class='ocrx_word' id='word_1_81' title='bbox 242 728 594 732; x_wconf 81' lang='eng'><em>——</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 623 724 705 744; x_wconf 84' lang='eng' dir='ltr'><em>oorel/a</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 715 724 887 744; x_wconf 75' lang='eng' dir='ltr'><em>thermoacetlca</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 133 754 1072 781; baseline 0 -5"><span class='ocrx_word' id='word_1_84' title='bbox 133 754 195 771; x_wconf 76' lang='eng'><em>81/-/-</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 600 755 833 781; x_wconf 81' lang='eng' dir='ltr'><em>Carboxydothermus</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 842 756 855 776; x_wconf 88' lang='eng' dir='ltr'><em>h</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 856 755 1072 781; x_wconf 83' lang='eng' dir='ltr'><em>ydrogenoformans</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 150 787 955 808; baseline 0.001 -1"><span class='ocrx_word' id='word_1_88' title='bbox 150 790 237 807; x_wconf 83' lang='eng'><em>99/73/85</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 594 787 828 808; x_wconf 75' lang='eng' dir='ltr'><em>‘Desulfotomaculum</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 837 788 955 808; x_wconf 85' lang='eng' dir='ltr'><em>reducens’</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 321 819 1539 845; baseline 0.002 -8"><span class='ocrx_word' id='word_1_91' title='bbox 321 821 431 837; x_wconf 82' lang='eng'><em>100/99/100</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 1292 819 1438 845; x_wconf 87' lang='eng' dir='ltr'><em>Ureap/asma</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 1447 825 1539 845; x_wconf 87' lang='eng' dir='ltr'><em>parvum</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 1140 851 1419 877; baseline 0.004 -6"><span class='ocrx_word' id='word_1_94' title='bbox 1140 851 1293 877; x_wconf 86' lang='eng' dir='ltr'><em>Mycop/asma</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 1303 851 1419 877; x_wconf 82' lang='eng' dir='ltr'><em>mycoides</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 122 0 457 117">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 122 0 457 117">
+     <span class='ocr_line' id='line_1_29' title="bbox 122 0 457 117; baseline 0 930"><span class='ocrx_word' id='word_1_96' title='bbox 122 0 457 117; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 53 174 235 191">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 53 174 235 191">
+     <span class='ocr_line' id='line_1_30' title="bbox 53 174 235 191; baseline 0 0"><span class='ocrx_word' id='word_1_97' title='bbox 53 179 76 191; x_wconf 83' lang='eng' dir='ltr'><em>aa</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 84 174 186 191; x_wconf 81' lang='eng' dir='ltr'><em>conserved</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 196 174 235 191; x_wconf 85' lang='eng' dir='ltr'>inse</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 28 201 424 250">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 28 201 424 250">
+     <span class='ocr_line' id='line_1_31' title="bbox 28 201 424 225; baseline 0 -7"><span class='ocrx_word' id='word_1_100' title='bbox 28 201 43 218; x_wconf 92' lang='eng' dir='ltr'>in</span> <span class='ocrx_word' id='word_1_101' title='bbox 52 201 229 223; x_wconf 79' lang='eng' dir='ltr'><em>phosphoglycerate</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 314 208 424 225; x_wconf 74' lang='eng'><em>100/97/100</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 51 229 206 250; baseline 0 -5"><span class='ocrx_word' id='word_1_103' title='bbox 51 229 206 250; x_wconf 83' lang='eng' dir='ltr'><em>dehydrogenase</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 0 166 261 254">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 0 166 261 254">
+     <span class='ocr_line' id='line_1_33' title="bbox 0 166 261 254; baseline 0 793"><span class='ocrx_word' id='word_1_104' title='bbox 0 166 261 254; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 76 428 163 444">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 76 428 163 444">
+     <span class='ocr_line' id='line_1_34' title="bbox 76 428 163 444; baseline 0 0"><span class='ocrx_word' id='word_1_105' title='bbox 76 428 163 444; x_wconf 87' lang='eng'><strong>79/60/99</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 258 890 813 892">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 258 890 813 892">
+     <span class='ocr_line' id='line_1_35' title="bbox 258 890 813 892; baseline 0 155"><span class='ocrx_word' id='word_1_106' title='bbox 258 890 813 892; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 85 884 1101 968">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 85 884 1101 968">
+     <span class='ocr_line' id='line_1_36' title="bbox 85 884 1101 910; baseline -0.001 -5"><span class='ocrx_word' id='word_1_107' title='bbox 85 888 182 905; x_wconf 84' lang='eng'><em>100/93/93</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 822 884 982 904; x_wconf 77' lang='eng' dir='ltr'><em>Lactobacillus</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 987 884 1101 910; x_wconf 86' lang='eng' dir='ltr'><em>johnsonii</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 138 915 985 942; baseline -0.004 -3"><span class='ocrx_word' id='word_1_110' title='bbox 138 923 236 939; x_wconf 83' lang='eng' dir='ltr'><em>100/96l62</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 328 922 695 925; x_wconf 90' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_112' title='bbox 700 915 893 942; x_wconf 84' lang='eng' dir='ltr'><em>Staphylococcus</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 902 921 985 936; x_wconf 82' lang='eng' dir='ltr'><em>aureus</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 201 948 804 968; baseline 0.007 -4"><span class='ocrx_word' id='word_1_114' title='bbox 201 948 311 965; x_wconf 83' lang='eng'><em>100/99/100</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 616 948 711 968; x_wconf 79' lang='eng' dir='ltr'><em>Bacillus</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 720 948 804 968; x_wconf 80' lang='eng' dir='ltr'><em>subti/is</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 76 990 880 992">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 76 990 880 992">
+     <span class='ocr_line' id='line_1_39' title="bbox 76 990 880 992; baseline 0 55"><span class='ocrx_word' id='word_1_117' title='bbox 76 990 880 992; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 841 980 1228 1047">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 841 980 1228 1047">
+     <span class='ocr_line' id='line_1_40' title="bbox 886 980 1228 1005; baseline 0 -5"><span class='ocrx_word' id='word_1_118' title='bbox 886 980 1071 1005; x_wconf 84' lang='eng' dir='ltr'><em>Mycobacterium</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 1081 980 1228 1000; x_wconf 85' lang='eng' dir='ltr'><em>tuberculosis</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 841 1021 1136 1047; baseline 0 -6"><span class='ocrx_word' id='word_1_120' title='bbox 841 1021 1009 1047; x_wconf 78' lang='eng' dir='ltr'><em>Streptomyces</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 1018 1021 1136 1041; x_wconf 85' lang='eng' dir='ltr'><em>coelicolor</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001800-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001800-0-000.pbm.png
new file mode 100644
index 00000000..b86b1418
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001800-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001800-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001800-0-000.pbm.png.hocr
new file mode 100644
index 00000000..15d28447
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001800-0-000.pbm.png.hocr
@@ -0,0 +1,400 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001800-0-000.pbm.png"; bbox 0 0 1302 2035; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 463 1332 484 1348">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 463 1332 484 1348">
+     <span class='ocr_line' id='line_1_1' title="bbox 463 1332 484 1348; baseline -0.048 0"><span class='ocrx_word' id='word_1_1' title='bbox 463 1332 484 1348; x_wconf 87' lang='eng'><strong>54</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 457 1354 493 1356">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 457 1354 493 1356">
+     <span class='ocr_line' id='line_1_2' title="bbox 457 1354 493 1356; baseline 0 679"><span class='ocrx_word' id='word_1_2' title='bbox 457 1354 493 1356; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 491 1203 495 1508">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 491 1203 495 1508">
+     <span class='ocr_line' id='line_1_3' title="bbox 491 1203 495 1508; baseline 0 527"><span class='ocrx_word' id='word_1_3' title='bbox 491 1203 495 1508; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 617 17 671 752">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 617 17 671 752">
+     <span class='ocr_line' id='line_1_4' title="bbox 619 17 644 130; baseline 0.04 -44"><span class='ocrx_word' id='word_1_4' title='bbox 619 17 644 130; x_wconf 95' lang='eng' dir='ltr'>    </span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 617 130 644 259; baseline 0.037 -44"><span class='ocrx_word' id='word_1_5' title='bbox 617 130 644 259; x_wconf 95' lang='eng' dir='ltr'>    </span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 617 259 644 386; baseline 0 -86"><span class='ocrx_word' id='word_1_6' title='bbox 617 259 644 386; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 617 386 644 416; baseline 0 1619"><span class='ocrx_word' id='word_1_7' title='bbox 617 386 644 416; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 617 476 633 558; baseline 0 -44"><span class='ocrx_word' id='word_1_8' title='bbox 617 476 633 558; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 617 558 661 686; baseline 0 -86"><span class='ocrx_word' id='word_1_9' title='bbox 617 558 661 686; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 623 686 671 752; baseline 0 0"><span class='ocrx_word' id='word_1_10' title='bbox 623 686 671 752; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 600 255 619 270">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 600 255 619 270">
+     <span class='ocr_line' id='line_1_11' title="bbox 600 255 619 270; baseline 0 0"><span class='ocrx_word' id='word_1_11' title='bbox 600 255 619 270; x_wconf 74' lang='eng'><strong>41</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 564 610 585 626">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 564 610 585 626">
+     <span class='ocr_line' id='line_1_12' title="bbox 564 610 585 626; baseline -0.048 0"><span class='ocrx_word' id='word_1_12' title='bbox 564 610 585 626; x_wconf 81' lang='eng'>82</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 541 628 719 1219">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 541 628 675 1201">
+     <span class='ocr_line' id='line_1_13' title="bbox 572 628 596 686; baseline 0 -43"><span class='ocrx_word' id='word_1_13' title='bbox 572 628 596 686; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 541 686 583 771; baseline 0 -43"><span class='ocrx_word' id='word_1_14' title='bbox 541 686 583 771; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 541 771 586 814; baseline 0 1221"><span class='ocrx_word' id='word_1_15' title='bbox 541 771 586 814; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 541 814 619 899; baseline 0 0"><span class='ocrx_word' id='word_1_16' title='bbox 541 814 619 899; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 572 899 661 985; baseline 0 -41"><span class='ocrx_word' id='word_1_17' title='bbox 572 899 661 985; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 572 985 661 1072; baseline 0 0"><span class='ocrx_word' id='word_1_18' title='bbox 572 985 661 1072; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 604 1072 675 1201; baseline 0 -88"><span class='ocrx_word' id='word_1_19' title='bbox 604 1072 675 1201; x_wconf 95' lang='eng' dir='ltr'>    </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 601 643 622 658">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 601 643 622 658">
+     <span class='ocr_line' id='line_1_20' title="bbox 601 643 622 658; baseline 0 0"><span class='ocrx_word' id='word_1_20' title='bbox 601 643 622 658; x_wconf 85' lang='eng'>55</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 594 453 596 833">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 594 453 596 833">
+     <span class='ocr_line' id='line_1_21' title="bbox 594 453 596 833; baseline 0 1202"><span class='ocrx_word' id='word_1_21' title='bbox 594 453 596 833; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 515 1018 536 1033">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 515 1018 536 1033">
+     <span class='ocr_line' id='line_1_22' title="bbox 515 1018 536 1033; baseline 0 0"><span class='ocrx_word' id='word_1_22' title='bbox 515 1018 536 1033; x_wconf 85' lang='eng'>59</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 635 1209 651 1224">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 635 1209 651 1224">
+     <span class='ocr_line' id='line_1_23' title="bbox 635 1209 651 1224; baseline 0 0"><span class='ocrx_word' id='word_1_23' title='bbox 635 1209 651 1224; x_wconf 94' lang='eng'><strong>11</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 543 799 545 1390">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 543 799 545 1390">
+     <span class='ocr_line' id='line_1_24' title="bbox 543 799 545 1390; baseline 0 645"><span class='ocrx_word' id='word_1_24' title='bbox 543 799 545 1390; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 492 1506 550 1508">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 492 1506 550 1508">
+     <span class='ocr_line' id='line_1_25' title="bbox 492 1506 550 1508; baseline 0 527"><span class='ocrx_word' id='word_1_25' title='bbox 492 1506 550 1508; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 428 1510 450 1525">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 428 1510 450 1525">
+     <span class='ocr_line' id='line_1_26' title="bbox 428 1510 450 1525; baseline 0 0"><span class='ocrx_word' id='word_1_26' title='bbox 428 1510 450 1525; x_wconf 84' lang='eng'>63</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 413 1532 459 1534">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 413 1532 459 1534">
+     <span class='ocr_line' id='line_1_27' title="bbox 413 1532 459 1534; baseline 0 501"><span class='ocrx_word' id='word_1_27' title='bbox 413 1532 459 1534; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 6 1684 415 1686">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 6 1684 415 1686">
+     <span class='ocr_line' id='line_1_28' title="bbox 6 1684 415 1686; baseline 0 349"><span class='ocrx_word' id='word_1_28' title='bbox 6 1684 415 1686; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 6 1684 8 1946">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 6 1684 8 1946">
+     <span class='ocr_line' id='line_1_29' title="bbox 6 1684 8 1946; baseline 0 89"><span class='ocrx_word' id='word_1_29' title='bbox 6 1684 8 1946; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 413 1532 415 1839">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 413 1532 415 1839">
+     <span class='ocr_line' id='line_1_30' title="bbox 413 1532 415 1839; baseline 0 196"><span class='ocrx_word' id='word_1_30' title='bbox 413 1532 415 1839; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 457 1354 459 1708">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 457 1354 459 1708">
+     <span class='ocr_line' id='line_1_31' title="bbox 457 1354 459 1708; baseline 0 327"><span class='ocrx_word' id='word_1_31' title='bbox 457 1354 459 1708; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 485 1772 507 1787">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 485 1772 507 1787">
+     <span class='ocr_line' id='line_1_32' title="bbox 485 1772 507 1787; baseline 0 0"><span class='ocrx_word' id='word_1_32' title='bbox 485 1772 507 1787; x_wconf 86' lang='eng'>99</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 593 11 1161 675">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 593 11 1161 675">
+     <span class='ocr_line' id='line_1_33' title="bbox 633 11 1047 34; baseline 0 -5"><span class='ocrx_word' id='word_1_33' title='bbox 633 11 774 34; x_wconf 77' lang='eng' dir='ltr'>Clyplococcus</span> <span class='ocrx_word' id='word_1_34' title='bbox 782 16 810 33; x_wconf 88' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_35' title='bbox 818 12 916 29; x_wconf 79' lang='eng' dir='ltr'>AA-090.4</span> <span class='ocrx_word' id='word_1_36' title='bbox 925 11 1047 33; x_wconf 81' lang='eng' dir='ltr'>(AY188363)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 649 54 1096 76; baseline 0 -5"><span class='ocrx_word' id='word_1_37' title='bbox 649 54 790 76; x_wconf 82' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_38' title='bbox 797 54 907 71; x_wconf 82' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_39' title='bbox 916 54 966 71; x_wconf 85' lang='eng' dir='ltr'>L146</span> <span class='ocrx_word' id='word_1_40' title='bbox 975 54 1096 76; x_wconf 85' lang='eng' dir='ltr'>(EF116912)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 633 97 1112 119; baseline 0 -5"><span class='ocrx_word' id='word_1_41' title='bbox 633 97 774 119; x_wconf 77' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_42' title='bbox 782 97 892 114; x_wconf 86' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_43' title='bbox 901 97 983 114; x_wconf 85' lang='eng' dir='ltr'>HB1043</span> <span class='ocrx_word' id='word_1_44' title='bbox 992 97 1112 119; x_wconf 87' lang='eng' dir='ltr'>(AJ509857)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 634 135 1161 162; baseline 0 -4"><span class='ocrx_word' id='word_1_45' title='bbox 634 140 788 162; x_wconf 79' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_46' title='bbox 796 140 915 158; x_wconf 79' lang='eng' dir='ltr'>flavescens</span> <span class='ocrx_word' id='word_1_47' title='bbox 924 140 971 158; x_wconf 87' lang='eng' dir='ltr'>CBS</span> <span class='ocrx_word' id='word_1_48' title='bbox 979 135 1027 158; x_wconf 67' lang='eng' dir='ltr'>942Y</span> <span class='ocrx_word' id='word_1_49' title='bbox 1035 140 1161 162; x_wconf 83' lang='eng' dir='ltr'>(A8085796)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 649 182 1076 205; baseline 0 -5"><span class='ocrx_word' id='word_1_50' title='bbox 649 183 790 205; x_wconf 83' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_51' title='bbox 798 187 826 204; x_wconf 88' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_52' title='bbox 836 183 940 200; x_wconf 88' lang='eng' dir='ltr'>HX-2006a</span> <span class='ocrx_word' id='word_1_53' title='bbox 948 182 1076 205; x_wconf 85' lang='eng' dir='ltr'>(DQ333277)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 633 226 1042 248; baseline 0 -4"><span class='ocrx_word' id='word_1_54' title='bbox 633 226 774 248; x_wconf 81' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_55' title='bbox 782 231 810 248; x_wconf 84' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_56' title='bbox 821 226 901 244; x_wconf 89' lang='eng' dir='ltr'>HB1122</span> <span class='ocrx_word' id='word_1_57' title='bbox 912 226 1042 248; x_wconf 83' lang='eng' dir='ltr'>(AM039434)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 649 267 1137 289; baseline 0 -4"><span class='ocrx_word' id='word_1_58' title='bbox 649 267 790 289; x_wconf 78' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_59' title='bbox 798 267 908 285; x_wconf 86' lang='eng' dir='ltr'>flavescens</span> <span class='ocrx_word' id='word_1_60' title='bbox 915 267 1003 285; x_wconf 87' lang='eng' dir='ltr'>TJY36-3</span> <span class='ocrx_word' id='word_1_61' title='bbox 1012 267 1137 289; x_wconf 84' lang='eng' dir='ltr'>(EU301625)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 633 311 1138 333; baseline 0 -5"><span class='ocrx_word' id='word_1_62' title='bbox 633 311 774 333; x_wconf 81' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_63' title='bbox 782 311 892 328; x_wconf 86' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_64' title='bbox 900 311 946 328; x_wconf 91' lang='eng' dir='ltr'>JCM</span> <span class='ocrx_word' id='word_1_65' title='bbox 955 311 1005 328; x_wconf 88' lang='eng'>9909</span> <span class='ocrx_word' id='word_1_66' title='bbox 1014 311 1138 333; x_wconf 87' lang='eng' dir='ltr'>(AB085807)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 644 353 1086 375; baseline 0 -4"><span class='ocrx_word' id='word_1_67' title='bbox 644 353 785 375; x_wconf 74' lang='eng' dir='ltr'>Cryptacoccus</span> <span class='ocrx_word' id='word_1_68' title='bbox 793 353 903 371; x_wconf 85' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_69' title='bbox 911 353 954 371; x_wconf 77' lang='eng' dir='ltr'>GGO</span> <span class='ocrx_word' id='word_1_70' title='bbox 962 353 1086 375; x_wconf 86' lang='eng' dir='ltr'>(ABO16233)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 649 396 1135 419; baseline 0 -5"><span class='ocrx_word' id='word_1_71' title='bbox 649 396 790 419; x_wconf 81' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_72' title='bbox 798 396 908 414; x_wconf 86' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_73' title='bbox 917 397 945 414; x_wconf 91' lang='eng' dir='ltr'>RT</span> <span class='ocrx_word' id='word_1_74' title='bbox 953 397 1003 414; x_wconf 20' lang='eng'>3.513</span> <span class='ocrx_word' id='word_1_75' title='bbox 1013 396 1135 419; x_wconf 82' lang='eng' dir='ltr'>(AY731784)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 593 431 1137 461; baseline 0 -5"><span class='ocrx_word' id='word_1_76' title='bbox 593 431 614 446; x_wconf 69' lang='eng'>32</span> <span class='ocrx_word' id='word_1_77' title='bbox 633 439 774 461; x_wconf 76' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_78' title='bbox 782 439 892 456; x_wconf 83' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_79' title='bbox 901 439 947 456; x_wconf 89' lang='eng' dir='ltr'>CBS</span> <span class='ocrx_word' id='word_1_80' title='bbox 955 439 1005 456; x_wconf 88' lang='eng'>6473</span> <span class='ocrx_word' id='word_1_81' title='bbox 1014 439 1137 461; x_wconf 86' lang='eng' dir='ltr'>(AF487885)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 633 481 1120 503; baseline -0.002 -4"><span class='ocrx_word' id='word_1_82' title='bbox 633 481 774 503; x_wconf 82' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_83' title='bbox 782 481 892 499; x_wconf 81' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_84' title='bbox 901 481 981 499; x_wconf 87' lang='eng' dir='ltr'>HB1178</span> <span class='ocrx_word' id='word_1_85' title='bbox 992 481 1120 503; x_wconf 84' lang='eng' dir='ltr'>(AM160631)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 633 524 1101 547; baseline 0 -5"><span class='ocrx_word' id='word_1_86' title='bbox 633 524 774 547; x_wconf 81' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_87' title='bbox 782 524 892 542; x_wconf 85' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_88' title='bbox 900 524 969 542; x_wconf 70' lang='eng' dir='ltr'>J075.4</span> <span class='ocrx_word' id='word_1_89' title='bbox 978 524 1088 547; x_wconf 83' lang='eng' dir='ltr'>(AY188361</span> <span class='ocrx_word' id='word_1_90' title='bbox 1096 524 1101 547; x_wconf 93' lang='eng'>)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 646 567 1149 589; baseline 0 -5"><span class='ocrx_word' id='word_1_91' title='bbox 646 567 786 589; x_wconf 79' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_92' title='bbox 795 567 905 584; x_wconf 78' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_93' title='bbox 913 567 1018 584; x_wconf 77' lang='eng'>8602-048</span> <span class='ocrx_word' id='word_1_94' title='bbox 1027 567 1149 589; x_wconf 83' lang='eng' dir='ltr'>(EF068213)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 661 610 1109 632; baseline 0 -5"><span class='ocrx_word' id='word_1_95' title='bbox 661 610 801 632; x_wconf 81' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_96' title='bbox 809 610 892 627; x_wconf 81' lang='eng' dir='ltr'>Iaurentii</span> <span class='ocrx_word' id='word_1_97' title='bbox 899 610 973 627; x_wconf 87' lang='eng' dir='ltr'>GS42A</span> <span class='ocrx_word' id='word_1_98' title='bbox 981 610 1109 632; x_wconf 85' lang='eng' dir='ltr'>(DQ862855)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_48' title="bbox 661 653 1089 675; baseline 0 -5"><span class='ocrx_word' id='word_1_99' title='bbox 661 653 801 675; x_wconf 79' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_100' title='bbox 809 653 892 670; x_wconf 85' lang='eng' dir='ltr'>Iaurentii</span> <span class='ocrx_word' id='word_1_101' title='bbox 899 653 958 670; x_wconf 85' lang='eng' dir='ltr'>KSNZ</span> <span class='ocrx_word' id='word_1_102' title='bbox 967 653 1089 675; x_wconf 87' lang='eng' dir='ltr'>(EF635635)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 604 738 1195 1017">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 604 738 1195 1017">
+     <span class='ocr_line' id='line_1_49' title="bbox 661 738 1118 760; baseline 0 -4"><span class='ocrx_word' id='word_1_103' title='bbox 661 738 801 760; x_wconf 76' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_104' title='bbox 809 738 920 756; x_wconf 83' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_105' title='bbox 928 739 984 756; x_wconf 91' lang='eng' dir='ltr'>M155</span> <span class='ocrx_word' id='word_1_106' title='bbox 993 738 1118 760; x_wconf 84' lang='eng' dir='ltr'>(EU386716)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_50' title="bbox 604 781 1027 803; baseline 0 -5"><span class='ocrx_word' id='word_1_107' title='bbox 604 781 745 803; x_wconf 82' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_108' title='bbox 753 785 781 803; x_wconf 82' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_109' title='bbox 791 781 837 798; x_wconf 87' lang='eng' dir='ltr'>CBS</span> <span class='ocrx_word' id='word_1_110' title='bbox 846 781 896 798; x_wconf 82' lang='eng'>8372</span> <span class='ocrx_word' id='word_1_111' title='bbox 906 781 1027 803; x_wconf 88' lang='eng' dir='ltr'>(AF444707)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_51' title="bbox 604 823 1091 845; baseline 0 -4"><span class='ocrx_word' id='word_1_112' title='bbox 604 823 745 845; x_wconf 80' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_113' title='bbox 753 823 863 841; x_wconf 78' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_114' title='bbox 872 823 959 841; x_wconf 81' lang='eng' dir='ltr'>SM3$07</span> <span class='ocrx_word' id='word_1_115' title='bbox 968 823 1091 845; x_wconf 84' lang='eng' dir='ltr'>(EF460580)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_52' title="bbox 619 866 1095 888; baseline 0 -4"><span class='ocrx_word' id='word_1_116' title='bbox 619 866 760 888; x_wconf 81' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_117' title='bbox 767 866 849 884; x_wconf 80' lang='eng' dir='ltr'><em>laurentii</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 857 866 903 884; x_wconf 86' lang='eng' dir='ltr'>CBS</span> <span class='ocrx_word' id='word_1_119' title='bbox 912 866 962 884; x_wconf 85' lang='eng'>8645</span> <span class='ocrx_word' id='word_1_120' title='bbox 971 866 1095 888; x_wconf 75' lang='eng' dir='ltr'>(ABOB7253)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_53' title="bbox 665 910 1195 933; baseline 0 -5"><span class='ocrx_word' id='word_1_121' title='bbox 665 911 805 933; x_wconf 80' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_122' title='bbox 813 911 904 928; x_wconf 77' lang='eng' dir='ltr'>terrestris</span> <span class='ocrx_word' id='word_1_123' title='bbox 912 911 1056 928; x_wconf 83' lang='eng' dir='ltr'>C107DX4-Y11</span> <span class='ocrx_word' id='word_1_124' title='bbox 1068 910 1195 933; x_wconf 85' lang='eng' dir='ltr'>(EF599104)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_54' title="bbox 665 952 1070 974; baseline 0 -5"><span class='ocrx_word' id='word_1_125' title='bbox 665 952 805 974; x_wconf 81' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_126' title='bbox 813 956 842 974; x_wconf 87' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_127' title='bbox 851 952 937 969; x_wconf 77' lang='eng' dir='ltr'>CABSSO</span> <span class='ocrx_word' id='word_1_128' title='bbox 946 952 1070 974; x_wconf 82' lang='eng' dir='ltr'>(EU427438)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_55' title="bbox 665 995 1110 1017; baseline 0 -5"><span class='ocrx_word' id='word_1_129' title='bbox 665 995 805 1017; x_wconf 83' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_130' title='bbox 813 995 904 1012; x_wconf 78' lang='eng' dir='ltr'>terrestris</span> <span class='ocrx_word' id='word_1_131' title='bbox 912 995 975 1017; x_wconf 85' lang='eng' dir='ltr'><strong>Ep11c</strong></span> <span class='ocrx_word' id='word_1_132' title='bbox 983 995 1110 1017; x_wconf 88' lang='eng' dir='ltr'>(EU200780)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 665 1038 1129 1102">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 665 1038 1129 1102">
+     <span class='ocr_line' id='line_1_56' title="bbox 665 1038 1080 1061; baseline -0.002 -4"><span class='ocrx_word' id='word_1_133' title='bbox 665 1039 805 1061; x_wconf 80' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_134' title='bbox 812 1039 895 1057; x_wconf 74' lang='eng' dir='ltr'>Iaurentif</span> <span class='ocrx_word' id='word_1_135' title='bbox 903 1039 946 1057; x_wconf 80' lang='eng' dir='ltr'>8H3</span> <span class='ocrx_word' id='word_1_136' title='bbox 955 1038 1080 1061; x_wconf 80' lang='eng' dir='ltr'>(EF644463)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_57' title="bbox 665 1080 1129 1102; baseline -0.002 -4"><span class='ocrx_word' id='word_1_137' title='bbox 665 1080 805 1102; x_wconf 82' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_138' title='bbox 813 1080 924 1098; x_wconf 83' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_139' title='bbox 932 1080 992 1098; x_wconf 88' lang='eng' dir='ltr'>DGR1</span> <span class='ocrx_word' id='word_1_140' title='bbox 1004 1080 1129 1102; x_wconf 85' lang='eng' dir='ltr'>(EU441902)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 665 1161 1199 1188">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 665 1161 1199 1188">
+     <span class='ocr_line' id='line_1_58' title="bbox 665 1161 1199 1188; baseline 0 -5"><span class='ocrx_word' id='word_1_141' title='bbox 665 1166 820 1188; x_wconf 80' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_142' title='bbox 828 1166 928 1183; x_wconf 69' lang='eng' dir='ltr'>terrestris</span> <span class='ocrx_word' id='word_1_143' title='bbox 937 1166 1011 1183; x_wconf 84' lang='eng' dir='ltr'>CJDX4</span> <span class='ocrx_word' id='word_1_144' title='bbox 1019 1161 1069 1183; x_wconf 85' lang='eng' dir='ltr'>Y23T</span> <span class='ocrx_word' id='word_1_145' title='bbox 1077 1166 1199 1188; x_wconf 85' lang='eng' dir='ltr'>(EF370393)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 514 1251 1073 1487">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 514 1251 1073 1487">
+     <span class='ocr_line' id='line_1_59' title="bbox 624 1251 1047 1273; baseline 0 -5"><span class='ocrx_word' id='word_1_146' title='bbox 624 1251 764 1273; x_wconf 79' lang='eng' dir='ltr'>Cryplococcus</span> <span class='ocrx_word' id='word_1_147' title='bbox 772 1256 801 1273; x_wconf 81' lang='eng' dir='ltr'>5p.</span> <span class='ocrx_word' id='word_1_148' title='bbox 811 1251 857 1269; x_wconf 88' lang='eng' dir='ltr'>CBS</span> <span class='ocrx_word' id='word_1_149' title='bbox 865 1251 916 1269; x_wconf 82' lang='eng'>8366</span> <span class='ocrx_word' id='word_1_150' title='bbox 925 1251 1047 1273; x_wconf 89' lang='eng' dir='ltr'>(AF444702)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_60' title="bbox 546 1261 1047 1316; baseline -0.002 -4"><span class='ocrx_word' id='word_1_151' title='bbox 546 1261 616 1309; x_wconf 43' lang='eng' dir='ltr'>j.</span> <span class='ocrx_word' id='word_1_152' title='bbox 624 1294 765 1316; x_wconf 84' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_153' title='bbox 772 1299 801 1316; x_wconf 86' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_154' title='bbox 811 1294 857 1312; x_wconf 85' lang='eng' dir='ltr'>CBS</span> <span class='ocrx_word' id='word_1_155' title='bbox 865 1294 916 1312; x_wconf 81' lang='eng'>8358</span> <span class='ocrx_word' id='word_1_156' title='bbox 925 1294 1047 1316; x_wconf 83' lang='eng' dir='ltr'>(AF444698)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_61' title="bbox 553 1335 1041 1362; baseline 0 -5"><span class='ocrx_word' id='word_1_157' title='bbox 553 1339 708 1362; x_wconf 75' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_158' title='bbox 716 1344 792 1357; x_wconf 87' lang='eng' dir='ltr'>aureus</span> <span class='ocrx_word' id='word_1_159' title='bbox 800 1339 847 1357; x_wconf 85' lang='eng' dir='ltr'>CBS</span> <span class='ocrx_word' id='word_1_160' title='bbox 856 1335 904 1357; x_wconf 65' lang='eng'>3181</span> <span class='ocrx_word' id='word_1_161' title='bbox 912 1337 1041 1362; x_wconf 79' lang='eng' dir='ltr'>(A3085795)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_62' title="bbox 514 1379 1073 1401; baseline 0.004 -6"><span class='ocrx_word' id='word_1_162' title='bbox 514 1380 536 1395; x_wconf 84' lang='eng'><strong>86</strong></span> <span class='ocrx_word' id='word_1_163' title='bbox 545 1388 638 1390; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_164' title='bbox 647 1379 788 1401; x_wconf 79' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_165' title='bbox 796 1384 867 1397; x_wconf 82' lang='eng' dir='ltr'>aureus</span> <span class='ocrx_word' id='word_1_166' title='bbox 875 1379 939 1397; x_wconf 82' lang='eng' dir='ltr'>HN4.9</span> <span class='ocrx_word' id='word_1_167' title='bbox 948 1379 1073 1401; x_wconf 85' lang='eng' dir='ltr'>(EU304246)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_63' title="bbox 553 1417 1027 1445; baseline 0 -5"><span class='ocrx_word' id='word_1_168' title='bbox 553 1430 574 1445; x_wconf 74' lang='eng'>95</span> <span class='ocrx_word' id='word_1_169' title='bbox 591 1423 669 1440; x_wconf 86' lang='eng' dir='ltr'>Bullera</span> <span class='ocrx_word' id='word_1_170' title='bbox 674 1423 771 1445; x_wconf 83' lang='eng' dir='ltr'>japonica</span> <span class='ocrx_word' id='word_1_171' title='bbox 779 1423 827 1440; x_wconf 89' lang='eng' dir='ltr'>CBS</span> <span class='ocrx_word' id='word_1_172' title='bbox 835 1417 896 1440; x_wconf 73' lang='eng' dir='ltr'>2013T</span> <span class='ocrx_word' id='word_1_173' title='bbox 904 1423 1027 1445; x_wconf 85' lang='eng' dir='ltr'>(AF444760)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_64' title="bbox 550 1431 1043 1487; baseline 0 -5"><span class='ocrx_word' id='word_1_174' title='bbox 550 1431 584 1474; x_wconf 65' lang='eng' dir='ltr'>—l</span> <span class='ocrx_word' id='word_1_175' title='bbox 591 1465 732 1487; x_wconf 80' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_176' title='bbox 740 1469 769 1487; x_wconf 90' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_177' title='bbox 778 1465 840 1482; x_wconf 91' lang='eng' dir='ltr'>KCTC</span> <span class='ocrx_word' id='word_1_178' title='bbox 850 1465 912 1482; x_wconf 86' lang='eng'>17079</span> <span class='ocrx_word' id='word_1_179' title='bbox 921 1465 1043 1487; x_wconf 85' lang='eng' dir='ltr'>(AF459695)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 1223 136 1257 618">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 1223 136 1257 618">
+     <span class='ocr_line' id='line_1_65' title="bbox 1223 136 1257 618; textangle 90"><span class='ocrx_word' id='word_1_180' title='bbox 1230 535 1256 618; x_wconf 79' lang='eng' dir='ltr'>epep</span> <span class='ocrx_word' id='word_1_181' title='bbox 1230 359 1257 524; x_wconf 58' lang='eng' dir='ltr'>SUGOSGAQIJ</span> <span class='ocrx_word' id='word_1_182' title='bbox 1223 136 1257 347; x_wconf 55' lang='eng' dir='ltr'>snooooold/Uo</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 677 695 1115 717">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 677 695 1115 717">
+     <span class='ocr_line' id='line_1_66' title="bbox 677 695 1115 717; baseline -0.002 -4"><span class='ocrx_word' id='word_1_183' title='bbox 677 695 817 717; x_wconf 83' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_184' title='bbox 825 695 935 713; x_wconf 81' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_185' title='bbox 944 695 984 712; x_wconf 89' lang='eng' dir='ltr'>FK2</span> <span class='ocrx_word' id='word_1_186' title='bbox 993 695 1115 717; x_wconf 85' lang='eng' dir='ltr'>(EF644446)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 1186 0 1187 768">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 1186 0 1187 768">
+     <span class='ocr_line' id='line_1_67' title="bbox 1186 0 1187 768; baseline 0 1267"><span class='ocrx_word' id='word_1_187' title='bbox 1186 0 1187 768; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 680 1124 1100 1147">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 680 1124 1100 1147">
+     <span class='ocr_line' id='line_1_68' title="bbox 680 1124 1100 1147; baseline 0 -5"><span class='ocrx_word' id='word_1_188' title='bbox 680 1125 820 1147; x_wconf 78' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_189' title='bbox 828 1125 918 1142; x_wconf 76' lang='eng' dir='ltr'>Ierrestris</span> <span class='ocrx_word' id='word_1_190' title='bbox 927 1125 964 1142; x_wconf 88' lang='eng' dir='ltr'>56e</span> <span class='ocrx_word' id='word_1_191' title='bbox 973 1125 1086 1147; x_wconf 83' lang='eng' dir='ltr'>(EU340251</span> <span class='ocrx_word' id='word_1_192' title='bbox 1095 1124 1100 1146; x_wconf 88' lang='eng'>)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 728 1209 1140 1231">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 728 1209 1140 1231">
+     <span class='ocr_line' id='line_1_69' title="bbox 728 1209 1140 1231; baseline 0 -5"><span class='ocrx_word' id='word_1_193' title='bbox 728 1209 869 1231; x_wconf 81' lang='eng' dir='ltr'>Cryptococous</span> <span class='ocrx_word' id='word_1_194' title='bbox 877 1213 905 1231; x_wconf 87' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_195' title='bbox 915 1209 961 1226; x_wconf 87' lang='eng' dir='ltr'>CAB</span> <span class='ocrx_word' id='word_1_196' title='bbox 969 1209 1007 1226; x_wconf 91' lang='eng'>579</span> <span class='ocrx_word' id='word_1_197' title='bbox 1016 1209 1140 1231; x_wconf 81' lang='eng' dir='ltr'>(EU427439)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 1261 829 1295 1282">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 1261 829 1295 1282">
+     <span class='ocr_line' id='line_1_70' title="bbox 1261 829 1295 1282; textangle 90"><span class='ocrx_word' id='word_1_198' title='bbox 1269 1199 1294 1282; x_wconf 76' lang='eng' dir='ltr'>apep</span> <span class='ocrx_word' id='word_1_199' title='bbox 1269 1053 1294 1188; x_wconf 67' lang='eng'>3111891191</span> <span class='ocrx_word' id='word_1_200' title='bbox 1261 829 1295 1041; x_wconf 64' lang='eng' dir='ltr'>snoooomd/ﬂo</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 1130 1255 1156 1498">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 1130 1255 1156 1498">
+     <span class='ocr_line' id='line_1_71' title="bbox 1130 1255 1156 1498; textangle 90"><span class='ocrx_word' id='word_1_201' title='bbox 1130 1416 1156 1498; x_wconf 79' lang='eng' dir='ltr'>epep</span> <span class='ocrx_word' id='word_1_202' title='bbox 1130 1298 1149 1405; x_wconf 64' lang='eng' dir='ltr'><em>meme</em></span> <span class='ocrx_word' id='word_1_203' title='bbox 1130 1255 1156 1283; x_wconf 78' lang='eng'>&#39;3</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 520 1507 989 1534">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 520 1507 989 1534">
+     <span class='ocr_line' id='line_1_72' title="bbox 520 1507 989 1534; baseline 0 -9"><span class='ocrx_word' id='word_1_204' title='bbox 520 1519 541 1534; x_wconf 69' lang='eng'>80</span> <span class='ocrx_word' id='word_1_205' title='bbox 615 1508 752 1525; x_wconf 82' lang='eng' dir='ltr'>AuriculibuI/er</span> <span class='ocrx_word' id='word_1_206' title='bbox 758 1512 786 1529; x_wconf 84' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_207' title='bbox 796 1508 849 1525; x_wconf 90' lang='eng' dir='ltr'>B|111</span> <span class='ocrx_word' id='word_1_208' title='bbox 864 1507 989 1530; x_wconf 76' lang='eng' dir='ltr'>(EU200788)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 548 1452 550 1561">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 548 1452 550 1561">
+     <span class='ocr_line' id='line_1_73' title="bbox 548 1452 550 1561; baseline 0 474"><span class='ocrx_word' id='word_1_209' title='bbox 548 1452 550 1561; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 533 1573 555 1588">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 533 1573 555 1588">
+     <span class='ocr_line' id='line_1_74' title="bbox 533 1573 555 1588; baseline 0 0"><span class='ocrx_word' id='word_1_210' title='bbox 533 1573 555 1588; x_wconf 85' lang='eng'>53</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 571 1546 1077 1573">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 571 1546 1077 1573">
+     <span class='ocr_line' id='line_1_75' title="bbox 571 1546 1077 1573; baseline 0 -4"><span class='ocrx_word' id='word_1_211' title='bbox 571 1551 725 1569; x_wconf 84' lang='eng' dir='ltr'>Auriculibuller</span> <span class='ocrx_word' id='word_1_212' title='bbox 731 1551 805 1569; x_wconf 87' lang='eng' dir='ltr'><strong><em>fuscus</em></strong></span> <span class='ocrx_word' id='word_1_213' title='bbox 813 1551 876 1569; x_wconf 90' lang='eng' dir='ltr'>PYCC</span> <span class='ocrx_word' id='word_1_214' title='bbox 885 1546 945 1569; x_wconf 76' lang='eng' dir='ltr'>5690T</span> <span class='ocrx_word' id='word_1_215' title='bbox 954 1551 1077 1573; x_wconf 84' lang='eng' dir='ltr'>(AF444762)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_37' title="bbox 571 1593 1042 1658">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 571 1593 1042 1658">
+     <span class='ocr_line' id='line_1_76' title="bbox 571 1593 1015 1615; baseline 0 -5"><span class='ocrx_word' id='word_1_216' title='bbox 571 1593 708 1610; x_wconf 79' lang='eng' dir='ltr'>Auriculibuller</span> <span class='ocrx_word' id='word_1_217' title='bbox 713 1593 780 1610; x_wconf 84' lang='eng' dir='ltr'>fuscus</span> <span class='ocrx_word' id='word_1_218' title='bbox 794 1593 833 1610; x_wconf 93' lang='eng' dir='ltr'>ZIM</span> <span class='ocrx_word' id='word_1_219' title='bbox 841 1593 879 1610; x_wconf 84' lang='eng'>609</span> <span class='ocrx_word' id='word_1_220' title='bbox 888 1593 1015 1615; x_wconf 84' lang='eng' dir='ltr'>(AM748525)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_77' title="bbox 571 1636 1042 1658; baseline -0.002 -4"><span class='ocrx_word' id='word_1_221' title='bbox 571 1636 708 1654; x_wconf 81' lang='eng' dir='ltr'>Auriculibuller</span> <span class='ocrx_word' id='word_1_222' title='bbox 713 1636 780 1654; x_wconf 83' lang='eng' dir='ltr'>fuscus</span> <span class='ocrx_word' id='word_1_223' title='bbox 789 1636 851 1654; x_wconf 86' lang='eng' dir='ltr'>PYCC</span> <span class='ocrx_word' id='word_1_224' title='bbox 860 1636 911 1654; x_wconf 82' lang='eng'>5740</span> <span class='ocrx_word' id='word_1_225' title='bbox 920 1636 1042 1658; x_wconf 89' lang='eng' dir='ltr'>(AF444761)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_38' title="bbox 541 1615 551 1630">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 541 1615 551 1630">
+     <span class='ocr_line' id='line_1_78' title="bbox 541 1615 551 1630; baseline 0 0"><span class='ocrx_word' id='word_1_226' title='bbox 541 1615 551 1630; x_wconf 88' lang='eng'>5</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_39' title="bbox 457 1674 1165 1731">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 693 1674 1165 1701">
+     <span class='ocr_line' id='line_1_79' title="bbox 693 1674 1165 1701; baseline -0.002 -4"><span class='ocrx_word' id='word_1_227' title='bbox 693 1679 771 1697; x_wconf 81' lang='eng' dir='ltr'>Bullera</span> <span class='ocrx_word' id='word_1_228' title='bbox 778 1679 909 1701; x_wconf 85' lang='eng' dir='ltr'>pseudoalba</span> <span class='ocrx_word' id='word_1_229' title='bbox 917 1679 965 1697; x_wconf 88' lang='eng' dir='ltr'>CBS</span> <span class='ocrx_word' id='word_1_230' title='bbox 973 1674 1034 1696; x_wconf 66' lang='eng'>72271</span> <span class='ocrx_word' id='word_1_231' title='bbox 1042 1679 1165 1701; x_wconf 84' lang='eng' dir='ltr'>(AF075504)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_40' title="bbox 646 1717 1261 1745">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 646 1717 1261 1745">
+     <span class='ocr_line' id='line_1_80' title="bbox 646 1717 1261 1745; baseline 0 -5"><span class='ocrx_word' id='word_1_232' title='bbox 646 1722 678 1737; x_wconf 88' lang='eng'>100</span> <span class='ocrx_word' id='word_1_233' title='bbox 694 1722 849 1745; x_wconf 81' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_234' title='bbox 857 1723 1005 1745; x_wconf 75' lang='eng' dir='ltr'>cellulolyticus</span> <span class='ocrx_word' id='word_1_235' title='bbox 1013 1722 1060 1740; x_wconf 89' lang='eng' dir='ltr'>CBS</span> <span class='ocrx_word' id='word_1_236' title='bbox 1069 1717 1129 1740; x_wconf 74' lang='eng'>82941</span> <span class='ocrx_word' id='word_1_237' title='bbox 1138 1722 1261 1745; x_wconf 89' lang='eng' dir='ltr'>(AF075525)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_41' title="bbox 449 1794 515 1796">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 449 1794 515 1796">
+     <span class='ocr_line' id='line_1_81' title="bbox 449 1794 515 1796; baseline 0 239"><span class='ocrx_word' id='word_1_238' title='bbox 449 1794 515 1796; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_42' title="bbox 413 1837 450 1839">
+    <p class='ocr_par' dir='ltr' id='par_1_42' title="bbox 413 1837 450 1839">
+     <span class='ocr_line' id='line_1_82' title="bbox 413 1837 450 1839; baseline 0 196"><span class='ocrx_word' id='word_1_239' title='bbox 413 1837 450 1839; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_43' title="bbox 449 1794 451 1881">
+    <p class='ocr_par' dir='ltr' id='par_1_43' title="bbox 449 1794 451 1881">
+     <span class='ocr_line' id='line_1_83' title="bbox 449 1794 451 1881; baseline 0 154"><span class='ocrx_word' id='word_1_240' title='bbox 449 1794 451 1881; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_44' title="bbox 514 1773 516 1817">
+    <p class='ocr_par' dir='ltr' id='par_1_44' title="bbox 514 1773 516 1817">
+     <span class='ocr_line' id='line_1_84' title="bbox 514 1773 516 1817; baseline 0 218"><span class='ocrx_word' id='word_1_241' title='bbox 514 1773 516 1817; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_45' title="bbox 516 1759 1036 1829">
+    <p class='ocr_par' dir='ltr' id='par_1_45' title="bbox 516 1759 1036 1829">
+     <span class='ocr_line' id='line_1_85' title="bbox 516 1759 1036 1787; baseline 0 -5"><span class='ocrx_word' id='word_1_242' title='bbox 516 1773 531 1775; x_wconf 98' lang='eng'>—</span> <span class='ocrx_word' id='word_1_243' title='bbox 540 1765 695 1787; x_wconf 72' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_244' title='bbox 703 1765 794 1782; x_wconf 86' lang='eng' dir='ltr'>Iaurentii</span> <span class='ocrx_word' id='word_1_245' title='bbox 801 1765 848 1782; x_wconf 87' lang='eng' dir='ltr'>CBS</span> <span class='ocrx_word' id='word_1_246' title='bbox 858 1759 905 1782; x_wconf 71' lang='eng' dir='ltr'>139T</span> <span class='ocrx_word' id='word_1_247' title='bbox 913 1765 1036 1787; x_wconf 83' lang='eng' dir='ltr'>(AFO75469)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_86' title="bbox 524 1807 998 1829; baseline 0 -5"><span class='ocrx_word' id='word_1_248' title='bbox 524 1807 665 1829; x_wconf 78' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_249' title='bbox 672 1807 755 1824; x_wconf 80' lang='eng' dir='ltr'>Iaurentii</span> <span class='ocrx_word' id='word_1_250' title='bbox 762 1807 808 1824; x_wconf 86' lang='eng' dir='ltr'>CBS</span> <span class='ocrx_word' id='word_1_251' title='bbox 816 1807 867 1824; x_wconf 88' lang='eng'>7140</span> <span class='ocrx_word' id='word_1_252' title='bbox 876 1807 998 1829; x_wconf 82' lang='eng' dir='ltr'>(AY315663)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_46' title="bbox 519 1845 1038 1873">
+    <p class='ocr_par' dir='ltr' id='par_1_46' title="bbox 519 1845 1038 1873">
+     <span class='ocr_line' id='line_1_87' title="bbox 519 1845 1038 1873; baseline 0 -5"><span class='ocrx_word' id='word_1_253' title='bbox 519 1851 673 1873; x_wconf 78' lang='eng' dir='ltr'>Cryplocaccus</span> <span class='ocrx_word' id='word_1_254' title='bbox 681 1851 844 1873; x_wconf 80' lang='eng' dir='ltr'>rajaslhanensis</span> <span class='ocrx_word' id='word_1_255' title='bbox 853 1845 901 1868; x_wconf 89' lang='eng' dir='ltr'>15LT</span> <span class='ocrx_word' id='word_1_256' title='bbox 909 1851 1038 1873; x_wconf 78' lang='eng' dir='ltr'>(AM262324)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_47' title="bbox 420 1851 1010 1915">
+    <p class='ocr_par' dir='ltr' id='par_1_47' title="bbox 420 1851 1010 1915">
+     <span class='ocr_line' id='line_1_88' title="bbox 420 1851 442 1866; baseline 0 0"><span class='ocrx_word' id='word_1_257' title='bbox 420 1851 442 1866; x_wconf 84' lang='eng'>58</span> 
+     </span>
+     <span class='ocr_line' id='line_1_89' title="bbox 479 1893 1010 1915; baseline 0 -5"><span class='ocrx_word' id='word_1_258' title='bbox 479 1893 501 1909; x_wconf 85' lang='eng'>99</span> <span class='ocrx_word' id='word_1_259' title='bbox 518 1893 659 1915; x_wconf 79' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_260' title='bbox 666 1893 817 1915; x_wconf 80' lang='eng' dir='ltr'>rajasthanensis</span> <span class='ocrx_word' id='word_1_261' title='bbox 825 1893 871 1910; x_wconf 81' lang='eng' dir='ltr'>3-C1</span> <span class='ocrx_word' id='word_1_262' title='bbox 883 1893 1010 1915; x_wconf 85' lang='eng' dir='ltr'>(AM262981)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_48' title="bbox 6 1944 720 1946">
+    <p class='ocr_par' dir='ltr' id='par_1_48' title="bbox 6 1944 720 1946">
+     <span class='ocr_line' id='line_1_90' title="bbox 6 1944 720 1946; baseline 0 89"><span class='ocrx_word' id='word_1_263' title='bbox 6 1944 720 1946; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_49' title="bbox 160 2018 199 2033">
+    <p class='ocr_par' dir='ltr' id='par_1_49' title="bbox 160 2018 199 2033">
+     <span class='ocr_line' id='line_1_91' title="bbox 160 2018 199 2033; baseline 0 0"><span class='ocrx_word' id='word_1_264' title='bbox 160 2018 199 2033; x_wconf 84' lang='eng'>0.02</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_50' title="bbox 729 1931 1265 1958">
+    <p class='ocr_par' dir='ltr' id='par_1_50' title="bbox 729 1931 1265 1958">
+     <span class='ocr_line' id='line_1_92' title="bbox 729 1931 1265 1958; baseline 0 -5"><span class='ocrx_word' id='word_1_265' title='bbox 729 1936 883 1958; x_wconf 82' lang='eng' dir='ltr'>Cryptacoccus</span> <span class='ocrx_word' id='word_1_266' title='bbox 892 1940 1020 1953; x_wconf 84' lang='eng' dir='ltr'>carnescens</span> <span class='ocrx_word' id='word_1_267' title='bbox 1028 1936 1075 1953; x_wconf 88' lang='eng' dir='ltr'>CBS</span> <span class='ocrx_word' id='word_1_268' title='bbox 1084 1931 1131 1953; x_wconf 74' lang='eng' dir='ltr'>973T</span> <span class='ocrx_word' id='word_1_269' title='bbox 1139 1936 1265 1958; x_wconf 80' lang='eng' dir='ltr'>(A3085798)</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001800-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001800-0-001.pbm.png
new file mode 100644
index 00000000..0fd8b6af
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001800-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001800-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001800-0-001.pbm.png.hocr
new file mode 100644
index 00000000..f880c517
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001800-0-001.pbm.png.hocr
@@ -0,0 +1,433 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001800-0-001.pbm.png"; bbox 0 0 1207 1937; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 190 1334 219 1348">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 190 1334 219 1348">
+     <span class='ocr_line' id='line_1_1' title="bbox 190 1334 219 1348; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 190 1334 219 1348; x_wconf 83' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 429 806 449 820">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 429 806 449 820">
+     <span class='ocr_line' id='line_1_2' title="bbox 429 806 449 820; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 429 806 449 820; x_wconf 86' lang='eng'>99</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 566 5 1030 67">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 566 5 1030 67">
+     <span class='ocr_line' id='line_1_3' title="bbox 566 5 958 26; baseline 0 -5"><span class='ocrx_word' id='word_1_3' title='bbox 566 5 699 26; x_wconf 80' lang='eng' dir='ltr'>Cryplococcus</span> <span class='ocrx_word' id='word_1_4' title='bbox 707 9 734 26; x_wconf 89' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_5' title='bbox 741 5 834 21; x_wconf 67' lang='eng' dir='ltr'>AA-090,4</span> <span class='ocrx_word' id='word_1_6' title='bbox 843 5 958 26; x_wconf 82' lang='eng' dir='ltr'>(AY188363)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 610 46 1030 67; baseline 0 -5"><span class='ocrx_word' id='word_1_7' title='bbox 610 46 744 67; x_wconf 83' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_8' title='bbox 752 46 856 62; x_wconf 80' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_9' title='bbox 864 46 904 62; x_wconf 79' lang='eng'><strong>660</strong></span> <span class='ocrx_word' id='word_1_10' title='bbox 913 46 1030 67; x_wconf 82' lang='eng' dir='ltr'>(ABO16234)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 526 10 605 117">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 526 10 605 117">
+     <span class='ocr_line' id='line_1_5' title="bbox 551 10 566 36; baseline 0 1901"><span class='ocrx_word' id='word_1_11' title='bbox 551 10 566 36; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 551 36 605 76; baseline 0 1861"><span class='ocrx_word' id='word_1_12' title='bbox 551 36 605 76; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 526 76 566 117; baseline 0 -1"><span class='ocrx_word' id='word_1_13' title='bbox 526 76 566 117; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 566 126 1069 554">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 566 126 1069 554">
+     <span class='ocr_line' id='line_1_8' title="bbox 566 126 1009 147; baseline 0 -4"><span class='ocrx_word' id='word_1_14' title='bbox 566 126 699 147; x_wconf 74' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_15' title='bbox 707 126 812 143; x_wconf 84' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_16' title='bbox 819 127 884 143; x_wconf 89' lang='eng' dir='ltr'>J075.4</span> <span class='ocrx_word' id='word_1_17' title='bbox 893 126 1009 147; x_wconf 83' lang='eng' dir='ltr'>(AY188361)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 566 167 1044 188; baseline 0 -4"><span class='ocrx_word' id='word_1_18' title='bbox 566 167 699 188; x_wconf 67' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_19' title='bbox 707 167 812 184; x_wconf 83' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_20' title='bbox 819 167 863 184; x_wconf 87' lang='eng' dir='ltr'>CBS</span> <span class='ocrx_word' id='word_1_21' title='bbox 871 168 919 184; x_wconf 84' lang='eng'><strong>6474</strong></span> <span class='ocrx_word' id='word_1_22' title='bbox 928 168 1044 188; x_wconf 89' lang='eng' dir='ltr'>(EF056305)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 566 208 1044 229; baseline 0 -5"><span class='ocrx_word' id='word_1_23' title='bbox 566 208 699 229; x_wconf 75' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_24' title='bbox 707 208 812 224; x_wconf 80' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_25' title='bbox 819 208 863 224; x_wconf 85' lang='eng' dir='ltr'>CBS</span> <span class='ocrx_word' id='word_1_26' title='bbox 871 208 919 224; x_wconf 80' lang='eng'>8359</span> <span class='ocrx_word' id='word_1_27' title='bbox 928 208 1044 229; x_wconf 84' lang='eng' dir='ltr'>(EF056302)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 566 248 915 269; baseline 0 -4"><span class='ocrx_word' id='word_1_28' title='bbox 566 248 699 269; x_wconf 79' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_29' title='bbox 706 253 734 269; x_wconf 28' lang='eng' dir='ltr'>spA</span> <span class='ocrx_word' id='word_1_30' title='bbox 744 248 793 265; x_wconf 83' lang='eng' dir='ltr'>P225</span> <span class='ocrx_word' id='word_1_31' title='bbox 802 248 915 269; x_wconf 80' lang='eng' dir='ltr'>(AJ345008)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 566 285 1067 311; baseline -0.002 -4"><span class='ocrx_word' id='word_1_32' title='bbox 566 290 712 311; x_wconf 75' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_33' title='bbox 720 290 833 307; x_wconf 82' lang='eng' dir='ltr'>flavescens</span> <span class='ocrx_word' id='word_1_34' title='bbox 841 290 887 307; x_wconf 86' lang='eng' dir='ltr'>CBS</span> <span class='ocrx_word' id='word_1_35' title='bbox 895 285 940 307; x_wconf 82' lang='eng' dir='ltr'>942r</span> <span class='ocrx_word' id='word_1_36' title='bbox 947 290 1067 311; x_wconf 84' lang='eng' dir='ltr'>(ABD35046)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 566 330 1034 351; baseline 0 -5"><span class='ocrx_word' id='word_1_37' title='bbox 566 330 699 351; x_wconf 73' lang='eng' dir='ltr'>Clyptococcus</span> <span class='ocrx_word' id='word_1_38' title='bbox 707 330 812 346; x_wconf 77' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_39' title='bbox 820 330 848 346; x_wconf 91' lang='eng' dir='ltr'>HB</span> <span class='ocrx_word' id='word_1_40' title='bbox 858 330 903 346; x_wconf 83' lang='eng'>1178</span> <span class='ocrx_word' id='word_1_41' title='bbox 913 330 1034 351; x_wconf 79' lang='eng' dir='ltr'>(AM160631)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 566 370 1045 391; baseline 0 -4"><span class='ocrx_word' id='word_1_42' title='bbox 566 370 699 391; x_wconf 76' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_43' title='bbox 707 370 812 387; x_wconf 80' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_44' title='bbox 819 370 862 387; x_wconf 91' lang='eng' dir='ltr'>JCM</span> <span class='ocrx_word' id='word_1_45' title='bbox 871 370 919 387; x_wconf 83' lang='eng'>9910</span> <span class='ocrx_word' id='word_1_46' title='bbox 928 370 1045 391; x_wconf 79' lang='eng' dir='ltr'>(ABOB5804)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 566 411 1069 432; baseline 0 -4"><span class='ocrx_word' id='word_1_47' title='bbox 566 411 699 432; x_wconf 74' lang='eng' dir='ltr'>Clyptococcus</span> <span class='ocrx_word' id='word_1_48' title='bbox 707 411 812 428; x_wconf 80' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_49' title='bbox 819 411 863 428; x_wconf 88' lang='eng' dir='ltr'>CBS</span> <span class='ocrx_word' id='word_1_50' title='bbox 873 411 944 428; x_wconf 83' lang='eng'>101036</span> <span class='ocrx_word' id='word_1_51' title='bbox 952 411 1069 432; x_wconf 84' lang='eng' dir='ltr'>(EF056308)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 566 452 1044 473; baseline 0 -5"><span class='ocrx_word' id='word_1_52' title='bbox 566 452 699 473; x_wconf 74' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_53' title='bbox 707 452 812 468; x_wconf 78' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_54' title='bbox 819 452 863 468; x_wconf 89' lang='eng' dir='ltr'>CBS</span> <span class='ocrx_word' id='word_1_55' title='bbox 871 452 919 468; x_wconf 82' lang='eng'>4919</span> <span class='ocrx_word' id='word_1_56' title='bbox 928 452 1044 473; x_wconf 83' lang='eng' dir='ltr'>(EF056303)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 566 492 1045 513; baseline 0 -5"><span class='ocrx_word' id='word_1_57' title='bbox 566 492 699 513; x_wconf 78' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_58' title='bbox 707 492 812 508; x_wconf 80' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_59' title='bbox 819 492 862 508; x_wconf 88' lang='eng' dir='ltr'>JCM</span> <span class='ocrx_word' id='word_1_60' title='bbox 871 492 914 508; x_wconf 80' lang='eng'>9911</span> <span class='ocrx_word' id='word_1_61' title='bbox 928 492 1045 513; x_wconf 81' lang='eng' dir='ltr'>(A8085805)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 566 533 1045 554; baseline 0 -5"><span class='ocrx_word' id='word_1_62' title='bbox 566 533 699 554; x_wconf 77' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_63' title='bbox 707 533 812 549; x_wconf 80' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_64' title='bbox 819 533 862 549; x_wconf 87' lang='eng' dir='ltr'>JCM</span> <span class='ocrx_word' id='word_1_65' title='bbox 871 533 919 549; x_wconf 82' lang='eng'>9912</span> <span class='ocrx_word' id='word_1_66' title='bbox 928 533 1045 554; x_wconf 81' lang='eng' dir='ltr'>(A8085806)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 501 573 992 594">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 501 573 992 594">
+     <span class='ocr_line' id='line_1_19' title="bbox 501 573 992 594; baseline -0.002 -4"><span class='ocrx_word' id='word_1_67' title='bbox 501 576 521 590; x_wconf 81' lang='eng'>88</span> <span class='ocrx_word' id='word_1_68' title='bbox 566 573 699 594; x_wconf 78' lang='eng' dir='ltr'>Cryplococcus</span> <span class='ocrx_word' id='word_1_69' title='bbox 707 573 811 590; x_wconf 80' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_70' title='bbox 820 573 867 590; x_wconf 83' lang='eng' dir='ltr'><strong>L146</strong></span> <span class='ocrx_word' id='word_1_71' title='bbox 875 573 992 594; x_wconf 80' lang='eng' dir='ltr'>(EF126368)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 456 597 529 599">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 456 597 529 599">
+     <span class='ocr_line' id='line_1_20' title="bbox 456 597 529 599; baseline 0 1338"><span class='ocrx_word' id='word_1_72' title='bbox 456 597 529 599; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 555 614 1045 798">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 555 614 1045 798">
+     <span class='ocr_line' id='line_1_21' title="bbox 566 614 1044 635; baseline 0 -5"><span class='ocrx_word' id='word_1_73' title='bbox 566 614 699 635; x_wconf 78' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_74' title='bbox 707 614 812 630; x_wconf 80' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_75' title='bbox 819 614 863 630; x_wconf 88' lang='eng' dir='ltr'>CBS</span> <span class='ocrx_word' id='word_1_76' title='bbox 871 614 919 630; x_wconf 84' lang='eng'><strong>6475</strong></span> <span class='ocrx_word' id='word_1_77' title='bbox 928 614 1044 635; x_wconf 83' lang='eng' dir='ltr'>(EF056308)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 565 655 1045 676; baseline 0 -5"><span class='ocrx_word' id='word_1_78' title='bbox 565 655 708 676; x_wconf 85' lang='eng' dir='ltr'>Basidiomycete</span> <span class='ocrx_word' id='word_1_79' title='bbox 716 656 769 676; x_wconf 75' lang='eng' dir='ltr'>yeast</span> <span class='ocrx_word' id='word_1_80' title='bbox 776 659 803 676; x_wconf 87' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_81' title='bbox 813 655 914 671; x_wconf 85' lang='eng' dir='ltr'>DX-2006N</span> <span class='ocrx_word' id='word_1_82' title='bbox 924 655 1045 676; x_wconf 86' lang='eng' dir='ltr'><strong>(DQ447764)</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 566 695 1045 716; baseline 0 -4"><span class='ocrx_word' id='word_1_83' title='bbox 566 695 699 716; x_wconf 67' lang='eng' dir='ltr'>Cryptoooccus</span> <span class='ocrx_word' id='word_1_84' title='bbox 707 695 812 712; x_wconf 74' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_85' title='bbox 819 695 862 712; x_wconf 90' lang='eng' dir='ltr'>JCM</span> <span class='ocrx_word' id='word_1_86' title='bbox 871 695 919 712; x_wconf 84' lang='eng'>9909</span> <span class='ocrx_word' id='word_1_87' title='bbox 928 695 1045 716; x_wconf 81' lang='eng' dir='ltr'>(A8085803)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 555 736 903 757; baseline 0 -4"><span class='ocrx_word' id='word_1_88' title='bbox 555 736 666 753; x_wconf 83' lang='eng' dir='ltr'>Tremella/es</span> <span class='ocrx_word' id='word_1_89' title='bbox 675 741 702 757; x_wconf 88' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_90' title='bbox 712 736 778 753; x_wconf 83' lang='eng' dir='ltr'>LM339</span> <span class='ocrx_word' id='word_1_91' title='bbox 786 736 903 757; x_wconf 74' lang='eng' dir='ltr'>(EF060658)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 555 777 903 798; baseline 0 -5"><span class='ocrx_word' id='word_1_92' title='bbox 555 777 666 793; x_wconf 83' lang='eng' dir='ltr'>Tremellales</span> <span class='ocrx_word' id='word_1_93' title='bbox 675 781 702 797; x_wconf 79' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_94' title='bbox 712 777 778 793; x_wconf 84' lang='eng' dir='ltr'>LM333</span> <span class='ocrx_word' id='word_1_95' title='bbox 786 777 903 798; x_wconf 88' lang='eng' dir='ltr'>(EF060652)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 526 117 562 709">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 526 117 562 709">
+     <span class='ocr_line' id='line_1_26' title="bbox 526 117 562 709; baseline 0 1228"><span class='ocrx_word' id='word_1_96' title='bbox 526 117 562 709; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 528 359 530 837">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 528 359 530 837">
+     <span class='ocr_line' id='line_1_27' title="bbox 528 359 530 837; baseline 0 1100"><span class='ocrx_word' id='word_1_97' title='bbox 528 359 530 837; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 252 825 568 828">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 252 825 568 828">
+     <span class='ocr_line' id='line_1_28' title="bbox 252 825 568 828; baseline 0 1109"><span class='ocrx_word' id='word_1_98' title='bbox 252 825 568 828; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 224 1072 245 1087">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 224 1072 245 1087">
+     <span class='ocr_line' id='line_1_29' title="bbox 224 1072 245 1087; baseline 0.048 -1"><span class='ocrx_word' id='word_1_99' title='bbox 224 1072 245 1087; x_wconf 82' lang='eng'>46</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 225 1093 253 1095">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 225 1093 253 1095">
+     <span class='ocr_line' id='line_1_30' title="bbox 225 1093 253 1095; baseline 0 842"><span class='ocrx_word' id='word_1_100' title='bbox 225 1093 253 1095; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 252 826 254 1361">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 252 826 254 1361">
+     <span class='ocr_line' id='line_1_31' title="bbox 252 826 254 1361; baseline 0 576"><span class='ocrx_word' id='word_1_101' title='bbox 252 826 254 1361; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 5 1355 227 1357">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 5 1355 227 1357">
+     <span class='ocr_line' id='line_1_32' title="bbox 5 1355 227 1357; baseline 0 580"><span class='ocrx_word' id='word_1_102' title='bbox 5 1355 227 1357; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 5 1355 7 1746">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 5 1355 7 1746">
+     <span class='ocr_line' id='line_1_33' title="bbox 5 1355 7 1746; baseline 0 191"><span class='ocrx_word' id='word_1_103' title='bbox 5 1355 7 1746; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 252 1360 299 1361">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 252 1360 299 1361">
+     <span class='ocr_line' id='line_1_34' title="bbox 252 1360 299 1361; baseline 0 576"><span class='ocrx_word' id='word_1_104' title='bbox 252 1360 299 1361; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 270 1372 290 1387">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 270 1372 290 1387">
+     <span class='ocr_line' id='line_1_35' title="bbox 270 1372 290 1387; baseline 0 0"><span class='ocrx_word' id='word_1_105' title='bbox 270 1372 290 1387; x_wconf 87' lang='eng'>70</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 298 1313 300 1408">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 298 1313 300 1408">
+     <span class='ocr_line' id='line_1_36' title="bbox 298 1313 300 1408; baseline 0 529"><span class='ocrx_word' id='word_1_106' title='bbox 298 1313 300 1408; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 345 1419 365 1434">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 345 1419 365 1434">
+     <span class='ocr_line' id='line_1_37' title="bbox 345 1419 365 1434; baseline 0 0"><span class='ocrx_word' id='word_1_107' title='bbox 345 1419 365 1434; x_wconf 85' lang='eng'>85</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 374 1473 395 1487">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 374 1473 395 1487">
+     <span class='ocr_line' id='line_1_38' title="bbox 374 1473 395 1487; baseline 0 0"><span class='ocrx_word' id='word_1_108' title='bbox 374 1473 395 1487; x_wconf 87' lang='eng'>67</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 225 1093 227 1619">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 225 1093 227 1619">
+     <span class='ocr_line' id='line_1_39' title="bbox 225 1093 227 1619; baseline 0 318"><span class='ocrx_word' id='word_1_109' title='bbox 225 1093 227 1619; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 401 1414 403 1508">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 401 1414 403 1508">
+     <span class='ocr_line' id='line_1_40' title="bbox 401 1414 403 1508; baseline 0 429"><span class='ocrx_word' id='word_1_110' title='bbox 401 1414 403 1508; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 399 1549 408 1563">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 399 1549 408 1563">
+     <span class='ocr_line' id='line_1_41' title="bbox 399 1549 408 1563; baseline 0 0"><span class='ocrx_word' id='word_1_111' title='bbox 399 1549 408 1563; x_wconf 90' lang='eng'><strong>2</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 409 1434 479 1436">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 409 1434 479 1436">
+     <span class='ocr_line' id='line_1_42' title="bbox 409 1434 479 1436; baseline 0 127"><span class='ocrx_word' id='word_1_112' title='bbox 409 1434 479 1436; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 391 1467 870 1533">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 391 1467 870 1533">
+     <span class='ocr_line' id='line_1_43' title="bbox 428 1467 870 1488; baseline 0 -4"><span class='ocrx_word' id='word_1_113' title='bbox 428 1467 562 1488; x_wconf 78' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_114' title='bbox 569 1471 637 1484; x_wconf 84' lang='eng' dir='ltr'><em>aureus</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 644 1467 687 1484; x_wconf 88' lang='eng' dir='ltr'>JCM</span> <span class='ocrx_word' id='word_1_116' title='bbox 696 1467 744 1484; x_wconf 80' lang='eng'>5945</span> <span class='ocrx_word' id='word_1_117' title='bbox 753 1467 870 1488; x_wconf 86' lang='eng' dir='ltr'>(AB085802)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 391 1508 870 1533; baseline 0 -9"><span class='ocrx_word' id='word_1_118' title='bbox 391 1519 411 1533; x_wconf 64' lang='eng'>58</span> <span class='ocrx_word' id='word_1_119' title='bbox 426 1508 576 1524; x_wconf 82' lang='eng' dir='ltr'><em>Aureobasidium</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 582 1508 671 1529; x_wconf 84' lang='eng' dir='ltr'><em>pullulans</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 679 1508 740 1524; x_wconf 69' lang='eng' dir='ltr'>HN2,3</span> <span class='ocrx_word' id='word_1_122' title='bbox 749 1508 870 1529; x_wconf 79' lang='eng' dir='ltr'>(DQ680843)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 456 597 458 1058">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 456 597 458 1058">
+     <span class='ocr_line' id='line_1_45' title="bbox 456 597 458 1058; baseline 0 879"><span class='ocrx_word' id='word_1_123' title='bbox 456 597 458 1058; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 454 1053 674 1283">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 454 1053 674 1283">
+     <span class='ocr_line' id='line_1_46' title="bbox 454 1053 674 1091; baseline 0 846"><span class='ocrx_word' id='word_1_124' title='bbox 454 1053 674 1091; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 454 1091 582 1173; baseline 0 0"><span class='ocrx_word' id='word_1_125' title='bbox 454 1091 582 1173; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_48' title="bbox 494 1173 582 1217; baseline 0 720"><span class='ocrx_word' id='word_1_126' title='bbox 494 1173 582 1217; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_49' title="bbox 504 1217 604 1283; baseline 0 0"><span class='ocrx_word' id='word_1_127' title='bbox 504 1217 604 1283; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 555 817 912 878">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 555 817 912 878">
+     <span class='ocr_line' id='line_1_50' title="bbox 577 817 912 838; baseline 0.003 -5"><span class='ocrx_word' id='word_1_128' title='bbox 577 817 688 834; x_wconf 82' lang='eng' dir='ltr'>Tremel/a/es</span> <span class='ocrx_word' id='word_1_129' title='bbox 697 821 725 838; x_wconf 27' lang='eng' dir='ltr'>spA</span> <span class='ocrx_word' id='word_1_130' title='bbox 735 817 788 833; x_wconf 93' lang='eng' dir='ltr'><strong>LM47</strong></span> <span class='ocrx_word' id='word_1_131' title='bbox 796 817 912 838; x_wconf 84' lang='eng' dir='ltr'>(EF060429)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_51' title="bbox 555 857 890 878; baseline 0 -4"><span class='ocrx_word' id='word_1_132' title='bbox 555 857 667 874; x_wconf 84' lang='eng' dir='ltr'>TremelIa/es</span> <span class='ocrx_word' id='word_1_133' title='bbox 675 862 702 878; x_wconf 65' lang='eng' dir='ltr'>sp,</span> <span class='ocrx_word' id='word_1_134' title='bbox 712 857 766 874; x_wconf 86' lang='eng' dir='ltr'>LM48</span> <span class='ocrx_word' id='word_1_135' title='bbox 774 857 890 878; x_wconf 84' lang='eng' dir='ltr'>(EF060430)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 528 836 546 837">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 528 836 546 837">
+     <span class='ocr_line' id='line_1_52' title="bbox 528 836 546 837; baseline 0 1100"><span class='ocrx_word' id='word_1_136' title='bbox 528 836 546 837; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 517 848 537 862">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 517 848 537 862">
+     <span class='ocr_line' id='line_1_53' title="bbox 517 848 537 862; baseline 0 0"><span class='ocrx_word' id='word_1_137' title='bbox 517 848 537 862; x_wconf 80' lang='eng'>80</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 544 745 546 908">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 544 745 546 908">
+     <span class='ocr_line' id='line_1_54' title="bbox 544 745 546 908; baseline 0 1029"><span class='ocrx_word' id='word_1_138' title='bbox 544 745 546 908; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 525 898 1123 960">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 525 898 1123 960">
+     <span class='ocr_line' id='line_1_55' title="bbox 555 898 987 920; baseline 0 -5"><span class='ocrx_word' id='word_1_139' title='bbox 555 898 688 920; x_wconf 74' lang='eng' dir='ltr'>Cryptacoccus</span> <span class='ocrx_word' id='word_1_140' title='bbox 696 898 800 915; x_wconf 81' lang='eng' dir='ltr'>f/avescens</span> <span class='ocrx_word' id='word_1_141' title='bbox 808 899 862 915; x_wconf 88' lang='eng' dir='ltr'>m155</span> <span class='ocrx_word' id='word_1_142' title='bbox 871 898 987 920; x_wconf 82' lang='eng' dir='ltr'>(EF648006)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_56' title="bbox 525 908 1123 960; baseline 0.002 -6"><span class='ocrx_word' id='word_1_143' title='bbox 525 908 682 954; x_wconf 65' lang='eng'>20‘—</span> <span class='ocrx_word' id='word_1_144' title='bbox 691 939 825 960; x_wconf 79' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_145' title='bbox 833 939 937 956; x_wconf 84' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_146' title='bbox 945 939 999 956; x_wconf 83' lang='eng' dir='ltr'>m158</span> <span class='ocrx_word' id='word_1_147' title='bbox 1008 939 1123 960; x_wconf 84' lang='eng' dir='ltr'>(EF648007)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 488 979 1028 1122">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 518 979 865 1000">
+     <span class='ocr_line' id='line_1_57' title="bbox 518 979 865 1000; baseline 0 -4"><span class='ocrx_word' id='word_1_148' title='bbox 518 980 629 996; x_wconf 75' lang='eng' dir='ltr'>TremeIIa/es</span> <span class='ocrx_word' id='word_1_149' title='bbox 638 984 665 1000; x_wconf 84' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_150' title='bbox 674 980 741 996; x_wconf 88' lang='eng' dir='ltr'>LM629</span> <span class='ocrx_word' id='word_1_151' title='bbox 749 979 865 1000; x_wconf 84' lang='eng' dir='ltr'>(EF060913)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 488 1020 1028 1122">
+     <span class='ocr_line' id='line_1_58' title="bbox 488 1020 997 1042; baseline 0 -5"><span class='ocrx_word' id='word_1_152' title='bbox 488 1028 497 1042; x_wconf 78' lang='eng'><strong>2</strong></span> <span class='ocrx_word' id='word_1_153' title='bbox 518 1020 651 1041; x_wconf 80' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_154' title='bbox 659 1020 764 1037; x_wconf 81' lang='eng' dir='ltr'>flavescens</span> <span class='ocrx_word' id='word_1_155' title='bbox 772 1020 816 1037; x_wconf 86' lang='eng' dir='ltr'>CBS</span> <span class='ocrx_word' id='word_1_156' title='bbox 823 1020 872 1037; x_wconf 88' lang='eng'>4926</span> <span class='ocrx_word' id='word_1_157' title='bbox 880 1020 997 1041; x_wconf 80' lang='eng' dir='ltr'>(EF056304)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_59' title="bbox 680 1061 1028 1082; baseline 0 -5"><span class='ocrx_word' id='word_1_158' title='bbox 680 1061 791 1077; x_wconf 74' lang='eng' dir='ltr'>Tremella/es</span> <span class='ocrx_word' id='word_1_159' title='bbox 800 1065 827 1081; x_wconf 84' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_160' title='bbox 837 1061 900 1077; x_wconf 84' lang='eng' dir='ltr'>LM651</span> <span class='ocrx_word' id='word_1_161' title='bbox 911 1061 1028 1082; x_wconf 80' lang='eng' dir='ltr'>(EF060935)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_60' title="bbox 517 1101 922 1122; baseline 0 -5"><span class='ocrx_word' id='word_1_162' title='bbox 517 1101 651 1122; x_wconf 77' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_163' title='bbox 658 1105 685 1122; x_wconf 82' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_164' title='bbox 694 1101 739 1117; x_wconf 87' lang='eng' dir='ltr'>CBS</span> <span class='ocrx_word' id='word_1_165' title='bbox 747 1101 794 1118; x_wconf 81' lang='eng'>8372</span> <span class='ocrx_word' id='word_1_166' title='bbox 803 1101 922 1122; x_wconf 82' lang='eng' dir='ltr'>(EU340250)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 454 985 513 1053">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 454 985 513 1053">
+     <span class='ocr_line' id='line_1_61' title="bbox 503 985 513 1009; baseline 0 928"><span class='ocrx_word' id='word_1_167' title='bbox 503 985 513 1009; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_62' title="bbox 454 1010 488 1053; baseline 0 884"><span class='ocrx_word' id='word_1_168' title='bbox 454 1010 488 1053; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 586 1224 1012 1285">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 586 1224 1012 1285">
+     <span class='ocr_line' id='line_1_63' title="bbox 586 1224 1011 1246; baseline -0.002 -4"><span class='ocrx_word' id='word_1_169' title='bbox 586 1225 719 1246; x_wconf 71' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_170' title='bbox 727 1225 813 1242; x_wconf 78' lang='eng' dir='ltr'>terrestris</span> <span class='ocrx_word' id='word_1_171' title='bbox 821 1225 881 1246; x_wconf 79' lang='eng' dir='ltr'>Ep11c</span> <span class='ocrx_word' id='word_1_172' title='bbox 891 1225 998 1246; x_wconf 83' lang='eng' dir='ltr'>(EU200781</span> <span class='ocrx_word' id='word_1_173' title='bbox 1007 1224 1011 1245; x_wconf 89' lang='eng'>)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_64' title="bbox 609 1264 1012 1285; baseline 0 -4"><span class='ocrx_word' id='word_1_174' title='bbox 609 1264 742 1285; x_wconf 77' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_175' title='bbox 750 1264 835 1281; x_wconf 83' lang='eng' dir='ltr'>terrestris</span> <span class='ocrx_word' id='word_1_176' title='bbox 849 1264 885 1281; x_wconf 74' lang='eng' dir='ltr'>56s</span> <span class='ocrx_word' id='word_1_177' title='bbox 893 1264 1012 1285; x_wconf 84' lang='eng' dir='ltr'>(EU340250)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_37' title="bbox 382 1304 914 1408">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 382 1304 914 1408">
+     <span class='ocr_line' id='line_1_65' title="bbox 423 1304 914 1325; baseline 0 -4"><span class='ocrx_word' id='word_1_178' title='bbox 423 1304 557 1325; x_wconf 80' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_179' title='bbox 564 1309 632 1321; x_wconf 85' lang='eng' dir='ltr'>aureus</span> <span class='ocrx_word' id='word_1_180' title='bbox 640 1305 698 1321; x_wconf 85' lang='eng' dir='ltr'>NRRL</span> <span class='ocrx_word' id='word_1_181' title='bbox 705 1305 789 1321; x_wconf 87' lang='eng' dir='ltr'>Y-30215</span> <span class='ocrx_word' id='word_1_182' title='bbox 798 1304 914 1325; x_wconf 83' lang='eng' dir='ltr'>(EF056299)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_66' title="bbox 398 1341 859 1367; baseline 0 -4"><span class='ocrx_word' id='word_1_183' title='bbox 398 1346 545 1367; x_wconf 81' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_184' title='bbox 553 1350 625 1363; x_wconf 81' lang='eng' dir='ltr'><strong><em>aureus</em></strong></span> <span class='ocrx_word' id='word_1_185' title='bbox 632 1346 677 1363; x_wconf 83' lang='eng' dir='ltr'>CBS</span> <span class='ocrx_word' id='word_1_186' title='bbox 686 1341 731 1363; x_wconf 79' lang='eng' dir='ltr'>318T</span> <span class='ocrx_word' id='word_1_187' title='bbox 739 1346 859 1367; x_wconf 86' lang='eng' dir='ltr'>(AB035045)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_67' title="bbox 382 1386 805 1408; baseline 0 -6"><span class='ocrx_word' id='word_1_188' title='bbox 382 1393 402 1408; x_wconf 75' lang='eng'>70</span> <span class='ocrx_word' id='word_1_189' title='bbox 417 1386 551 1407; x_wconf 76' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_190' title='bbox 558 1390 625 1402; x_wconf 85' lang='eng' dir='ltr'><em>aureus</em></span> <span class='ocrx_word' id='word_1_191' title='bbox 633 1386 676 1402; x_wconf 84' lang='eng' dir='ltr'>G7A</span> <span class='ocrx_word' id='word_1_192' title='bbox 684 1386 805 1407; x_wconf 89' lang='eng' dir='ltr'><strong>(DQ640764)</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_38' title="bbox 489 1426 837 1447">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 489 1426 837 1447">
+     <span class='ocr_line' id='line_1_68' title="bbox 489 1426 837 1447; baseline 0.003 -5"><span class='ocrx_word' id='word_1_193' title='bbox 489 1426 600 1443; x_wconf 80' lang='eng' dir='ltr'>Treme/lales</span> <span class='ocrx_word' id='word_1_194' title='bbox 610 1430 637 1447; x_wconf 28' lang='eng' dir='ltr'>spA</span> <span class='ocrx_word' id='word_1_195' title='bbox 646 1426 712 1443; x_wconf 82' lang='eng' dir='ltr'><strong>LM613</strong></span> <span class='ocrx_word' id='word_1_196' title='bbox 721 1426 837 1447; x_wconf 81' lang='eng' dir='ltr'>(EF060898)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_39' title="bbox 1013 1324 1038 1556">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 1013 1324 1038 1556">
+     <span class='ocr_line' id='line_1_69' title="bbox 1013 1324 1038 1556; textangle 90"><span class='ocrx_word' id='word_1_197' title='bbox 1013 1478 1038 1556; x_wconf 77' lang='eng' dir='ltr'>epep</span> <span class='ocrx_word' id='word_1_198' title='bbox 1013 1366 1032 1467; x_wconf 78' lang='eng' dir='ltr'>sneme</span> <span class='ocrx_word' id='word_1_199' title='bbox 1013 1324 1038 1351; x_wconf 76' lang='eng'>&#39;9</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_40' title="bbox 474 1548 965 1569">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 474 1548 965 1569">
+     <span class='ocr_line' id='line_1_70' title="bbox 474 1548 965 1569; baseline 0 -4"><span class='ocrx_word' id='word_1_200' title='bbox 474 1548 608 1569; x_wconf 77' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_201' title='bbox 616 1553 683 1565; x_wconf 83' lang='eng' dir='ltr'><em>aureus</em></span> <span class='ocrx_word' id='word_1_202' title='bbox 691 1548 750 1565; x_wconf 86' lang='eng' dir='ltr'>NRRL</span> <span class='ocrx_word' id='word_1_203' title='bbox 756 1548 840 1565; x_wconf 81' lang='eng' dir='ltr'>Y—30213</span> <span class='ocrx_word' id='word_1_204' title='bbox 849 1548 965 1569; x_wconf 85' lang='eng' dir='ltr'>(EF056298)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_41' title="bbox 397 1589 800 1609">
+    <p class='ocr_par' dir='ltr' id='par_1_42' title="bbox 397 1589 800 1609">
+     <span class='ocr_line' id='line_1_71' title="bbox 397 1589 800 1609; baseline 0 -4"><span class='ocrx_word' id='word_1_205' title='bbox 397 1589 531 1609; x_wconf 74' lang='eng' dir='ltr'>Cryplococcus</span> <span class='ocrx_word' id='word_1_206' title='bbox 539 1593 566 1609; x_wconf 84' lang='eng' dir='ltr'>5p.</span> <span class='ocrx_word' id='word_1_207' title='bbox 575 1589 619 1605; x_wconf 88' lang='eng' dir='ltr'>CBS</span> <span class='ocrx_word' id='word_1_208' title='bbox 627 1589 675 1605; x_wconf 83' lang='eng'><strong>8366</strong></span> <span class='ocrx_word' id='word_1_209' title='bbox 683 1589 800 1609; x_wconf 83' lang='eng' dir='ltr'>(AF444393)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_42' title="bbox 227 1598 800 1650">
+    <p class='ocr_par' dir='ltr' id='par_1_43' title="bbox 351 1630 800 1650">
+     <span class='ocr_line' id='line_1_72' title="bbox 351 1630 800 1650; baseline 0.004 -6"><span class='ocrx_word' id='word_1_210' title='bbox 351 1630 381 1645; x_wconf 86' lang='eng'>100</span> <span class='ocrx_word' id='word_1_211' title='bbox 397 1630 531 1650; x_wconf 75' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_212' title='bbox 539 1634 566 1650; x_wconf 84' lang='eng' dir='ltr'>5p.</span> <span class='ocrx_word' id='word_1_213' title='bbox 575 1630 619 1646; x_wconf 88' lang='eng' dir='ltr'>CBS</span> <span class='ocrx_word' id='word_1_214' title='bbox 627 1630 674 1646; x_wconf 82' lang='eng'>8358</span> <span class='ocrx_word' id='word_1_215' title='bbox 683 1630 800 1650; x_wconf 81' lang='eng' dir='ltr'>(AF444387)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_43' title="bbox 566 86 1093 107">
+    <p class='ocr_par' dir='ltr' id='par_1_44' title="bbox 566 86 1093 107">
+     <span class='ocr_line' id='line_1_73' title="bbox 566 86 1093 107; baseline 0.002 -5"><span class='ocrx_word' id='word_1_216' title='bbox 566 86 699 107; x_wconf 78' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_217' title='bbox 707 86 812 103; x_wconf 76' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_218' title='bbox 820 86 878 102; x_wconf 90' lang='eng' dir='ltr'>NRRL</span> <span class='ocrx_word' id='word_1_219' title='bbox 884 86 969 103; x_wconf 89' lang='eng' dir='ltr'>Y-30216</span> <span class='ocrx_word' id='word_1_220' title='bbox 978 86 1093 107; x_wconf 85' lang='eng' dir='ltr'>(EF056300)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_44' title="bbox 1140 0 1141 966">
+    <p class='ocr_par' dir='ltr' id='par_1_45' title="bbox 1140 0 1141 966">
+     <span class='ocr_line' id='line_1_74' title="bbox 1140 0 1141 966; baseline 0 971"><span class='ocrx_word' id='word_1_221' title='bbox 1140 0 1141 966; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_45' title="bbox 585 1142 1096 1204">
+    <p class='ocr_par' dir='ltr' id='par_1_46' title="bbox 585 1142 1096 1204">
+     <span class='ocr_line' id='line_1_75' title="bbox 585 1142 1086 1163; baseline 0 -5"><span class='ocrx_word' id='word_1_222' title='bbox 585 1142 719 1163; x_wconf 79' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_223' title='bbox 727 1142 812 1158; x_wconf 81' lang='eng' dir='ltr'>terrestris</span> <span class='ocrx_word' id='word_1_224' title='bbox 820 1142 915 1158; x_wconf 89' lang='eng' dir='ltr'>C107DX4</span> <span class='ocrx_word' id='word_1_225' title='bbox 922 1142 956 1158; x_wconf 90' lang='eng' dir='ltr'>Y11</span> <span class='ocrx_word' id='word_1_226' title='bbox 968 1142 1086 1163; x_wconf 84' lang='eng' dir='ltr'>(EU4991B7)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_76' title="bbox 586 1178 1096 1204; baseline -0.002 -4"><span class='ocrx_word' id='word_1_227' title='bbox 586 1183 732 1204; x_wconf 76' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_228' title='bbox 741 1183 836 1200; x_wconf 76' lang='eng' dir='ltr'>terrestris</span> <span class='ocrx_word' id='word_1_229' title='bbox 844 1183 914 1200; x_wconf 83' lang='eng' dir='ltr'>CJDX4</span> <span class='ocrx_word' id='word_1_230' title='bbox 921 1178 970 1200; x_wconf 67' lang='eng' dir='ltr'>Y23Y</span> <span class='ocrx_word' id='word_1_231' title='bbox 978 1183 1096 1204; x_wconf 80' lang='eng' dir='ltr'>(EU200782)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_46' title="bbox 1163 255 1195 713">
+    <p class='ocr_par' dir='ltr' id='par_1_47' title="bbox 1163 255 1195 713">
+     <span class='ocr_line' id='line_1_77' title="bbox 1163 255 1195 713; textangle 90"><span class='ocrx_word' id='word_1_232' title='bbox 1170 635 1195 713; x_wconf 76' lang='eng' dir='ltr'>epelo</span> <span class='ocrx_word' id='word_1_233' title='bbox 1170 467 1195 624; x_wconf 65' lang='eng' dir='ltr'>sueoseAey</span> <span class='ocrx_word' id='word_1_234' title='bbox 1163 255 1195 456; x_wconf 70' lang='eng' dir='ltr'>SHOOOOOJd/DO</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_47' title="bbox 1150 985 1181 1414">
+    <p class='ocr_par' dir='ltr' id='par_1_48' title="bbox 1150 985 1181 1414">
+     <span class='ocr_line' id='line_1_78' title="bbox 1150 985 1181 1414; textangle 90"><span class='ocrx_word' id='word_1_235' title='bbox 1156 1337 1181 1414; x_wconf 76' lang='eng' dir='ltr'>epep</span> <span class='ocrx_word' id='word_1_236' title='bbox 1156 1197 1181 1326; x_wconf 69' lang='eng' dir='ltr'>S/JJSGJJQJ</span> <span class='ocrx_word' id='word_1_237' title='bbox 1150 985 1181 1185; x_wconf 68' lang='eng' dir='ltr'>SHOOOOOJd/UQ</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_48' title="bbox 500 1665 1164 1692">
+    <p class='ocr_par' dir='ltr' id='par_1_49' title="bbox 500 1665 1164 1692">
+     <span class='ocr_line' id='line_1_79' title="bbox 500 1665 1164 1692; baseline 0 -5"><span class='ocrx_word' id='word_1_238' title='bbox 500 1678 520 1692; x_wconf 75' lang='eng'>99</span> <span class='ocrx_word' id='word_1_239' title='bbox 529 1678 683 1680; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_240' title='bbox 692 1671 839 1691; x_wconf 81' lang='eng' dir='ltr'>Cryptacoccus</span> <span class='ocrx_word' id='word_1_241' title='bbox 847 1671 934 1687; x_wconf 78' lang='eng' dir='ltr'>Iaurenlii</span> <span class='ocrx_word' id='word_1_242' title='bbox 940 1670 986 1687; x_wconf 87' lang='eng' dir='ltr'>CBS</span> <span class='ocrx_word' id='word_1_243' title='bbox 995 1665 1039 1687; x_wconf 74' lang='eng' dir='ltr'>139T</span> <span class='ocrx_word' id='word_1_244' title='bbox 1046 1670 1164 1691; x_wconf 84' lang='eng' dir='ltr'>(AF410468)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_49' title="bbox 196 1698 528 1700">
+    <p class='ocr_par' dir='ltr' id='par_1_50' title="bbox 196 1698 528 1700">
+     <span class='ocr_line' id='line_1_80' title="bbox 196 1698 528 1700; baseline 0 237"><span class='ocrx_word' id='word_1_245' title='bbox 196 1698 528 1700; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_50' title="bbox 5 1744 198 1746">
+    <p class='ocr_par' dir='ltr' id='par_1_51' title="bbox 5 1744 198 1746">
+     <span class='ocr_line' id='line_1_81' title="bbox 5 1744 198 1746; baseline 0 191"><span class='ocrx_word' id='word_1_246' title='bbox 5 1744 198 1746; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_51' title="bbox 112 1915 146 1929">
+    <p class='ocr_par' dir='ltr' id='par_1_52' title="bbox 112 1915 146 1929">
+     <span class='ocr_line' id='line_1_82' title="bbox 112 1915 146 1929; baseline 0 0"><span class='ocrx_word' id='word_1_247' title='bbox 112 1915 146 1929; x_wconf 88' lang='eng'>0.01</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_52' title="bbox 196 1698 198 1791">
+    <p class='ocr_par' dir='ltr' id='par_1_53' title="bbox 196 1698 198 1791">
+     <span class='ocr_line' id='line_1_83' title="bbox 196 1698 198 1791; baseline 0 146"><span class='ocrx_word' id='word_1_248' title='bbox 196 1698 198 1791; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_53' title="bbox 196 1789 257 1791">
+    <p class='ocr_par' dir='ltr' id='par_1_54' title="bbox 196 1789 257 1791">
+     <span class='ocr_line' id='line_1_84' title="bbox 196 1789 257 1791; baseline 0 146"><span class='ocrx_word' id='word_1_249' title='bbox 196 1789 257 1791; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_54' title="bbox 256 1759 258 1822">
+    <p class='ocr_par' dir='ltr' id='par_1_55' title="bbox 256 1759 258 1822">
+     <span class='ocr_line' id='line_1_85' title="bbox 256 1759 258 1822; baseline 0 115"><span class='ocrx_word' id='word_1_250' title='bbox 256 1759 258 1822; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_55' title="bbox 527 1678 529 1720">
+    <p class='ocr_par' dir='ltr' id='par_1_56' title="bbox 527 1678 529 1720">
+     <span class='ocr_line' id='line_1_86' title="bbox 527 1678 529 1720; baseline 0 217"><span class='ocrx_word' id='word_1_251' title='bbox 527 1678 529 1720; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_56' title="bbox 529 1718 603 1720">
+    <p class='ocr_par' dir='ltr' id='par_1_57' title="bbox 529 1718 603 1720">
+     <span class='ocr_line' id='line_1_87' title="bbox 529 1718 603 1720; baseline 0 217"><span class='ocrx_word' id='word_1_252' title='bbox 529 1718 603 1720; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_57' title="bbox 380 1706 1112 1773">
+    <p class='ocr_par' dir='ltr' id='par_1_58' title="bbox 380 1706 1112 1773">
+     <span class='ocr_line' id='line_1_88' title="bbox 612 1706 1112 1733; baseline 0 -5"><span class='ocrx_word' id='word_1_253' title='bbox 612 1711 759 1733; x_wconf 62' lang='eng' dir='ltr'>Culptocaccus</span> <span class='ocrx_word' id='word_1_254' title='bbox 772 1712 928 1733; x_wconf 85' lang='eng' dir='ltr'>rajasthanensis</span> <span class='ocrx_word' id='word_1_255' title='bbox 936 1706 982 1728; x_wconf 89' lang='eng' dir='ltr'>15LT</span> <span class='ocrx_word' id='word_1_256' title='bbox 990 1711 1112 1733; x_wconf 84' lang='eng' dir='ltr'>(AM262325)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_89' title="bbox 380 1747 958 1773; baseline 0 -5"><span class='ocrx_word' id='word_1_257' title='bbox 380 1752 527 1773; x_wconf 84' lang='eng' dir='ltr'>Cryptococcus</span> <span class='ocrx_word' id='word_1_258' title='bbox 535 1752 699 1768; x_wconf 85' lang='eng' dir='ltr'>anemochoreius</span> <span class='ocrx_word' id='word_1_259' title='bbox 707 1752 752 1768; x_wconf 87' lang='eng' dir='ltr'>CBS</span> <span class='ocrx_word' id='word_1_260' title='bbox 761 1747 830 1768; x_wconf 81' lang='eng' dir='ltr'>10258T</span> <span class='ocrx_word' id='word_1_261' title='bbox 838 1752 958 1773; x_wconf 80' lang='eng' dir='ltr'>(DQS30986)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_58' title="bbox 228 1787 1061 1854">
+    <p class='ocr_par' dir='ltr' id='par_1_59' title="bbox 228 1787 1061 1854">
+     <span class='ocr_line' id='line_1_90' title="bbox 228 1787 970 1817; baseline 0 -8"><span class='ocrx_word' id='word_1_262' title='bbox 228 1803 249 1817; x_wconf 67' lang='eng'>64</span> <span class='ocrx_word' id='word_1_263' title='bbox 521 1792 595 1809; x_wconf 85' lang='eng' dir='ltr'>Bullera</span> <span class='ocrx_word' id='word_1_264' title='bbox 602 1792 726 1813; x_wconf 83' lang='eng' dir='ltr'>pseudaalba</span> <span class='ocrx_word' id='word_1_265' title='bbox 734 1792 779 1809; x_wconf 89' lang='eng' dir='ltr'>CBS</span> <span class='ocrx_word' id='word_1_266' title='bbox 787 1787 845 1809; x_wconf 62' lang='eng'><strong>7227&#39;</strong></span> <span class='ocrx_word' id='word_1_267' title='bbox 852 1792 970 1814; x_wconf 76' lang='eng' dir='ltr'>(AF444399)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_91' title="bbox 476 1828 1061 1854; baseline -0.002 -4"><span class='ocrx_word' id='word_1_268' title='bbox 476 1833 506 1847; x_wconf 86' lang='eng'>100</span> <span class='ocrx_word' id='word_1_269' title='bbox 522 1833 669 1854; x_wconf 79' lang='eng' dir='ltr'>Cryptoooccus</span> <span class='ocrx_word' id='word_1_270' title='bbox 677 1833 817 1854; x_wconf 80' lang='eng' dir='ltr'>cellulolyticus</span> <span class='ocrx_word' id='word_1_271' title='bbox 825 1833 870 1850; x_wconf 88' lang='eng' dir='ltr'>CBS</span> <span class='ocrx_word' id='word_1_272' title='bbox 878 1828 935 1850; x_wconf 66' lang='eng' dir='ltr'>8294Y</span> <span class='ocrx_word' id='word_1_273' title='bbox 943 1833 1061 1854; x_wconf 87' lang='eng' dir='ltr'><strong>(AF444442)</strong></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001826-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001826-0-000.pbm.png
new file mode 100644
index 00000000..cab94811
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001826-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001826-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001826-0-000.pbm.png.hocr
new file mode 100644
index 00000000..70ab8169
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001826-0-000.pbm.png.hocr
@@ -0,0 +1,124 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001826-0-000.pbm.png"; bbox 0 0 1243 644; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 43 60 90 101">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 43 60 90 101">
+     <span class='ocr_line' id='line_1_1' title="bbox 43 60 90 101; textangle 90"><span class='ocrx_word' id='word_1_1' title='bbox 59 99 61 101; x_wconf 82' lang='eng'>&#39;</span> <span class='ocrx_word' id='word_1_2' title='bbox 43 60 90 79; x_wconf 70' lang='eng' dir='ltr'>I</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 110 0 1243 400">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 110 0 1243 318">
+     <span class='ocr_line' id='line_1_2' title="bbox 339 0 1147 34; baseline 0 -7"><span class='ocrx_word' id='word_1_3' title='bbox 339 7 362 23; x_wconf 83' lang='eng'>95</span> <span class='ocrx_word' id='word_1_4' title='bbox 457 3 676 27; x_wconf 80' lang='eng' dir='ltr'><em>Aestuariibacter</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 684 3 836 34; x_wconf 85' lang='eng' dir='ltr'><em>saleXigens</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 846 0 969 27; x_wconf 80' lang='eng' dir='ltr'><em>J02042T</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 977 3 1147 33; x_wconf 90' lang='eng' dir='ltr'>(AY207502)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 441 41 1123 74; baseline 0 -6"><span class='ocrx_word' id='word_1_8' title='bbox 441 44 660 68; x_wconf 78' lang='eng' dir='ltr'><em>Aestuariibacter</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 667 44 812 74; x_wconf 85' lang='eng' dir='ltr'><em>halophilus</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 822 41 946 68; x_wconf 78' lang='eng' dir='ltr'><em>JCZO43T</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 954 44 1123 74; x_wconf 86' lang='eng' dir='ltr'>(AY207503)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 473 81 1090 115; baseline 0 -7"><span class='ocrx_word' id='word_1_12' title='bbox 473 84 621 108; x_wconf 86' lang='eng' dir='ltr'><em>Glaciecola</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 631 85 726 115; x_wconf 88' lang='eng' dir='ltr'><em>polaris</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 738 84 804 108; x_wconf 91' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 815 81 1090 115; x_wconf 77' lang='eng' dir='ltr'>21857T(AJ293820)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 512 122 1101 155; baseline 0 -6"><span class='ocrx_word' id='word_1_16' title='bbox 512 125 660 149; x_wconf 87' lang='eng' dir='ltr'><em>GIacieco/a</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 669 125 782 155; x_wconf 87' lang='eng' dir='ltr'><em>punicea</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 792 125 884 149; x_wconf 92' lang='eng' dir='ltr'><em>ACAM</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 896 122 1101 155; x_wconf 75' lang='eng' dir='ltr'><em>611T(U85853)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 502 163 1243 196; baseline 0.001 -7"><span class='ocrx_word' id='word_1_20' title='bbox 502 166 676 190; x_wconf 87' lang='eng' dir='ltr'><em>Salinimonas</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 687 166 891 196; x_wconf 87' lang='eng' dir='ltr'><em>chungwhensis</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 903 163 1066 190; x_wconf 82' lang='eng' dir='ltr'><em>BHO30046T</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 1074 166 1243 196; x_wconf 85' lang='eng' dir='ltr'>(AY553295)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 435 203 1062 236; baseline 0 -6"><span class='ocrx_word' id='word_1_24' title='bbox 435 206 617 230; x_wconf 83' lang='eng' dir='ltr'><em>Alteromonas</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 628 206 714 230; x_wconf 81' lang='eng' dir='ltr'><em>addita</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 726 206 759 230; x_wconf 90' lang='eng' dir='ltr'>R1</span> <span class='ocrx_word' id='word_1_27' title='bbox 766 206 848 230; x_wconf 86' lang='eng' dir='ltr'><em>OSW1</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 855 203 884 230; x_wconf 75' lang='eng' dir='ltr'><em>3T</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 892 206 1062 236; x_wconf 86' lang='eng' dir='ltr'>(AY682202)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 353 244 1083 277; baseline -0.001 -6"><span class='ocrx_word' id='word_1_30' title='bbox 353 248 386 264; x_wconf 77' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 438 247 620 271; x_wconf 85' lang='eng' dir='ltr'><em>Alteromonas</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 630 247 767 271; x_wconf 83' lang='eng' dir='ltr'><em>mac/eodii</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 778 247 831 270; x_wconf 93' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 846 244 945 271; x_wconf 78' lang='eng' dir='ltr'><em>12920T</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 953 247 1083 277; x_wconf 90' lang='eng' dir='ltr'>(X82145)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 110 284 1040 318; baseline 0 -6"><span class='ocrx_word' id='word_1_36' title='bbox 110 292 132 308; x_wconf 82' lang='eng'><em>89</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 384 288 589 315; x_wconf 67' lang='eng' dir='ltr'><em>I—Bowmane/Ia</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 600 287 772 312; x_wconf 85' lang='eng' dir='ltr'><em>denitriﬁcans</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 783 284 857 312; x_wconf 93' lang='eng' dir='ltr'><em>BD1T</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 866 287 1040 318; x_wconf 84' lang='eng' dir='ltr'>(DQ343294)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 342 317 1030 359">
+     <span class='ocr_line' id='line_1_10' title="bbox 342 317 1030 359; baseline 0 -7"><span class='ocrx_word' id='word_1_41' title='bbox 342 330 375 346; x_wconf 79' lang='eng'>100</span> <span class='ocrx_word' id='word_1_42' title='bbox 384 317 598 352; x_wconf 61' lang='eng' dir='ltr'><em>LBowmaneIIa</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 607 328 728 359; x_wconf 88' lang='eng' dir='ltr'><em>pacifica</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 738 325 852 352; x_wconf 91' lang='eng' dir='ltr'><em>W3-3AT</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 860 329 1030 359; x_wconf 91' lang='eng' dir='ltr'><em>(EU440951)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 332 366 914 400">
+     <span class='ocr_line' id='line_1_11' title="bbox 332 366 914 400; baseline 0 -7"><span class='ocrx_word' id='word_1_46' title='bbox 332 369 505 400; x_wconf 86' lang='eng' dir='ltr'><em>Agarivorans</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 516 369 592 393; x_wconf 87' lang='eng' dir='ltr'><em>albus</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 603 366 737 393; x_wconf 89' lang='eng' dir='ltr'><em>MKT106T</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 745 369 914 399; x_wconf 82' lang='eng' dir='ltr'><em>(A8076561)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 271 10 510 260">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 271 10 510 260">
+     <span class='ocr_line' id='line_1_12' title="bbox 293 10 457 51; baseline 0 -26"><span class='ocrx_word' id='word_1_50' title='bbox 293 10 457 51; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 293 51 441 90; baseline 0 554"><span class='ocrx_word' id='word_1_51' title='bbox 293 51 441 90; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 271 90 510 147; baseline 0 -15"><span class='ocrx_word' id='word_1_52' title='bbox 271 90 510 147; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 293 147 500 187; baseline 0 457"><span class='ocrx_word' id='word_1_53' title='bbox 293 147 500 187; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 293 187 435 260; baseline 0 -20"><span class='ocrx_word' id='word_1_54' title='bbox 293 187 435 240; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> <span class='ocrx_word' id='word_1_55' title='bbox 391 240 433 260; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 274 48 296 63">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 274 48 296 63">
+     <span class='ocr_line' id='line_1_17' title="bbox 274 48 296 63; baseline 0 0"><span class='ocrx_word' id='word_1_56' title='bbox 274 48 296 63; x_wconf 83' lang='eng'><em>55</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 266 113 285 129">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 266 113 285 129">
+     <span class='ocr_line' id='line_1_18' title="bbox 266 113 285 129; baseline 0 0"><span class='ocrx_word' id='word_1_57' title='bbox 266 113 285 129; x_wconf 86' lang='eng'><em>71</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 227 202 260 218">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 227 202 260 218">
+     <span class='ocr_line' id='line_1_19' title="bbox 227 202 260 218; baseline 0 0"><span class='ocrx_word' id='word_1_58' title='bbox 227 202 260 218; x_wconf 90' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 269 137 271 317">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 269 137 271 317">
+     <span class='ocr_line' id='line_1_20' title="bbox 269 137 271 317; baseline 0 327"><span class='ocrx_word' id='word_1_59' title='bbox 269 137 271 317; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 105 315 386 318">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 105 315 386 318">
+     <span class='ocr_line' id='line_1_21' title="bbox 105 315 386 318; baseline 0 326"><span class='ocrx_word' id='word_1_60' title='bbox 105 315 386 318; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 105 316 107 530">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 105 316 107 530">
+     <span class='ocr_line' id='line_1_22' title="bbox 105 316 107 530; baseline 0 114"><span class='ocrx_word' id='word_1_61' title='bbox 105 316 107 530; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 91 407 1173 589">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 91 407 1173 589">
+     <span class='ocr_line' id='line_1_23' title="bbox 120 407 1173 440; baseline 0.001 -7"><span class='ocrx_word' id='word_1_62' title='bbox 120 421 143 437; x_wconf 67' lang='eng'>55</span> <span class='ocrx_word' id='word_1_63' title='bbox 412 410 538 434; x_wconf 81' lang='eng' dir='ltr'><em>Colwellia</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 548 410 797 440; x_wconf 84' lang='eng' dir='ltr'><em>psychroerythraea</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 807 410 899 434; x_wconf 90' lang='eng' dir='ltr'><em>ACAM</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 912 407 1173 440; x_wconf 76' lang='eng' dir='ltr'><em>55OTT(AF001375)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 236 447 1092 480; baseline 0 -6"><span class='ocrx_word' id='word_1_67' title='bbox 236 451 269 467; x_wconf 78' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 382 451 607 474; x_wconf 88' lang='eng' dir='ltr'><em>Thalassomonas</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 619 450 728 474; x_wconf 89' lang='eng' dir='ltr'><em>viridans</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 739 450 825 474; x_wconf 91' lang='eng' dir='ltr'><em>CECT</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 837 447 920 474; x_wconf 90' lang='eng' dir='ltr'><em>5083T</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 928 450 1092 480; x_wconf 83' lang='eng' dir='ltr'>(AJ294748)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 334 488 1078 521; baseline -0.001 -6"><span class='ocrx_word' id='word_1_73' title='bbox 334 491 531 515; x_wconf 85' lang='eng' dir='ltr'><em>Oceanimonas</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 542 491 693 515; x_wconf 86' lang='eng' dir='ltr'><em>doudoroffii</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 701 491 787 515; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 799 488 902 515; x_wconf 79' lang='eng' dir='ltr'><em>27123T</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 910 491 1078 521; x_wconf 81' lang='eng' dir='ltr'>(ABO19390)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 91 498 990 581; baseline 0 -26"><span class='ocrx_word' id='word_1_78' title='bbox 91 498 537 581; x_wconf 67' lang='eng' dir='ltr'><em>5EFerrimonas</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 547 532 677 555; x_wconf 88' lang='eng' dir='ltr'><em>balearica</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 689 531 757 555; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 770 528 853 555; x_wconf 78' lang='eng' dir='ltr'><em>9799T</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 861 532 990 562; x_wconf 89' lang='eng' dir='ltr'><em>(X93021)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 132 573 154 589; baseline 0 0"><span class='ocrx_word' id='word_1_83' title='bbox 132 573 154 589; x_wconf 84' lang='eng'>93</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 244 569 1054 644">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 244 569 1054 644">
+     <span class='ocr_line' id='line_1_28' title="bbox 374 569 1054 603; baseline 0 -7"><span class='ocrx_word' id='word_1_84' title='bbox 374 572 538 596; x_wconf 86' lang='eng' dir='ltr'><em>Shewane/la</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 549 572 725 603; x_wconf 80' lang='eng' dir='ltr'><em>putrefaciens</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 734 572 821 596; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 834 569 917 596; x_wconf 80' lang='eng' dir='ltr'><em>8071T</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 925 572 1054 603; x_wconf 83' lang='eng' dir='ltr'>(X82133)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 244 610 814 644; baseline 0 -7"><span class='ocrx_word' id='word_1_89' title='bbox 244 613 409 637; x_wconf 85' lang='eng' dir='ltr'><em>Escherichia</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 421 613 470 637; x_wconf 89' lang='eng' dir='ltr'><em>coli</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 477 613 563 637; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 578 613 586 637; x_wconf 94' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 596 610 678 637; x_wconf 92' lang='eng' dir='ltr'><em>1775T</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 686 613 814 644; x_wconf 89' lang='eng' dir='ltr'>(X80725)</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001909-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001909-0-000.pbm.png
new file mode 100644
index 00000000..495607a1
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001909-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001909-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001909-0-000.pbm.png.hocr
new file mode 100644
index 00000000..6c953d0a
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001909-0-000.pbm.png.hocr
@@ -0,0 +1,178 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001909-0-000.pbm.png"; bbox 0 0 1539 1154; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 202 53 249 69">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 202 53 249 69">
+     <span class='ocr_line' id='line_1_1' title="bbox 202 53 249 69; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 202 53 249 69; x_wconf 85' lang='eng'>64.8</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 2 174 41 206">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 2 174 41 206">
+     <span class='ocr_line' id='line_1_2' title="bbox 2 174 38 200; textangle 90"><span class='ocrx_word' id='word_1_2' title='bbox 21 189 29 200; x_wconf 67' lang='eng' dir='ltr'>o</span> <span class='ocrx_word' id='word_1_3' title='bbox 2 174 38 178; x_wconf 86' lang='eng' dir='ltr'><strong>I</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 26 189 41 206; textangle 90"><span class='ocrx_word' id='word_1_4' title='bbox 26 189 41 206; x_wconf 73' lang='eng' dir='ltr'>o\</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 210 221 240 237">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 210 221 240 237">
+     <span class='ocr_line' id='line_1_4' title="bbox 210 221 240 237; baseline 0 0"><span class='ocrx_word' id='word_1_5' title='bbox 210 221 240 237; x_wconf 84' lang='eng'>72.</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 263 295 309 312">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 263 295 309 312">
+     <span class='ocr_line' id='line_1_5' title="bbox 263 295 309 312; baseline 0 0"><span class='ocrx_word' id='word_1_6' title='bbox 263 295 309 312; x_wconf 89' lang='eng'>84.6</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 137 383 249 432">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 137 383 249 432">
+     <span class='ocr_line' id='line_1_6' title="bbox 202 383 249 399; baseline 0 0"><span class='ocrx_word' id='word_1_7' title='bbox 202 383 249 399; x_wconf 85' lang='eng'>85.8</span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 137 415 184 432; baseline 0 0"><span class='ocrx_word' id='word_1_8' title='bbox 137 415 184 432; x_wconf 87' lang='eng'>51.8</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 76 592 261 618">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 76 592 261 618">
+     <span class='ocr_line' id='line_1_8' title="bbox 76 592 261 618; baseline 0 -9"><span class='ocrx_word' id='word_1_9' title='bbox 76 592 122 609; x_wconf 82' lang='eng'>95.6</span> <span class='ocrx_word' id='word_1_10' title='bbox 215 601 261 618; x_wconf 42' lang='eng'>99.9</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 8 778 53 794">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 8 778 53 794">
+     <span class='ocr_line' id='line_1_9' title="bbox 8 778 53 794; baseline 0 0"><span class='ocrx_word' id='word_1_11' title='bbox 8 778 53 794; x_wconf 87' lang='eng'>74.9</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 132 808 176 824">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 132 808 176 824">
+     <span class='ocr_line' id='line_1_10' title="bbox 132 808 176 824; baseline 0 0"><span class='ocrx_word' id='word_1_12' title='bbox 132 808 176 824; x_wconf 89' lang='eng'>71.7</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 235 909 293 926">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 235 909 293 926">
+     <span class='ocr_line' id='line_1_11' title="bbox 235 909 293 926; baseline 0 0"><span class='ocrx_word' id='word_1_13' title='bbox 235 909 293 926; x_wconf 88' lang='eng'>100.0</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 145 964 190 980">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 145 964 190 980">
+     <span class='ocr_line' id='line_1_12' title="bbox 145 964 190 980; baseline 0 0"><span class='ocrx_word' id='word_1_14' title='bbox 145 964 190 980; x_wconf 83' lang='eng'>99.6</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 303 1081 362 1098">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 303 1081 362 1098">
+     <span class='ocr_line' id='line_1_13' title="bbox 303 1081 362 1098; baseline 0 0"><span class='ocrx_word' id='word_1_15' title='bbox 303 1081 362 1098; x_wconf 88' lang='eng'>100.0</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 385 4 1201 36">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 385 4 1201 36">
+     <span class='ocr_line' id='line_1_14' title="bbox 385 4 1201 36; baseline 0.001 -8"><span class='ocrx_word' id='word_1_16' title='bbox 385 10 444 26; x_wconf 88' lang='eng'>100.0</span> <span class='ocrx_word' id='word_1_17' title='bbox 540 7 746 36; x_wconf 85' lang='eng' dir='ltr'>Porphyromonas</span> <span class='ocrx_word' id='word_1_18' title='bbox 755 7 825 36; x_wconf 84' lang='eng' dir='ltr'>gu/ae</span> <span class='ocrx_word' id='word_1_19' title='bbox 835 7 918 29; x_wconf 91' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_20' title='bbox 929 8 956 29; x_wconf 93' lang='eng'>51</span> <span class='ocrx_word' id='word_1_21' title='bbox 966 5 1028 29; x_wconf 91' lang='eng' dir='ltr'>700T</span> <span class='ocrx_word' id='word_1_22' title='bbox 1039 4 1201 33; x_wconf 85' lang='eng' dir='ltr'>(AF208290)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 457 47 1536 1149">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 457 47 1536 1149">
+     <span class='ocr_line' id='line_1_15' title="bbox 558 47 1231 79; baseline 0 -7"><span class='ocrx_word' id='word_1_23' title='bbox 558 50 763 79; x_wconf 80' lang='eng' dir='ltr'>Porphyromonas</span> <span class='ocrx_word' id='word_1_24' title='bbox 773 50 894 79; x_wconf 85' lang='eng' dir='ltr'>gingiva/is</span> <span class='ocrx_word' id='word_1_25' title='bbox 903 50 986 72; x_wconf 91' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_26' title='bbox 996 47 1096 72; x_wconf 83' lang='eng' dir='ltr'>33277T</span> <span class='ocrx_word' id='word_1_27' title='bbox 1107 47 1142 76; x_wconf 94' lang='eng' dir='ltr'>(L1</span> <span class='ocrx_word' id='word_1_28' title='bbox 1151 47 1231 76; x_wconf 84' lang='eng'>6492)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 593 90 1358 121; baseline 0.001 -7"><span class='ocrx_word' id='word_1_29' title='bbox 593 92 798 121; x_wconf 84' lang='eng' dir='ltr'>Porphyromonas</span> <span class='ocrx_word' id='word_1_30' title='bbox 809 92 972 115; x_wconf 80' lang='eng' dir='ltr'>crevioricanis</span> <span class='ocrx_word' id='word_1_31' title='bbox 982 92 1064 115; x_wconf 91' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_32' title='bbox 1075 90 1175 115; x_wconf 87' lang='eng' dir='ltr'>55563T</span> <span class='ocrx_word' id='word_1_33' title='bbox 1185 90 1358 119; x_wconf 80' lang='eng' dir='ltr'>(D0677836)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 596 133 1216 164; baseline 0.002 -7"><span class='ocrx_word' id='word_1_34' title='bbox 596 135 802 164; x_wconf 87' lang='eng' dir='ltr'>Porphyromonas</span> <span class='ocrx_word' id='word_1_35' title='bbox 812 135 985 158; x_wconf 84' lang='eng' dir='ltr'>cansu/ciVPB</span> <span class='ocrx_word' id='word_1_36' title='bbox 997 133 1078 158; x_wconf 79' lang='eng' dir='ltr'>4875T</span> <span class='ocrx_word' id='word_1_37' title='bbox 1089 133 1216 162; x_wconf 87' lang='eng' dir='ltr'>(X76260)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 561 176 1226 207; baseline 0 -7"><span class='ocrx_word' id='word_1_38' title='bbox 561 178 766 207; x_wconf 87' lang='eng' dir='ltr'>Porphyromonas</span> <span class='ocrx_word' id='word_1_39' title='bbox 777 178 886 200; x_wconf 84' lang='eng' dir='ltr'>catoniae</span> <span class='ocrx_word' id='word_1_40' title='bbox 895 178 978 200; x_wconf 92' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_41' title='bbox 988 179 1015 200; x_wconf 87' lang='eng'>51</span> <span class='ocrx_word' id='word_1_42' title='bbox 1025 176 1088 200; x_wconf 93' lang='eng' dir='ltr'>270T</span> <span class='ocrx_word' id='word_1_43' title='bbox 1099 176 1226 205; x_wconf 89' lang='eng' dir='ltr'>(X82823)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 582 218 1251 250; baseline 0 -7"><span class='ocrx_word' id='word_1_44' title='bbox 582 221 787 250; x_wconf 84' lang='eng' dir='ltr'>Porphyromonas</span> <span class='ocrx_word' id='word_1_45' title='bbox 797 228 914 243; x_wconf 79' lang='eng' dir='ltr'>macacae</span> <span class='ocrx_word' id='word_1_46' title='bbox 923 220 1005 243; x_wconf 91' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_47' title='bbox 1016 221 1061 243; x_wconf 88' lang='eng'>331</span> <span class='ocrx_word' id='word_1_48' title='bbox 1071 222 1098 243; x_wconf 90' lang='eng'>41</span> <span class='ocrx_word' id='word_1_49' title='bbox 1106 218 1116 233; x_wconf 77' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_50' title='bbox 1127 218 1251 247; x_wconf 85' lang='eng' dir='ltr'>(L16494)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 599 261 1356 292; baseline 0.001 -7"><span class='ocrx_word' id='word_1_51' title='bbox 599 264 805 292; x_wconf 88' lang='eng' dir='ltr'>Porphyromonas</span> <span class='ocrx_word' id='word_1_52' title='bbox 815 271 926 286; x_wconf 84' lang='eng' dir='ltr'>somerae</span> <span class='ocrx_word' id='word_1_53' title='bbox 936 263 1018 286; x_wconf 87' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_54' title='bbox 1029 264 1111 285; x_wconf 90' lang='eng' dir='ltr'>BAA-1</span> <span class='ocrx_word' id='word_1_55' title='bbox 1121 261 1183 286; x_wconf 90' lang='eng' dir='ltr'>230T</span> <span class='ocrx_word' id='word_1_56' title='bbox 1191 261 1356 290; x_wconf 84' lang='eng' dir='ltr'>(AY968205)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 599 304 1201 336; baseline 0 -7"><span class='ocrx_word' id='word_1_57' title='bbox 599 307 804 336; x_wconf 84' lang='eng' dir='ltr'>Porphyromonas</span> <span class='ocrx_word' id='word_1_58' title='bbox 815 307 866 329; x_wconf 81' lang='eng' dir='ltr'>leI/I&#39;i</span> <span class='ocrx_word' id='word_1_59' title='bbox 874 307 956 329; x_wconf 89' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_60' title='bbox 968 304 1066 329; x_wconf 89' lang='eng' dir='ltr'>29147T</span> <span class='ocrx_word' id='word_1_61' title='bbox 1077 304 1201 334; x_wconf 84' lang='eng' dir='ltr'>(L16493)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 730 347 1480 378; baseline 0 -6"><span class='ocrx_word' id='word_1_62' title='bbox 730 350 968 378; x_wconf 88' lang='eng' dir='ltr'>Porphyromonas</span> <span class='ocrx_word' id='word_1_63' title='bbox 977 350 1115 372; x_wconf 91' lang='eng' dir='ltr'>bennonis</span> <span class='ocrx_word' id='word_1_64' title='bbox 1125 350 1193 372; x_wconf 95' lang='eng' dir='ltr'>WAL</span> <span class='ocrx_word' id='word_1_65' title='bbox 1204 348 1304 372; x_wconf 76' lang='eng' dir='ltr'>19266T</span> <span class='ocrx_word' id='word_1_66' title='bbox 1315 347 1480 377; x_wconf 91' lang='eng' dir='ltr'>(EU414673)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 523 390 1203 422; baseline 0 -7"><span class='ocrx_word' id='word_1_67' title='bbox 523 393 728 422; x_wconf 84' lang='eng' dir='ltr'>Porphyromonas</span> <span class='ocrx_word' id='word_1_68' title='bbox 739 393 906 421; x_wconf 73' lang='eng' dir='ltr'>cangingiva/fs</span> <span class='ocrx_word' id='word_1_69' title='bbox 915 393 972 415; x_wconf 90' lang='eng' dir='ltr'>VPB</span> <span class='ocrx_word' id='word_1_70' title='bbox 984 390 1066 415; x_wconf 90' lang='eng' dir='ltr'>4874T</span> <span class='ocrx_word' id='word_1_71' title='bbox 1076 390 1203 419; x_wconf 90' lang='eng' dir='ltr'>(X76259)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 570 432 1164 464; baseline 0 -7"><span class='ocrx_word' id='word_1_72' title='bbox 570 435 775 464; x_wconf 83' lang='eng' dir='ltr'>Porphyromonas</span> <span class='ocrx_word' id='word_1_73' title='bbox 785 435 879 457; x_wconf 87' lang='eng' dir='ltr'>canoris</span> <span class='ocrx_word' id='word_1_74' title='bbox 888 435 945 457; x_wconf 92' lang='eng' dir='ltr'>VPB</span> <span class='ocrx_word' id='word_1_75' title='bbox 957 436 1025 457; x_wconf 91' lang='eng'>4882</span> <span class='ocrx_word' id='word_1_76' title='bbox 1038 432 1164 462; x_wconf 86' lang='eng' dir='ltr'>(X76261)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 544 475 1282 507; baseline 0.003 -9"><span class='ocrx_word' id='word_1_77' title='bbox 544 481 603 498; x_wconf 88' lang='eng'>100.0</span> <span class='ocrx_word' id='word_1_78' title='bbox 640 478 853 507; x_wconf 77' lang='eng' dir='ltr'>‘Porphyromonas</span> <span class='ocrx_word' id='word_1_79' title='bbox 863 478 936 500; x_wconf 79' lang='eng' dir='ltr'>can/3’</span> <span class='ocrx_word' id='word_1_80' title='bbox 947 478 1005 500; x_wconf 93' lang='eng' dir='ltr'>JCM</span> <span class='ocrx_word' id='word_1_81' title='bbox 1019 479 1104 500; x_wconf 90' lang='eng'>10100</span> <span class='ocrx_word' id='word_1_82' title='bbox 1116 475 1282 505; x_wconf 79' lang='eng' dir='ltr'>(ABOS4799)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 477 512 1389 550; baseline 0 -7"><span class='ocrx_word' id='word_1_83' title='bbox 477 512 536 529; x_wconf 59' lang='eng'>100&#39;0</span> <span class='ocrx_word' id='word_1_84' title='bbox 634 521 840 550; x_wconf 86' lang='eng' dir='ltr'>Porphyromonas</span> <span class='ocrx_word' id='word_1_85' title='bbox 849 521 1002 549; x_wconf 82' lang='eng' dir='ltr'>gingivicanis</span> <span class='ocrx_word' id='word_1_86' title='bbox 1012 521 1094 543; x_wconf 91' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_87' title='bbox 1105 518 1205 543; x_wconf 90' lang='eng' dir='ltr'>55562T</span> <span class='ocrx_word' id='word_1_88' title='bbox 1215 519 1389 548; x_wconf 81' lang='eng' dir='ltr'>(D0677835)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 623 561 1370 593; baseline 0 -7"><span class='ocrx_word' id='word_1_89' title='bbox 623 564 828 593; x_wconf 81' lang='eng' dir='ltr'>Porphyromonas</span> <span class='ocrx_word' id='word_1_90' title='bbox 839 564 1031 586; x_wconf 73' lang='eng' dir='ltr'>circumdentaria</span> <span class='ocrx_word' id='word_1_91' title='bbox 1043 563 1126 586; x_wconf 91' lang='eng' dir='ltr'>NCTC</span> <span class='ocrx_word' id='word_1_92' title='bbox 1139 565 1146 586; x_wconf 93' lang='eng'>1</span> <span class='ocrx_word' id='word_1_93' title='bbox 1156 561 1236 586; x_wconf 80' lang='eng' dir='ltr'>2469T</span> <span class='ocrx_word' id='word_1_94' title='bbox 1246 561 1370 591; x_wconf 86' lang='eng' dir='ltr'>(L26102)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 599 604 1361 636; baseline 0 -7"><span class='ocrx_word' id='word_1_95' title='bbox 599 607 805 636; x_wconf 85' lang='eng' dir='ltr'>Porphyromonas</span> <span class='ocrx_word' id='word_1_96' title='bbox 815 607 982 629; x_wconf 74' lang='eng' dir='ltr'>endodonta/r&#39;s</span> <span class='ocrx_word' id='word_1_97' title='bbox 992 607 1074 629; x_wconf 88' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_98' title='bbox 1085 604 1185 629; x_wconf 73' lang='eng' dir='ltr'>35406T</span> <span class='ocrx_word' id='word_1_99' title='bbox 1195 604 1361 633; x_wconf 88' lang='eng' dir='ltr'>(AY253728)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 592 647 1464 678; baseline 0.002 -9"><span class='ocrx_word' id='word_1_100' title='bbox 592 653 650 669; x_wconf 86' lang='eng'>100.0</span> <span class='ocrx_word' id='word_1_101' title='bbox 732 650 937 678; x_wconf 83' lang='eng' dir='ltr'>Porphyromonas</span> <span class='ocrx_word' id='word_1_102' title='bbox 948 650 1049 672; x_wconf 85' lang='eng' dir='ltr'>uenonis</span> <span class='ocrx_word' id='word_1_103' title='bbox 1059 649 1142 672; x_wconf 92' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_104' title='bbox 1153 647 1289 672; x_wconf 88' lang='eng' dir='ltr'>BAA—906T</span> <span class='ocrx_word' id='word_1_105' title='bbox 1299 647 1430 676; x_wconf 89' lang='eng' dir='ltr'>(AY57051</span> <span class='ocrx_word' id='word_1_106' title='bbox 1439 647 1464 676; x_wconf 92' lang='eng'>4)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 717 690 1471 721; baseline 0.001 -7"><span class='ocrx_word' id='word_1_107' title='bbox 717 692 922 721; x_wconf 84' lang='eng' dir='ltr'>Porphyromonas</span> <span class='ocrx_word' id='word_1_108' title='bbox 932 692 1133 721; x_wconf 80' lang='eng' dir='ltr'>asaccharo/ytica</span> <span class='ocrx_word' id='word_1_109' title='bbox 1143 692 1226 715; x_wconf 90' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_110' title='bbox 1238 690 1337 715; x_wconf 89' lang='eng' dir='ltr'>25260T</span> <span class='ocrx_word' id='word_1_111' title='bbox 1347 690 1471 719; x_wconf 88' lang='eng' dir='ltr'>(L16490)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 463 733 1095 764; baseline 0.002 -7"><span class='ocrx_word' id='word_1_112' title='bbox 463 735 595 758; x_wconf 87' lang='eng' dir='ltr'>Tannere/la</span> <span class='ocrx_word' id='word_1_113' title='bbox 606 735 715 764; x_wconf 80' lang='eng' dir='ltr'>forsythia</span> <span class='ocrx_word' id='word_1_114' title='bbox 724 735 807 758; x_wconf 91' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_115' title='bbox 817 733 918 758; x_wconf 78' lang='eng' dir='ltr'>43037T</span> <span class='ocrx_word' id='word_1_116' title='bbox 928 733 1095 762; x_wconf 80' lang='eng' dir='ltr'>(A8035460)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 457 775 1047 807; baseline 0 -7"><span class='ocrx_word' id='word_1_117' title='bbox 457 778 589 800; x_wconf 79' lang='eng' dir='ltr'>Tannerella</span> <span class='ocrx_word' id='word_1_118' title='bbox 600 777 708 807; x_wconf 83' lang='eng' dir='ltr'>forsythia</span> <span class='ocrx_word' id='word_1_119' title='bbox 720 778 782 800; x_wconf 93' lang='eng' dir='ltr'>RMA</span> <span class='ocrx_word' id='word_1_120' title='bbox 793 778 862 800; x_wconf 88' lang='eng'>8464</span> <span class='ocrx_word' id='word_1_121' title='bbox 873 775 1013 805; x_wconf 79' lang='eng' dir='ltr'>(D034491</span> <span class='ocrx_word' id='word_1_122' title='bbox 1023 775 1047 804; x_wconf 92' lang='eng'>7)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 593 818 1283 847; baseline 0 -4"><span class='ocrx_word' id='word_1_123' title='bbox 593 821 806 843; x_wconf 71' lang='eng' dir='ltr'>Parabacteroides</span> <span class='ocrx_word' id='word_1_124' title='bbox 816 821 947 843; x_wconf 78' lang='eng' dir='ltr'>distasonis</span> <span class='ocrx_word' id='word_1_125' title='bbox 956 820 1014 843; x_wconf 88' lang='eng' dir='ltr'>JCM</span> <span class='ocrx_word' id='word_1_126' title='bbox 1026 818 1108 843; x_wconf 88' lang='eng' dir='ltr'>5825T</span> <span class='ocrx_word' id='word_1_127' title='bbox 1119 818 1283 847; x_wconf 87' lang='eng' dir='ltr'>(EU136681)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 693 861 1290 892; baseline 0 -6"><span class='ocrx_word' id='word_1_128' title='bbox 693 864 850 886; x_wconf 83' lang='eng' dir='ltr'>Bacteroides</span> <span class='ocrx_word' id='word_1_129' title='bbox 861 864 945 892; x_wconf 84' lang='eng' dir='ltr'>fragi/is</span> <span class='ocrx_word' id='word_1_130' title='bbox 956 864 1019 886; x_wconf 93' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_131' title='bbox 1032 861 1113 886; x_wconf 91' lang='eng' dir='ltr'>2151T</span> <span class='ocrx_word' id='word_1_132' title='bbox 1123 861 1290 891; x_wconf 86' lang='eng' dir='ltr'>(AB050106)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 543 904 1265 933; baseline 0 -4"><span class='ocrx_word' id='word_1_133' title='bbox 543 907 700 929; x_wconf 79' lang='eng' dir='ltr'>Bacteroides</span> <span class='ocrx_word' id='word_1_134' title='bbox 711 907 928 929; x_wconf 82' lang='eng' dir='ltr'>theta/otaomicron</span> <span class='ocrx_word' id='word_1_135' title='bbox 938 906 1020 929; x_wconf 92' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_136' title='bbox 1031 908 1076 929; x_wconf 87' lang='eng'>291</span> <span class='ocrx_word' id='word_1_137' title='bbox 1085 904 1131 929; x_wconf 82' lang='eng' dir='ltr'>48T</span> <span class='ocrx_word' id='word_1_138' title='bbox 1141 904 1176 933; x_wconf 93' lang='eng' dir='ltr'>(L1</span> <span class='ocrx_word' id='word_1_139' title='bbox 1185 904 1265 933; x_wconf 88' lang='eng'>6489)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 536 947 1312 979; baseline 0 -7"><span class='ocrx_word' id='word_1_140' title='bbox 536 953 594 969; x_wconf 87' lang='eng'>100.0</span> <span class='ocrx_word' id='word_1_141' title='bbox 682 950 839 972; x_wconf 77' lang='eng' dir='ltr'>Bacteroides</span> <span class='ocrx_word' id='word_1_142' title='bbox 847 957 975 979; x_wconf 86' lang='eng' dir='ltr'>pyogenes</span> <span class='ocrx_word' id='word_1_143' title='bbox 984 949 1042 972; x_wconf 91' lang='eng' dir='ltr'>JCM</span> <span class='ocrx_word' id='word_1_144' title='bbox 1054 947 1136 972; x_wconf 90' lang='eng' dir='ltr'>6294T</span> <span class='ocrx_word' id='word_1_145' title='bbox 1147 947 1312 976; x_wconf 87' lang='eng' dir='ltr'>(EU136683)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 673 990 1274 1019; baseline 0 -4"><span class='ocrx_word' id='word_1_146' title='bbox 673 993 830 1015; x_wconf 82' lang='eng' dir='ltr'>Bacteroides</span> <span class='ocrx_word' id='word_1_147' title='bbox 841 995 919 1015; x_wconf 74' lang='eng' dir='ltr'>tectus</span> <span class='ocrx_word' id='word_1_148' title='bbox 928 992 986 1015; x_wconf 90' lang='eng' dir='ltr'>JCM</span> <span class='ocrx_word' id='word_1_149' title='bbox 1000 990 1098 1015; x_wconf 78' lang='eng' dir='ltr'>10003T</span> <span class='ocrx_word' id='word_1_150' title='bbox 1108 990 1274 1019; x_wconf 87' lang='eng' dir='ltr'>(EU136689)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 814 1032 1536 1064; baseline 0 -7"><span class='ocrx_word' id='word_1_151' title='bbox 814 1035 942 1057; x_wconf 81' lang='eng' dir='ltr'>Prevote/la</span> <span class='ocrx_word' id='word_1_152' title='bbox 953 1035 1158 1064; x_wconf 87' lang='eng' dir='ltr'>me/aninogenica</span> <span class='ocrx_word' id='word_1_153' title='bbox 1168 1035 1250 1057; x_wconf 92' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_154' title='bbox 1262 1033 1361 1057; x_wconf 87' lang='eng' dir='ltr'>25845T</span> <span class='ocrx_word' id='word_1_155' title='bbox 1372 1032 1536 1062; x_wconf 86' lang='eng' dir='ltr'>(AY323525)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 527 1075 1099 1106; baseline 0 -6"><span class='ocrx_word' id='word_1_156' title='bbox 527 1078 637 1106; x_wconf 82' lang='eng' dir='ltr'>Alist/pes</span> <span class='ocrx_word' id='word_1_157' title='bbox 649 1078 837 1106; x_wconf 83' lang='eng' dir='ltr'>finegoldiiANH</span> <span class='ocrx_word' id='word_1_158' title='bbox 850 1075 931 1100; x_wconf 89' lang='eng' dir='ltr'>2437T</span> <span class='ocrx_word' id='word_1_159' title='bbox 942 1075 1099 1105; x_wconf 89' lang='eng' dir='ltr'>(AJ518874)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 509 1118 1095 1149; baseline 0 -6"><span class='ocrx_word' id='word_1_160' title='bbox 509 1121 620 1149; x_wconf 85' lang='eng' dir='ltr'>Alistipes</span> <span class='ocrx_word' id='word_1_161' title='bbox 629 1121 759 1149; x_wconf 76' lang='eng' dir='ltr'>putredinis</span> <span class='ocrx_word' id='word_1_162' title='bbox 768 1120 851 1143; x_wconf 92' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_163' title='bbox 862 1118 961 1143; x_wconf 89' lang='eng' dir='ltr'>29800T</span> <span class='ocrx_word' id='word_1_164' title='bbox 972 1118 1007 1147; x_wconf 88' lang='eng' dir='ltr'>(L1</span> <span class='ocrx_word' id='word_1_165' title='bbox 1016 1122 1066 1143; x_wconf 87' lang='eng'>649</span> <span class='ocrx_word' id='word_1_166' title='bbox 1072 1118 1095 1147; x_wconf 93' lang='eng'>7)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 486 95 545 112">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 486 95 545 112">
+     <span class='ocr_line' id='line_1_41' title="bbox 486 95 545 112; baseline 0 0"><span class='ocrx_word' id='word_1_167' title='bbox 486 95 545 112; x_wconf 89' lang='eng'>100.0</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 385 267 444 283">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 385 267 444 283">
+     <span class='ocr_line' id='line_1_42' title="bbox 385 267 444 283; baseline 0 0"><span class='ocrx_word' id='word_1_168' title='bbox 385 267 444 283; x_wconf 93' lang='eng'>100.0</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 356 549 415 566">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 356 549 415 566">
+     <span class='ocr_line' id='line_1_43' title="bbox 356 549 415 566; baseline 0 0"><span class='ocrx_word' id='word_1_169' title='bbox 356 549 415 566; x_wconf 88' lang='eng'>100.0</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 320 738 379 755">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 320 738 379 755">
+     <span class='ocr_line' id='line_1_44' title="bbox 320 738 379 755; baseline 0 0"><span class='ocrx_word' id='word_1_170' title='bbox 320 738 379 755; x_wconf 89' lang='eng'>100.0</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 320 867 379 883">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 320 867 379 883">
+     <span class='ocr_line' id='line_1_45' title="bbox 320 867 379 883; baseline 0 0"><span class='ocrx_word' id='word_1_171' title='bbox 320 867 379 883; x_wconf 87' lang='eng'>100.0</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001925-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001925-0-000.pbm.png
new file mode 100644
index 00000000..d217b64d
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001925-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001925-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001925-0-000.pbm.png.hocr
new file mode 100644
index 00000000..ba0bd32e
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001925-0-000.pbm.png.hocr
@@ -0,0 +1,98 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001925-0-000.pbm.png"; bbox 0 0 994 535; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 170 2 990 532">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 170 2 779 29">
+     <span class='ocr_line' id='line_1_1' title="bbox 170 2 779 29; baseline -0.002 -5"><span class='ocrx_word' id='word_1_1' title='bbox 170 8 206 26; x_wconf 87' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 245 2 359 24; x_wconf 83' lang='eng' dir='ltr'><em>Leifsonia</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 370 2 478 29; x_wconf 81' lang='eng' dir='ltr'><em>aquatica</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 489 2 550 24; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 561 2 653 24; x_wconf 79' lang='eng' dir='ltr'><em>2014GT</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 662 2 779 29; x_wconf 88' lang='eng' dir='ltr'><em>(X77450)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 231 44 792 71">
+     <span class='ocr_line' id='line_1_2' title="bbox 231 44 792 71; baseline 0 -6"><span class='ocrx_word' id='word_1_7' title='bbox 231 44 346 65; x_wconf 85' lang='eng' dir='ltr'><em>Leifsonia</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 356 44 521 71; x_wconf 83' lang='eng' dir='ltr'><em>naganoensis</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 531 44 630 65; x_wconf 84' lang='eng' dir='ltr'><em>DB103T</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 640 44 792 71; x_wconf 87' lang='eng' dir='ltr'><em>(AB028941)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 261 86 825 113">
+     <span class='ocr_line' id='line_1_3' title="bbox 261 86 825 113; baseline 0 -6"><span class='ocrx_word' id='word_1_11' title='bbox 261 86 375 107; x_wconf 83' lang='eng' dir='ltr'><em>Le/fsonia</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 385 86 553 107; x_wconf 89' lang='eng' dir='ltr'><em>shinshuensis</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 563 86 662 107; x_wconf 91' lang='eng' dir='ltr'><em>DB102T</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 672 86 825 113; x_wconf 79' lang='eng' dir='ltr'><em>(A3028940)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 179 128 990 197">
+     <span class='ocr_line' id='line_1_4' title="bbox 267 128 990 155; baseline 0 -6"><span class='ocrx_word' id='word_1_15' title='bbox 267 128 382 149; x_wconf 81' lang='eng' dir='ltr'><em>Leifsonia</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 391 128 435 155; x_wconf 83' lang='eng' dir='ltr'><em>xyli</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 443 128 525 155; x_wconf 21' lang='eng' dir='ltr'><em>subsp‘</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 537 128 675 155; x_wconf 81' lang='eng' dir='ltr'><em>cynodontis</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 684 128 741 149; x_wconf 90' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 753 128 828 149; x_wconf 80' lang='eng' dir='ltr'><em>9733T</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 838 128 990 155; x_wconf 87' lang='eng' dir='ltr'><em>(ABO16985)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 179 170 728 197; baseline 0 -6"><span class='ocrx_word' id='word_1_22' title='bbox 179 170 294 191; x_wconf 85' lang='eng' dir='ltr'><em>Leifsonia</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 303 175 368 197; x_wconf 86' lang='eng' dir='ltr'><em>poae</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 376 170 437 191; x_wconf 93' lang='eng' dir='ltr'><em>VKM</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 447 170 568 191; x_wconf 81' lang='eng' dir='ltr'><em>Ac-1401T</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 578 170 728 197; x_wconf 85' lang='eng' dir='ltr'><em>(AF116342)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 224 211 978 281">
+     <span class='ocr_line' id='line_1_6' title="bbox 343 211 978 238; baseline 0 -5"><span class='ocrx_word' id='word_1_27' title='bbox 343 211 512 233; x_wconf 79' lang='eng' dir='ltr'><em>Okibacterium</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 522 211 637 233; x_wconf 76' lang='eng' dir='ltr'><em>frit/&quot;I/ariae</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 648 211 708 233; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 722 211 811 233; x_wconf 89' lang='eng' dir='ltr'><em>15271T</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 821 212 978 238; x_wconf 86' lang='eng' dir='ltr'><em>(AM410675)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 224 253 746 281; baseline 0 -6"><span class='ocrx_word' id='word_1_32' title='bbox 224 253 340 275; x_wconf 81' lang='eng' dir='ltr'><em>Leifsonia</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 349 254 459 281; x_wconf 82' lang='eng' dir='ltr'><em>ginsengi</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 466 254 547 281; x_wconf 90' lang='eng' dir='ltr'>wged1</span> <span class='ocrx_word' id='word_1_35' title='bbox 555 253 579 275; x_wconf 81' lang='eng' dir='ltr'>1T</span> <span class='ocrx_word' id='word_1_36' title='bbox 589 253 746 280; x_wconf 87' lang='eng' dir='ltr'><em>(DQ473536)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 232 295 975 491">
+     <span class='ocr_line' id='line_1_8' title="bbox 357 295 922 323; baseline 0 -6"><span class='ocrx_word' id='word_1_37' title='bbox 357 295 483 317; x_wconf 88' lang='eng' dir='ltr'><em>Leifsonia</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 493 295 638 317; x_wconf 87' lang='eng' dir='ltr'><em>kribbensis</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 648 295 760 317; x_wconf 80' lang='eng' dir='ltr'><em>MSL-13T</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 770 295 922 323; x_wconf 88' lang='eng' dir='ltr'><em>(EF466129)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 232 337 802 365; baseline 0 -6"><span class='ocrx_word' id='word_1_41' title='bbox 232 337 346 359; x_wconf 81' lang='eng' dir='ltr'><em>Leifsonia</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 356 338 519 365; x_wconf 84' lang='eng' dir='ltr'><em>bigeumensis</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 530 337 641 359; x_wconf 89' lang='eng' dir='ltr'><em>MSL—27T</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 651 338 802 365; x_wconf 87' lang='eng' dir='ltr'><em>(EF466124)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 275 379 975 407; baseline 0 -6"><span class='ocrx_word' id='word_1_45' title='bbox 275 379 472 401; x_wconf 81' lang='eng' dir='ltr'><em>Sal/n/bacterium</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 482 380 654 407; x_wconf 86' lang='eng' dir='ltr'><em>amurskyense</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 664 380 728 401; x_wconf 91' lang='eng' dir='ltr'><em>KMM</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 740 379 814 401; x_wconf 83' lang='eng' dir='ltr'><em>3673T</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 824 380 975 407; x_wconf 87' lang='eng' dir='ltr'><em>(AF539697)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 361 421 857 449; baseline 0 -6"><span class='ocrx_word' id='word_1_50' title='bbox 361 421 476 443; x_wconf 79' lang='eng' dir='ltr'><em>Leifsonia</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 487 427 559 443; x_wconf 86' lang='eng' dir='ltr'><em>aurea</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 570 421 631 443; x_wconf 88' lang='eng' dir='ltr'><em>CMS</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 642 421 699 449; x_wconf 82' lang='eng' dir='ltr'><em>81yT</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 709 422 857 448; x_wconf 85' lang='eng' dir='ltr'><em>(AJ438586)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 355 463 852 491; baseline 0 -6"><span class='ocrx_word' id='word_1_55' title='bbox 355 464 526 491; x_wconf 86' lang='eng' dir='ltr'><em>Rhodoglobus</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 537 464 625 485; x_wconf 81' lang='eng' dir='ltr'><em>vestalii</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 634 463 695 485; x_wconf 80' lang='eng' dir='ltr'><em>LV3T</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 705 464 852 490; x_wconf 82' lang='eng' dir='ltr'><em>(AJ459101)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 239 502 777 532">
+     <span class='ocr_line' id='line_1_13' title="bbox 239 502 777 532; baseline 0 -5"><span class='ocrx_word' id='word_1_59' title='bbox 239 502 275 519; x_wconf 70' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 294 505 408 527; x_wconf 81' lang='eng' dir='ltr'><em>Leifsonia</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 418 506 485 527; x_wconf 88' lang='eng' dir='ltr'><em>rubra</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 495 505 557 527; x_wconf 88' lang='eng' dir='ltr'><em>CMS</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 568 505 620 527; x_wconf 82' lang='eng' dir='ltr'>76rT</span> <span class='ocrx_word' id='word_1_64' title='bbox 630 506 777 532; x_wconf 87' lang='eng' dir='ltr'><em>(AJ438585)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 0 9 354 518">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 0 9 354 518">
+     <span class='ocr_line' id='line_1_14' title="bbox 90 9 237 42; baseline 0 -11"><span class='ocrx_word' id='word_1_65' title='bbox 90 9 237 42; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 26 42 261 126; baseline 0 0"><span class='ocrx_word' id='word_1_66' title='bbox 26 42 261 126; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 0 126 262 168; baseline 0 -20"><span class='ocrx_word' id='word_1_67' title='bbox 0 126 262 168; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 0 168 335 251; baseline 0 -12"><span class='ocrx_word' id='word_1_68' title='bbox 0 168 335 251; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 0 251 354 323; baseline 0 0"><span class='ocrx_word' id='word_1_69' title='bbox 0 251 354 323; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 0 323 232 379; baseline 0 156"><span class='ocrx_word' id='word_1_70' title='bbox 0 323 232 379; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 0 379 273 421; baseline 0 114"><span class='ocrx_word' id='word_1_71' title='bbox 0 379 273 421; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 0 421 350 487; baseline 0 48"><span class='ocrx_word' id='word_1_72' title='bbox 0 421 350 487; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 171 487 239 518; baseline 0 17"><span class='ocrx_word' id='word_1_73' title='bbox 171 487 239 518; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 171 121 195 139">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 171 121 195 139">
+     <span class='ocr_line' id='line_1_23' title="bbox 171 121 195 139; baseline 0 0"><span class='ocrx_word' id='word_1_74' title='bbox 171 121 195 139; x_wconf 87' lang='eng'><em>80</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 40 489 98 507">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 40 489 98 507">
+     <span class='ocr_line' id='line_1_24' title="bbox 40 489 98 507; baseline 0 0"><span class='ocrx_word' id='word_1_75' title='bbox 40 489 98 507; x_wconf 62' lang='eng'>0,005</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001958-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001958-0-001.pbm.png
new file mode 100644
index 00000000..54b17990
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001958-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001958-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001958-0-001.pbm.png.hocr
new file mode 100644
index 00000000..244db661
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001958-0-001.pbm.png.hocr
@@ -0,0 +1,344 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001958-0-001.pbm.png"; bbox 0 0 1302 1839; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 88 0 134 18">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 88 0 134 18">
+     <span class='ocr_line' id='line_1_1' title="bbox 88 0 134 18; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 88 0 134 18; x_wconf 67' lang='eng'><em>0,02</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 0 1503 332 1810">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 0 1503 332 1810">
+     <span class='ocr_line' id='line_1_2' title="bbox 0 1503 332 1810; baseline 0 29"><span class='ocrx_word' id='word_1_2' title='bbox 0 1503 332 1810; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 368 889 382 899">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 368 889 382 899">
+     <span class='ocr_line' id='line_1_3' title="bbox 368 889 382 899; baseline 0 0"><span class='ocrx_word' id='word_1_3' title='bbox 368 889 382 899; x_wconf 71' lang='eng' dir='ltr'><em>as</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 576 2 1053 25">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 576 2 1053 25">
+     <span class='ocr_line' id='line_1_4' title="bbox 576 2 1053 25; baseline 0 -5"><span class='ocrx_word' id='word_1_4' title='bbox 576 2 694 20; x_wconf 75' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 702 2 863 20; x_wconf 80' lang='eng' dir='ltr'><em>sulfatireducens</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 875 3 917 20; x_wconf 86' lang='eng'><em>38-1</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 927 2 1053 25; x_wconf 84' lang='eng' dir='ltr'><em>(AY943861)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 393 8 581 814">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 393 33 581 814">
+     <span class='ocr_line' id='line_1_5' title="bbox 503 33 574 181; baseline 0 0"><span class='ocrx_word' id='word_1_8' title='bbox 503 33 574 181; x_wconf 95' lang='eng' dir='ltr'><em>     </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 496 181 581 278; baseline 0 0"><span class='ocrx_word' id='word_1_9' title='bbox 496 181 581 278; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 496 278 539 349; baseline 0 1490"><span class='ocrx_word' id='word_1_10' title='bbox 496 278 539 349; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 393 338 502 427; baseline 0 0"><span class='ocrx_word' id='word_1_11' title='bbox 393 338 502 427; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 393 427 439 490; baseline 0 0"><span class='ocrx_word' id='word_1_12' title='bbox 393 427 439 490; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 393 490 439 516; baseline 0 1323"><span class='ocrx_word' id='word_1_13' title='bbox 393 490 439 516; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 393 516 558 663; baseline 0 -56"><span class='ocrx_word' id='word_1_14' title='bbox 393 516 558 663; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 393 663 518 814; baseline 0 0"><span class='ocrx_word' id='word_1_15' title='bbox 393 663 518 814; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 567 46 1115 115">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 567 46 1115 115">
+     <span class='ocr_line' id='line_1_13' title="bbox 567 46 1115 73; baseline 0 -5"><span class='ocrx_word' id='word_1_16' title='bbox 567 50 685 68; x_wconf 74' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 694 51 835 73; x_wconf 74' lang='eng' dir='ltr'><em>amygdaI/‘num</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 853 46 979 68; x_wconf 67' lang='eng' dir='ltr'><em>DSM12857T</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 988 50 1115 73; x_wconf 82' lang='eng' dir='ltr'><em>(AY353957)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 575 92 1004 115; baseline 0 -5"><span class='ocrx_word' id='word_1_20' title='bbox 575 92 693 110; x_wconf 74' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 701 93 812 110; x_wconf 74' lang='eng' dir='ltr'><em>boliviensis</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 833 93 864 110; x_wconf 89' lang='eng' dir='ltr'><em>E-1</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 877 92 1004 115; x_wconf 83' lang='eng' dir='ltr'><em>(AY943862)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 503 111 516 121">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 503 111 516 121">
+     <span class='ocr_line' id='line_1_15' title="bbox 503 111 516 121; baseline 0 0"><span class='ocrx_word' id='word_1_24' title='bbox 503 111 516 121; x_wconf 77' lang='eng' dir='ltr'><em>se</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 477 141 1216 423">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 557 141 991 168">
+     <span class='ocr_line' id='line_1_16' title="bbox 557 141 991 168; baseline 0 -5"><span class='ocrx_word' id='word_1_25' title='bbox 557 145 675 163; x_wconf 70' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 683 145 751 163; x_wconf 81' lang='eng' dir='ltr'><em>indolis</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 771 145 821 163; x_wconf 85' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 831 141 879 163; x_wconf 79' lang='eng' dir='ltr'><em>755T</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 894 145 991 168; x_wconf 83' lang='eng' dir='ltr'><em>(Y18184)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 539 189 1216 265">
+     <span class='ocr_line' id='line_1_17' title="bbox 582 189 1216 215; baseline -0.002 -4"><span class='ocrx_word' id='word_1_30' title='bbox 582 193 700 211; x_wconf 83' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 709 193 937 215; x_wconf 82' lang='eng' dir='ltr'><em>methoxybenzovorans</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 949 193 999 211; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 1010 189 1084 211; x_wconf 74' lang='eng' dir='ltr'><em>12182T</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 1091 193 1216 215; x_wconf 84' lang='eng' dir='ltr'><em>(AF067965)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 539 238 1079 265; baseline 0.002 -6"><span class='ocrx_word' id='word_1_35' title='bbox 539 242 657 259; x_wconf 85' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 665 242 837 264; x_wconf 81' lang='eng' dir='ltr'><em>saccharolyticum</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 856 242 906 259; x_wconf 85' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 915 238 976 259; x_wconf 71' lang='eng' dir='ltr'><em>2544T</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 982 242 1079 265; x_wconf 85' lang='eng' dir='ltr'><em>(Y18185)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 547 285 1093 312">
+     <span class='ocr_line' id='line_1_19' title="bbox 547 285 1093 312; baseline -0.002 -4"><span class='ocrx_word' id='word_1_40' title='bbox 547 289 665 308; x_wconf 80' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 674 290 796 312; x_wconf 86' lang='eng' dir='ltr'><em>sphenoides</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 810 289 875 308; x_wconf 86' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 886 285 956 308; x_wconf 78' lang='eng' dir='ltr'><em>19403T</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 966 290 1093 312; x_wconf 88' lang='eng' dir='ltr'>(ABO75772)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 477 323 1064 360">
+     <span class='ocr_line' id='line_1_20' title="bbox 477 323 1064 360; baseline 0 -5"><span class='ocrx_word' id='word_1_45' title='bbox 477 323 497 332; x_wconf 57' lang='eng' dir='ltr'><em>m</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 541 338 659 355; x_wconf 79' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 668 338 829 355; x_wconf 81' lang='eng' dir='ltr'><em>celerecrescens</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 844 338 894 355; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 904 334 1064 360; x_wconf 66' lang='eng' dir='ltr'><em>5628T(X71848)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 506 382 1185 423">
+     <span class='ocr_line' id='line_1_21' title="bbox 506 382 1185 423; baseline 0 -20"><span class='ocrx_word' id='word_1_50' title='bbox 506 414 520 423; x_wconf 47' lang='eng' dir='ltr'><em>9E</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 572 386 690 403; x_wconf 83' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 699 386 899 408; x_wconf 81' lang='eng' dir='ltr'><em>algidixylanolyticum</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 919 386 969 403; x_wconf 93' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 980 382 1185 408; x_wconf 56' lang='eng' dir='ltr'><em>12273T(AF092549)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 544 428 1058 454">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 544 428 1058 454">
+     <span class='ocr_line' id='line_1_22' title="bbox 544 428 1058 454; baseline 0.002 -5"><span class='ocrx_word' id='word_1_55' title='bbox 544 432 663 450; x_wconf 76' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 671 432 814 454; x_wconf 81' lang='eng' dir='ltr'><em>xylanolyticum</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 838 432 888 450; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 898 428 1058 454; x_wconf 54' lang='eng' dir='ltr'><em>6555T(X76739)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 498 255 500 432">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 498 255 500 432">
+     <span class='ocr_line' id='line_1_23' title="bbox 498 255 500 432; baseline 0 1407"><span class='ocrx_word' id='word_1_59' title='bbox 498 255 500 432; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 513 475 533 485">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 513 475 533 485">
+     <span class='ocr_line' id='line_1_24' title="bbox 513 475 533 485; baseline 0 0"><span class='ocrx_word' id='word_1_60' title='bbox 513 475 533 485; x_wconf 75' lang='eng' dir='ltr'><em>mu</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 490 477 1107 741">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 496 477 1107 649">
+     <span class='ocr_line' id='line_1_25' title="bbox 544 477 1052 503; baseline 0 -5"><span class='ocrx_word' id='word_1_61' title='bbox 544 481 663 498; x_wconf 81' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 671 481 804 498; x_wconf 75' lang='eng' dir='ltr'><em>aerato/erans</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 823 481 873 498; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 883 477 943 498; x_wconf 75' lang='eng' dir='ltr'><em>5434T</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 955 481 1052 503; x_wconf 83' lang='eng' dir='ltr'><em>(X76163)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 562 524 1079 551; baseline 0 -5"><span class='ocrx_word' id='word_1_66' title='bbox 562 528 681 546; x_wconf 81' lang='eng' dir='ltr'><em>Closm&#39;dium</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 689 529 798 551; x_wconf 78' lang='eng' dir='ltr'><em>hathewayi</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 816 528 866 546; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 878 524 948 546; x_wconf 80' lang='eng' dir='ltr'><em>13479T</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 957 528 1079 551; x_wconf 84' lang='eng' dir='ltr'><em>(AJ311620)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 563 572 1107 599; baseline 0 -5"><span class='ocrx_word' id='word_1_71' title='bbox 563 576 682 594; x_wconf 82' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 690 576 800 594; x_wconf 84' lang='eng' dir='ltr'><em>aldenense</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 814 576 883 594; x_wconf 89' lang='eng' dir='ltr'><em>CCUG</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 892 572 968 594; x_wconf 76' lang='eng' dir='ltr'><em>52204T</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 976 576 1107 599; x_wconf 82' lang='eng' dir='ltr'>(DQ279736)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 496 621 1038 649; baseline 0 -7"><span class='ocrx_word' id='word_1_76' title='bbox 496 640 510 649; x_wconf 55' lang='eng' dir='ltr'><strong><em>w</em></strong></span> <span class='ocrx_word' id='word_1_77' title='bbox 544 625 662 642; x_wconf 79' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 670 625 748 642; x_wconf 83' lang='eng' dir='ltr'><em>bolteae</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 771 621 903 642; x_wconf 73' lang='eng' dir='ltr'><em>WAL16351T</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 916 625 1038 647; x_wconf 83' lang='eng' dir='ltr'><em>(AJ508452)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 490 633 1105 741">
+     <span class='ocr_line' id='line_1_29' title="bbox 490 633 1105 695; baseline 0 -5"><span class='ocrx_word' id='word_1_81' title='bbox 490 633 538 683; x_wconf 63' lang='eng'>{</span> <span class='ocrx_word' id='word_1_82' title='bbox 547 672 666 690; x_wconf 79' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 674 672 829 690; x_wconf 78' lang='eng' dir='ltr'><em>closm&#39;dioforme</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 843 672 908 690; x_wconf 87' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 916 668 992 690; x_wconf 78' lang='eng' dir='ltr'><em>25537T</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 1004 672 1105 695; x_wconf 84' lang='eng' dir='ltr'>(M59089)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 575 715 1104 741; baseline 0 -5"><span class='ocrx_word' id='word_1_87' title='bbox 575 719 693 736; x_wconf 82' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 702 719 791 736; x_wconf 75' lang='eng' dir='ltr'><em>Citroniae</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 813 719 882 736; x_wconf 86' lang='eng' dir='ltr'><em>CCUG</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 892 715 964 736; x_wconf 75' lang='eng' dir='ltr'><em>52203T</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 973 719 1104 741; x_wconf 80' lang='eng' dir='ltr'>(DQZ79737)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 488 657 490 731">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 488 657 490 731">
+     <span class='ocr_line' id='line_1_31' title="bbox 488 657 490 731; baseline 0 1108"><span class='ocrx_word' id='word_1_92' title='bbox 488 657 490 731; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 490 729 569 731">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 490 729 569 731">
+     <span class='ocr_line' id='line_1_32' title="bbox 490 729 569 731; baseline 0 1108"><span class='ocrx_word' id='word_1_93' title='bbox 490 729 569 731; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 520 764 1116 790">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 520 764 1116 790">
+     <span class='ocr_line' id='line_1_33' title="bbox 520 764 1116 790; baseline 0 -5"><span class='ocrx_word' id='word_1_94' title='bbox 520 776 538 778; x_wconf 98' lang='eng'>—</span> <span class='ocrx_word' id='word_1_95' title='bbox 546 767 664 785; x_wconf 80' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 673 767 825 790; x_wconf 83' lang='eng' dir='ltr'><em>asparagiforme</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 846 767 896 785; x_wconf 85' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 907 764 980 785; x_wconf 78' lang='eng' dir='ltr'><em>15981T</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 993 767 1116 790; x_wconf 86' lang='eng' dir='ltr'><em>(AJ582080)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 518 776 520 850">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 518 776 520 850">
+     <span class='ocr_line' id='line_1_34' title="bbox 518 776 520 850; baseline 0 989"><span class='ocrx_word' id='word_1_100' title='bbox 518 776 520 850; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 520 811 1083 885">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 520 811 1083 885">
+     <span class='ocr_line' id='line_1_35' title="bbox 520 811 1083 874; baseline 0 -41"><span class='ocrx_word' id='word_1_101' title='bbox 520 815 702 874; x_wconf 50' lang='eng' dir='ltr'><em>1_E,OICIostridium</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 710 811 1083 838; x_wconf 71' lang='eng' dir='ltr'><em>IavalenseCCRl-9842T(EF564277)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 570 863 1078 885; baseline -0.002 -4"><span class='ocrx_word' id='word_1_103' title='bbox 570 863 702 881; x_wconf 84' lang='eng' dir='ltr'><em>Clcstridium</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 710 863 879 881; x_wconf 82' lang='eng' dir='ltr'><em>IavalenseCCRl</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 885 863 944 881; x_wconf 81' lang='eng'>-9929</span> <span class='ocrx_word' id='word_1_106' title='bbox 953 863 1078 885; x_wconf 87' lang='eng' dir='ltr'><em>(EF564278)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 354 909 391 911">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 354 909 391 911">
+     <span class='ocr_line' id='line_1_37' title="bbox 354 909 391 911; baseline 0 928"><span class='ocrx_word' id='word_1_107' title='bbox 354 909 391 911; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 354 909 356 1233">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 354 909 356 1233">
+     <span class='ocr_line' id='line_1_38' title="bbox 354 909 356 1233; baseline 0 606"><span class='ocrx_word' id='word_1_108' title='bbox 354 909 356 1233; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 363 1478 377 1487">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 363 1478 377 1487">
+     <span class='ocr_line' id='line_1_39' title="bbox 363 1478 377 1487; baseline 0 0"><span class='ocrx_word' id='word_1_109' title='bbox 363 1478 377 1487; x_wconf 64' lang='eng'><strong>54</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 632 907 1146 980">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 632 907 1146 980">
+     <span class='ocr_line' id='line_1_40' title="bbox 632 907 1146 934; baseline 0 -5"><span class='ocrx_word' id='word_1_110' title='bbox 632 911 750 929; x_wconf 78' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 759 912 880 934; x_wconf 86' lang='eng' dir='ltr'><em>symbiosum</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 889 911 954 929; x_wconf 87' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 964 907 1146 934; x_wconf 54' lang='eng' dir='ltr'><em>14940T(M59112)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 694 953 1109 980; baseline 0 -5"><span class='ocrx_word' id='word_1_114' title='bbox 694 958 812 975; x_wconf 82' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 820 958 956 980; x_wconf 84' lang='eng' dir='ltr'><em>aminophilum</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 975 953 1000 976; x_wconf 76' lang='eng' dir='ltr'><em>FT</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 1014 958 1109 980; x_wconf 88' lang='eng' dir='ltr'><em>(L04165)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 550 1002 1302 1124">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 550 1002 1302 1124">
+     <span class='ocr_line' id='line_1_42' title="bbox 743 1002 1302 1029; baseline 0 -5"><span class='ocrx_word' id='word_1_118' title='bbox 743 1006 861 1024; x_wconf 81' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 868 1006 1037 1028; x_wconf 75' lang='eng' dir='ltr'><em>pmteoc/asticum</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 1048 1006 1112 1024; x_wconf 87' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 1122 1002 1195 1024; x_wconf 74' lang='eng' dir='ltr'><em>51982T</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 1203 1006 1302 1029; x_wconf 85' lang='eng' dir='ltr'>(U37378)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 563 1051 1056 1077; baseline 0.002 -5"><span class='ocrx_word' id='word_1_123' title='bbox 563 1054 682 1072; x_wconf 77' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 690 1054 796 1072; x_wconf 82' lang='eng' dir='ltr'><em>coccoides</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 815 1054 865 1072; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 875 1051 936 1072; x_wconf 72' lang='eng' dir='ltr'><em>2088T</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 955 1055 1056 1077; x_wconf 86' lang='eng' dir='ltr'>(M59090)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 550 1098 1118 1124; baseline 0 -5"><span class='ocrx_word' id='word_1_128' title='bbox 550 1102 669 1120; x_wconf 82' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 676 1102 877 1124; x_wconf 77' lang='eng' dir='ltr'><em>glycyrrhizini/yticum</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 900 1098 969 1120; x_wconf 73' lang='eng' dir='ltr'><em>ZM35T</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 991 1102 1118 1124; x_wconf 81' lang='eng' dir='ltr'><em>(AB233029)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 389 916 742 1021">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 389 916 742 1021">
+     <span class='ocr_line' id='line_1_45' title="bbox 389 916 632 947; baseline 0 892"><span class='ocrx_word' id='word_1_132' title='bbox 389 916 632 947; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 389 947 742 1021; baseline 0 -28"><span class='ocrx_word' id='word_1_133' title='bbox 389 947 742 1021; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 389 554 395 1065">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 389 554 395 1065">
+     <span class='ocr_line' id='line_1_47' title="bbox 389 554 395 1065; baseline 0 774"><span class='ocrx_word' id='word_1_134' title='bbox 389 554 395 1065; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 391 554 397 1065">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 391 554 397 1065">
+     <span class='ocr_line' id='line_1_48' title="bbox 391 554 397 1065; baseline 0 774"><span class='ocrx_word' id='word_1_135' title='bbox 391 554 397 1065; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 392 554 394 1065">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 392 554 394 1065">
+     <span class='ocr_line' id='line_1_49' title="bbox 392 554 394 1065; baseline 0 774"><span class='ocrx_word' id='word_1_136' title='bbox 392 554 394 1065; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 352 1107 668 1356">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 352 1107 668 1356">
+     <span class='ocr_line' id='line_1_50' title="bbox 352 1107 549 1185; baseline 0 -52"><span class='ocrx_word' id='word_1_137' title='bbox 352 1107 549 1185; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_51' title="bbox 352 1185 603 1285; baseline 0 0"><span class='ocrx_word' id='word_1_138' title='bbox 352 1185 603 1285; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_52' title="bbox 403 1285 668 1356; baseline 0 -29"><span class='ocrx_word' id='word_1_139' title='bbox 403 1285 668 1356; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 384 1146 1127 1459">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 533 1146 1019 1172">
+     <span class='ocr_line' id='line_1_53' title="bbox 533 1146 1019 1172; baseline 0 -5"><span class='ocrx_word' id='word_1_140' title='bbox 533 1150 651 1167; x_wconf 79' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_141' title='bbox 660 1150 750 1167; x_wconf 72' lang='eng' dir='ltr'><em>orotioum</em></span> <span class='ocrx_word' id='word_1_142' title='bbox 766 1150 830 1167; x_wconf 88' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_143' title='bbox 841 1146 911 1167; x_wconf 72' lang='eng' dir='ltr'><em>13619T</em></span> <span class='ocrx_word' id='word_1_144' title='bbox 918 1150 1019 1172; x_wconf 84' lang='eng' dir='ltr'>(M59109)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 536 1194 968 1220">
+     <span class='ocr_line' id='line_1_54' title="bbox 536 1194 968 1220; baseline -0.002 -4"><span class='ocrx_word' id='word_1_145' title='bbox 536 1198 654 1216; x_wconf 76' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_146' title='bbox 662 1198 724 1216; x_wconf 85' lang='eng' dir='ltr'><em>nexile</em></span> <span class='ocrx_word' id='word_1_147' title='bbox 744 1198 794 1216; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_148' title='bbox 805 1194 863 1216; x_wconf 74' lang='eng' dir='ltr'><em>1787T</em></span> <span class='ocrx_word' id='word_1_149' title='bbox 871 1198 968 1220; x_wconf 85' lang='eng' dir='ltr'><em>(X73443)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 604 1240 1127 1270">
+     <span class='ocr_line' id='line_1_55' title="bbox 604 1240 1127 1270; baseline 0.008 -8"><span class='ocrx_word' id='word_1_150' title='bbox 604 1244 722 1262; x_wconf 74' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_151' title='bbox 731 1245 847 1267; x_wconf 81' lang='eng' dir='ltr'><em>hy/emonae</em></span> <span class='ocrx_word' id='word_1_152' title='bbox 861 1245 911 1263; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_153' title='bbox 922 1240 1127 1270; x_wconf 67' lang='eng' dir='ltr'><em>15053T(A8023972)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 605 1293 1055 1316">
+     <span class='ocr_line' id='line_1_56' title="bbox 605 1293 1055 1316; baseline 0.002 -5"><span class='ocrx_word' id='word_1_154' title='bbox 605 1293 723 1311; x_wconf 80' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_155' title='bbox 731 1293 833 1311; x_wconf 82' lang='eng' dir='ltr'><em>fusiformis</em></span> <span class='ocrx_word' id='word_1_156' title='bbox 844 1294 920 1312; x_wconf 83' lang='eng' dir='ltr'>CM973</span> <span class='ocrx_word' id='word_1_157' title='bbox 930 1294 1055 1316; x_wconf 84' lang='eng' dir='ltr'><em>(AF028349)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 439 1336 1125 1412">
+     <span class='ocr_line' id='line_1_57' title="bbox 670 1336 1125 1363; baseline 0 -4"><span class='ocrx_word' id='word_1_158' title='bbox 670 1341 787 1359; x_wconf 83' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_159' title='bbox 796 1341 890 1359; x_wconf 84' lang='eng' dir='ltr'><em>scindens</em></span> <span class='ocrx_word' id='word_1_160' title='bbox 902 1341 952 1359; x_wconf 85' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_161' title='bbox 961 1336 1021 1359; x_wconf 84' lang='eng' dir='ltr'><em>5676T</em></span> <span class='ocrx_word' id='word_1_162' title='bbox 1028 1341 1125 1363; x_wconf 83' lang='eng' dir='ltr'><em>(Y18186)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_58' title="bbox 439 1385 1034 1412; baseline 0 -6"><span class='ocrx_word' id='word_1_163' title='bbox 439 1402 459 1412; x_wconf 59' lang='eng' dir='ltr'><strong><em>m</em></strong></span> <span class='ocrx_word' id='word_1_164' title='bbox 528 1389 646 1406; x_wconf 80' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_165' title='bbox 651 1389 743 1411; x_wconf 85' lang='eng' dir='ltr'><em>jejuense</em></span> <span class='ocrx_word' id='word_1_166' title='bbox 764 1389 813 1406; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_167' title='bbox 825 1385 898 1406; x_wconf 74' lang='eng' dir='ltr'><em>15929T</em></span> <span class='ocrx_word' id='word_1_168' title='bbox 907 1389 1034 1411; x_wconf 86' lang='eng' dir='ltr'><em>(AY494606)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 384 1397 1084 1459">
+     <span class='ocr_line' id='line_1_59' title="bbox 384 1397 1084 1459; baseline 0 -5"><span class='ocrx_word' id='word_1_169' title='bbox 384 1397 658 1454; x_wconf 79' lang='eng' dir='ltr'><em>—|:Clostridium</em></span> <span class='ocrx_word' id='word_1_170' title='bbox 665 1437 807 1459; x_wconf 80' lang='eng' dir='ltr'><em>xylanovorans</em></span> <span class='ocrx_word' id='word_1_171' title='bbox 818 1436 869 1454; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_172' title='bbox 880 1433 1084 1459; x_wconf 56' lang='eng' dir='ltr'><em>12503T(AF116920)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 402 1479 1124 1506">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 402 1479 1124 1506">
+     <span class='ocr_line' id='line_1_60' title="bbox 402 1479 1124 1506; baseline 0 -5"><span class='ocrx_word' id='word_1_173' title='bbox 402 1496 416 1506; x_wconf 58' lang='eng'><em>57</em></span> <span class='ocrx_word' id='word_1_174' title='bbox 587 1483 706 1501; x_wconf 81' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_175' title='bbox 714 1483 882 1501; x_wconf 75' lang='eng' dir='ltr'><em>aminova/erfcum</em></span> <span class='ocrx_word' id='word_1_176' title='bbox 899 1483 948 1501; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_177' title='bbox 960 1479 1018 1501; x_wconf 83' lang='eng' dir='ltr'><em>1283T</em></span> <span class='ocrx_word' id='word_1_178' title='bbox 1027 1483 1124 1506; x_wconf 83' lang='eng' dir='ltr'><em>(X73436)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 337 1491 582 1497">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 337 1491 582 1497">
+     <span class='ocr_line' id='line_1_61' title="bbox 337 1491 582 1497; baseline 0 342"><span class='ocrx_word' id='word_1_179' title='bbox 337 1491 582 1497; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 392 1517 424 1519">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 392 1517 424 1519">
+     <span class='ocr_line' id='line_1_62' title="bbox 392 1517 424 1519; baseline 0 320"><span class='ocrx_word' id='word_1_180' title='bbox 392 1517 424 1519; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 422 1493 424 1543">
+    <p class='ocr_par' dir='ltr' id='par_1_42' title="bbox 422 1493 424 1543">
+     <span class='ocr_line' id='line_1_63' title="bbox 422 1493 424 1543; baseline 0 296"><span class='ocrx_word' id='word_1_181' title='bbox 422 1493 424 1543; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 382 1421 384 1570">
+    <p class='ocr_par' dir='ltr' id='par_1_43' title="bbox 382 1421 384 1570">
+     <span class='ocr_line' id='line_1_64' title="bbox 382 1421 384 1570; baseline 0 269"><span class='ocrx_word' id='word_1_182' title='bbox 382 1421 384 1570; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 353 1783 373 1792">
+    <p class='ocr_par' dir='ltr' id='par_1_44' title="bbox 353 1783 373 1792">
+     <span class='ocr_line' id='line_1_65' title="bbox 353 1783 373 1792; baseline 0 0"><span class='ocrx_word' id='word_1_183' title='bbox 353 1783 373 1792; x_wconf 81' lang='eng' dir='ltr'><em>ma</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 591 1528 1232 1602">
+    <p class='ocr_par' dir='ltr' id='par_1_45' title="bbox 591 1528 1232 1602">
+     <span class='ocr_line' id='line_1_66' title="bbox 621 1528 1232 1554; baseline -0.002 -4"><span class='ocrx_word' id='word_1_184' title='bbox 621 1532 740 1550; x_wconf 85' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_185' title='bbox 747 1532 927 1554; x_wconf 75' lang='eng' dir='ltr'><em>phytofermenlans</em></span> <span class='ocrx_word' id='word_1_186' title='bbox 939 1532 1004 1550; x_wconf 88' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_187' title='bbox 1012 1528 1100 1550; x_wconf 80' lang='eng' dir='ltr'><em>700394T</em></span> <span class='ocrx_word' id='word_1_188' title='bbox 1107 1532 1232 1554; x_wconf 85' lang='eng' dir='ltr'><em>(AF020431)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_67' title="bbox 591 1576 1080 1602; baseline 0 -5"><span class='ocrx_word' id='word_1_189' title='bbox 591 1580 710 1597; x_wconf 78' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_190' title='bbox 717 1580 803 1602; x_wconf 82' lang='eng' dir='ltr'><em>populeti</em></span> <span class='ocrx_word' id='word_1_191' title='bbox 815 1580 880 1597; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_192' title='bbox 889 1576 965 1597; x_wconf 81' lang='eng' dir='ltr'><em>35295T</em></span> <span class='ocrx_word' id='word_1_193' title='bbox 983 1580 1080 1602; x_wconf 86' lang='eng' dir='ltr'><em>(X71853)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 392 1517 394 1627">
+    <p class='ocr_par' dir='ltr' id='par_1_46' title="bbox 392 1517 394 1627">
+     <span class='ocr_line' id='line_1_68' title="bbox 392 1517 394 1627; baseline 0 212"><span class='ocrx_word' id='word_1_194' title='bbox 392 1517 394 1627; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_37' title="bbox 488 1624 1276 1792">
+    <p class='ocr_par' dir='ltr' id='par_1_47' title="bbox 488 1624 1276 1792">
+     <span class='ocr_line' id='line_1_69' title="bbox 488 1624 1201 1650; baseline 0 -5"><span class='ocrx_word' id='word_1_195' title='bbox 488 1641 502 1650; x_wconf 54' lang='eng'>93</span> <span class='ocrx_word' id='word_1_196' title='bbox 626 1628 744 1645; x_wconf 79' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_197' title='bbox 751 1628 968 1650; x_wconf 83' lang='eng' dir='ltr'><em>polysaccharolyticum</em></span> <span class='ocrx_word' id='word_1_198' title='bbox 978 1628 1028 1645; x_wconf 92' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_199' title='bbox 1040 1624 1095 1645; x_wconf 88' lang='eng' dir='ltr'><em>1801T</em></span> <span class='ocrx_word' id='word_1_200' title='bbox 1104 1628 1201 1650; x_wconf 85' lang='eng' dir='ltr'>(X77839)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_70' title="bbox 577 1673 1074 1695; baseline 0.004 -2"><span class='ocrx_word' id='word_1_201' title='bbox 577 1675 695 1693; x_wconf 80' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_202' title='bbox 704 1676 829 1693; x_wconf 82' lang='eng' dir='ltr'><em>herbivorans</em></span> <span class='ocrx_word' id='word_1_203' title='bbox 837 1676 887 1694; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_204' title='bbox 898 1673 971 1694; x_wconf 76' lang='eng' dir='ltr'><em>14428T</em></span> <span class='ocrx_word' id='word_1_205' title='bbox 980 1673 1074 1695; x_wconf 83' lang='eng' dir='ltr'><em>(L34418)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_71' title="bbox 532 1719 1031 1743; baseline -0.002 -2"><span class='ocrx_word' id='word_1_206' title='bbox 532 1723 650 1741; x_wconf 80' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_207' title='bbox 659 1723 770 1741; x_wconf 77' lang='eng' dir='ltr'><em>fimetarium</em></span> <span class='ocrx_word' id='word_1_208' title='bbox 778 1723 828 1741; x_wconf 86' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_209' title='bbox 837 1719 896 1741; x_wconf 70' lang='eng' dir='ltr'><em>9179T</em></span> <span class='ocrx_word' id='word_1_210' title='bbox 906 1721 1031 1743; x_wconf 79' lang='eng' dir='ltr'><em>(AF126687)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_72' title="bbox 742 1766 1276 1792; baseline -0.004 -5"><span class='ocrx_word' id='word_1_211' title='bbox 742 1770 909 1792; x_wconf 86' lang='eng' dir='ltr'><em>Propionigenium</em></span> <span class='ocrx_word' id='word_1_212' title='bbox 917 1770 1028 1787; x_wconf 83' lang='eng' dir='ltr'><em>modestum</em></span> <span class='ocrx_word' id='word_1_213' title='bbox 1044 1770 1080 1787; x_wconf 85' lang='eng' dir='ltr'><em>Gra</em></span> <span class='ocrx_word' id='word_1_214' title='bbox 1089 1770 1141 1787; x_wconf 85' lang='eng' dir='ltr'><em>Succ</em></span> <span class='ocrx_word' id='word_1_215' title='bbox 1149 1766 1171 1787; x_wconf 76' lang='eng' dir='ltr'><em>2T</em></span> <span class='ocrx_word' id='word_1_216' title='bbox 1179 1767 1276 1790; x_wconf 85' lang='eng' dir='ltr'><em>(X54275)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_38' title="bbox 653 1815 1216 1839">
+    <p class='ocr_par' dir='ltr' id='par_1_48' title="bbox 653 1815 1216 1839">
+     <span class='ocr_line' id='line_1_73' title="bbox 653 1815 1216 1839; baseline -0.004 -3"><span class='ocrx_word' id='word_1_217' title='bbox 653 1819 811 1836; x_wconf 79' lang='eng' dir='ltr'><em>Fusobacterium</em></span> <span class='ocrx_word' id='word_1_218' title='bbox 819 1819 930 1836; x_wconf 76' lang='eng' dir='ltr'><em>nucleatum</em></span> <span class='ocrx_word' id='word_1_219' title='bbox 939 1819 1004 1836; x_wconf 90' lang='eng' dir='ltr'><strong>ATCC</strong></span> <span class='ocrx_word' id='word_1_220' title='bbox 1012 1815 1084 1836; x_wconf 74' lang='eng' dir='ltr'><em>25586T</em></span> <span class='ocrx_word' id='word_1_221' title='bbox 1093 1816 1216 1839; x_wconf 81' lang='eng' dir='ltr'><em>(AJ133496)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001966-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001966-0-000.pbm.png
new file mode 100644
index 00000000..9f0be5b4
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001966-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001966-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001966-0-000.pbm.png.hocr
new file mode 100644
index 00000000..b971b2b6
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001966-0-000.pbm.png.hocr
@@ -0,0 +1,120 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001966-0-000.pbm.png"; bbox 0 0 1241 573; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 245 0 1241 572">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 245 1 1240 571">
+     <span class='ocr_line' id='line_1_1' title="bbox 288 1 1168 28; baseline 0 -4"><span class='ocrx_word' id='word_1_1' title='bbox 288 13 572 15; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_2' title='bbox 584 3 748 24; x_wconf 82' lang='eng' dir='ltr'><em>Granulicatella</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 758 4 865 24; x_wconf 84' lang='eng' dir='ltr'><em>adiacens</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 875 3 936 24; x_wconf 87' lang='eng' dir='ltr'><em>GIFU</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 950 1 1039 24; x_wconf 84' lang='eng' dir='ltr'><em>12706T</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 1049 1 1168 28; x_wconf 89' lang='eng' dir='ltr'><em>(D50540)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 287 35 1141 64; baseline 0 -6"><span class='ocrx_word' id='word_1_7' title='bbox 287 47 572 49; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_8' title='bbox 581 38 720 64; x_wconf 82' lang='eng' dir='ltr'><em>Ablotrophla</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 731 37 838 58; x_wconf 82' lang='eng' dir='ltr'><em>defectiva</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 848 37 909 58; x_wconf 89' lang='eng' dir='ltr'><em>GIFU</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 922 35 1012 58; x_wconf 89' lang='eng' dir='ltr'><em>12707T</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 1021 35 1141 62; x_wconf 89' lang='eng' dir='ltr'><em>(D50541)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 245 68 1135 96; baseline -0.002 -3"><span class='ocrx_word' id='word_1_13' title='bbox 245 81 572 83; x_wconf 94' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_14' title='bbox 583 71 702 92; x_wconf 85' lang='eng' dir='ltr'><em>Facklamla</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 712 71 806 92; x_wconf 86' lang='eng' dir='ltr'><em>homlnls</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 815 71 891 92; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 902 68 1009 92; x_wconf 84' lang='eng' dir='ltr'><em>700628T</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 1018 69 1135 96; x_wconf 92' lang='eng' dir='ltr'>(Y10772)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 335 102 1146 129; baseline 0 -4"><span class='ocrx_word' id='word_1_19' title='bbox 335 115 572 117; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_20' title='bbox 581 105 727 125; x_wconf 85' lang='eng' dir='ltr'><em>Aerococcus</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 738 105 828 125; x_wconf 81' lang='eng' dir='ltr'><em>viridans</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 837 104 913 125; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 925 106 932 125; x_wconf 95' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 942 102 1015 125; x_wconf 78' lang='eng' dir='ltr'><em>1563T</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 1024 102 1146 129; x_wconf 87' lang='eng' dir='ltr'><em>(M58797)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 335 136 1108 163; baseline 0 -4"><span class='ocrx_word' id='word_1_26' title='bbox 335 149 572 151; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_27' title='bbox 581 138 726 159; x_wconf 85' lang='eng' dir='ltr'><em>Aerococcus</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 737 138 809 159; x_wconf 77' lang='eng' dir='ltr'><em>urinae</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 820 138 893 159; x_wconf 90' lang='eng' dir='ltr'>NCFB</span> <span class='ocrx_word' id='word_1_30' title='bbox 905 136 1108 163; x_wconf 71' lang='eng' dir='ltr'><em>2893T(M77819)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 582 169 1240 199; baseline 0 -6"><span class='ocrx_word' id='word_1_31' title='bbox 582 172 775 199; x_wconf 77' lang='eng' dir='ltr'><em>Staphylococcus</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 785 172 925 193; x_wconf 84' lang='eng' dir='ltr'><em>lntermedlus</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 934 172 1010 193; x_wconf 87' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 1021 169 1111 193; x_wconf 65' lang='eng' dir='ltr'><em>QQGBST</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 1121 170 1240 197; x_wconf 86' lang='eng' dir='ltr'><em>(D83369)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 582 203 1131 232; baseline 0 -6"><span class='ocrx_word' id='word_1_36' title='bbox 582 205 775 232; x_wconf 84' lang='eng' dir='ltr'><em>Staphylococcus</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 785 205 894 226; x_wconf 80' lang='eng' dir='ltr'><em>sch/elferl</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 902 205 996 226; x_wconf 85' lang='eng' dir='ltr'>CD22-1</span> <span class='ocrx_word' id='word_1_39' title='bbox 1012 203 1131 230; x_wconf 86' lang='eng' dir='ltr'>(D83372)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 582 237 1176 266; baseline 0 -6"><span class='ocrx_word' id='word_1_40' title='bbox 582 239 775 266; x_wconf 83' lang='eng' dir='ltr'><em>Staphylococcus</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 785 239 861 266; x_wconf 80' lang='eng' dir='ltr'><em>hyicus</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 870 239 946 260; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 958 241 965 260; x_wconf 90' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 975 237 1048 260; x_wconf 83' lang='eng' dir='ltr'><em>1249T</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 1057 237 1176 264; x_wconf 84' lang='eng' dir='ltr'><em>(D83368)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 582 270 1223 300; baseline 0 -7"><span class='ocrx_word' id='word_1_46' title='bbox 582 273 775 300; x_wconf 83' lang='eng' dir='ltr'><em>Staphylococcus</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 783 273 908 300; x_wconf 80' lang='eng' dir='ltr'><em>gallinarum</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 917 273 993 293; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 1003 270 1095 293; x_wconf 78' lang='eng' dir='ltr'><em>35539T</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 1104 271 1223 297; x_wconf 85' lang='eng' dir='ltr'><em>(D83366)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 582 304 1064 333; baseline 0 -6"><span class='ocrx_word' id='word_1_51' title='bbox 582 306 775 333; x_wconf 83' lang='eng' dir='ltr'><em>Staphylococcus</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 785 306 832 327; x_wconf 82' lang='eng' dir='ltr'><em>fells</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 842 307 935 327; x_wconf 87' lang='eng' dir='ltr'><em>FD21-2</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 945 304 1064 331; x_wconf 85' lang='eng' dir='ltr'><em>(D83365)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 501 339 1158 388; baseline 0 -26"><span class='ocrx_word' id='word_1_55' title='bbox 501 352 571 388; x_wconf 77' lang='eng'><em>_|:</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 584 341 682 362; x_wconf 86' lang='eng' dir='ltr'><em>Gemella</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 692 342 849 368; x_wconf 83' lang='eng' dir='ltr'><em>haemolysans</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 858 341 933 362; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 946 339 1035 362; x_wconf 87' lang='eng' dir='ltr'><em>10379T</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 1044 339 1158 366; x_wconf 85' lang='eng' dir='ltr'><em>(L14326)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 584 373 1061 402; baseline -0.002 -6"><span class='ocrx_word' id='word_1_61' title='bbox 584 375 682 396; x_wconf 76' lang='eng' dir='ltr'><em>Gems/la</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 692 375 806 402; x_wconf 83' lang='eng' dir='ltr'><em>sangulnls</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 817 373 935 396; x_wconf 84' lang='eng' dir='ltr'><em>2045—94T</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 944 373 1061 399; x_wconf 87' lang='eng' dir='ltr'><em>(Y13364)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 584 408 1144 435; baseline -0.002 -4"><span class='ocrx_word' id='word_1_65' title='bbox 584 410 682 431; x_wconf 75' lang='eng' dir='ltr'><em>Gems/la</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 692 410 834 431; x_wconf 86' lang='eng' dir='ltr'><em>morblllorum</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 844 410 920 431; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 930 408 1021 431; x_wconf 91' lang='eng' dir='ltr'><em>27824T</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 1030 408 1144 435; x_wconf 85' lang='eng' dir='ltr'><em>(L14327)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 584 441 1132 469; baseline -0.002 -4"><span class='ocrx_word' id='word_1_70' title='bbox 584 444 682 465; x_wconf 85' lang='eng' dir='ltr'><em>Gemella</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 692 441 1132 469; x_wconf 66' lang='eng' dir='ltr'><em>cuniculiM60449l99l1T(AJ251987)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 392 475 1014 505; baseline 0 -7"><span class='ocrx_word' id='word_1_72' title='bbox 392 488 572 490; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_73' title='bbox 584 478 682 498; x_wconf 83' lang='eng' dir='ltr'><em>Gemella</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 692 475 887 505; x_wconf 74' lang='eng' dir='ltr'><em>bergerl617-93T</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 897 476 1014 502; x_wconf 86' lang='eng' dir='ltr'><em>(Y13365)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 583 509 1218 537; baseline 0 -5"><span class='ocrx_word' id='word_1_76' title='bbox 583 511 687 532; x_wconf 88' lang='eng' dir='ltr'><em>Gemella</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 697 511 897 537; x_wconf 85' lang='eng' dir='ltr'><em>asaccharolytica</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 907 511 962 532; x_wconf 97' lang='eng' dir='ltr'><em>WAL</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 974 509 1057 532; x_wconf 78' lang='eng' dir='ltr'><em>1945JT</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 1067 509 1218 536; x_wconf 89' lang='eng' dir='ltr'><em>(EU427463)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 584 542 1108 571; baseline 0 -6"><span class='ocrx_word' id='word_1_81' title='bbox 584 544 682 565; x_wconf 76' lang='eng' dir='ltr'><em>Gems/la</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 691 545 819 571; x_wconf 82' lang='eng' dir='ltr'><em>palaticanis</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 829 545 965 565; x_wconf 86' lang='eng' dir='ltr'><em>M663-98—1</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 972 542 981 556; x_wconf 66' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_85' title='bbox 991 543 1108 569; x_wconf 89' lang='eng' dir='ltr'>(Y17280)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 243 29 287 31">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 243 29 287 31">
+     <span class='ocr_line' id='line_1_18' title="bbox 243 29 287 31; baseline 0 542"><span class='ocrx_word' id='word_1_86' title='bbox 243 29 287 31; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 284 16 288 49">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 284 16 288 49">
+     <span class='ocr_line' id='line_1_19' title="bbox 284 16 288 49; baseline 0 524"><span class='ocrx_word' id='word_1_87' title='bbox 284 16 288 49; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 243 29 245 83">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 243 29 245 83">
+     <span class='ocr_line' id='line_1_20' title="bbox 243 29 245 83; baseline 0 490"><span class='ocrx_word' id='word_1_88' title='bbox 243 29 245 83; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 333 115 335 151">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 333 115 335 151">
+     <span class='ocr_line' id='line_1_21' title="bbox 333 115 335 151; baseline 0 422"><span class='ocrx_word' id='word_1_89' title='bbox 333 115 335 151; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 452 393 500 395">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 452 393 500 395">
+     <span class='ocr_line' id='line_1_22' title="bbox 452 393 500 395; baseline 0 178"><span class='ocrx_word' id='word_1_90' title='bbox 452 393 500 395; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 499 368 501 422">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 499 368 501 422">
+     <span class='ocr_line' id='line_1_23' title="bbox 499 368 501 422; baseline 0 151"><span class='ocrx_word' id='word_1_91' title='bbox 499 368 501 422; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 390 419 571 424">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 390 419 571 424">
+     <span class='ocr_line' id='line_1_24' title="bbox 390 419 571 424; baseline 0 149"><span class='ocrx_word' id='word_1_92' title='bbox 390 419 571 424; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 452 393 454 456">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 452 393 454 456">
+     <span class='ocr_line' id='line_1_25' title="bbox 452 393 454 456; baseline 0 117"><span class='ocrx_word' id='word_1_93' title='bbox 452 393 454 456; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 354 452 572 458">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 354 452 572 458">
+     <span class='ocr_line' id='line_1_26' title="bbox 354 452 572 458; baseline 0 115"><span class='ocrx_word' id='word_1_94' title='bbox 354 452 572 458; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 390 422 392 490">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 390 422 392 490">
+     <span class='ocr_line' id='line_1_27' title="bbox 390 422 392 490; baseline 0 83"><span class='ocrx_word' id='word_1_95' title='bbox 390 422 392 490; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 0 6 581 562">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 0 6 577 562">
+     <span class='ocr_line' id='line_1_28' title="bbox 0 6 577 562; baseline 0 11"><span class='ocrx_word' id='word_1_96' title='bbox 0 6 577 562; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001990-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001990-0-000.pbm.png
new file mode 100644
index 00000000..89d57640
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001990-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001990-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001990-0-000.pbm.png.hocr
new file mode 100644
index 00000000..9d32ec7c
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.001990-0-000.pbm.png.hocr
@@ -0,0 +1,415 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.001990-0-000.pbm.png"; bbox 0 0 2603 1752; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 150 2 1132 789">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 195 6 1129 409">
+     <span class='ocr_line' id='line_1_1' title="bbox 251 6 1129 37; baseline 0 -11"><span class='ocrx_word' id='word_1_1' title='bbox 251 6 411 26; x_wconf 87' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 421 6 501 26; x_wconf 82' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 508 6 561 26; x_wconf 89' lang='eng' dir='ltr'><strong>9I2b</strong></span> <span class='ocrx_word' id='word_1_4' title='bbox 571 6 721 32; x_wconf 88' lang='eng' dir='ltr'><em>(AM942729)</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 967 12 998 37; x_wconf 76' lang='eng' dir='ltr'><em>(a)</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 1010 11 1054 32; x_wconf 77' lang='eng'><em>163</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 1065 12 1129 31; x_wconf 71' lang='eng' dir='ltr'><em>rRNA</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 268 53 737 79; baseline 0 -6"><span class='ocrx_word' id='word_1_8' title='bbox 268 53 427 73; x_wconf 84' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 437 53 517 73; x_wconf 87' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 524 53 577 73; x_wconf 90' lang='eng' dir='ltr'><em>9I5b</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 587 53 737 79; x_wconf 88' lang='eng' dir='ltr'><em>(AM942730)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 301 100 784 126; baseline 0 -6"><span class='ocrx_word' id='word_1_12' title='bbox 301 100 461 120; x_wconf 87' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 471 100 551 120; x_wconf 87' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 559 100 624 120; x_wconf 90' lang='eng' dir='ltr'>11/2a</span> <span class='ocrx_word' id='word_1_15' title='bbox 634 100 784 126; x_wconf 87' lang='eng' dir='ltr'><em>(AM942732)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 279 147 747 173; baseline 0 -6"><span class='ocrx_word' id='word_1_16' title='bbox 279 148 439 168; x_wconf 86' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 449 148 529 168; x_wconf 87' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 538 147 588 168; x_wconf 89' lang='eng'><em>10/6</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 598 147 747 173; x_wconf 86' lang='eng' dir='ltr'><em>(AM942731)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 282 194 750 220; baseline 0 -6"><span class='ocrx_word' id='word_1_20' title='bbox 282 195 442 215; x_wconf 84' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 452 195 532 215; x_wconf 88' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 539 194 590 215; x_wconf 85' lang='eng' dir='ltr'><em>9/2a</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 601 194 750 220; x_wconf 85' lang='eng' dir='ltr'><em>(AM942728)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 275 241 743 267; baseline -0.002 -5"><span class='ocrx_word' id='word_1_24' title='bbox 275 241 435 262; x_wconf 83' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 445 241 525 262; x_wconf 87' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 532 241 584 262; x_wconf 88' lang='eng' dir='ltr'>9/1c</span> <span class='ocrx_word' id='word_1_27' title='bbox 594 241 743 267; x_wconf 82' lang='eng' dir='ltr'><em>(AM942727)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 275 289 743 315; baseline 0 -6"><span class='ocrx_word' id='word_1_28' title='bbox 275 289 435 309; x_wconf 88' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 445 289 525 309; x_wconf 87' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 532 289 583 309; x_wconf 87' lang='eng' dir='ltr'><em>9I1a</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 594 289 743 315; x_wconf 86' lang='eng' dir='ltr'><em>(AM942726)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 276 336 744 362; baseline 0 -6"><span class='ocrx_word' id='word_1_32' title='bbox 276 336 436 356; x_wconf 87' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 446 336 526 356; x_wconf 84' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 533 336 584 356; x_wconf 86' lang='eng'>8/13</span> <span class='ocrx_word' id='word_1_35' title='bbox 594 336 744 362; x_wconf 87' lang='eng' dir='ltr'><em>(AM942725)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 195 381 729 409; baseline 0 -6"><span class='ocrx_word' id='word_1_36' title='bbox 195 383 340 403; x_wconf 85' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 349 383 420 403; x_wconf 86' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 428 383 484 403; x_wconf 91' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 494 381 580 403; x_wconf 81' lang='eng' dir='ltr'><em>22228T</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 590 383 729 409; x_wconf 86' lang='eng' dir='ltr'><em>(AJ842343)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 151 428 792 550">
+     <span class='ocr_line' id='line_1_10' title="bbox 165 428 792 456; baseline 0 -6"><span class='ocrx_word' id='word_1_41' title='bbox 165 439 189 456; x_wconf 87' lang='eng'><strong>77</strong></span> <span class='ocrx_word' id='word_1_42' title='bbox 207 430 367 450; x_wconf 84' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 376 430 496 456; x_wconf 88' lang='eng' dir='ltr'><em>nigricans</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 506 430 549 450; x_wconf 94' lang='eng' dir='ltr'><em>DAI</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 560 428 634 450; x_wconf 93' lang='eng' dir='ltr'><em>1-1-5T</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 643 430 792 456; x_wconf 87' lang='eng' dir='ltr'><em>(AM942722)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 151 473 778 503; baseline 0 -6"><span class='ocrx_word' id='word_1_47' title='bbox 151 473 187 491; x_wconf 77' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 204 477 364 497; x_wconf 84' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 373 477 493 503; x_wconf 86' lang='eng' dir='ltr'><em>nigricans</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 503 477 546 497; x_wconf 96' lang='eng' dir='ltr'><em>DAI</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 558 477 619 497; x_wconf 87' lang='eng'>1-1-4</span> <span class='ocrx_word' id='word_1_52' title='bbox 629 477 778 503; x_wconf 86' lang='eng' dir='ltr'><em>(AM942723)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 216 524 726 550; baseline 0 -6"><span class='ocrx_word' id='word_1_53' title='bbox 216 524 376 545; x_wconf 87' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 385 524 506 550; x_wconf 87' lang='eng' dir='ltr'><em>nigricans</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 514 524 567 545; x_wconf 88' lang='eng' dir='ltr'>8/6b</span> <span class='ocrx_word' id='word_1_56' title='bbox 577 524 726 550; x_wconf 88' lang='eng' dir='ltr'><em>(AM942724)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 262 569 976 739">
+     <span class='ocr_line' id='line_1_13' title="bbox 340 569 976 598; baseline 0.002 -7"><span class='ocrx_word' id='word_1_57' title='bbox 340 580 365 598; x_wconf 69' lang='eng'><em>65</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 382 571 526 592; x_wconf 78' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 535 571 666 597; x_wconf 86' lang='eng' dir='ltr'><em>norvegicus</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 676 571 731 592; x_wconf 88' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 744 569 828 592; x_wconf 75' lang='eng' dir='ltr'><em>19839T</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 837 571 976 597; x_wconf 86' lang='eng' dir='ltr'><em>(AJ316208)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 321 616 959 644; baseline 0 -5"><span class='ocrx_word' id='word_1_63' title='bbox 321 616 357 634; x_wconf 74' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 384 619 528 639; x_wconf 84' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 537 619 669 644; x_wconf 84' lang='eng' dir='ltr'><em>norvegicus</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 678 619 810 639; x_wconf 84' lang='eng' dir='ltr'><em>LMG19840</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 820 619 959 644; x_wconf 88' lang='eng' dir='ltr'><em>(AJ316207)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 374 666 957 692; baseline 0 -6"><span class='ocrx_word' id='word_1_68' title='bbox 374 666 518 686; x_wconf 83' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 527 666 658 691; x_wconf 83' lang='eng' dir='ltr'><em>norvegicus</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 668 666 723 686; x_wconf 93' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 736 666 807 686; x_wconf 85' lang='eng'>19842</span> <span class='ocrx_word' id='word_1_72' title='bbox 818 666 957 692; x_wconf 84' lang='eng' dir='ltr'><em>(AJ437193)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 262 711 822 739; baseline 0 -6"><span class='ocrx_word' id='word_1_73' title='bbox 262 713 406 733; x_wconf 84' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 415 713 532 733; x_wconf 83' lang='eng' dir='ltr'><em>calviensis</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 542 711 822 739; x_wconf 78' lang='eng' dir='ltr'><em>RE35F/12T(AF118021)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 352 758 876 786">
+     <span class='ocr_line' id='line_1_17' title="bbox 352 758 876 786; baseline 0 -6"><span class='ocrx_word' id='word_1_76' title='bbox 352 760 467 780; x_wconf 81' lang='eng' dir='ltr'><em>Grimontia</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 476 760 567 780; x_wconf 83' lang='eng' dir='ltr'><em>hollisae</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 577 760 633 780; x_wconf 90' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 645 758 729 780; x_wconf 82' lang='eng' dir='ltr'>17719T</span> <span class='ocrx_word' id='word_1_80' title='bbox 737 760 876 786; x_wconf 83' lang='eng' dir='ltr'><em>(AJ514909)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 1 10 765 822">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 2 10 765 822">
+     <span class='ocr_line' id='line_1_18' title="bbox 177 10 251 45; baseline 0 1707"><span class='ocrx_word' id='word_1_81' title='bbox 177 10 251 45; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 177 45 297 186; baseline 0.025 -51"><span class='ocrx_word' id='word_1_82' title='bbox 177 45 297 186; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 177 186 278 233; baseline -0.05 0"><span class='ocrx_word' id='word_1_83' title='bbox 177 186 278 233; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 37 233 275 328; baseline 0 -52"><span class='ocrx_word' id='word_1_84' title='bbox 37 233 275 328; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 16 328 272 375; baseline 0 -8"><span class='ocrx_word' id='word_1_85' title='bbox 16 328 272 375; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 11 375 192 470; baseline 0 -56"><span class='ocrx_word' id='word_1_86' title='bbox 11 375 192 470; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 16 470 151 518; baseline 0 1234"><span class='ocrx_word' id='word_1_87' title='bbox 16 470 151 518; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 16 518 212 612; baseline 0 0"><span class='ocrx_word' id='word_1_88' title='bbox 16 518 212 612; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 2 612 369 753; baseline 0 -95"><span class='ocrx_word' id='word_1_89' title='bbox 2 612 369 753; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 16 753 765 822; baseline 0 0"><span class='ocrx_word' id='word_1_90' title='bbox 16 753 765 822; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 78 55 115 73">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 78 55 115 73">
+     <span class='ocr_line' id='line_1_28' title="bbox 78 55 115 73; baseline 0.027 -1"><span class='ocrx_word' id='word_1_91' title='bbox 78 55 115 73; x_wconf 88' lang='eng'>1%</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 140 216 176 234">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 140 216 176 234">
+     <span class='ocr_line' id='line_1_29' title="bbox 140 216 176 234; baseline 0.028 -1"><span class='ocrx_word' id='word_1_92' title='bbox 140 216 176 234; x_wconf 89' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 231 950 1055 1082">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 231 953 1055 1080">
+     <span class='ocr_line' id='line_1_30' title="bbox 231 953 1055 982; baseline 0.001 -9"><span class='ocrx_word' id='word_1_93' title='bbox 231 953 394 973; x_wconf 88' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 403 953 485 973; x_wconf 90' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 494 953 545 973; x_wconf 89' lang='eng' dir='ltr'><em>10l6</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 555 953 708 979; x_wconf 83' lang='eng' dir='ltr'><em>(AM942058)</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 956 955 986 982; x_wconf 89' lang='eng' dir='ltr'><em>(c)</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 996 955 1055 981; x_wconf 82' lang='eng' dir='ltr'><em>rpoD</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 231 1003 709 1029; baseline 0.002 -6"><span class='ocrx_word' id='word_1_99' title='bbox 231 1003 394 1024; x_wconf 90' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 403 1003 485 1024; x_wconf 90' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 492 1003 546 1024; x_wconf 86' lang='eng' dir='ltr'><em>9I5b</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 556 1003 709 1029; x_wconf 84' lang='eng' dir='ltr'><em>(AM942057)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 231 1054 708 1080; baseline 0 -6"><span class='ocrx_word' id='word_1_103' title='bbox 231 1054 394 1074; x_wconf 86' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 403 1054 485 1074; x_wconf 85' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 492 1054 545 1074; x_wconf 83' lang='eng' dir='ltr'><em>9I1c</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 555 1054 708 1080; x_wconf 89' lang='eng' dir='ltr'><em>(AM942054)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 0 955 292 1724">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 1 955 292 1724">
+     <span class='ocr_line' id='line_1_33' title="bbox 220 955 230 1093; baseline 0 -51"><span class='ocrx_word' id='word_1_107' title='bbox 220 955 230 1093; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 211 1093 230 1143; baseline 0 609"><span class='ocrx_word' id='word_1_108' title='bbox 211 1093 230 1143; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 94 1143 230 1303; baseline 0 0"><span class='ocrx_word' id='word_1_109' title='bbox 94 1245 169 1303; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> <span class='ocrx_word' id='word_1_110' title='bbox 206 1143 230 1242; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 29 1303 221 1398; baseline 0 -51"><span class='ocrx_word' id='word_1_111' title='bbox 29 1303 221 1398; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 15 1398 215 1555; baseline 0 -73"><span class='ocrx_word' id='word_1_112' title='bbox 15 1398 215 1555; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 15 1555 292 1595; baseline 0 157"><span class='ocrx_word' id='word_1_113' title='bbox 15 1555 292 1595; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 1 1595 233 1652; baseline 0 100"><span class='ocrx_word' id='word_1_114' title='bbox 1 1595 233 1652; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 15 1652 252 1724; baseline 0 28"><span class='ocrx_word' id='word_1_115' title='bbox 15 1652 252 1724; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 50 982 144 985">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 50 982 144 985">
+     <span class='ocr_line' id='line_1_41' title="bbox 50 982 144 985; baseline 0 767"><span class='ocrx_word' id='word_1_116' title='bbox 50 982 144 985; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 77 992 116 1011">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 77 992 116 1011">
+     <span class='ocr_line' id='line_1_42' title="bbox 77 992 116 1011; baseline 0.026 -1"><span class='ocrx_word' id='word_1_117' title='bbox 77 992 116 1011; x_wconf 86' lang='eng'><em>5%</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 194 1090 219 1108">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 194 1090 219 1108">
+     <span class='ocr_line' id='line_1_43' title="bbox 194 1090 219 1108; baseline 0 0"><span class='ocrx_word' id='word_1_118' title='bbox 194 1090 219 1108; x_wconf 85' lang='eng'>99</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 169 1101 1148 1741">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 231 1104 708 1130">
+     <span class='ocr_line' id='line_1_44' title="bbox 231 1104 708 1130; baseline 0 -5"><span class='ocrx_word' id='word_1_119' title='bbox 231 1105 394 1125; x_wconf 86' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 403 1105 485 1125; x_wconf 87' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 492 1104 545 1125; x_wconf 87' lang='eng' dir='ltr'><em>9I2a</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 555 1104 708 1130; x_wconf 85' lang='eng' dir='ltr'><em>(AM942055)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 231 1155 709 1181">
+     <span class='ocr_line' id='line_1_45' title="bbox 231 1155 709 1181; baseline 0.002 -6"><span class='ocrx_word' id='word_1_123' title='bbox 231 1155 394 1176; x_wconf 87' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 403 1155 485 1176; x_wconf 88' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 492 1155 546 1176; x_wconf 88' lang='eng' dir='ltr'><em>9I2b</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 556 1155 709 1181; x_wconf 86' lang='eng' dir='ltr'><em>(AM942056)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 231 1206 708 1232">
+     <span class='ocr_line' id='line_1_46' title="bbox 231 1206 708 1232; baseline 0 -5"><span class='ocrx_word' id='word_1_127' title='bbox 231 1206 394 1227; x_wconf 89' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 403 1206 485 1227; x_wconf 88' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 492 1206 545 1227; x_wconf 87' lang='eng' dir='ltr'><em>9I1a</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 555 1206 708 1232; x_wconf 87' lang='eng' dir='ltr'><em>(AM942053)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 169 1257 708 1288">
+     <span class='ocr_line' id='line_1_47' title="bbox 169 1257 708 1288; baseline 0.002 -11"><span class='ocrx_word' id='word_1_131' title='bbox 169 1270 207 1288; x_wconf 69' lang='eng'>100</span> <span class='ocrx_word' id='word_1_132' title='bbox 231 1257 394 1278; x_wconf 87' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 403 1257 485 1278; x_wconf 85' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_134' title='bbox 493 1257 545 1278; x_wconf 85' lang='eng'>8/13</span> <span class='ocrx_word' id='word_1_135' title='bbox 555 1257 708 1283; x_wconf 87' lang='eng' dir='ltr'><em>(AM942052)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 222 1307 714 1334">
+     <span class='ocr_line' id='line_1_48' title="bbox 222 1307 714 1334; baseline 0 -6"><span class='ocrx_word' id='word_1_136' title='bbox 222 1308 385 1328; x_wconf 85' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_137' title='bbox 395 1308 476 1328; x_wconf 86' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_138' title='bbox 485 1307 551 1328; x_wconf 71' lang='eng'>11/23</span> <span class='ocrx_word' id='word_1_139' title='bbox 561 1307 714 1334; x_wconf 85' lang='eng' dir='ltr'><em>(AM942059)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 217 1356 755 1435">
+     <span class='ocr_line' id='line_1_49' title="bbox 223 1356 755 1384; baseline 0 -6"><span class='ocrx_word' id='word_1_140' title='bbox 223 1358 370 1379; x_wconf 76' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_141' title='bbox 380 1358 452 1379; x_wconf 81' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_142' title='bbox 460 1358 526 1379; x_wconf 94' lang='eng' dir='ltr'><em>CAIM</em></span> <span class='ocrx_word' id='word_1_143' title='bbox 537 1356 594 1379; x_wconf 88' lang='eng' dir='ltr'><em>912T</em></span> <span class='ocrx_word' id='word_1_144' title='bbox 604 1358 755 1384; x_wconf 84' lang='eng' dir='ltr'><em>(AM942051)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_50' title="bbox 217 1408 737 1435; baseline 0 -6"><span class='ocrx_word' id='word_1_145' title='bbox 217 1409 380 1429; x_wconf 86' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_146' title='bbox 389 1409 512 1435; x_wconf 87' lang='eng' dir='ltr'><em>nigricans</em></span> <span class='ocrx_word' id='word_1_147' title='bbox 521 1408 575 1429; x_wconf 85' lang='eng' dir='ltr'>8/6b</span> <span class='ocrx_word' id='word_1_148' title='bbox 585 1408 737 1435; x_wconf 89' lang='eng' dir='ltr'><em>(AM942050)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 216 1459 801 1485">
+     <span class='ocr_line' id='line_1_51' title="bbox 216 1459 801 1485; baseline 0 -6"><span class='ocrx_word' id='word_1_149' title='bbox 216 1459 379 1480; x_wconf 87' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_150' title='bbox 388 1459 511 1485; x_wconf 86' lang='eng' dir='ltr'><em>nigricans</em></span> <span class='ocrx_word' id='word_1_151' title='bbox 521 1459 564 1479; x_wconf 96' lang='eng' dir='ltr'><em>DAI</em></span> <span class='ocrx_word' id='word_1_152' title='bbox 576 1459 639 1479; x_wconf 91' lang='eng'>1-1-4</span> <span class='ocrx_word' id='word_1_153' title='bbox 649 1459 801 1485; x_wconf 85' lang='eng' dir='ltr'><em>(AM942049)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 179 1500 911 1689">
+     <span class='ocr_line' id='line_1_52' title="bbox 179 1500 812 1537; baseline 0 -6"><span class='ocrx_word' id='word_1_154' title='bbox 179 1500 204 1519; x_wconf 77' lang='eng'>99</span> <span class='ocrx_word' id='word_1_155' title='bbox 216 1510 379 1531; x_wconf 88' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_156' title='bbox 388 1510 511 1537; x_wconf 86' lang='eng' dir='ltr'><em>nigricans</em></span> <span class='ocrx_word' id='word_1_157' title='bbox 521 1510 564 1531; x_wconf 93' lang='eng' dir='ltr'><em>DAI</em></span> <span class='ocrx_word' id='word_1_158' title='bbox 576 1508 651 1531; x_wconf 81' lang='eng' dir='ltr'><em>1-1-5T</em></span> <span class='ocrx_word' id='word_1_159' title='bbox 660 1510 812 1537; x_wconf 83' lang='eng' dir='ltr'><em>(AM942048)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_53' title="bbox 296 1559 911 1587; baseline 0 -6"><span class='ocrx_word' id='word_1_160' title='bbox 296 1561 443 1582; x_wconf 81' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_161' title='bbox 452 1561 586 1587; x_wconf 83' lang='eng' dir='ltr'><em>norvegicus</em></span> <span class='ocrx_word' id='word_1_162' title='bbox 595 1561 669 1582; x_wconf 86' lang='eng' dir='ltr'><em>CECT</em></span> <span class='ocrx_word' id='word_1_163' title='bbox 678 1559 750 1582; x_wconf 74' lang='eng' dir='ltr'><em>7288T</em></span> <span class='ocrx_word' id='word_1_164' title='bbox 760 1561 911 1587; x_wconf 84' lang='eng' dir='ltr'><em>(AM942062)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_54' title="bbox 233 1609 835 1638; baseline 0 -6"><span class='ocrx_word' id='word_1_165' title='bbox 233 1612 380 1632; x_wconf 79' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_166' title='bbox 389 1612 509 1632; x_wconf 83' lang='eng' dir='ltr'><em>calviensis</em></span> <span class='ocrx_word' id='word_1_167' title='bbox 518 1611 577 1632; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_168' title='bbox 589 1609 675 1632; x_wconf 85' lang='eng' dir='ltr'><em>14347T</em></span> <span class='ocrx_word' id='word_1_169' title='bbox 685 1611 835 1638; x_wconf 84' lang='eng' dir='ltr'><em>(AM942047)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_55' title="bbox 254 1660 799 1689; baseline 0 -6"><span class='ocrx_word' id='word_1_170' title='bbox 254 1662 372 1683; x_wconf 80' lang='eng' dir='ltr'><em>Grimontia</em></span> <span class='ocrx_word' id='word_1_171' title='bbox 381 1662 474 1683; x_wconf 87' lang='eng' dir='ltr'><em>hollisae</em></span> <span class='ocrx_word' id='word_1_172' title='bbox 483 1662 557 1683; x_wconf 92' lang='eng' dir='ltr'><em>CECT</em></span> <span class='ocrx_word' id='word_1_173' title='bbox 567 1660 638 1683; x_wconf 80' lang='eng' dir='ltr'><em>5069T</em></span> <span class='ocrx_word' id='word_1_174' title='bbox 649 1662 799 1689; x_wconf 86' lang='eng' dir='ltr'><em>(AM942061)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 657 1711 1148 1739">
+     <span class='ocr_line' id='line_1_56' title="bbox 657 1711 1148 1739; baseline 0 -6"><span class='ocrx_word' id='word_1_175' title='bbox 657 1713 724 1733; x_wconf 90' lang='eng' dir='ltr'><em>Vibrio</em></span> <span class='ocrx_word' id='word_1_176' title='bbox 733 1713 838 1733; x_wconf 87' lang='eng' dir='ltr'><em>cholerae</em></span> <span class='ocrx_word' id='word_1_177' title='bbox 847 1713 922 1733; x_wconf 91' lang='eng' dir='ltr'><em>CECT</em></span> <span class='ocrx_word' id='word_1_178' title='bbox 931 1711 988 1733; x_wconf 93' lang='eng' dir='ltr'><em>514T</em></span> <span class='ocrx_word' id='word_1_179' title='bbox 998 1713 1148 1739; x_wconf 83' lang='eng' dir='ltr'><em>(AM942060)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 185 1191 210 1209">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 185 1191 210 1209">
+     <span class='ocr_line' id='line_1_57' title="bbox 185 1191 210 1209; baseline 0 0"><span class='ocrx_word' id='word_1_180' title='bbox 185 1191 210 1209; x_wconf 82' lang='eng'><em>76</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 19 1717 650 1725">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 19 1717 650 1725">
+     <span class='ocr_line' id='line_1_58' title="bbox 19 1717 650 1725; baseline 0 27"><span class='ocrx_word' id='word_1_181' title='bbox 19 1717 650 1725; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 771 805 1216 835">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 771 805 1216 833">
+     <span class='ocr_line' id='line_1_59' title="bbox 771 805 1216 833; baseline 0 -6"><span class='ocrx_word' id='word_1_182' title='bbox 771 807 837 827; x_wconf 73' lang='eng' dir='ltr'><em>Vibrio</em></span> <span class='ocrx_word' id='word_1_183' title='bbox 846 807 950 827; x_wconf 88' lang='eng' dir='ltr'><em>cholerae</em></span> <span class='ocrx_word' id='word_1_184' title='bbox 959 807 1031 827; x_wconf 90' lang='eng' dir='ltr'><em>CECT</em></span> <span class='ocrx_word' id='word_1_185' title='bbox 1041 805 1096 827; x_wconf 90' lang='eng' dir='ltr'><em>514T</em></span> <span class='ocrx_word' id='word_1_186' title='bbox 1106 807 1216 833; x_wconf 85' lang='eng' dir='ltr'><em>(X76337)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 1575 0 2482 837">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 1630 0 2479 82">
+     <span class='ocr_line' id='line_1_60' title="bbox 1630 0 2479 38; baseline 0 -13"><span class='ocrx_word' id='word_1_187' title='bbox 1630 3 1794 26; x_wconf 79' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_188' title='bbox 1805 3 1886 26; x_wconf 91' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_189' title='bbox 1895 3 1969 26; x_wconf 94' lang='eng' dir='ltr'><em>CAIM</em></span> <span class='ocrx_word' id='word_1_190' title='bbox 1981 0 2045 26; x_wconf 87' lang='eng' dir='ltr'><em>912T</em></span> <span class='ocrx_word' id='word_1_191' title='bbox 2056 2 2225 32; x_wconf 84' lang='eng' dir='ltr'><em>(AM942063)</em></span> <span class='ocrx_word' id='word_1_192' title='bbox 2371 9 2406 38; x_wconf 77' lang='eng' dir='ltr'><em>(b)</em></span> <span class='ocrx_word' id='word_1_193' title='bbox 2417 9 2479 32; x_wconf 69' lang='eng' dir='ltr'><em>recA</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_61' title="bbox 1635 53 2169 82; baseline 0 -7"><span class='ocrx_word' id='word_1_194' title='bbox 1635 53 1818 76; x_wconf 87' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_195' title='bbox 1829 53 1920 76; x_wconf 89' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_196' title='bbox 1929 53 1987 76; x_wconf 87' lang='eng'>8/13</span> <span class='ocrx_word' id='word_1_197' title='bbox 1998 53 2169 82; x_wconf 89' lang='eng' dir='ltr'><em>(AM942064)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 1635 102 2169 132">
+     <span class='ocr_line' id='line_1_62' title="bbox 1635 102 2169 132; baseline 0.002 -7"><span class='ocrx_word' id='word_1_198' title='bbox 1635 103 1818 126; x_wconf 87' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_199' title='bbox 1829 103 1920 126; x_wconf 87' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_200' title='bbox 1928 102 1987 126; x_wconf 86' lang='eng' dir='ltr'>9/1a</span> <span class='ocrx_word' id='word_1_201' title='bbox 1998 102 2169 132; x_wconf 88' lang='eng' dir='ltr'><em>(AM942065)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 1635 152 2169 182">
+     <span class='ocr_line' id='line_1_63' title="bbox 1635 152 2169 182; baseline 0.002 -7"><span class='ocrx_word' id='word_1_202' title='bbox 1635 153 1818 176; x_wconf 86' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_203' title='bbox 1829 153 1920 176; x_wconf 87' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_204' title='bbox 1928 152 1987 176; x_wconf 87' lang='eng' dir='ltr'><em>9/2a</em></span> <span class='ocrx_word' id='word_1_205' title='bbox 1998 152 2169 182; x_wconf 88' lang='eng' dir='ltr'><em>(AM942066)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 1635 202 2171 232">
+     <span class='ocr_line' id='line_1_64' title="bbox 1635 202 2171 232; baseline 0.002 -7"><span class='ocrx_word' id='word_1_206' title='bbox 1635 203 1818 226; x_wconf 89' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_207' title='bbox 1829 203 1920 226; x_wconf 90' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_208' title='bbox 1928 202 1989 226; x_wconf 87' lang='eng' dir='ltr'><em>9/2b</em></span> <span class='ocrx_word' id='word_1_209' title='bbox 2000 202 2171 232; x_wconf 86' lang='eng' dir='ltr'><em>(AM942068)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 1575 247 2169 282">
+     <span class='ocr_line' id='line_1_65' title="bbox 1575 247 2169 282; baseline 0 -6"><span class='ocrx_word' id='word_1_210' title='bbox 1575 247 1617 266; x_wconf 81' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_211' title='bbox 1635 253 1818 276; x_wconf 90' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_212' title='bbox 1829 253 1920 276; x_wconf 88' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_213' title='bbox 1928 253 1987 276; x_wconf 85' lang='eng' dir='ltr'><em>9I1c</em></span> <span class='ocrx_word' id='word_1_214' title='bbox 1998 253 2169 282; x_wconf 86' lang='eng' dir='ltr'><em>(AM942067)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 1635 303 2171 333">
+     <span class='ocr_line' id='line_1_66' title="bbox 1635 303 2171 333; baseline 0 -7"><span class='ocrx_word' id='word_1_215' title='bbox 1635 303 1818 326; x_wconf 89' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_216' title='bbox 1829 303 1920 326; x_wconf 88' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_217' title='bbox 1928 303 1989 326; x_wconf 87' lang='eng' dir='ltr'><em>9l5b</em></span> <span class='ocrx_word' id='word_1_218' title='bbox 2000 303 2171 333; x_wconf 86' lang='eng' dir='ltr'><em>(AM942069)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 1635 353 2169 383">
+     <span class='ocr_line' id='line_1_67' title="bbox 1635 353 2169 383; baseline 0 -7"><span class='ocrx_word' id='word_1_219' title='bbox 1635 354 1818 376; x_wconf 87' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_220' title='bbox 1829 354 1920 376; x_wconf 85' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_221' title='bbox 1930 353 1987 376; x_wconf 91' lang='eng' dir='ltr'><em>10l6</em></span> <span class='ocrx_word' id='word_1_222' title='bbox 1998 353 2169 383; x_wconf 90' lang='eng' dir='ltr'><em>(AM942070)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 1635 403 2187 433">
+     <span class='ocr_line' id='line_1_68' title="bbox 1635 403 2187 433; baseline 0 -7"><span class='ocrx_word' id='word_1_223' title='bbox 1635 403 1818 426; x_wconf 88' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_224' title='bbox 1829 403 1920 426; x_wconf 88' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_225' title='bbox 1930 403 2004 426; x_wconf 87' lang='eng' dir='ltr'>11l2a</span> <span class='ocrx_word' id='word_1_226' title='bbox 2016 403 2187 433; x_wconf 84' lang='eng' dir='ltr'><em>(AM942071)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 1640 451 2395 734">
+     <span class='ocr_line' id='line_1_69' title="bbox 1656 451 2395 483; baseline 0.001 -7"><span class='ocrx_word' id='word_1_227' title='bbox 1656 463 1685 483; x_wconf 75' lang='eng'><em>63</em></span> <span class='ocrx_word' id='word_1_228' title='bbox 1706 454 1870 477; x_wconf 83' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_229' title='bbox 1881 454 2031 483; x_wconf 86' lang='eng' dir='ltr'><em>norvegicus</em></span> <span class='ocrx_word' id='word_1_230' title='bbox 2041 453 2124 477; x_wconf 91' lang='eng' dir='ltr'><em>CECT</em></span> <span class='ocrx_word' id='word_1_231' title='bbox 2134 451 2215 477; x_wconf 90' lang='eng' dir='ltr'><em>7288T</em></span> <span class='ocrx_word' id='word_1_232' title='bbox 2226 453 2395 483; x_wconf 86' lang='eng' dir='ltr'><em>(AM942075)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_70' title="bbox 1640 502 2308 533; baseline 0.001 -7"><span class='ocrx_word' id='word_1_233' title='bbox 1640 502 1681 522; x_wconf 81' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_234' title='bbox 1703 504 1868 527; x_wconf 81' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_235' title='bbox 1878 504 2028 533; x_wconf 84' lang='eng' dir='ltr'><em>norvegicus</em></span> <span class='ocrx_word' id='word_1_236' title='bbox 2040 504 2138 527; x_wconf 86' lang='eng' dir='ltr'><em>R-3717</em></span> <span class='ocrx_word' id='word_1_237' title='bbox 2150 503 2308 533; x_wconf 89' lang='eng' dir='ltr'><em>(AJ842350)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_71' title="bbox 1702 553 2368 583; baseline 0.002 -7"><span class='ocrx_word' id='word_1_238' title='bbox 1702 554 1867 577; x_wconf 81' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_239' title='bbox 1877 554 2027 583; x_wconf 89' lang='eng' dir='ltr'><em>norvegicus</em></span> <span class='ocrx_word' id='word_1_240' title='bbox 2038 553 2102 577; x_wconf 91' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_241' title='bbox 2116 554 2198 577; x_wconf 88' lang='eng'><em>19840</em></span> <span class='ocrx_word' id='word_1_242' title='bbox 2210 553 2368 583; x_wconf 87' lang='eng' dir='ltr'><em>(AJ842349)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_72' title="bbox 1692 602 2368 633; baseline 0 -6"><span class='ocrx_word' id='word_1_243' title='bbox 1692 604 1857 627; x_wconf 84' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_244' title='bbox 1868 604 2001 627; x_wconf 86' lang='eng' dir='ltr'><em>calviensis</em></span> <span class='ocrx_word' id='word_1_245' title='bbox 2012 604 2078 627; x_wconf 92' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_246' title='bbox 2091 602 2188 627; x_wconf 89' lang='eng' dir='ltr'><em>14347T</em></span> <span class='ocrx_word' id='word_1_247' title='bbox 2198 604 2368 633; x_wconf 86' lang='eng' dir='ltr'><em>(AM942077)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_73' title="bbox 1658 654 2241 684; baseline 0 -7"><span class='ocrx_word' id='word_1_248' title='bbox 1658 655 1840 678; x_wconf 87' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_249' title='bbox 1851 655 1988 684; x_wconf 89' lang='eng' dir='ltr'><em>nigricans</em></span> <span class='ocrx_word' id='word_1_250' title='bbox 1998 654 2059 678; x_wconf 89' lang='eng' dir='ltr'><em>8/6b</em></span> <span class='ocrx_word' id='word_1_251' title='bbox 2070 654 2241 684; x_wconf 87' lang='eng' dir='ltr'><em>(AM942074)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_74' title="bbox 1683 704 2339 734; baseline 0 -7"><span class='ocrx_word' id='word_1_252' title='bbox 1683 705 1865 727; x_wconf 88' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_253' title='bbox 1876 705 2013 734; x_wconf 89' lang='eng' dir='ltr'><em>nigricans</em></span> <span class='ocrx_word' id='word_1_254' title='bbox 2024 705 2074 727; x_wconf 96' lang='eng' dir='ltr'><em>DAI</em></span> <span class='ocrx_word' id='word_1_255' title='bbox 2087 705 2157 727; x_wconf 97' lang='eng'>1-1-4</span> <span class='ocrx_word' id='word_1_256' title='bbox 2168 704 2339 734; x_wconf 86' lang='eng' dir='ltr'><em>(AM942073)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 1625 749 2352 834">
+     <span class='ocr_line' id='line_1_75' title="bbox 1625 749 2352 784; baseline 0 -7"><span class='ocrx_word' id='word_1_257' title='bbox 1625 749 1667 769; x_wconf 79' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_258' title='bbox 1683 755 1865 777; x_wconf 87' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_259' title='bbox 1876 755 2013 784; x_wconf 90' lang='eng' dir='ltr'><em>nigricans</em></span> <span class='ocrx_word' id='word_1_260' title='bbox 2024 755 2074 777; x_wconf 94' lang='eng' dir='ltr'><em>DAI</em></span> <span class='ocrx_word' id='word_1_261' title='bbox 2087 752 2171 777; x_wconf 92' lang='eng' dir='ltr'><em>1-1-5T</em></span> <span class='ocrx_word' id='word_1_262' title='bbox 2181 754 2352 784; x_wconf 90' lang='eng' dir='ltr'><em>(AM942072)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_76' title="bbox 1728 802 2339 834; baseline 0 -7"><span class='ocrx_word' id='word_1_263' title='bbox 1728 804 1860 827; x_wconf 76' lang='eng' dir='ltr'><em>Grimontia</em></span> <span class='ocrx_word' id='word_1_264' title='bbox 1870 805 1974 827; x_wconf 89' lang='eng' dir='ltr'><em>hollisae</em></span> <span class='ocrx_word' id='word_1_265' title='bbox 1985 804 2068 827; x_wconf 90' lang='eng' dir='ltr'><em>CECT</em></span> <span class='ocrx_word' id='word_1_266' title='bbox 2079 802 2159 827; x_wconf 83' lang='eng' dir='ltr'><em>5069T</em></span> <span class='ocrx_word' id='word_1_267' title='bbox 2170 804 2339 834; x_wconf 88' lang='eng' dir='ltr'><em>(AM942076)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 1315 8 2039 871">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 1318 8 2039 871">
+     <span class='ocr_line' id='line_1_77' title="bbox 1577 8 1630 48; baseline 0 1704"><span class='ocrx_word' id='word_1_268' title='bbox 1577 8 1630 48; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_78' title="bbox 1415 48 1631 96; baseline 0 1656"><span class='ocrx_word' id='word_1_269' title='bbox 1415 48 1631 96; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_79' title="bbox 1415 96 1631 197; baseline 0 0"><span class='ocrx_word' id='word_1_270' title='bbox 1415 96 1631 197; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_80' title="bbox 1415 197 1631 247; baseline 0 0"><span class='ocrx_word' id='word_1_271' title='bbox 1415 197 1631 247; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_81' title="bbox 1383 247 1575 299; baseline 0 1453"><span class='ocrx_word' id='word_1_272' title='bbox 1383 247 1575 299; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_82' title="bbox 1380 299 1631 398; baseline 0 0"><span class='ocrx_word' id='word_1_273' title='bbox 1380 299 1631 398; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_83' title="bbox 1383 398 1631 448; baseline 0 1304"><span class='ocrx_word' id='word_1_274' title='bbox 1383 398 1631 448; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_84' title="bbox 1347 448 1631 499; baseline 0 1253"><span class='ocrx_word' id='word_1_275' title='bbox 1347 448 1631 499; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_85' title="bbox 1335 499 1698 598; baseline 0 -11"><span class='ocrx_word' id='word_1_276' title='bbox 1335 499 1698 598; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_86' title="bbox 1318 598 1688 648; baseline 0 -9"><span class='ocrx_word' id='word_1_277' title='bbox 1318 598 1688 648; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_87' title="bbox 1318 648 1679 749; baseline 0 -50"><span class='ocrx_word' id='word_1_278' title='bbox 1318 648 1679 749; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_88' title="bbox 1335 749 1625 801; baseline 0 951"><span class='ocrx_word' id='word_1_279' title='bbox 1335 749 1625 801; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_89' title="bbox 1335 801 2039 871; baseline 0 0"><span class='ocrx_word' id='word_1_280' title='bbox 1335 801 2039 871; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 1400 29 1444 49">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 1400 29 1444 49">
+     <span class='ocr_line' id='line_1_90' title="bbox 1400 29 1444 49; baseline 0 0"><span class='ocrx_word' id='word_1_281' title='bbox 1400 29 1444 49; x_wconf 85' lang='eng'>5%</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 1728 979 2036 1002">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 1728 981 2036 1001">
+     <span class='ocr_line' id='line_1_91' title="bbox 1728 981 2036 1001; baseline 0 0"><span class='ocrx_word' id='word_1_282' title='bbox 1728 981 1887 1001; x_wconf 86' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_283' title='bbox 1897 981 1977 1001; x_wconf 80' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_284' title='bbox 1984 981 2036 1001; x_wconf 83' lang='eng'>8/13</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 1365 986 2265 1744">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 1367 986 2265 1744">
+     <span class='ocr_line' id='line_1_92' title="bbox 1713 986 1724 1071; baseline 0 -10"><span class='ocrx_word' id='word_1_285' title='bbox 1713 986 1724 1071; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_93' title="bbox 1713 1071 1724 1118; baseline 0 0"><span class='ocrx_word' id='word_1_286' title='bbox 1713 1071 1724 1118; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_94' title="bbox 1702 1162 1725 1208; baseline 0 -38"><span class='ocrx_word' id='word_1_287' title='bbox 1702 1162 1725 1208; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_95' title="bbox 1487 1265 1725 1320; baseline 0 0"><span class='ocrx_word' id='word_1_288' title='bbox 1487 1265 1725 1320; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_96' title="bbox 1426 1320 1712 1366; baseline 0 -6"><span class='ocrx_word' id='word_1_289' title='bbox 1426 1320 1712 1366; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_97' title="bbox 1383 1366 1708 1472; baseline 0 -61"><span class='ocrx_word' id='word_1_290' title='bbox 1383 1366 1708 1472; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_98' title="bbox 1383 1472 1731 1518; baseline 0 -1"><span class='ocrx_word' id='word_1_291' title='bbox 1383 1472 1731 1518; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_99' title="bbox 1383 1518 1727 1568; baseline 0 184"><span class='ocrx_word' id='word_1_292' title='bbox 1383 1518 1727 1568; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_100' title="bbox 1367 1568 1796 1617; baseline 0.002 -1"><span class='ocrx_word' id='word_1_293' title='bbox 1367 1568 1796 1617; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_101' title="bbox 1367 1617 1775 1665; baseline 0.012 -5"><span class='ocrx_word' id='word_1_294' title='bbox 1367 1617 1775 1665; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_102' title="bbox 1383 1665 2265 1744; baseline 0 -34"><span class='ocrx_word' id='word_1_295' title='bbox 1383 1665 2265 1744; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 1523 1029 2245 1651">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 1523 1031 2039 1350">
+     <span class='ocr_line' id='line_1_103' title="bbox 1523 1031 2035 1067; baseline 0 -16"><span class='ocrx_word' id='word_1_296' title='bbox 1523 1050 1534 1067; x_wconf 77' lang='eng'>5</span> <span class='ocrx_word' id='word_1_297' title='bbox 1543 1049 1562 1067; x_wconf 80' lang='eng'>%</span> <span class='ocrx_word' id='word_1_298' title='bbox 1728 1031 1887 1051; x_wconf 89' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_299' title='bbox 1897 1031 1977 1051; x_wconf 89' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_300' title='bbox 1984 1031 2035 1051; x_wconf 85' lang='eng' dir='ltr'><em>9I2a</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_104' title="bbox 1728 1081 2037 1101; baseline 0 0"><span class='ocrx_word' id='word_1_301' title='bbox 1728 1081 1887 1101; x_wconf 89' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_302' title='bbox 1897 1081 1977 1101; x_wconf 87' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_303' title='bbox 1984 1081 2037 1101; x_wconf 86' lang='eng' dir='ltr'><em>9I2b</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_105' title="bbox 1675 1129 2036 1151; baseline 0.014 -5"><span class='ocrx_word' id='word_1_304' title='bbox 1675 1129 1712 1147; x_wconf 87' lang='eng'>100</span> <span class='ocrx_word' id='word_1_305' title='bbox 1728 1131 1887 1151; x_wconf 90' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_306' title='bbox 1897 1131 1977 1151; x_wconf 89' lang='eng' dir='ltr'><strong><em>coralii</em></strong></span> <span class='ocrx_word' id='word_1_307' title='bbox 1985 1130 2036 1151; x_wconf 87' lang='eng' dir='ltr'><em>10l6</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_106' title="bbox 1729 1180 2036 1201; baseline 0 0"><span class='ocrx_word' id='word_1_308' title='bbox 1729 1180 1889 1201; x_wconf 86' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_309' title='bbox 1898 1180 1978 1201; x_wconf 86' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_310' title='bbox 1985 1180 2036 1201; x_wconf 89' lang='eng' dir='ltr'>9/1a</span> 
+     </span>
+     <span class='ocr_line' id='line_1_107' title="bbox 1664 1222 2037 1251; baseline 0.003 -1"><span class='ocrx_word' id='word_1_311' title='bbox 1664 1222 1700 1239; x_wconf 62' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_312' title='bbox 1729 1230 1889 1251; x_wconf 86' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_313' title='bbox 1898 1230 1978 1251; x_wconf 88' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_314' title='bbox 1985 1230 2037 1251; x_wconf 85' lang='eng' dir='ltr'>9/1c</span> 
+     </span>
+     <span class='ocr_line' id='line_1_108' title="bbox 1636 1280 2038 1311; baseline 0.002 -11"><span class='ocrx_word' id='word_1_315' title='bbox 1636 1293 1672 1311; x_wconf 71' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_316' title='bbox 1729 1280 1889 1301; x_wconf 85' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_317' title='bbox 1898 1280 1978 1301; x_wconf 85' lang='eng' dir='ltr'><strong><em>coralii</em></strong></span> <span class='ocrx_word' id='word_1_318' title='bbox 1985 1280 2038 1301; x_wconf 88' lang='eng' dir='ltr'>9/5b</span> 
+     </span>
+     <span class='ocr_line' id='line_1_109' title="bbox 1717 1330 2039 1350; baseline 0 0"><span class='ocrx_word' id='word_1_319' title='bbox 1717 1330 1876 1350; x_wconf 87' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_320' title='bbox 1886 1330 1966 1350; x_wconf 87' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_321' title='bbox 1974 1330 2039 1350; x_wconf 88' lang='eng' dir='ltr'>11l2a</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 1713 1377 2075 1400">
+     <span class='ocr_line' id='line_1_110' title="bbox 1713 1377 2075 1400; baseline 0 0"><span class='ocrx_word' id='word_1_322' title='bbox 1713 1380 1857 1400; x_wconf 84' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_323' title='bbox 1866 1380 1937 1400; x_wconf 80' lang='eng' dir='ltr'><em>coralii</em></span> <span class='ocrx_word' id='word_1_324' title='bbox 1944 1379 2009 1400; x_wconf 91' lang='eng' dir='ltr'><em>CAIM</em></span> <span class='ocrx_word' id='word_1_325' title='bbox 2020 1377 2075 1400; x_wconf 82' lang='eng' dir='ltr'><em>912T</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 1684 1427 2161 1555">
+     <span class='ocr_line' id='line_1_111' title="bbox 1684 1427 2161 1457; baseline 0 -8"><span class='ocrx_word' id='word_1_326' title='bbox 1684 1440 1720 1457; x_wconf 73' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_327' title='bbox 1736 1430 1895 1450; x_wconf 84' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_328' title='bbox 1904 1430 2024 1455; x_wconf 83' lang='eng' dir='ltr'><em>nigricans</em></span> <span class='ocrx_word' id='word_1_329' title='bbox 2034 1430 2077 1449; x_wconf 96' lang='eng' dir='ltr'><em>DAI</em></span> <span class='ocrx_word' id='word_1_330' title='bbox 2088 1427 2161 1450; x_wconf 76' lang='eng' dir='ltr'><em>1-1-5T</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_112' title="bbox 1736 1479 2149 1505; baseline 0 -6"><span class='ocrx_word' id='word_1_331' title='bbox 1736 1479 1895 1499; x_wconf 86' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_332' title='bbox 1904 1479 2024 1505; x_wconf 88' lang='eng' dir='ltr'><em>nigricans</em></span> <span class='ocrx_word' id='word_1_333' title='bbox 2034 1479 2077 1499; x_wconf 94' lang='eng' dir='ltr'><em>DAI</em></span> <span class='ocrx_word' id='word_1_334' title='bbox 2088 1479 2149 1499; x_wconf 91' lang='eng'>1-1-4</span> 
+     </span>
+     <span class='ocr_line' id='line_1_113' title="bbox 1727 1529 2076 1555; baseline 0.003 -6"><span class='ocrx_word' id='word_1_335' title='bbox 1727 1530 1886 1550; x_wconf 83' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_336' title='bbox 1895 1530 2015 1555; x_wconf 88' lang='eng' dir='ltr'><em>nigricans</em></span> <span class='ocrx_word' id='word_1_337' title='bbox 2024 1529 2076 1550; x_wconf 83' lang='eng' dir='ltr'>8/6b</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_42' title="bbox 1717 1577 2244 1649">
+     <span class='ocr_line' id='line_1_114' title="bbox 1800 1577 2244 1604; baseline 0 -5"><span class='ocrx_word' id='word_1_338' title='bbox 1800 1579 1944 1599; x_wconf 74' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_339' title='bbox 1953 1579 2084 1604; x_wconf 83' lang='eng' dir='ltr'><em>norvegicus</em></span> <span class='ocrx_word' id='word_1_340' title='bbox 2092 1579 2164 1599; x_wconf 91' lang='eng' dir='ltr'><em>CECT</em></span> <span class='ocrx_word' id='word_1_341' title='bbox 2174 1577 2244 1599; x_wconf 79' lang='eng' dir='ltr'><em>7288T</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_115' title="bbox 1717 1627 2149 1649; baseline 0 0"><span class='ocrx_word' id='word_1_342' title='bbox 1717 1629 1861 1649; x_wconf 86' lang='eng' dir='ltr'><em>Enterovibrio</em></span> <span class='ocrx_word' id='word_1_343' title='bbox 1870 1629 1987 1649; x_wconf 86' lang='eng' dir='ltr'><em>calviensis</em></span> <span class='ocrx_word' id='word_1_344' title='bbox 1996 1629 2053 1649; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_345' title='bbox 2066 1627 2149 1649; x_wconf 81' lang='eng' dir='ltr'><em>14347T</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 1781 1676 2157 1701">
+    <p class='ocr_par' dir='ltr' id='par_1_43' title="bbox 1781 1676 2157 1699">
+     <span class='ocr_line' id='line_1_116' title="bbox 1781 1676 2157 1699; baseline 0 0"><span class='ocrx_word' id='word_1_346' title='bbox 1781 1678 1895 1699; x_wconf 78' lang='eng' dir='ltr'><em>Grimontia</em></span> <span class='ocrx_word' id='word_1_347' title='bbox 1905 1679 1995 1699; x_wconf 82' lang='eng' dir='ltr'><em>hollisae</em></span> <span class='ocrx_word' id='word_1_348' title='bbox 2005 1678 2077 1699; x_wconf 89' lang='eng' dir='ltr'><em>CECT</em></span> <span class='ocrx_word' id='word_1_349' title='bbox 2086 1676 2157 1699; x_wconf 82' lang='eng' dir='ltr'><em>5069T</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 2045 851 2596 886">
+    <p class='ocr_par' dir='ltr' id='par_1_44' title="bbox 2045 852 2596 884">
+     <span class='ocr_line' id='line_1_117' title="bbox 2045 852 2596 884; baseline 0 -7"><span class='ocrx_word' id='word_1_350' title='bbox 2045 855 2120 878; x_wconf 90' lang='eng' dir='ltr'><em>Vibrio</em></span> <span class='ocrx_word' id='word_1_351' title='bbox 2131 855 2249 878; x_wconf 84' lang='eng' dir='ltr'><em>cholerae</em></span> <span class='ocrx_word' id='word_1_352' title='bbox 2259 854 2343 878; x_wconf 92' lang='eng' dir='ltr'><em>CECT</em></span> <span class='ocrx_word' id='word_1_353' title='bbox 2353 852 2416 878; x_wconf 92' lang='eng' dir='ltr'><em>514T</em></span> <span class='ocrx_word' id='word_1_354' title='bbox 2427 854 2596 884; x_wconf 86' lang='eng' dir='ltr'><em>(AM942078)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 2239 992 2545 1021">
+    <p class='ocr_par' dir='ltr' id='par_1_45' title="bbox 2239 994 2545 1020">
+     <span class='ocr_line' id='line_1_118' title="bbox 2239 994 2545 1020; baseline 0 -6"><span class='ocrx_word' id='word_1_355' title='bbox 2239 994 2270 1020; x_wconf 89' lang='eng' dir='ltr'><em>(d)</em></span> <span class='ocrx_word' id='word_1_356' title='bbox 2280 994 2447 1014; x_wconf 84' lang='eng' dir='ltr'><em>Concatenated</em></span> <span class='ocrx_word' id='word_1_357' title='bbox 2457 994 2545 1014; x_wconf 84' lang='eng' dir='ltr'><em>dataset</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 2272 1726 2595 1750">
+    <p class='ocr_par' dir='ltr' id='par_1_46' title="bbox 2272 1726 2595 1749">
+     <span class='ocr_line' id='line_1_119' title="bbox 2272 1726 2595 1749; baseline 0.003 -1"><span class='ocrx_word' id='word_1_358' title='bbox 2272 1729 2337 1749; x_wconf 87' lang='eng' dir='ltr'><em>Vibrio</em></span> <span class='ocrx_word' id='word_1_359' title='bbox 2347 1729 2449 1749; x_wconf 84' lang='eng' dir='ltr'><em>cholerae</em></span> <span class='ocrx_word' id='word_1_360' title='bbox 2458 1728 2531 1749; x_wconf 88' lang='eng' dir='ltr'><em>CECT</em></span> <span class='ocrx_word' id='word_1_361' title='bbox 2540 1726 2595 1749; x_wconf 92' lang='eng' dir='ltr'><em>514T</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002048-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002048-0-000.pbm.png
new file mode 100644
index 00000000..d97215f8
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002048-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002048-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002048-0-000.pbm.png.hocr
new file mode 100644
index 00000000..36720599
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002048-0-000.pbm.png.hocr
@@ -0,0 +1,153 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002048-0-000.pbm.png"; bbox 0 0 1539 533; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 277 1 1538 265">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 407 1 1255 78">
+     <span class='ocr_line' id='line_1_1' title="bbox 407 1 1201 31; baseline 0 -6"><span class='ocrx_word' id='word_1_1' title='bbox 407 10 469 12; x_wconf 90' lang='eng'>—</span> <span class='ocrx_word' id='word_1_2' title='bbox 482 2 728 31; x_wconf 83' lang='eng' dir='ltr'><em>Sporolactobacillus</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 737 2 866 25; x_wconf 84' lang='eng' dir='ltr'><em>kofuensis</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 876 2 936 25; x_wconf 88' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 948 1 1028 25; x_wconf 79' lang='eng' dir='ltr'><em>3419T</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 1039 3 1201 31; x_wconf 77' lang='eng' dir='ltr'><em>(ABS74517)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 407 47 1255 78; baseline 0 -6"><span class='ocrx_word' id='word_1_7' title='bbox 407 57 470 59; x_wconf 91' lang='eng'>—</span> <span class='ocrx_word' id='word_1_8' title='bbox 482 49 728 78; x_wconf 82' lang='eng' dir='ltr'><em>Sporo/actobacil/us</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 737 49 912 72; x_wconf 81' lang='eng' dir='ltr'><em>laevo/acticus</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 924 49 973 72; x_wconf 92' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 987 47 1083 72; x_wconf 89' lang='eng' dir='ltr'><em>12321T</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 1094 49 1255 78; x_wconf 89' lang='eng' dir='ltr'><em>(AB374516)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 277 94 1538 265">
+     <span class='ocr_line' id='line_1_3' title="bbox 449 94 1538 152; baseline 0 -34"><span class='ocrx_word' id='word_1_13' title='bbox 449 98 510 152; x_wconf 69' lang='eng'><em>100[</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 523 95 769 124; x_wconf 82' lang='eng' dir='ltr'><em>Sporo/actobacil/us</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 779 95 936 124; x_wconf 85' lang='eng' dir='ltr'><em>nakayamae</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 946 95 1033 124; x_wconf 84' lang='eng' dir='ltr'>subsp.</span> <span class='ocrx_word' id='word_1_17' title='bbox 1046 95 1203 124; x_wconf 87' lang='eng' dir='ltr'><em>nakayamae</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 1213 95 1273 118; x_wconf 89' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 1285 94 1366 118; x_wconf 89' lang='eng' dir='ltr'><em>3514T</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 1376 95 1538 124; x_wconf 88' lang='eng' dir='ltr'><em>(AB374518)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 277 140 1516 178; baseline 0 -13"><span class='ocrx_word' id='word_1_21' title='bbox 277 158 304 178; x_wconf 71' lang='eng'><em>76</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 387 162 398 164; x_wconf 95' lang='eng'>_</span> <span class='ocrx_word' id='word_1_23' title='bbox 521 142 767 171; x_wconf 82' lang='eng' dir='ltr'><em>Sporolactobacillus</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 776 142 933 171; x_wconf 88' lang='eng' dir='ltr'><em>nakayamae</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 944 148 973 165; x_wconf 84' lang='eng' dir='ltr'><em>su</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 978 142 1030 171; x_wconf 86' lang='eng' dir='ltr'><em>bsp.</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 1044 142 1182 165; x_wconf 84' lang='eng' dir='ltr'><em>racemicus</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 1191 142 1252 165; x_wconf 91' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 1263 140 1344 165; x_wconf 81' lang='eng' dir='ltr'><em>3417T</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 1355 142 1516 171; x_wconf 86' lang='eng' dir='ltr'><em>(AB374519)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 400 187 1153 217; baseline -0.001 -5"><span class='ocrx_word' id='word_1_31' title='bbox 400 197 471 199; x_wconf 91' lang='eng'>—</span> <span class='ocrx_word' id='word_1_32' title='bbox 484 188 730 217; x_wconf 85' lang='eng' dir='ltr'><em>Sporolactobaci/Ius</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 740 189 818 212; x_wconf 82' lang='eng' dir='ltr'><em>terrae</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 828 188 888 212; x_wconf 90' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 900 187 981 212; x_wconf 80' lang='eng' dir='ltr'><em>3516T</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 991 189 1153 217; x_wconf 71' lang='eng' dir='ltr'><em>(ABs74520)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 632 234 1344 265; baseline 0 -7"><span class='ocrx_word' id='word_1_37' title='bbox 632 235 904 265; x_wconf 85' lang='eng' dir='ltr'><em>Sporolactobacillus</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 912 236 1024 265; x_wconf 81' lang='eng' dir='ltr'><em>putidus</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 1033 234 1170 260; x_wconf 89' lang='eng' dir='ltr'><em>QC81-06T</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 1180 235 1344 264; x_wconf 86' lang='eng' dir='ltr'><em>(AB374522)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 385 34 407 36">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 385 34 407 36">
+     <span class='ocr_line' id='line_1_7' title="bbox 385 34 407 36; baseline 0 497"><span class='ocrx_word' id='word_1_41' title='bbox 385 34 407 36; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 405 10 407 59">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 405 10 407 59">
+     <span class='ocr_line' id='line_1_8' title="bbox 405 10 407 59; baseline 0 474"><span class='ocrx_word' id='word_1_42' title='bbox 405 10 407 59; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 348 69 375 88">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 348 69 375 88">
+     <span class='ocr_line' id='line_1_9' title="bbox 348 69 375 88; baseline 0 0"><span class='ocrx_word' id='word_1_43' title='bbox 348 69 375 88; x_wconf 88' lang='eng'>88</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 315 98 387 100">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 315 98 387 100">
+     <span class='ocr_line' id='line_1_10' title="bbox 315 98 387 100; baseline 0 433"><span class='ocrx_word' id='word_1_44' title='bbox 315 98 387 100; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 385 34 387 164">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 385 34 387 164">
+     <span class='ocr_line' id='line_1_11' title="bbox 385 34 387 164; baseline 0 369"><span class='ocrx_word' id='word_1_45' title='bbox 385 34 387 164; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 398 127 400 199">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 398 127 400 199">
+     <span class='ocr_line' id='line_1_12' title="bbox 398 127 400 199; baseline 0 334"><span class='ocrx_word' id='word_1_46' title='bbox 398 127 400 199; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 282 188 316 190">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 282 188 316 190">
+     <span class='ocr_line' id='line_1_13' title="bbox 282 188 316 190; baseline 0 343"><span class='ocrx_word' id='word_1_47' title='bbox 282 188 316 190; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 315 98 316 280">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 315 98 316 280">
+     <span class='ocr_line' id='line_1_14' title="bbox 315 98 316 280; baseline 0 253"><span class='ocrx_word' id='word_1_48' title='bbox 315 98 316 280; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 315 278 484 280">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 315 278 484 280">
+     <span class='ocr_line' id='line_1_15' title="bbox 315 278 484 280; baseline 0 253"><span class='ocrx_word' id='word_1_49' title='bbox 315 278 484 280; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 1 286 284 288">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 1 286 284 288">
+     <span class='ocr_line' id='line_1_16' title="bbox 1 286 284 288; baseline 0 245"><span class='ocrx_word' id='word_1_50' title='bbox 1 286 284 288; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 1 286 3 432">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 1 286 3 432">
+     <span class='ocr_line' id='line_1_17' title="bbox 1 286 3 432; baseline 0 101"><span class='ocrx_word' id='word_1_51' title='bbox 1 286 3 432; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 482 243 484 315">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 482 243 484 315">
+     <span class='ocr_line' id='line_1_18' title="bbox 482 243 484 315; baseline 0 218"><span class='ocrx_word' id='word_1_52' title='bbox 482 243 484 315; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 284 281 1421 404">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 284 281 1421 404">
+     <span class='ocr_line' id='line_1_19' title="bbox 443 281 1421 314; baseline -0.001 -9"><span class='ocrx_word' id='word_1_53' title='bbox 443 295 471 314; x_wconf 77' lang='eng'><em>98</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 761 291 779 292; x_wconf 41' lang='eng'><em>*</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 792 281 1039 310; x_wconf 84' lang='eng' dir='ltr'><em>Sporolactobacillus</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 1049 282 1137 305; x_wconf 81' lang='eng' dir='ltr'><em>vineae</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 1148 281 1250 305; x_wconf 85' lang='eng' dir='ltr'>SL1153</span> <span class='ocrx_word' id='word_1_58' title='bbox 1261 282 1421 310; x_wconf 89' lang='eng' dir='ltr'><em>(EF581818)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 707 326 1402 359; baseline 0 -6"><span class='ocrx_word' id='word_1_59' title='bbox 707 330 748 349; x_wconf 88' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 774 330 1021 359; x_wconf 78' lang='eng' dir='ltr'><em>Sporo/actobaciI/us</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 1032 330 1120 353; x_wconf 89' lang='eng' dir='ltr'><em>vineae</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 1130 326 1231 353; x_wconf 90' lang='eng' dir='ltr'><em>SL153T</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 1242 330 1402 359; x_wconf 87' lang='eng' dir='ltr'><em>(EF581819)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 284 373 1121 404; baseline 0 -6"><span class='ocrx_word' id='word_1_64' title='bbox 284 384 408 386; x_wconf 91' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_65' title='bbox 421 375 669 404; x_wconf 82' lang='eng' dir='ltr'><em>Sporolactobaci/Ius</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 678 375 781 398; x_wconf 88' lang='eng' dir='ltr'><em>inulinus</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 793 375 840 398; x_wconf 93' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 853 373 949 398; x_wconf 85' lang='eng' dir='ltr'><em>13595T</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 959 375 1121 404; x_wconf 85' lang='eng' dir='ltr'><em>(AB374521)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 482 313 761 315">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 482 313 761 315">
+     <span class='ocr_line' id='line_1_22' title="bbox 482 313 761 315; baseline 0 218"><span class='ocrx_word' id='word_1_70' title='bbox 482 313 761 315; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 759 291 761 339">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 759 291 761 339">
+     <span class='ocr_line' id='line_1_23' title="bbox 759 291 761 339; baseline 0 194"><span class='ocrx_word' id='word_1_71' title='bbox 759 291 761 339; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 282 188 284 386">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 282 188 284 386">
+     <span class='ocr_line' id='line_1_24' title="bbox 282 188 284 386; baseline 0 147"><span class='ocrx_word' id='word_1_72' title='bbox 282 188 284 386; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 1 430 779 432">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 1 430 779 432">
+     <span class='ocr_line' id='line_1_25' title="bbox 1 430 779 432; baseline 0 101"><span class='ocrx_word' id='word_1_73' title='bbox 1 430 779 432; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 790 420 1337 450">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 790 420 1337 450">
+     <span class='ocr_line' id='line_1_26' title="bbox 790 420 1337 450; baseline 0 -6"><span class='ocrx_word' id='word_1_74' title='bbox 790 421 895 444; x_wconf 84' lang='eng' dir='ltr'><em>Bacillus</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 904 421 997 444; x_wconf 82' lang='eng' dir='ltr'><em>subtilis</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 1008 421 1058 444; x_wconf 92' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 1072 420 1166 444; x_wconf 91' lang='eng' dir='ltr'><em>12118T</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 1176 421 1337 450; x_wconf 88' lang='eng' dir='ltr'><em>(ABO42061)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 137 512 182 532">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 137 512 182 532">
+     <span class='ocr_line' id='line_1_27' title="bbox 137 512 182 532; baseline 0 0"><span class='ocrx_word' id='word_1_79' title='bbox 137 512 182 532; x_wconf 90' lang='eng'><em>0.01</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002048-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002048-0-001.pbm.png
new file mode 100644
index 00000000..6f79c5f3
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002048-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002048-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002048-0-001.pbm.png.hocr
new file mode 100644
index 00000000..8524aa17
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002048-0-001.pbm.png.hocr
@@ -0,0 +1,102 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002048-0-001.pbm.png"; bbox 0 0 1536 527; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 204 1 1303 92">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 204 1 1303 92">
+     <span class='ocr_line' id='line_1_1' title="bbox 204 1 1247 37; baseline -0.001 -10"><span class='ocrx_word' id='word_1_1' title='bbox 204 15 233 37; x_wconf 75' lang='eng'><em>85</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 245 16 475 18; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_3' title='bbox 488 3 747 32; x_wconf 85' lang='eng' dir='ltr'><em>Sporolactobacillus</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 759 3 894 27; x_wconf 87' lang='eng' dir='ltr'><em>kofuensis</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 905 3 967 27; x_wconf 90' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 981 1 1065 27; x_wconf 80' lang='eng' dir='ltr'><em>3419T</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 1077 3 1247 32; x_wconf 82' lang='eng' dir='ltr'><em>(A8374524)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 486 61 1303 92; baseline -0.001 -5"><span class='ocrx_word' id='word_1_8' title='bbox 486 63 746 92; x_wconf 79' lang='eng' dir='ltr'><em>Sporalactobacillus</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 757 63 941 87; x_wconf 84' lang='eng' dir='ltr'><em>laevolacticus</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 954 63 1006 86; x_wconf 92' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 1021 61 1122 87; x_wconf 80' lang='eng' dir='ltr'><em>12321T</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 1134 63 1303 92; x_wconf 80' lang='eng' dir='ltr'><em>(A8374523)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 243 16 245 78">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 243 16 245 78">
+     <span class='ocr_line' id='line_1_3' title="bbox 243 16 245 78; baseline 0 449"><span class='ocrx_word' id='word_1_13' title='bbox 243 16 245 78; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 194 129 214 131">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 194 129 214 131">
+     <span class='ocr_line' id='line_1_4' title="bbox 194 129 214 131; baseline 0 396"><span class='ocrx_word' id='word_1_14' title='bbox 194 129 214 131; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 356 137 358 199">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 356 137 358 199">
+     <span class='ocr_line' id='line_1_5' title="bbox 356 137 358 199; baseline 0 328"><span class='ocrx_word' id='word_1_15' title='bbox 356 137 358 199; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 212 46 214 213">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 212 46 214 213">
+     <span class='ocr_line' id='line_1_6' title="bbox 212 46 214 213; baseline 0 314"><span class='ocrx_word' id='word_1_16' title='bbox 212 46 214 213; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 116 223 196 225">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 116 223 196 225">
+     <span class='ocr_line' id='line_1_7' title="bbox 116 223 196 225; baseline 0 302"><span class='ocrx_word' id='word_1_17' title='bbox 116 223 196 225; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 194 129 196 319">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 194 129 196 319">
+     <span class='ocr_line' id='line_1_8' title="bbox 194 129 196 319; baseline 0 208"><span class='ocrx_word' id='word_1_18' title='bbox 194 129 196 319; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 1 300 118 302">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 1 300 118 302">
+     <span class='ocr_line' id='line_1_9' title="bbox 1 300 118 302; baseline 0 225"><span class='ocrx_word' id='word_1_19' title='bbox 1 300 118 302; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 1 301 3 440">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 1 301 3 440">
+     <span class='ocr_line' id='line_1_10' title="bbox 1 301 3 440; baseline 0 87"><span class='ocrx_word' id='word_1_20' title='bbox 1 301 3 440; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 116 223 118 379">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 116 223 118 379">
+     <span class='ocr_line' id='line_1_11' title="bbox 116 223 118 379; baseline 0 148"><span class='ocrx_word' id='word_1_21' title='bbox 116 223 118 379; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 27 120 1534 499">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 27 120 1534 499">
+     <span class='ocr_line' id='line_1_12' title="bbox 305 120 1534 158; baseline -0.001 -12"><span class='ocrx_word' id='word_1_22' title='bbox 305 137 348 158; x_wconf 75' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 358 137 446 139; x_wconf 94' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_24' title='bbox 463 122 723 152; x_wconf 82' lang='eng' dir='ltr'><em>Sporolactobaoillus</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 734 123 899 152; x_wconf 88' lang='eng' dir='ltr'><em>nakayamae</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 910 123 1001 152; x_wconf 87' lang='eng' dir='ltr'><em>subsp.</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 1015 123 1181 152; x_wconf 85' lang='eng' dir='ltr'><em>nakayamae</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 1192 122 1254 146; x_wconf 91' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 1268 120 1353 146; x_wconf 76' lang='eng' dir='ltr'><em>3514T</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 1365 123 1534 152; x_wconf 79' lang='eng' dir='ltr'><em>(A8374525)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 143 183 1505 215; baseline -0.001 -6"><span class='ocrx_word' id='word_1_31' title='bbox 143 193 185 214; x_wconf 79' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 358 197 440 199; x_wconf 95' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_33' title='bbox 454 185 714 215; x_wconf 82' lang='eng' dir='ltr'><em>Sporalactobacillus</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 725 185 890 215; x_wconf 86' lang='eng' dir='ltr'><em>nakayamae</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 902 185 993 215; x_wconf 87' lang='eng' dir='ltr'><em>subsp.</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 1006 185 1153 209; x_wconf 86' lang='eng' dir='ltr'><em>racemicus</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 1163 185 1225 209; x_wconf 90' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 1239 183 1323 209; x_wconf 78' lang='eng' dir='ltr'><em>3417T</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 1336 185 1505 215; x_wconf 77' lang='eng' dir='ltr'><em>(ABS74526)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 78 245 1168 291; baseline 0 -21"><span class='ocrx_word' id='word_1_40' title='bbox 78 270 107 291; x_wconf 73' lang='eng'><em>98</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 461 247 721 276; x_wconf 84' lang='eng' dir='ltr'><em>Sporolactobacillus</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 732 248 814 270; x_wconf 78' lang='eng' dir='ltr'><em>terrae</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 826 247 888 270; x_wconf 90' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 901 245 986 270; x_wconf 81' lang='eng' dir='ltr'><em>3516T</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 998 247 1168 276; x_wconf 75' lang='eng' dir='ltr'><em>(ABB74527)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 497 303 1234 334; baseline 0 -6"><span class='ocrx_word' id='word_1_46' title='bbox 497 305 757 334; x_wconf 78' lang='eng' dir='ltr'><em>Sporolactobacillus</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 767 305 876 328; x_wconf 87' lang='eng' dir='ltr'><em>inulinus</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 888 305 938 328; x_wconf 94' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 952 303 1053 328; x_wconf 80' lang='eng' dir='ltr'><em>13595T</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 1065 305 1234 334; x_wconf 72' lang='eng' dir='ltr'><em>(ABS74528)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 423 362 1175 394; baseline -0.001 -7"><span class='ocrx_word' id='word_1_51' title='bbox 423 364 709 394; x_wconf 87' lang='eng' dir='ltr'><em>Sporolactobacillus</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 719 364 835 394; x_wconf 88' lang='eng' dir='ltr'><em>putidus</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 847 362 992 388; x_wconf 85' lang='eng' dir='ltr'><em>QC81-06T</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 1002 363 1175 392; x_wconf 85' lang='eng' dir='ltr'><em>(AB374529)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 489 428 1031 459; baseline 0 -6"><span class='ocrx_word' id='word_1_55' title='bbox 489 430 600 453; x_wconf 87' lang='eng' dir='ltr'><em>Bacillus</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 610 430 708 453; x_wconf 78' lang='eng' dir='ltr'><em>subtilis</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 720 430 772 453; x_wconf 92' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 788 428 886 453; x_wconf 91' lang='eng' dir='ltr'><em>12118T</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 898 430 1031 459; x_wconf 86' lang='eng'><em>(299104)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 27 477 137 499; baseline 0 0"><span class='ocrx_word' id='word_1_60' title='bbox 27 477 137 499; x_wconf 59' lang='eng'><em>1—1</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 55 504 112 525">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 55 504 112 525">
+     <span class='ocr_line' id='line_1_19' title="bbox 55 504 112 525; baseline 0 0"><span class='ocrx_word' id='word_1_61' title='bbox 55 504 112 525; x_wconf 92' lang='eng'>0.05</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002113-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002113-0-000.pbm.png
new file mode 100644
index 00000000..4b88d31b
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002113-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002113-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002113-0-000.pbm.png.hocr
new file mode 100644
index 00000000..9ba2c352
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002113-0-000.pbm.png.hocr
@@ -0,0 +1,163 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002113-0-000.pbm.png"; bbox 0 0 1231 978; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 430 5 1146 196">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 430 5 1146 115">
+     <span class='ocr_line' id='line_1_1' title="bbox 497 5 1146 34; baseline 0 -6"><span class='ocrx_word' id='word_1_1' title='bbox 497 7 666 28; x_wconf 83' lang='eng' dir='ltr'><em>Marinomonas</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 674 7 834 34; x_wconf 83' lang='eng' dir='ltr'><em>primoryensis</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 844 7 905 28; x_wconf 91' lang='eng' dir='ltr'><em>KMM</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 916 5 989 28; x_wconf 80' lang='eng' dir='ltr'><em>3633T</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 999 7 1146 34; x_wconf 85' lang='eng' dir='ltr'><em>(AB074193)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 523 45 1025 74; baseline 0.002 -6"><span class='ocrx_word' id='word_1_6' title='bbox 523 48 692 69; x_wconf 88' lang='eng' dir='ltr'><em>Marinomonas</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 700 48 783 74; x_wconf 87' lang='eng' dir='ltr'><em>polaris</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 792 45 872 69; x_wconf 76' lang='eng' dir='ltr'><em>CK13T</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 882 48 1025 74; x_wconf 85' lang='eng' dir='ltr'><em>(AJ833000)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 430 86 946 115; baseline 0 -6"><span class='ocrx_word' id='word_1_10' title='bbox 430 89 599 109; x_wconf 87' lang='eng' dir='ltr'><em>Marinomonas</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 607 89 697 115; x_wconf 88' lang='eng' dir='ltr'><em>pontica</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 706 86 789 109; x_wconf 82' lang='eng' dir='ltr'><em>46-16T</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 799 88 946 115; x_wconf 83' lang='eng' dir='ltr'><em>(AY539835)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 443 127 1096 196">
+     <span class='ocr_line' id='line_1_4' title="bbox 443 127 1096 156; baseline 0 -6"><span class='ocrx_word' id='word_1_14' title='bbox 443 129 612 150; x_wconf 82' lang='eng' dir='ltr'><em>Marinomonas</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 621 129 778 150; x_wconf 84' lang='eng' dir='ltr'><em>dokdonensis</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 788 127 934 150; x_wconf 89' lang='eng' dir='ltr'><em>DSW10-10T</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 944 129 1096 156; x_wconf 87' lang='eng' dir='ltr'>(DQO11526)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 468 168 1001 196; baseline 0 -5"><span class='ocrx_word' id='word_1_18' title='bbox 468 170 637 191; x_wconf 86' lang='eng' dir='ltr'><em>Marinomonas</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 646 170 793 191; x_wconf 85' lang='eng' dir='ltr'><em>ushuaiensis</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 804 168 848 191; x_wconf 92' lang='eng' dir='ltr'><em>U1T</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 858 170 1001 196; x_wconf 83' lang='eng' dir='ltr'><em>(AJ627909)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 217 12 519 222">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 217 12 519 222">
+     <span class='ocr_line' id='line_1_6' title="bbox 257 12 519 129; baseline 0 0"><span class='ocrx_word' id='word_1_22' title='bbox 257 12 519 129; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 257 129 443 170; baseline 0 808"><span class='ocrx_word' id='word_1_23' title='bbox 257 129 443 170; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 217 170 463 222; baseline 0 -28"><span class='ocrx_word' id='word_1_24' title='bbox 217 170 463 222; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 53 30 93 48">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 53 30 93 48">
+     <span class='ocr_line' id='line_1_9' title="bbox 53 30 93 48; baseline -0.025 0"><span class='ocrx_word' id='word_1_25' title='bbox 53 30 93 48; x_wconf 87' lang='eng'><em>0.01</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 324 58 359 75">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 324 58 359 75">
+     <span class='ocr_line' id='line_1_10' title="bbox 324 58 359 75; baseline 0 0"><span class='ocrx_word' id='word_1_26' title='bbox 324 58 359 75; x_wconf 90' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 1 242 544 960">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 1 242 544 960">
+     <span class='ocr_line' id='line_1_11' title="bbox 45 242 215 334; baseline 0 -42"><span class='ocrx_word' id='word_1_27' title='bbox 45 242 215 334; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 20 334 55 374; baseline 0 604"><span class='ocrx_word' id='word_1_28' title='bbox 20 334 55 374; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 20 374 378 414; baseline 0 564"><span class='ocrx_word' id='word_1_29' title='bbox 20 374 378 414; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 20 414 401 455; baseline 0 0"><span class='ocrx_word' id='word_1_30' title='bbox 20 414 401 455; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 20 455 386 496; baseline 0 482"><span class='ocrx_word' id='word_1_31' title='bbox 20 455 386 496; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 20 496 432 536; baseline 0 442"><span class='ocrx_word' id='word_1_32' title='bbox 20 496 432 536; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 1 536 510 577; baseline 0 0"><span class='ocrx_word' id='word_1_33' title='bbox 1 536 510 577; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 1 577 349 618; baseline 0 360"><span class='ocrx_word' id='word_1_34' title='bbox 1 577 349 618; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 1 618 415 659; baseline 0 0"><span class='ocrx_word' id='word_1_35' title='bbox 1 618 415 659; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 1 659 372 700; baseline 0 278"><span class='ocrx_word' id='word_1_36' title='bbox 1 659 372 700; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 1 700 387 740; baseline 0 238"><span class='ocrx_word' id='word_1_37' title='bbox 1 700 387 740; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 1 740 429 781; baseline 0 0"><span class='ocrx_word' id='word_1_38' title='bbox 1 740 429 781; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 1 781 375 822; baseline 0 156"><span class='ocrx_word' id='word_1_39' title='bbox 1 781 375 822; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 1 822 467 862; baseline 0 116"><span class='ocrx_word' id='word_1_40' title='bbox 1 822 467 862; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 1 862 525 903; baseline 0 0"><span class='ocrx_word' id='word_1_41' title='bbox 1 862 525 903; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 1 903 544 960; baseline 0 0"><span class='ocrx_word' id='word_1_42' title='bbox 1 903 544 960; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 172 180 1035 360">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 172 180 1035 360">
+     <span class='ocr_line' id='line_1_27' title="bbox 218 180 254 197; baseline 0 0"><span class='ocrx_word' id='word_1_43' title='bbox 218 180 254 197; x_wconf 90' lang='eng'><em>100</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 172 208 1035 238; baseline 0 -7"><span class='ocrx_word' id='word_1_44' title='bbox 172 220 208 238; x_wconf 75' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 426 211 595 231; x_wconf 86' lang='eng' dir='ltr'><em>Marinomonas</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 604 211 768 231; x_wconf 82' lang='eng' dir='ltr'><em>mediterranea</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 779 208 879 231; x_wconf 81' lang='eng' dir='ltr'><em>MMB-1T</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 889 210 1035 237; x_wconf 87' lang='eng' dir='ltr'><em>(AF063027)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 267 249 1024 278; baseline 0 -6"><span class='ocrx_word' id='word_1_49' title='bbox 267 258 291 276; x_wconf 75' lang='eng'><em>33</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 405 252 575 272; x_wconf 85' lang='eng' dir='ltr'><em>Marinomonas</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 584 252 711 272; x_wconf 85' lang='eng' dir='ltr'><em>communis</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 721 251 778 272; x_wconf 91' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 789 249 862 272; x_wconf 79' lang='eng' dir='ltr'><em>2864T</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 871 251 1024 278; x_wconf 89' lang='eng' dir='ltr'>(DQO11528)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 420 289 963 319; baseline 0 -6"><span class='ocrx_word' id='word_1_55' title='bbox 420 292 589 313; x_wconf 83' lang='eng' dir='ltr'><em>Marinomonas</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 599 297 657 319; x_wconf 83' lang='eng' dir='ltr'><em>vaga</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 666 292 742 313; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 752 289 840 313; x_wconf 82' lang='eng' dir='ltr'><em>27119T</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 850 292 963 319; x_wconf 88' lang='eng' dir='ltr'><em>(X67025)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 251 331 974 360; baseline 0 -6"><span class='ocrx_word' id='word_1_60' title='bbox 251 340 275 358; x_wconf 81' lang='eng'><em>94</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 397 333 566 354; x_wconf 85' lang='eng' dir='ltr'><em>Marinomonas</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 575 333 712 359; x_wconf 85' lang='eng' dir='ltr'><em>aquimarina</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 724 333 731 354; x_wconf 99' lang='eng'>1</span> <span class='ocrx_word' id='word_1_64' title='bbox 740 331 821 354; x_wconf 91' lang='eng' dir='ltr'><em>1SM4T</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 831 333 974 360; x_wconf 84' lang='eng' dir='ltr'><em>(AJ843077)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 215 201 217 366">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 215 201 217 366">
+     <span class='ocr_line' id='line_1_32' title="bbox 215 201 217 366; baseline 0 612"><span class='ocrx_word' id='word_1_66' title='bbox 215 201 217 366; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 349 371 1229 971">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 378 371 1081 482">
+     <span class='ocr_line' id='line_1_33' title="bbox 378 371 1081 400; baseline 0 -5"><span class='ocrx_word' id='word_1_67' title='bbox 378 374 547 395; x_wconf 87' lang='eng' dir='ltr'><em>Marinomonas</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 556 374 700 400; x_wconf 86' lang='eng' dir='ltr'><em>ostreistagni</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 709 371 924 395; x_wconf 81' lang='eng' dir='ltr'><em>UST010306—043T</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 934 374 1081 400; x_wconf 79' lang='eng' dir='ltr'><em>(ABZ42868)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 407 412 972 441; baseline 0 -6"><span class='ocrx_word' id='word_1_71' title='bbox 407 414 584 435; x_wconf 84' lang='eng' dir='ltr'><em>Oceanobacter</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 590 415 664 441; x_wconf 84' lang='eng' dir='ltr'><em>kriegii</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 673 414 716 435; x_wconf 93' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 728 412 815 435; x_wconf 80' lang='eng' dir='ltr'><em>15467T</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 825 414 972 441; x_wconf 87' lang='eng' dir='ltr'><em>(AB006767)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 386 453 942 482; baseline 0 -6"><span class='ocrx_word' id='word_1_76' title='bbox 386 455 562 476; x_wconf 83' lang='eng' dir='ltr'><em>Thalassolituus</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 571 455 698 476; x_wconf 82' lang='eng' dir='ltr'><em>o/eivorans</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 708 455 727 476; x_wconf 93' lang='eng' dir='ltr'>M</span> <span class='ocrx_word' id='word_1_79' title='bbox 732 455 735 476; x_wconf 99' lang='eng'><strong><em>|</em></strong></span> <span class='ocrx_word' id='word_1_80' title='bbox 740 455 773 476; x_wconf 99' lang='eng' dir='ltr'><em>L-1</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 779 453 790 466; x_wconf 73' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_82' title='bbox 799 455 942 482; x_wconf 84' lang='eng' dir='ltr'><em>(AJ431699)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 432 493 998 522">
+     <span class='ocr_line' id='line_1_36' title="bbox 432 493 998 522; baseline 0 -6"><span class='ocrx_word' id='word_1_83' title='bbox 432 496 582 517; x_wconf 89' lang='eng' dir='ltr'><em>Bermanella</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 592 496 732 517; x_wconf 86' lang='eng' dir='ltr'><em>marisrubri</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 740 493 840 517; x_wconf 78' lang='eng' dir='ltr'><em>RED65T</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 850 496 998 522; x_wconf 86' lang='eng' dir='ltr'><em>(AY136131)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 349 534 990 604">
+     <span class='ocr_line' id='line_1_37' title="bbox 515 534 990 563; baseline 0 -6"><span class='ocrx_word' id='word_1_87' title='bbox 515 536 623 563; x_wconf 88' lang='eng' dir='ltr'><em>O/eispira</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 633 537 753 557; x_wconf 82' lang='eng' dir='ltr'><em>antarctica</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 764 534 837 557; x_wconf 90' lang='eng' dir='ltr'><em>RB-8T</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 847 536 990 563; x_wconf 86' lang='eng' dir='ltr'><em>(AJ426420)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 349 575 933 604; baseline 0 -6"><span class='ocrx_word' id='word_1_91' title='bbox 349 577 548 604; x_wconf 83' lang='eng' dir='ltr'><em>Oceanospiri/Ium</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 557 577 623 598; x_wconf 91' lang='eng' dir='ltr'><em>linum</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 631 577 707 598; x_wconf 86' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_94' title='bbox 719 577 726 598; x_wconf 99' lang='eng'>1</span> <span class='ocrx_word' id='word_1_95' title='bbox 734 575 805 598; x_wconf 81' lang='eng' dir='ltr'><em>1336T</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 815 577 933 604; x_wconf 86' lang='eng' dir='ltr'>(M22365)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 372 616 1155 808">
+     <span class='ocr_line' id='line_1_39' title="bbox 421 616 1037 645; baseline 0 -6"><span class='ocrx_word' id='word_1_97' title='bbox 421 618 620 645; x_wconf 83' lang='eng' dir='ltr'><em>Oceanospir/Ilum</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 630 619 697 639; x_wconf 89' lang='eng' dir='ltr'><em>maris</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 705 618 781 639; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 791 616 879 639; x_wconf 82' lang='eng' dir='ltr'><em>27509T</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 889 618 1037 645; x_wconf 89' lang='eng' dir='ltr'><em>(ABOO6771)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 372 657 1020 686; baseline 0 -6"><span class='ocrx_word' id='word_1_102' title='bbox 372 659 571 685; x_wconf 83' lang='eng' dir='ltr'><em>Oceanospiri/lum</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 580 659 711 686; x_wconf 77' lang='eng' dir='ltr'><em>beljerinckii</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 720 659 764 680; x_wconf 90' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 776 657 862 680; x_wconf 92' lang='eng' dir='ltr'><em>15445T</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 872 659 1020 686; x_wconf 80' lang='eng' dir='ltr'><em>(ABOOG760)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 387 697 1117 726; baseline -0.001 -5"><span class='ocrx_word' id='word_1_107' title='bbox 387 700 586 726; x_wconf 86' lang='eng' dir='ltr'><em>Oceanospiri/Ium</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 595 700 806 726; x_wconf 84' lang='eng' dir='ltr'><em>multiglobuliferum</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 817 700 861 721; x_wconf 94' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 873 697 959 721; x_wconf 74' lang='eng' dir='ltr'><em>13614T</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 969 700 1117 726; x_wconf 77' lang='eng' dir='ltr'><em>(ABOOB764)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 434 738 1155 767; baseline 0 -6"><span class='ocrx_word' id='word_1_112' title='bbox 434 741 623 767; x_wconf 81' lang='eng' dir='ltr'><em>Neptunomonas</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 632 741 817 767; x_wconf 81' lang='eng' dir='ltr'><em>naphthovorans</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 827 738 998 761; x_wconf 80' lang='eng' dir='ltr'><em>NAG-2N-126T</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 1009 740 1155 767; x_wconf 86' lang='eng' dir='ltr'><em>(AF053734)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 375 779 990 808; baseline 0 -6"><span class='ocrx_word' id='word_1_116' title='bbox 375 781 558 807; x_wconf 81' lang='eng' dir='ltr'><em>Neptuniibacter</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 565 781 719 802; x_wconf 85' lang='eng' dir='ltr'><em>caesariensis</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 729 779 833 802; x_wconf 76' lang='eng' dir='ltr'><em>MEDE)2T</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 842 781 945 808; x_wconf 84' lang='eng' dir='ltr'><em>(AY1361</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 953 781 990 808; x_wconf 89' lang='eng'><em>16)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 467 819 1017 848">
+     <span class='ocr_line' id='line_1_44' title="bbox 467 819 1017 848; baseline 0 -5"><span class='ocrx_word' id='word_1_121' title='bbox 467 822 583 843; x_wconf 83' lang='eng' dir='ltr'><em>Reinekea</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 593 822 726 843; x_wconf 87' lang='eng' dir='ltr'><em>blandensis</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 736 819 855 843; x_wconf 79' lang='eng' dir='ltr'><em>MED297T</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 865 822 1017 848; x_wconf 88' lang='eng' dir='ltr'><em>(DQ403810)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 423 860 1229 930">
+     <span class='ocr_line' id='line_1_45' title="bbox 529 860 1229 889; baseline 0 -6"><span class='ocrx_word' id='word_1_125' title='bbox 529 863 646 883; x_wconf 86' lang='eng' dir='ltr'><em>Reinekea</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 655 863 908 883; x_wconf 83' lang='eng' dir='ltr'><em>marinisedimentorum</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 919 862 977 883; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 991 860 1077 883; x_wconf 79' lang='eng' dir='ltr'><em>15388T</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 1087 862 1229 889; x_wconf 88' lang='eng' dir='ltr'><em>(AJ561121)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 423 901 1034 930; baseline 0.002 -6"><span class='ocrx_word' id='word_1_130' title='bbox 423 903 643 930; x_wconf 84' lang='eng' dir='ltr'><em>Saccharospiri/Ium</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 652 904 772 930; x_wconf 88' lang='eng' dir='ltr'><em>impatiens</em></span> <span class='ocrx_word' id='word_1_132' title='bbox 782 901 881 925; x_wconf 92' lang='eng' dir='ltr'><em>EL—105T</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 891 904 1034 930; x_wconf 83' lang='eng' dir='ltr'><em>(AJ315983)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 549 942 1069 971">
+     <span class='ocr_line' id='line_1_47' title="bbox 549 942 1069 971; baseline 0 -6"><span class='ocrx_word' id='word_1_134' title='bbox 549 945 662 971; x_wconf 82' lang='eng' dir='ltr'><em>KangleI/a</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 672 945 791 965; x_wconf 85' lang='eng' dir='ltr'><em>koreensis</em></span> <span class='ocrx_word' id='word_1_136' title='bbox 800 942 912 965; x_wconf 89' lang='eng' dir='ltr'><em>SW-125T</em></span> <span class='ocrx_word' id='word_1_137' title='bbox 922 944 1069 971; x_wconf 86' lang='eng' dir='ltr'><em>(AY520560)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002220-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002220-0-000.pbm.png
new file mode 100644
index 00000000..2de6edd5
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002220-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002220-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002220-0-000.pbm.png.hocr
new file mode 100644
index 00000000..26663842
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002220-0-000.pbm.png.hocr
@@ -0,0 +1,220 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002220-0-000.pbm.png"; bbox 0 0 1243 1660; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 7 429 35 450">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 7 429 35 450">
+     <span class='ocr_line' id='line_1_1' title="bbox 7 429 35 450; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 7 429 35 450; x_wconf 85' lang='eng'>56</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 48 3 99 23">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 48 3 99 23">
+     <span class='ocr_line' id='line_1_2' title="bbox 48 3 99 23; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 48 3 99 23; x_wconf 91' lang='eng'><em>002</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 54 149 83 169">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 54 149 83 169">
+     <span class='ocr_line' id='line_1_3' title="bbox 54 149 83 169; baseline 0 0"><span class='ocrx_word' id='word_1_3' title='bbox 54 149 83 169; x_wconf 85' lang='eng'><em>99</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 52 761 80 781">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 52 761 80 781">
+     <span class='ocr_line' id='line_1_4' title="bbox 52 761 80 781; baseline 0 0"><span class='ocrx_word' id='word_1_4' title='bbox 52 761 80 781; x_wconf 93' lang='eng'><em>84</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 41 1454 83 1475">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 41 1454 83 1475">
+     <span class='ocr_line' id='line_1_5' title="bbox 41 1454 83 1475; baseline 0.024 -1"><span class='ocrx_word' id='word_1_5' title='bbox 41 1454 83 1475; x_wconf 85' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 135 78 177 99">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 135 78 177 99">
+     <span class='ocr_line' id='line_1_6' title="bbox 135 78 177 99; baseline 0 0"><span class='ocrx_word' id='word_1_6' title='bbox 135 78 177 99; x_wconf 86' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 98 508 141 529">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 98 508 141 529">
+     <span class='ocr_line' id='line_1_7' title="bbox 98 508 141 529; baseline 0 0"><span class='ocrx_word' id='word_1_7' title='bbox 98 508 141 529; x_wconf 82' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 88 956 116 976">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 88 956 116 976">
+     <span class='ocr_line' id='line_1_8' title="bbox 88 956 116 976; baseline 0 0"><span class='ocrx_word' id='word_1_8' title='bbox 88 956 116 976; x_wconf 89' lang='eng'>74</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 134 729 176 750">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 134 729 176 750">
+     <span class='ocr_line' id='line_1_9' title="bbox 134 729 176 750; baseline 0 0"><span class='ocrx_word' id='word_1_9' title='bbox 134 729 176 750; x_wconf 85' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 134 1139 176 1160">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 134 1139 176 1160">
+     <span class='ocr_line' id='line_1_10' title="bbox 134 1139 176 1160; baseline 0 0"><span class='ocrx_word' id='word_1_10' title='bbox 134 1139 176 1160; x_wconf 87' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 301 357 330 377">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 301 357 330 377">
+     <span class='ocr_line' id='line_1_11' title="bbox 301 357 330 377; baseline 0 0"><span class='ocrx_word' id='word_1_11' title='bbox 301 357 330 377; x_wconf 85' lang='eng'>96</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 250 426 292 447">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 250 426 292 447">
+     <span class='ocr_line' id='line_1_12' title="bbox 250 426 292 447; baseline 0 0"><span class='ocrx_word' id='word_1_12' title='bbox 250 426 292 447; x_wconf 87' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 308 915 350 936">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 308 915 350 936">
+     <span class='ocr_line' id='line_1_13' title="bbox 308 915 350 936; baseline 0.024 -1"><span class='ocrx_word' id='word_1_13' title='bbox 308 915 350 936; x_wconf 87' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 265 985 294 1005">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 265 985 294 1005">
+     <span class='ocr_line' id='line_1_14' title="bbox 265 985 294 1005; baseline 0 0"><span class='ocrx_word' id='word_1_14' title='bbox 265 985 294 1005; x_wconf 91' lang='eng'><em>50</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 280 1244 322 1265">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 280 1244 322 1265">
+     <span class='ocr_line' id='line_1_15' title="bbox 280 1244 322 1265; baseline 0 0"><span class='ocrx_word' id='word_1_15' title='bbox 280 1244 322 1265; x_wconf 90' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 250 1524 292 1545">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 250 1524 292 1545">
+     <span class='ocr_line' id='line_1_16' title="bbox 250 1524 292 1545; baseline 0.024 -1"><span class='ocrx_word' id='word_1_16' title='bbox 250 1524 292 1545; x_wconf 85' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 414 46 957 75">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 414 46 957 75">
+     <span class='ocr_line' id='line_1_17' title="bbox 414 46 957 75; baseline 0 -6"><span class='ocrx_word' id='word_1_17' title='bbox 414 49 491 69; x_wconf 77' lang='eng' dir='ltr'><em>Haliea</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 501 49 633 75; x_wconf 83' lang='eng' dir='ltr'><em>salexigens</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 643 48 701 69; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 715 46 801 69; x_wconf 80' lang='eng' dir='ltr'><em>19537T</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 811 49 957 75; x_wconf 85' lang='eng' dir='ltr'><em>(AY576769)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 490 140 1052 169">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 490 140 1052 169">
+     <span class='ocr_line' id='line_1_18' title="bbox 490 140 1052 169; baseline 0 -6"><span class='ocrx_word' id='word_1_22' title='bbox 490 142 566 163; x_wconf 86' lang='eng' dir='ltr'><em>Strain</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 578 140 726 168; x_wconf 89' lang='eng' dir='ltr'><em>CM41_15aT</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 736 140 1052 169; x_wconf 79' lang='eng' dir='ltr'><em>DSM19751T(EU161717)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 518 235 1072 263">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 518 235 1072 263">
+     <span class='ocr_line' id='line_1_19' title="bbox 518 235 1072 263; baseline -0.002 -5"><span class='ocrx_word' id='word_1_25' title='bbox 518 237 606 258; x_wconf 83' lang='eng' dir='ltr'><em>Melitea</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 615 237 748 263; x_wconf 79' lang='eng' dir='ltr'><em>salexigens</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 758 237 816 258; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 829 235 916 258; x_wconf 81' lang='eng' dir='ltr'><em>19753T</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 926 237 1072 263; x_wconf 87' lang='eng' dir='ltr'><em>(AY576729)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 392 329 933 357">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 392 329 933 357">
+     <span class='ocr_line' id='line_1_20' title="bbox 392 329 933 357; baseline 0.002 -6"><span class='ocrx_word' id='word_1_30' title='bbox 392 331 554 352; x_wconf 83' lang='eng' dir='ltr'><em>Microbulbifer</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 560 331 691 357; x_wconf 85' lang='eng' dir='ltr'><em>salipa/udis</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 700 331 761 352; x_wconf 78' lang='eng' dir='ltr'><em>SM—‘l</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 767 329 778 343; x_wconf 73' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_34' title='bbox 788 331 933 357; x_wconf 82' lang='eng' dir='ltr'><em>(AF479688)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 408 420 1045 448">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 408 420 1045 448">
+     <span class='ocr_line' id='line_1_21' title="bbox 408 420 1045 448; baseline 0.002 -6"><span class='ocrx_word' id='word_1_35' title='bbox 408 422 570 443; x_wconf 86' lang='eng' dir='ltr'><em>Microbulbifer</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 577 422 725 448; x_wconf 86' lang='eng' dir='ltr'><em>hydrolyticus</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 735 422 793 443; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 806 422 813 442; x_wconf 84' lang='eng'><strong>1</strong></span> <span class='ocrx_word' id='word_1_39' title='bbox 821 420 893 443; x_wconf 87' lang='eng' dir='ltr'><em>1525T</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 903 422 1045 448; x_wconf 83' lang='eng' dir='ltr'><em>(AJ608704)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 423 515 1019 543">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 423 515 1019 543">
+     <span class='ocr_line' id='line_1_22' title="bbox 423 515 1019 543; baseline 0.002 -6"><span class='ocrx_word' id='word_1_41' title='bbox 423 517 584 538; x_wconf 77' lang='eng' dir='ltr'><em>Microbulb/fer</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 591 517 712 543; x_wconf 81' lang='eng' dir='ltr'><em>elongatus</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 722 517 780 538; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 791 515 865 538; x_wconf 80' lang='eng' dir='ltr'><em>6810T</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 875 517 1019 543; x_wconf 89' lang='eng' dir='ltr'><em>(AF500006)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 432 607 973 636">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 432 607 973 636">
+     <span class='ocr_line' id='line_1_23' title="bbox 432 607 973 636; baseline 0 -6"><span class='ocrx_word' id='word_1_46' title='bbox 432 610 593 631; x_wconf 85' lang='eng' dir='ltr'><em>Microbulbifer</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 600 610 722 631; x_wconf 81' lang='eng' dir='ltr'><em>maritimus</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 730 610 784 630; x_wconf 82' lang='eng' dir='ltr'><em>TF—1</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 790 607 816 630; x_wconf 94' lang='eng' dir='ltr'><em>7T</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 826 610 973 636; x_wconf 84' lang='eng' dir='ltr'><em>(AY377986)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 466 700 1058 728">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 466 700 1058 728">
+     <span class='ocr_line' id='line_1_24' title="bbox 466 700 1058 728; baseline 0 -5"><span class='ocrx_word' id='word_1_51' title='bbox 466 702 579 723; x_wconf 85' lang='eng' dir='ltr'><em>Cellvibrio</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 584 702 706 728; x_wconf 82' lang='eng' dir='ltr'><em>japonicus</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 717 702 804 723; x_wconf 88' lang='eng' dir='ltr'>NCIMB</span> <span class='ocrx_word' id='word_1_54' title='bbox 815 700 903 723; x_wconf 78' lang='eng' dir='ltr'><em>10462T</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 912 702 1058 728; x_wconf 83' lang='eng' dir='ltr'><em>(AF452103)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 498 795 993 821">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 498 795 993 821">
+     <span class='ocr_line' id='line_1_25' title="bbox 498 795 993 821; baseline 0.002 -6"><span class='ocrx_word' id='word_1_56' title='bbox 498 795 610 816; x_wconf 84' lang='eng' dir='ltr'><em>CeI/vibrio</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 620 795 701 816; x_wconf 79' lang='eng' dir='ltr'><em>mixtus</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 709 795 769 816; x_wconf 92' lang='eng' dir='ltr'><em>ACM</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 780 795 840 816; x_wconf 86' lang='eng'><em>2603</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 851 795 993 821; x_wconf 83' lang='eng' dir='ltr'><em>(AJ289160)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 452 883 1142 912">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 452 883 1142 912">
+     <span class='ocr_line' id='line_1_26' title="bbox 452 883 1142 912; baseline -0.001 -5"><span class='ocrx_word' id='word_1_61' title='bbox 452 886 630 907; x_wconf 84' lang='eng' dir='ltr'><em>Pseudomonas</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 638 886 870 912; x_wconf 83' lang='eng' dir='ltr'><em>pseudoalcaligenes</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 881 885 938 907; x_wconf 93' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 950 883 1021 907; x_wconf 86' lang='eng' dir='ltr'><em>1225T</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 1031 886 1142 912; x_wconf 84' lang='eng'><em>(276666)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 463 979 1036 1005">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 463 979 1036 1005">
+     <span class='ocr_line' id='line_1_27' title="bbox 463 979 1036 1005; baseline 0 -5"><span class='ocrx_word' id='word_1_66' title='bbox 463 979 641 1000; x_wconf 88' lang='eng' dir='ltr'><em>Pseudomonas</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 651 979 741 1000; x_wconf 84' lang='eng' dir='ltr'><em>stutzeri</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 750 979 808 1000; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 819 979 880 1000; x_wconf 85' lang='eng'><em>7136</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 890 979 1036 1005; x_wconf 81' lang='eng' dir='ltr'><em>(AF063219)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 447 1073 959 1099">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 447 1073 959 1099">
+     <span class='ocr_line' id='line_1_28' title="bbox 447 1073 959 1099; baseline -0.002 -5"><span class='ocrx_word' id='word_1_71' title='bbox 447 1073 624 1094; x_wconf 85' lang='eng' dir='ltr'><em>Pseudomonas</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 633 1073 745 1094; x_wconf 85' lang='eng' dir='ltr'><em>balearica</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 757 1073 830 1094; x_wconf 85' lang='eng' dir='ltr'><em>LS401</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 845 1073 959 1099; x_wconf 85' lang='eng' dir='ltr'><em>(U26417)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 455 1163 1087 1192">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 455 1163 1087 1192">
+     <span class='ocr_line' id='line_1_29' title="bbox 455 1163 1087 1192; baseline 0 -6"><span class='ocrx_word' id='word_1_75' title='bbox 455 1165 633 1186; x_wconf 87' lang='eng' dir='ltr'><em>Pseudomonas</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 642 1165 763 1186; x_wconf 87' lang='eng' dir='ltr'><em>rhodesiae</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 774 1165 833 1186; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 846 1163 932 1186; x_wconf 76' lang='eng' dir='ltr'><em>14020T</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 942 1165 1087 1192; x_wconf 86' lang='eng' dir='ltr'><em>(AF064459)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 457 1259 1096 1288">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 457 1259 1096 1288">
+     <span class='ocr_line' id='line_1_30' title="bbox 457 1259 1096 1288; baseline 0 -6"><span class='ocrx_word' id='word_1_80' title='bbox 457 1262 635 1282; x_wconf 85' lang='eng' dir='ltr'><em>Pseudomonas</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 644 1262 751 1288; x_wconf 79' lang='eng' dir='ltr'><em>grimontii</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 759 1261 834 1282; x_wconf 89' lang='eng' dir='ltr'>CFML</span> <span class='ocrx_word' id='word_1_83' title='bbox 844 1259 942 1282; x_wconf 79' lang='eng' dir='ltr'><em>97—514T</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 951 1262 1096 1288; x_wconf 87' lang='eng' dir='ltr'><em>(AF268029)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 623 1347 1222 1376">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 623 1347 1222 1376">
+     <span class='ocr_line' id='line_1_31' title="bbox 623 1347 1222 1376; baseline -0.002 -5"><span class='ocrx_word' id='word_1_85' title='bbox 623 1350 797 1371; x_wconf 75' lang='eng' dir='ltr'><em>Acinetobacter</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 804 1350 901 1371; x_wconf 86' lang='eng' dir='ltr'><em>bouvetii</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 910 1350 968 1371; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 981 1347 1068 1371; x_wconf 79' lang='eng' dir='ltr'><em>14964T</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 1078 1350 1222 1376; x_wconf 84' lang='eng' dir='ltr'><em>(AF509827)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 642 1443 1160 1472">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 642 1443 1160 1472">
+     <span class='ocr_line' id='line_1_32' title="bbox 642 1443 1160 1472; baseline 0 -6"><span class='ocrx_word' id='word_1_90' title='bbox 642 1446 761 1466; x_wconf 81' lang='eng' dir='ltr'><em>Moraxella</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 771 1446 824 1472; x_wconf 86' lang='eng' dir='ltr'><em>equi</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 831 1445 906 1466; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 916 1443 1006 1466; x_wconf 79' lang='eng' dir='ltr'><em>25576T</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 1015 1446 1160 1472; x_wconf 87' lang='eng' dir='ltr'><em>(AF005184)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 660 1533 1239 1562">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 660 1533 1239 1562">
+     <span class='ocr_line' id='line_1_33' title="bbox 660 1533 1239 1562; baseline 0 -6"><span class='ocrx_word' id='word_1_95' title='bbox 660 1536 840 1562; x_wconf 80' lang='eng' dir='ltr'><em>Psychrobacter</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 847 1536 966 1562; x_wconf 79' lang='eng' dir='ltr'><em>aquaticus</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 975 1535 1035 1556; x_wconf 86' lang='eng' dir='ltr'><em>CMS</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 1046 1533 1088 1556; x_wconf 77' lang='eng' dir='ltr'><em>56T</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 1097 1536 1239 1562; x_wconf 83' lang='eng' dir='ltr'><em>(AJ584833)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 407 1626 1031 1655">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 407 1626 1031 1655">
+     <span class='ocr_line' id='line_1_34' title="bbox 407 1626 1031 1655; baseline 0 -6"><span class='ocrx_word' id='word_1_100' title='bbox 407 1629 552 1649; x_wconf 84' lang='eng' dir='ltr'><em>Alcanivorax</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 563 1629 709 1649; x_wconf 76' lang='eng' dir='ltr'><em>venustensis</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 719 1628 777 1649; x_wconf 86' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 790 1626 877 1649; x_wconf 81' lang='eng' dir='ltr'><em>13974T</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 887 1629 1031 1655; x_wconf 85' lang='eng' dir='ltr'><em>(AF328766)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002287-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002287-0-000.pbm.png
new file mode 100644
index 00000000..ff445d95
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002287-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002287-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002287-0-000.pbm.png.hocr
new file mode 100644
index 00000000..484aa414
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002287-0-000.pbm.png.hocr
@@ -0,0 +1,287 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002287-0-000.pbm.png"; bbox 0 0 1243 926; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 25 78 1240 922">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 25 78 1135 551">
+     <span class='ocr_line' id='line_1_1' title="bbox 320 78 861 120; baseline 0 -19"><span class='ocrx_word' id='word_1_1' title='bbox 320 97 355 114; x_wconf 62' lang='eng'>100</span> <span class='ocrx_word' id='word_1_2' title='bbox 453 103 477 120; x_wconf 69' lang='eng'>94</span> <span class='ocrx_word' id='word_1_3' title='bbox 495 79 516 101; x_wconf 97' lang='eng' dir='ltr'><strong><em>T.</em></strong></span> <span class='ocrx_word' id='word_1_4' title='bbox 527 79 607 107; x_wconf 90' lang='eng' dir='ltr'><strong><em>pedis</em></strong></span> <span class='ocrx_word' id='word_1_5' title='bbox 616 79 689 101; x_wconf 80' lang='eng' dir='ltr'>T183</span> <span class='ocrx_word' id='word_1_6' title='bbox 701 78 861 107; x_wconf 91' lang='eng' dir='ltr'>(EF061270)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 495 115 878 144; baseline 0 -6"><span class='ocrx_word' id='word_1_7' title='bbox 495 115 516 138; x_wconf 90' lang='eng'>7&#39;.</span> <span class='ocrx_word' id='word_1_8' title='bbox 527 115 607 144; x_wconf 91' lang='eng' dir='ltr'>pedis</span> <span class='ocrx_word' id='word_1_9' title='bbox 616 115 708 138; x_wconf 87' lang='eng' dir='ltr'>T354A</span> <span class='ocrx_word' id='word_1_10' title='bbox 718 115 878 144; x_wconf 89' lang='eng' dir='ltr'>(EF061267)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 227 152 986 181; baseline 0.003 -8"><span class='ocrx_word' id='word_1_11' title='bbox 227 157 246 173; x_wconf 86' lang='eng'>71</span> <span class='ocrx_word' id='word_1_12' title='bbox 399 162 436 164; x_wconf 96' lang='eng'>—</span> <span class='ocrx_word' id='word_1_13' title='bbox 449 152 469 175; x_wconf 97' lang='eng' dir='ltr'>T.</span> <span class='ocrx_word' id='word_1_14' title='bbox 482 152 603 175; x_wconf 83' lang='eng' dir='ltr'>dent/cola</span> <span class='ocrx_word' id='word_1_15' title='bbox 613 152 695 175; x_wconf 92' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_16' title='bbox 706 152 802 175; x_wconf 82' lang='eng' dir='ltr'>35405T</span> <span class='ocrx_word' id='word_1_17' title='bbox 812 152 864 181; x_wconf 94' lang='eng' dir='ltr'>(NC</span> <span class='ocrx_word' id='word_1_18' title='bbox 875 152 986 181; x_wconf 88' lang='eng'>002967)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 369 189 968 218; baseline 0 -6"><span class='ocrx_word' id='word_1_19' title='bbox 369 196 433 212; x_wconf 84' lang='eng'>97—</span> <span class='ocrx_word' id='word_1_20' title='bbox 446 190 466 212; x_wconf 95' lang='eng' dir='ltr'><strong><em>T.</em></strong></span> <span class='ocrx_word' id='word_1_21' title='bbox 477 190 586 218; x_wconf 89' lang='eng' dir='ltr'>putidum</span> <span class='ocrx_word' id='word_1_22' title='bbox 595 189 678 212; x_wconf 93' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_23' title='bbox 689 189 802 212; x_wconf 81' lang='eng' dir='ltr'>700334T</span> <span class='ocrx_word' id='word_1_24' title='bbox 812 189 968 218; x_wconf 88' lang='eng' dir='ltr'>(AJ543428)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 466 226 942 255; baseline 0 -6"><span class='ocrx_word' id='word_1_25' title='bbox 466 226 496 249; x_wconf 75' lang='eng' dir='ltr'><em>‘T.</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 507 226 671 255; x_wconf 86' lang='eng' dir='ltr'>phagedenis‘</span> <span class='ocrx_word' id='word_1_27' title='bbox 683 226 755 249; x_wconf 87' lang='eng' dir='ltr'>strain</span> <span class='ocrx_word' id='word_1_28' title='bbox 767 226 802 249; x_wconf 93' lang='eng' dir='ltr'>K5</span> <span class='ocrx_word' id='word_1_29' title='bbox 813 226 942 255; x_wconf 89' lang='eng' dir='ltr'>(M57739)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 176 263 1088 297; baseline 0 -11"><span class='ocrx_word' id='word_1_30' title='bbox 176 281 200 297; x_wconf 69' lang='eng'>87</span> <span class='ocrx_word' id='word_1_31' title='bbox 588 263 617 286; x_wconf 80' lang='eng' dir='ltr'><em>‘T.</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 630 263 770 292; x_wconf 70' lang='eng' dir='ltr'>refringens‘</span> <span class='ocrx_word' id='word_1_33' title='bbox 782 263 831 286; x_wconf 93' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_34' title='bbox 842 263 916 286; x_wconf 87' lang='eng'>51.64</span> <span class='ocrx_word' id='word_1_35' title='bbox 928 263 1088 292; x_wconf 89' lang='eng' dir='ltr'>(AF426101)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 426 301 1135 329; baseline -0.001 -5"><span class='ocrx_word' id='word_1_36' title='bbox 426 307 623 324; x_wconf 85' lang='eng'>100—</span> <span class='ocrx_word' id='word_1_37' title='bbox 634 301 663 323; x_wconf 83' lang='eng' dir='ltr'><em>‘T.</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 676 301 817 329; x_wconf 73' lang='eng' dir='ltr'>calligyrum’</span> <span class='ocrx_word' id='word_1_39' title='bbox 830 301 878 323; x_wconf 90' lang='eng' dir='ltr'><strong>CIP</strong></span> <span class='ocrx_word' id='word_1_40' title='bbox 889 301 963 323; x_wconf 89' lang='eng'>64.40</span> <span class='ocrx_word' id='word_1_41' title='bbox 975 301 1135 329; x_wconf 89' lang='eng' dir='ltr'>(AF426100)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 119 337 1011 366; baseline 0.002 -8"><span class='ocrx_word' id='word_1_42' title='bbox 119 341 154 358; x_wconf 84' lang='eng'>100</span> <span class='ocrx_word' id='word_1_43' title='bbox 443 347 468 349; x_wconf 96' lang='eng'>—</span> <span class='ocrx_word' id='word_1_44' title='bbox 478 338 508 360; x_wconf 82' lang='eng' dir='ltr'><em>‘T.</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 522 338 635 360; x_wconf 73' lang='eng' dir='ltr'>vincentil&quot;</span> <span class='ocrx_word' id='word_1_46' title='bbox 646 337 729 360; x_wconf 93' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_47' title='bbox 739 338 840 360; x_wconf 88' lang='eng'>700013</span> <span class='ocrx_word' id='word_1_48' title='bbox 851 337 1011 366; x_wconf 87' lang='eng' dir='ltr'>(AF033310)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 404 374 974 403; baseline 0 -6"><span class='ocrx_word' id='word_1_49' title='bbox 404 381 470 398; x_wconf 83' lang='eng'>100—</span> <span class='ocrx_word' id='word_1_50' title='bbox 482 375 502 397; x_wconf 97' lang='eng' dir='ltr'>T.</span> <span class='ocrx_word' id='word_1_51' title='bbox 515 375 622 397; x_wconf 92' lang='eng' dir='ltr'><em>medium</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 631 374 714 397; x_wconf 92' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_53' title='bbox 725 374 838 397; x_wconf 85' lang='eng' dir='ltr'>700293T</span> <span class='ocrx_word' id='word_1_54' title='bbox 849 374 974 403; x_wconf 91' lang='eng' dir='ltr'>(D85437)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 533 411 1065 440; baseline 0 -6"><span class='ocrx_word' id='word_1_55' title='bbox 533 412 554 434; x_wconf 95' lang='eng' dir='ltr'>T.</span> <span class='ocrx_word' id='word_1_56' title='bbox 565 412 679 440; x_wconf 88' lang='eng' dir='ltr'><em>pallidum</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 691 412 788 434; x_wconf 90' lang='eng' dir='ltr'>Nichols</span> <span class='ocrx_word' id='word_1_58' title='bbox 799 412 871 434; x_wconf 86' lang='eng' dir='ltr'>strain</span> <span class='ocrx_word' id='word_1_59' title='bbox 883 411 1065 440; x_wconf 86' lang='eng' dir='ltr'>(NC_000919)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 54 448 875 477; baseline 0 -6"><span class='ocrx_word' id='word_1_60' title='bbox 54 458 308 460; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_61' title='bbox 320 449 340 471; x_wconf 95' lang='eng' dir='ltr'>T.</span> <span class='ocrx_word' id='word_1_62' title='bbox 353 449 558 471; x_wconf 89' lang='eng' dir='ltr'>brennaborense</span> <span class='ocrx_word' id='word_1_63' title='bbox 569 448 633 471; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_64' title='bbox 647 448 741 471; x_wconf 81' lang='eng' dir='ltr'>12168T</span> <span class='ocrx_word' id='word_1_65' title='bbox 751 448 875 477; x_wconf 84' lang='eng' dir='ltr'>(Y16568)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 25 485 1007 517; baseline 0 -9"><span class='ocrx_word' id='word_1_66' title='bbox 25 501 48 517; x_wconf 70' lang='eng'>87</span> <span class='ocrx_word' id='word_1_67' title='bbox 385 486 405 508; x_wconf 94' lang='eng' dir='ltr'>T.</span> <span class='ocrx_word' id='word_1_68' title='bbox 418 486 625 514; x_wconf 81' lang='eng' dir='ltr'>Iecithinolyticum</span> <span class='ocrx_word' id='word_1_69' title='bbox 634 485 716 508; x_wconf 93' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_70' title='bbox 728 485 841 508; x_wconf 81' lang='eng' dir='ltr'>700332T</span> <span class='ocrx_word' id='word_1_71' title='bbox 851 485 1007 514; x_wconf 90' lang='eng' dir='ltr'>(AJ131282)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 243 522 915 551; baseline 0 -6"><span class='ocrx_word' id='word_1_72' title='bbox 243 529 373 545; x_wconf 82' lang='eng'>100—</span> <span class='ocrx_word' id='word_1_73' title='bbox 385 522 405 545; x_wconf 95' lang='eng' dir='ltr'>T.</span> <span class='ocrx_word' id='word_1_74' title='bbox 418 522 582 551; x_wconf 89' lang='eng' dir='ltr'>maltophilum</span> <span class='ocrx_word' id='word_1_75' title='bbox 591 522 674 545; x_wconf 93' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_76' title='bbox 685 522 781 545; x_wconf 80' lang='eng' dir='ltr'>51939T</span> <span class='ocrx_word' id='word_1_77' title='bbox 791 522 915 551; x_wconf 92' lang='eng' dir='ltr'>(X87140)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 28 559 1196 773">
+     <span class='ocr_line' id='line_1_14' title="bbox 115 559 938 588; baseline 0 -6"><span class='ocrx_word' id='word_1_78' title='bbox 115 568 343 585; x_wconf 76' lang='eng'>99—</span> <span class='ocrx_word' id='word_1_79' title='bbox 356 559 376 582; x_wconf 93' lang='eng' dir='ltr'>T.</span> <span class='ocrx_word' id='word_1_80' title='bbox 389 559 529 582; x_wconf 87' lang='eng' dir='ltr'>berlinense</span> <span class='ocrx_word' id='word_1_81' title='bbox 538 559 621 582; x_wconf 93' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_82' title='bbox 633 559 766 582; x_wconf 77' lang='eng' dir='ltr'>BAA-909T</span> <span class='ocrx_word' id='word_1_83' title='bbox 776 559 938 588; x_wconf 88' lang='eng' dir='ltr'>(AY230217)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 43 596 949 626; baseline 0.001 -7"><span class='ocrx_word' id='word_1_84' title='bbox 43 596 67 613; x_wconf 87' lang='eng'>40</span> <span class='ocrx_word' id='word_1_85' title='bbox 145 606 352 608; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_86' title='bbox 364 596 385 619; x_wconf 94' lang='eng' dir='ltr'>T.</span> <span class='ocrx_word' id='word_1_87' title='bbox 396 596 580 625; x_wconf 83' lang='eng' dir='ltr'>pectinovorum</span> <span class='ocrx_word' id='word_1_88' title='bbox 589 596 672 620; x_wconf 88' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_89' title='bbox 683 596 779 620; x_wconf 80' lang='eng' dir='ltr'>33768T</span> <span class='ocrx_word' id='word_1_90' title='bbox 789 596 949 626; x_wconf 86' lang='eng' dir='ltr'>(AF302940)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 602 633 1186 663; baseline 0 -7"><span class='ocrx_word' id='word_1_91' title='bbox 602 634 623 656; x_wconf 96' lang='eng' dir='ltr'>T.</span> <span class='ocrx_word' id='word_1_92' title='bbox 635 634 849 662; x_wconf 84' lang='eng' dir='ltr'>saccharophilum</span> <span class='ocrx_word' id='word_1_93' title='bbox 858 633 940 656; x_wconf 92' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_94' title='bbox 950 633 1048 656; x_wconf 80' lang='eng' dir='ltr'>43261T</span> <span class='ocrx_word' id='word_1_95' title='bbox 1058 633 1186 663; x_wconf 85' lang='eng' dir='ltr'>(M71238)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 28 670 939 704; baseline 0 -11"><span class='ocrx_word' id='word_1_96' title='bbox 28 687 52 704; x_wconf 61' lang='eng'>,9</span> <span class='ocrx_word' id='word_1_97' title='bbox 87 680 458 682; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_98' title='bbox 470 671 491 693; x_wconf 95' lang='eng' dir='ltr'>T.</span> <span class='ocrx_word' id='word_1_99' title='bbox 503 671 602 699; x_wconf 81' lang='eng' dir='ltr'>bryantii</span> <span class='ocrx_word' id='word_1_100' title='bbox 610 670 692 693; x_wconf 93' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_101' title='bbox 703 670 799 693; x_wconf 84' lang='eng' dir='ltr'>33254T</span> <span class='ocrx_word' id='word_1_102' title='bbox 809 670 939 699; x_wconf 87' lang='eng' dir='ltr'>(M57737)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 115 707 972 736; baseline 0 -6"><span class='ocrx_word' id='word_1_103' title='bbox 115 716 393 733; x_wconf 80' lang='eng'>51—</span> <span class='ocrx_word' id='word_1_104' title='bbox 405 708 426 730; x_wconf 96' lang='eng' dir='ltr'>T.</span> <span class='ocrx_word' id='word_1_105' title='bbox 437 708 563 736; x_wconf 88' lang='eng' dir='ltr'><em>porcinum</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 572 707 655 730; x_wconf 91' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_107' title='bbox 667 707 800 730; x_wconf 82' lang='eng' dir='ltr'>BAA-908T</span> <span class='ocrx_word' id='word_1_108' title='bbox 810 707 972 736; x_wconf 90' lang='eng' dir='ltr'>(AY518274)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 58 744 1196 773; baseline 0 -6"><span class='ocrx_word' id='word_1_109' title='bbox 58 744 78 760; x_wconf 77' lang='eng'>51</span> <span class='ocrx_word' id='word_1_110' title='bbox 145 754 623 756; x_wconf 94' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_111' title='bbox 635 745 656 767; x_wconf 94' lang='eng' dir='ltr'>T.</span> <span class='ocrx_word' id='word_1_112' title='bbox 668 744 859 767; x_wconf 86' lang='eng' dir='ltr'>succinifaciens</span> <span class='ocrx_word' id='word_1_113' title='bbox 867 744 950 767; x_wconf 93' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_114' title='bbox 961 744 1057 767; x_wconf 83' lang='eng' dir='ltr'>33096T</span> <span class='ocrx_word' id='word_1_115' title='bbox 1067 744 1196 773; x_wconf 89' lang='eng' dir='ltr'>(M57738)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 83 781 1015 851">
+     <span class='ocr_line' id='line_1_20' title="bbox 83 781 1015 810; baseline 0 -6"><span class='ocrx_word' id='word_1_116' title='bbox 83 792 106 809; x_wconf 74' lang='eng'>59</span> <span class='ocrx_word' id='word_1_117' title='bbox 151 791 455 793; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_118' title='bbox 467 782 488 804; x_wconf 95' lang='eng' dir='ltr'>T.</span> <span class='ocrx_word' id='word_1_119' title='bbox 500 782 666 810; x_wconf 85' lang='eng' dir='ltr'><em>amylovorum</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 674 781 757 804; x_wconf 94' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_121' title='bbox 768 781 882 804; x_wconf 78' lang='eng' dir='ltr'>700288T</span> <span class='ocrx_word' id='word_1_122' title='bbox 892 781 1015 810; x_wconf 88' lang='eng' dir='ltr'>(Y09959)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 122 818 950 851; baseline 0 -10"><span class='ocrx_word' id='word_1_123' title='bbox 122 828 418 851; x_wconf 67' lang='eng'>65_—</span> <span class='ocrx_word' id='word_1_124' title='bbox 430 819 451 841; x_wconf 95' lang='eng' dir='ltr'>T.</span> <span class='ocrx_word' id='word_1_125' title='bbox 462 824 564 847; x_wconf 87' lang='eng' dir='ltr'><em>parvum</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 572 818 655 841; x_wconf 93' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_127' title='bbox 666 818 779 841; x_wconf 85' lang='eng' dir='ltr'>700770T</span> <span class='ocrx_word' id='word_1_128' title='bbox 789 818 950 847; x_wconf 84' lang='eng' dir='ltr'>(AF302938)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 162 855 1240 922">
+     <span class='ocr_line' id='line_1_22' title="bbox 162 855 1233 884; baseline 0 -6"><span class='ocrx_word' id='word_1_129' title='bbox 162 865 610 867; x_wconf 94' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_130' title='bbox 622 856 642 878; x_wconf 95' lang='eng' dir='ltr'>T.</span> <span class='ocrx_word' id='word_1_131' title='bbox 655 856 792 878; x_wconf 83' lang='eng' dir='ltr'>socranskii</span> <span class='ocrx_word' id='word_1_132' title='bbox 800 856 887 884; x_wconf 90' lang='eng' dir='ltr'>subsp.</span> <span class='ocrx_word' id='word_1_133' title='bbox 899 856 1036 878; x_wconf 85' lang='eng' dir='ltr'>socranskii</span> <span class='ocrx_word' id='word_1_134' title='bbox 1043 855 1126 878; x_wconf 89' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_135' title='bbox 1137 855 1233 878; x_wconf 83' lang='eng' dir='ltr'>35536T</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 1081 892 1240 922; baseline 0 -7"><span class='ocrx_word' id='word_1_136' title='bbox 1081 892 1240 922; x_wconf 84' lang='eng' dir='ltr'>(AF033306)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 34 4 907 127">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 34 4 907 127">
+     <span class='ocr_line' id='line_1_24' title="bbox 34 4 905 48; baseline 0 -21"><span class='ocrx_word' id='word_1_137' title='bbox 34 28 47 48; x_wconf 73' lang='eng'>0</span> <span class='ocrx_word' id='word_1_138' title='bbox 57 28 85 48; x_wconf 73' lang='eng'>02</span> <span class='ocrx_word' id='word_1_139' title='bbox 493 5 515 27; x_wconf 97' lang='eng' dir='ltr'>T.</span> <span class='ocrx_word' id='word_1_140' title='bbox 525 5 606 33; x_wconf 86' lang='eng' dir='ltr'>pedis</span> <span class='ocrx_word' id='word_1_141' title='bbox 614 4 735 27; x_wconf 80' lang='eng' dir='ltr'>T35523T</span> <span class='ocrx_word' id='word_1_142' title='bbox 745 5 905 34; x_wconf 90' lang='eng' dir='ltr'>(EF061268)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 51 14 907 127; baseline 0 -60"><span class='ocrx_word' id='word_1_143' title='bbox 51 45 54 48; x_wconf 81' lang='eng'>&#39;</span> <span class='ocrx_word' id='word_1_144' title='bbox 359 14 483 127; x_wconf 35' lang='eng' dir='ltr'>A“</span> <span class='ocrx_word' id='word_1_145' title='bbox 495 44 516 67; x_wconf 87' lang='eng' dir='ltr'>T.</span> <span class='ocrx_word' id='word_1_146' title='bbox 527 44 607 73; x_wconf 88' lang='eng' dir='ltr'>pedis</span> <span class='ocrx_word' id='word_1_147' title='bbox 616 44 734 67; x_wconf 82' lang='eng' dir='ltr'><strong>GS19CB</strong></span> <span class='ocrx_word' id='word_1_148' title='bbox 746 42 907 74; x_wconf 88' lang='eng' dir='ltr'>(EF061269)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 254 116 359 118">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 254 116 359 118">
+     <span class='ocr_line' id='line_1_26' title="bbox 254 116 359 118; baseline 0 808"><span class='ocrx_word' id='word_1_149' title='bbox 254 116 359 118; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 357 51 359 182">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 357 51 359 182">
+     <span class='ocr_line' id='line_1_27' title="bbox 357 51 359 182; baseline 0 744"><span class='ocrx_word' id='word_1_150' title='bbox 357 51 359 182; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 357 180 399 182">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 357 180 399 182">
+     <span class='ocr_line' id='line_1_28' title="bbox 357 180 399 182; baseline 0 744"><span class='ocrx_word' id='word_1_151' title='bbox 357 180 399 182; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 397 162 399 200">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 397 162 399 200">
+     <span class='ocr_line' id='line_1_29' title="bbox 397 162 399 200; baseline 0 726"><span class='ocrx_word' id='word_1_152' title='bbox 397 162 399 200; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 254 116 256 238">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 254 116 256 238">
+     <span class='ocr_line' id='line_1_30' title="bbox 254 116 256 238; baseline 0 688"><span class='ocrx_word' id='word_1_153' title='bbox 254 116 256 238; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 204 233 456 235">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 204 233 456 235">
+     <span class='ocr_line' id='line_1_31' title="bbox 204 233 456 235; baseline 0 691"><span class='ocrx_word' id='word_1_154' title='bbox 204 233 456 235; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 465 273 578 275">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 465 273 578 275">
+     <span class='ocr_line' id='line_1_32' title="bbox 465 273 578 275; baseline 0 651"><span class='ocrx_word' id='word_1_155' title='bbox 465 273 578 275; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 229 176 230 293">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 229 176 230 293">
+     <span class='ocr_line' id='line_1_33' title="bbox 229 176 230 293; baseline 0 633"><span class='ocrx_word' id='word_1_156' title='bbox 229 176 230 293; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 228 291 465 293">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 228 291 465 293">
+     <span class='ocr_line' id='line_1_34' title="bbox 228 291 465 293; baseline 0 633"><span class='ocrx_word' id='word_1_157' title='bbox 228 291 465 293; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 463 273 465 312">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 463 273 465 312">
+     <span class='ocr_line' id='line_1_35' title="bbox 463 273 465 312; baseline 0 614"><span class='ocrx_word' id='word_1_158' title='bbox 463 273 465 312; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 204 233 205 367">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 204 233 205 367">
+     <span class='ocr_line' id='line_1_36' title="bbox 204 233 205 367; baseline 0 559"><span class='ocrx_word' id='word_1_159' title='bbox 204 233 205 367; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 16 360 158 362">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 16 360 158 362">
+     <span class='ocr_line' id='line_1_37' title="bbox 16 360 158 362; baseline 0 564"><span class='ocrx_word' id='word_1_160' title='bbox 16 360 158 362; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 204 366 443 367">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 204 366 443 367">
+     <span class='ocr_line' id='line_1_38' title="bbox 204 366 443 367; baseline 0 559"><span class='ocrx_word' id='word_1_161' title='bbox 204 366 443 367; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 441 347 443 386">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 441 347 443 386">
+     <span class='ocr_line' id='line_1_39' title="bbox 441 347 443 386; baseline 0 540"><span class='ocrx_word' id='word_1_162' title='bbox 441 347 443 386; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 156 301 158 423">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 156 301 158 423">
+     <span class='ocr_line' id='line_1_40' title="bbox 156 301 158 423; baseline 0 503"><span class='ocrx_word' id='word_1_163' title='bbox 156 301 158 423; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 16 360 18 487">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 16 360 18 487">
+     <span class='ocr_line' id='line_1_41' title="bbox 16 360 18 487; baseline 0 439"><span class='ocrx_word' id='word_1_164' title='bbox 16 360 18 487; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 16 486 54 487">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 16 486 54 487">
+     <span class='ocr_line' id='line_1_42' title="bbox 16 486 54 487; baseline 0 439"><span class='ocrx_word' id='word_1_165' title='bbox 16 486 54 487; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 52 458 54 515">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 52 458 54 515">
+     <span class='ocr_line' id='line_1_43' title="bbox 52 458 54 515; baseline 0 411"><span class='ocrx_word' id='word_1_166' title='bbox 52 458 54 515; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 282 495 373 497">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 282 495 373 497">
+     <span class='ocr_line' id='line_1_44' title="bbox 282 495 373 497; baseline 0 429"><span class='ocrx_word' id='word_1_167' title='bbox 282 495 373 497; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 52 513 282 515">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 52 513 282 515">
+     <span class='ocr_line' id='line_1_45' title="bbox 52 513 282 515; baseline 0 411"><span class='ocrx_word' id='word_1_168' title='bbox 52 513 282 515; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 280 495 282 534">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 280 495 282 534">
+     <span class='ocr_line' id='line_1_46' title="bbox 280 495 282 534; baseline 0 392"><span class='ocrx_word' id='word_1_169' title='bbox 280 495 282 534; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 56 615 73 617">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 56 615 73 617">
+     <span class='ocr_line' id='line_1_47' title="bbox 56 615 73 617; baseline 0 309"><span class='ocrx_word' id='word_1_170' title='bbox 56 615 73 617; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 71 587 73 645">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 71 587 73 645">
+     <span class='ocr_line' id='line_1_48' title="bbox 71 587 73 645; baseline 0 281"><span class='ocrx_word' id='word_1_171' title='bbox 71 587 73 645; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 71 643 590 645">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 71 643 590 645">
+     <span class='ocr_line' id='line_1_49' title="bbox 71 643 590 645; baseline 0 281"><span class='ocrx_word' id='word_1_172' title='bbox 71 643 590 645; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 56 615 58 730">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 56 615 58 730">
+     <span class='ocr_line' id='line_1_50' title="bbox 56 615 58 730; baseline 0 196"><span class='ocrx_word' id='word_1_173' title='bbox 56 615 58 730; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 56 729 87 730">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 56 729 87 730">
+     <span class='ocr_line' id='line_1_51' title="bbox 56 729 87 730; baseline 0 196"><span class='ocrx_word' id='word_1_174' title='bbox 56 729 87 730; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 110 736 145 737">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 110 736 145 737">
+     <span class='ocr_line' id='line_1_52' title="bbox 110 736 145 737; baseline 0 189"><span class='ocrx_word' id='word_1_175' title='bbox 110 736 145 737; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 143 569 145 756">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 143 569 145 756">
+     <span class='ocr_line' id='line_1_53' title="bbox 143 569 145 756; baseline 0 170"><span class='ocrx_word' id='word_1_176' title='bbox 143 569 145 756; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 85 680 87 779">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 85 680 87 779">
+     <span class='ocr_line' id='line_1_54' title="bbox 85 680 87 779; baseline 0 147"><span class='ocrx_word' id='word_1_177' title='bbox 85 680 87 779; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 85 777 112 779">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 85 777 112 779">
+     <span class='ocr_line' id='line_1_55' title="bbox 85 777 112 779; baseline 0 147"><span class='ocrx_word' id='word_1_178' title='bbox 85 777 112 779; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 110 736 112 820">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 110 736 112 820">
+     <span class='ocr_line' id='line_1_56' title="bbox 110 736 112 820; baseline 0 106"><span class='ocrx_word' id='word_1_179' title='bbox 110 736 112 820; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 110 818 151 820">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 110 818 151 820">
+     <span class='ocr_line' id='line_1_57' title="bbox 110 818 151 820; baseline 0 106"><span class='ocrx_word' id='word_1_180' title='bbox 110 818 151 820; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 150 791 151 848">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 150 791 151 848">
+     <span class='ocr_line' id='line_1_58' title="bbox 150 791 151 848; baseline 0 78"><span class='ocrx_word' id='word_1_181' title='bbox 150 791 151 848; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 160 828 162 867">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 160 828 162 867">
+     <span class='ocr_line' id='line_1_59' title="bbox 160 828 162 867; baseline 0 59"><span class='ocrx_word' id='word_1_182' title='bbox 160 828 162 867; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002287-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002287-0-001.pbm.png
new file mode 100644
index 00000000..8c0d638e
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002287-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002287-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002287-0-001.pbm.png.hocr
new file mode 100644
index 00000000..8cd06ae9
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002287-0-001.pbm.png.hocr
@@ -0,0 +1,218 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002287-0-001.pbm.png"; bbox 0 0 1243 563; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 40 22 90 42">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 40 22 90 42">
+     <span class='ocr_line' id='line_1_1' title="bbox 40 22 90 42; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 40 22 90 42; x_wconf 90' lang='eng'><em>0.05</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 166 291 189 307">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 166 291 189 307">
+     <span class='ocr_line' id='line_1_2' title="bbox 166 291 189 307; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 166 291 189 307; x_wconf 90' lang='eng'><strong>44</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 225 171 249 187">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 225 171 249 187">
+     <span class='ocr_line' id='line_1_3' title="bbox 225 171 249 187; baseline 0 0"><span class='ocrx_word' id='word_1_3' title='bbox 225 171 249 187; x_wconf 83' lang='eng'><strong>43</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 334 115 356 131">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 334 115 356 131">
+     <span class='ocr_line' id='line_1_4' title="bbox 334 115 356 131; baseline 0 0"><span class='ocrx_word' id='word_1_4' title='bbox 334 115 356 131; x_wconf 88' lang='eng'><em>80</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 631 41 1045 72">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 631 41 1045 72">
+     <span class='ocr_line' id='line_1_5' title="bbox 631 41 1045 72; baseline 0 -6"><span class='ocrx_word' id='word_1_5' title='bbox 631 41 654 57; x_wconf 69' lang='eng'><em>98</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 686 45 708 66; x_wconf 95' lang='eng' dir='ltr'><strong><em>T.</em></strong></span> <span class='ocrx_word' id='word_1_7' title='bbox 717 45 796 72; x_wconf 83' lang='eng' dir='ltr'><strong><em>pedis</em></strong></span> <span class='ocrx_word' id='word_1_8' title='bbox 804 44 876 67; x_wconf 79' lang='eng' dir='ltr'><em>T183</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 887 44 1045 72; x_wconf 86' lang='eng' dir='ltr'><em>(EU754824)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 603 77 1095 113">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 603 4 1095 113">
+     <span class='ocr_line' id='line_1_6' title="bbox 641 4 1091 95; baseline 0 -67"><span class='ocrx_word' id='word_1_10' title='bbox 641 6 708 95; x_wconf 37' lang='eng' dir='ltr'><em>sir.</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 718 6 796 34; x_wconf 88' lang='eng' dir='ltr'><em>pedis</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 805 6 919 28; x_wconf 82' lang='eng' dir='ltr'><em>GB19CB</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 931 4 1091 35; x_wconf 84' lang='eng' dir='ltr'><em>(EU754823)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 603 77 1095 113; baseline 0 -6"><span class='ocrx_word' id='word_1_14' title='bbox 603 77 637 93; x_wconf 62' lang='eng'><em>10°</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 697 85 718 107; x_wconf 90' lang='eng' dir='ltr'><strong><em>T.</em></strong></span> <span class='ocrx_word' id='word_1_16' title='bbox 728 85 806 113; x_wconf 90' lang='eng' dir='ltr'><em>pedis</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 815 85 932 107; x_wconf 80' lang='eng' dir='ltr'><em>T35523T</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 939 85 1095 113; x_wconf 90' lang='eng' dir='ltr'><em>(EF061284)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 364 98 651 99">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 364 98 651 99">
+     <span class='ocr_line' id='line_1_8' title="bbox 364 98 651 99; baseline 0 464"><span class='ocrx_word' id='word_1_19' title='bbox 364 98 651 99; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 259 136 366 138">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 259 136 366 138">
+     <span class='ocr_line' id='line_1_9' title="bbox 259 136 366 138; baseline 0 425"><span class='ocrx_word' id='word_1_20' title='bbox 259 136 366 138; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 199 195 260 196">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 199 195 260 196">
+     <span class='ocr_line' id='line_1_10' title="bbox 199 195 260 196; baseline 0 367"><span class='ocrx_word' id='word_1_21' title='bbox 199 195 260 196; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 157 317 200 318">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 157 317 200 318">
+     <span class='ocr_line' id='line_1_11' title="bbox 157 317 200 318; baseline 0 245"><span class='ocrx_word' id='word_1_22' title='bbox 157 317 200 318; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 6 408 158 410">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 6 408 158 410">
+     <span class='ocr_line' id='line_1_12' title="bbox 6 408 158 410; baseline 0 153"><span class='ocrx_word' id='word_1_23' title='bbox 6 408 158 410; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 6 408 7 542">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 6 408 7 542">
+     <span class='ocr_line' id='line_1_13' title="bbox 6 408 7 542; baseline 0 21"><span class='ocrx_word' id='word_1_24' title='bbox 6 408 7 542; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 157 317 158 500">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 157 317 158 500">
+     <span class='ocr_line' id='line_1_14' title="bbox 157 317 158 500; baseline 0 63"><span class='ocrx_word' id='word_1_25' title='bbox 157 317 158 500; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 199 195 201 440">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 199 195 201 440">
+     <span class='ocr_line' id='line_1_15' title="bbox 199 195 201 440; baseline 0 123"><span class='ocrx_word' id='word_1_26' title='bbox 199 195 201 440; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 259 136 260 254">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 259 136 260 254">
+     <span class='ocr_line' id='line_1_16' title="bbox 259 136 260 254; baseline 0 309"><span class='ocrx_word' id='word_1_27' title='bbox 259 136 260 254; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 364 98 366 176">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 364 98 366 176">
+     <span class='ocr_line' id='line_1_17' title="bbox 364 98 366 176; baseline 0 387"><span class='ocrx_word' id='word_1_28' title='bbox 364 98 366 176; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 650 63 651 135">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 650 63 651 135">
+     <span class='ocr_line' id='line_1_18' title="bbox 650 63 651 135; baseline 0 428"><span class='ocrx_word' id='word_1_29' title='bbox 650 63 651 135; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 506 125 1127 235">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 506 125 1127 235">
+     <span class='ocr_line' id='line_1_19' title="bbox 651 125 1052 153; baseline 0 -6"><span class='ocrx_word' id='word_1_30' title='bbox 651 133 667 135; x_wconf 98' lang='eng'>—</span> <span class='ocrx_word' id='word_1_31' title='bbox 680 125 701 147; x_wconf 88' lang='eng' dir='ltr'><em>T.</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 711 125 789 153; x_wconf 89' lang='eng' dir='ltr'><em>pedis</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 797 125 886 147; x_wconf 91' lang='eng' dir='ltr'><em>T354A</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 897 125 1052 153; x_wconf 87' lang='eng' dir='ltr'><em>(EF061283)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 633 166 1127 194; baseline 0.002 -6"><span class='ocrx_word' id='word_1_35' title='bbox 633 166 653 188; x_wconf 88' lang='eng' dir='ltr'><em>T.</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 665 166 783 188; x_wconf 81' lang='eng' dir='ltr'><em>denticola</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 792 166 873 189; x_wconf 95' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 883 166 960 189; x_wconf 85' lang='eng'>33521</span> <span class='ocrx_word' id='word_1_39' title='bbox 975 166 1127 194; x_wconf 89' lang='eng' dir='ltr'><em>(AJ277354)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 506 206 1011 235; baseline 0 -6"><span class='ocrx_word' id='word_1_40' title='bbox 506 207 525 228; x_wconf 88' lang='eng' dir='ltr'><em>T.</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 538 207 656 229; x_wconf 88' lang='eng' dir='ltr'><em>denticola</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 665 206 745 229; x_wconf 94' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 756 206 850 229; x_wconf 76' lang='eng' dir='ltr'><em>35405T</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 859 207 1011 235; x_wconf 86' lang='eng' dir='ltr'><em>(AJ277353)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 259 253 585 254">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 259 253 585 254">
+     <span class='ocr_line' id='line_1_22' title="bbox 259 253 585 254; baseline 0 309"><span class='ocrx_word' id='word_1_45' title='bbox 259 253 585 254; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 291 215 293 292">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 291 215 293 292">
+     <span class='ocr_line' id='line_1_23' title="bbox 291 215 293 292; baseline 0 271"><span class='ocrx_word' id='word_1_46' title='bbox 291 215 293 292; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 291 291 344 292">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 291 291 344 292">
+     <span class='ocr_line' id='line_1_24' title="bbox 291 291 344 292; baseline 0 271"><span class='ocrx_word' id='word_1_47' title='bbox 291 291 344 292; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 342 256 344 329">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 342 256 344 329">
+     <span class='ocr_line' id='line_1_25' title="bbox 342 256 344 329; baseline 0 234"><span class='ocrx_word' id='word_1_48' title='bbox 342 256 344 329; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 312 308 334 324">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 312 308 334 324">
+     <span class='ocr_line' id='line_1_26' title="bbox 312 308 334 324; baseline 0 0"><span class='ocrx_word' id='word_1_49' title='bbox 312 308 334 324; x_wconf 78' lang='eng'><strong>84</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 549 247 1116 316">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 549 247 1116 316">
+     <span class='ocr_line' id='line_1_27' title="bbox 596 247 1051 276; baseline 0.002 -7"><span class='ocrx_word' id='word_1_50' title='bbox 596 247 625 269; x_wconf 88' lang='eng' dir='ltr'><em>‘T.</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 636 247 795 276; x_wconf 85' lang='eng' dir='ltr'><em>phagedenis’</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 808 247 889 269; x_wconf 88' lang='eng' dir='ltr'><em>Kazan</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 900 248 914 270; x_wconf 93' lang='eng'>5</span> <span class='ocrx_word' id='word_1_54' title='bbox 925 247 1051 276; x_wconf 88' lang='eng' dir='ltr'><em>(M94015)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 549 287 1116 316; baseline 0 -6"><span class='ocrx_word' id='word_1_55' title='bbox 549 296 592 298; x_wconf 91' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_56' title='bbox 604 288 624 310; x_wconf 94' lang='eng' dir='ltr'><strong><em>T.</em></strong></span> <span class='ocrx_word' id='word_1_57' title='bbox 636 288 741 310; x_wconf 86' lang='eng' dir='ltr'><em>medium</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 750 287 830 310; x_wconf 92' lang='eng' dir='ltr'><strong>ATCC</strong></span> <span class='ocrx_word' id='word_1_59' title='bbox 841 287 951 310; x_wconf 81' lang='eng' dir='ltr'><em>700293T</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 961 287 1116 316; x_wconf 89' lang='eng' dir='ltr'><em>(EF061285)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 342 327 549 329">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 342 327 549 329">
+     <span class='ocr_line' id='line_1_29' title="bbox 342 327 549 329; baseline 0 234"><span class='ocrx_word' id='word_1_61' title='bbox 342 327 549 329; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 373 455 407 471">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 373 455 407 471">
+     <span class='ocr_line' id='line_1_30' title="bbox 373 455 407 471; baseline 0 0"><span class='ocrx_word' id='word_1_62' title='bbox 373 455 407 471; x_wconf 89' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 415 419 416 461">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 415 419 416 461">
+     <span class='ocr_line' id='line_1_31' title="bbox 415 419 416 461; baseline 0 102"><span class='ocrx_word' id='word_1_63' title='bbox 415 419 416 461; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 547 296 549 359">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 547 296 549 359">
+     <span class='ocr_line' id='line_1_32' title="bbox 547 296 549 359; baseline 0 204"><span class='ocrx_word' id='word_1_64' title='bbox 547 296 549 359; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 506 328 1238 519">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 506 328 1238 519">
+     <span class='ocr_line' id='line_1_33' title="bbox 506 328 1107 379; baseline 0 -28"><span class='ocrx_word' id='word_1_65' title='bbox 506 343 540 360; x_wconf 66' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 549 337 595 379; x_wconf 36' lang='eng'><em>4|</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 605 329 634 351; x_wconf 85' lang='eng'><strong><em>‘7&#39;.</em></strong></span> <span class='ocrx_word' id='word_1_68' title='bbox 648 328 849 351; x_wconf 87' lang='eng' dir='ltr'><em>Vincentii’ATCC</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 860 329 940 351; x_wconf 88' lang='eng'>35580</span> <span class='ocrx_word' id='word_1_70' title='bbox 951 329 1107 357; x_wconf 89' lang='eng' dir='ltr'><em>(EF061286)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 563 369 1008 398; baseline 0.002 -8"><span class='ocrx_word' id='word_1_71' title='bbox 563 374 586 390; x_wconf 84' lang='eng'><em>99</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 605 370 634 391; x_wconf 88' lang='eng' dir='ltr'><em>‘T.</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 648 370 762 392; x_wconf 84' lang='eng' dir='ltr'><em>Vincentii’</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 771 370 842 391; x_wconf 90' lang='eng' dir='ltr'><em>D2A2</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 853 369 1008 398; x_wconf 89' lang='eng' dir='ltr'><em>(EF061287)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 645 410 1160 438; baseline 0 -6"><span class='ocrx_word' id='word_1_76' title='bbox 645 410 665 432; x_wconf 98' lang='eng' dir='ltr'><strong><em>T.</em></strong></span> <span class='ocrx_word' id='word_1_77' title='bbox 677 410 837 438; x_wconf 87' lang='eng' dir='ltr'><em>maltophilum</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 846 410 926 432; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 937 410 1030 432; x_wconf 78' lang='eng' dir='ltr'><em>51939T</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 1040 410 1160 438; x_wconf 87' lang='eng' dir='ltr'><em>(Y18889)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 637 450 1238 479; baseline 0 -6"><span class='ocrx_word' id='word_1_81' title='bbox 637 451 657 472; x_wconf 94' lang='eng' dir='ltr'><strong><em>T.</em></strong></span> <span class='ocrx_word' id='word_1_82' title='bbox 669 451 871 479; x_wconf 86' lang='eng' dir='ltr'><em>lecithinolyticum</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 880 450 960 473; x_wconf 93' lang='eng' dir='ltr'><strong>ATCC</strong></span> <span class='ocrx_word' id='word_1_84' title='bbox 971 450 1238 479; x_wconf 79' lang='eng' dir='ltr'><em>700332T(AJ277358)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 628 491 1154 519; baseline 0.002 -6"><span class='ocrx_word' id='word_1_85' title='bbox 628 491 648 513; x_wconf 97' lang='eng' dir='ltr'><em>T.</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 659 491 770 519; x_wconf 87' lang='eng' dir='ltr'><em>pallidum</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 780 491 865 519; x_wconf 85' lang='eng' dir='ltr'><em>subsp.</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 875 491 986 519; x_wconf 89' lang='eng' dir='ltr'><em>pallidum</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 997 491 1154 519; x_wconf 89' lang='eng' dir='ltr'><em>(AE000520)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 6 540 684 542">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 6 540 684 542">
+     <span class='ocr_line' id='line_1_38' title="bbox 6 540 684 542; baseline 0 21"><span class='ocrx_word' id='word_1_90' title='bbox 6 540 684 542; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 696 532 1208 560">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 696 532 1208 560">
+     <span class='ocr_line' id='line_1_39' title="bbox 696 532 1208 560; baseline 0 -6"><span class='ocrx_word' id='word_1_91' title='bbox 696 532 819 560; x_wconf 84' lang='eng' dir='ltr'><em>Serpulina</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 829 532 1030 560; x_wconf 84' lang='eng' dir='ltr'><em>hyodysenteriae</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 1041 532 1077 554; x_wconf 79' lang='eng' dir='ltr'><em>CS</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 1088 532 1208 560; x_wconf 86' lang='eng' dir='ltr'><em>(X63513)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002295-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002295-0-001.pbm.png
new file mode 100644
index 00000000..fd861437
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002295-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002295-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002295-0-001.pbm.png.hocr
new file mode 100644
index 00000000..4d04c0b6
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002295-0-001.pbm.png.hocr
@@ -0,0 +1,79 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002295-0-001.pbm.png"; bbox 0 0 994 470; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 110 7 155 25">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 110 7 155 25">
+     <span class='ocr_line' id='line_1_1' title="bbox 110 7 155 25; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 110 7 155 25; x_wconf 67' lang='eng'><em>0,02</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 6 34 260 45">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 6 34 260 45">
+     <span class='ocr_line' id='line_1_2' title="bbox 6 34 260 45; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 6 34 260 45; x_wconf 68' lang='eng' dir='ltr'><em>D—I</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 132 68 991 307">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 135 68 947 102">
+     <span class='ocr_line' id='line_1_3' title="bbox 135 68 947 102; baseline -0.001 -11"><span class='ocrx_word' id='word_1_3' title='bbox 135 84 160 102; x_wconf 73' lang='eng'><em>73</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 183 70 205 91; x_wconf 93' lang='eng' dir='ltr'><em>C.</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 218 70 386 91; x_wconf 77' lang='eng' dir='ltr'><em>esten‘heticum</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 396 70 475 96; x_wconf 82' lang='eng' dir='ltr'><em>subsp.</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 487 70 624 91; x_wconf 87' lang='eng' dir='ltr'><em>Iaramiense</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 635 70 693 91; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 706 68 794 91; x_wconf 75' lang='eng' dir='ltr'><em>14884T</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 804 70 947 96; x_wconf 86' lang='eng' dir='ltr'><em>(AJ506115)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 132 120 991 201">
+     <span class='ocr_line' id='line_1_4' title="bbox 132 120 991 149; baseline 0 -6"><span class='ocrx_word' id='word_1_11' title='bbox 132 124 158 142; x_wconf 84' lang='eng'><em>65</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 181 122 203 143; x_wconf 19' lang='eng' dir='ltr'>C1</span> <span class='ocrx_word' id='word_1_13' title='bbox 216 122 384 143; x_wconf 71' lang='eng' dir='ltr'><em>estertheticum</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 394 122 473 149; x_wconf 26' lang='eng' dir='ltr'><em>subsp‘</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 485 122 669 143; x_wconf 70' lang='eng' dir='ltr'><em>estherfheticum</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 680 122 768 143; x_wconf 86' lang='eng' dir='ltr'><em>NCIMB</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 780 120 867 143; x_wconf 85' lang='eng' dir='ltr'><em>12511T</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 877 122 991 149; x_wconf 87' lang='eng' dir='ltr'><em>(X68181)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 215 173 656 201; baseline 0.002 -6"><span class='ocrx_word' id='word_1_19' title='bbox 215 175 238 196; x_wconf 92' lang='eng' dir='ltr'><em>C.</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 250 175 334 201; x_wconf 85' lang='eng' dir='ltr'><em>frigoris</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 344 175 402 196; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 415 173 503 196; x_wconf 89' lang='eng' dir='ltr'><em>14204T</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 513 175 656 201; x_wconf 85' lang='eng' dir='ltr'><em>(AJ506116)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 194 225 752 254">
+     <span class='ocr_line' id='line_1_6' title="bbox 194 225 752 254; baseline 0 -6"><span class='ocrx_word' id='word_1_24' title='bbox 194 227 217 248; x_wconf 91' lang='eng' dir='ltr'><em>C.</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 229 227 429 254; x_wconf 78' lang='eng' dir='ltr'><em>lacusflyxe/lense</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 439 227 498 248; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 511 225 598 248; x_wconf 89' lang='eng' dir='ltr'><em>14205T</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 608 228 752 254; x_wconf 86' lang='eng' dir='ltr'><em>(AJ506118)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 185 280 653 307">
+     <span class='ocr_line' id='line_1_7' title="bbox 185 280 653 307; baseline 0 -6"><span class='ocrx_word' id='word_1_29' title='bbox 185 280 250 301; x_wconf 79' lang='eng' dir='ltr'><em>—‘C.</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 263 280 418 307; x_wconf 80' lang='eng' dir='ltr'><em>algoriphilum’</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 431 280 490 301; x_wconf 95' lang='eng' dir='ltr'>14D1</span> <span class='ocrx_word' id='word_1_32' title='bbox 505 280 653 307; x_wconf 89' lang='eng' dir='ltr'><em>(AY117755)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 2 119 210 453">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 2 119 210 453">
+     <span class='ocr_line' id='line_1_8' title="bbox 126 119 132 163; baseline 0 307"><span class='ocrx_word' id='word_1_33' title='bbox 126 119 132 163; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 2 163 210 268; baseline 0.005 -1"><span class='ocrx_word' id='word_1_34' title='bbox 2 163 210 268; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 2 268 185 320; baseline 0.016 -4"><span class='ocrx_word' id='word_1_35' title='bbox 2 268 185 320; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 2 320 166 453; baseline 0.006 -30"><span class='ocrx_word' id='word_1_36' title='bbox 2 320 166 453; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 183 289 185 370">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 183 289 185 370">
+     <span class='ocr_line' id='line_1_12' title="bbox 183 289 185 370; baseline 0 100"><span class='ocrx_word' id='word_1_37' title='bbox 183 289 185 370; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 139 331 731 465">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 139 331 731 465">
+     <span class='ocr_line' id='line_1_13' title="bbox 185 331 731 397; baseline 0 -43"><span class='ocrx_word' id='word_1_38' title='bbox 185 333 278 397; x_wconf 57' lang='eng' dir='ltr'><em>_‘——C.</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 291 333 410 354; x_wconf 82' lang='eng' dir='ltr'><em>bowmanii</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 419 333 477 354; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 490 331 578 354; x_wconf 86' lang='eng' dir='ltr'><em>14206T</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 588 333 731 359; x_wconf 85' lang='eng' dir='ltr'><em>(AJ506120)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 166 374 617 412; baseline 0 -5"><span class='ocrx_word' id='word_1_43' title='bbox 166 374 192 392; x_wconf 67' lang='eng'>55</span> <span class='ocrx_word' id='word_1_44' title='bbox 280 386 357 407; x_wconf 83' lang='eng' dir='ltr'><em>Strain</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 367 386 430 406; x_wconf 91' lang='eng' dir='ltr'>A121</span> <span class='ocrx_word' id='word_1_46' title='bbox 439 384 450 398; x_wconf 76' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_47' title='bbox 463 386 617 412; x_wconf 78' lang='eng' dir='ltr'><em>(D0296031)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 139 437 665 465; baseline 0 -6"><span class='ocrx_word' id='word_1_48' title='bbox 139 438 162 459; x_wconf 93' lang='eng' dir='ltr'><em>C.</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 173 439 355 465; x_wconf 83' lang='eng' dir='ltr'><em>psychrophi/um</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 364 437 508 459; x_wconf 80' lang='eng' dir='ltr'><em>A-1/C-an/lT</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 522 439 665 465; x_wconf 82' lang='eng' dir='ltr'><em>(AJ297443)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002352-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002352-0-001.pbm.png
new file mode 100644
index 00000000..e4068b70
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002352-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002352-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002352-0-001.pbm.png.hocr
new file mode 100644
index 00000000..08b24bb8
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002352-0-001.pbm.png.hocr
@@ -0,0 +1,91 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002352-0-001.pbm.png"; bbox 0 0 1124 553; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 225 6 1034 188">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 225 6 1034 86">
+     <span class='ocr_line' id='line_1_1' title="bbox 498 6 1034 34; baseline 0.002 -6"><span class='ocrx_word' id='word_1_1' title='bbox 498 9 655 29; x_wconf 84' lang='eng' dir='ltr'><em>Paenibacillus</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 662 9 774 34; x_wconf 89' lang='eng' dir='ltr'><em>polymyxa</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 784 9 839 29; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 850 6 889 29; x_wconf 77' lang='eng' dir='ltr'><em>3ST</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 899 9 1034 34; x_wconf 85' lang='eng' dir='ltr'><em>(AJ320493)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 225 58 775 86; baseline 0 -6"><span class='ocrx_word' id='word_1_6' title='bbox 225 61 381 80; x_wconf 84' lang='eng' dir='ltr'><em>Paenibacillus</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 389 61 437 86; x_wconf 89' lang='eng' dir='ltr'><em>elgii</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 445 60 518 80; x_wconf 88' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 529 58 626 80; x_wconf 81' lang='eng' dir='ltr'><em>100335T</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 636 60 775 86; x_wconf 87' lang='eng' dir='ltr'><em>(AY090110)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 267 109 916 188">
+     <span class='ocr_line' id='line_1_3' title="bbox 333 109 916 137; baseline -0.002 -5"><span class='ocrx_word' id='word_1_11' title='bbox 333 112 489 132; x_wconf 82' lang='eng' dir='ltr'><em>Paenibacillus</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 497 112 611 132; x_wconf 86' lang='eng' dir='ltr'><em>koreensis</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 620 112 690 132; x_wconf 90' lang='eng' dir='ltr'><em>KCTC</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 699 109 768 132; x_wconf 78' lang='eng' dir='ltr'><em>2393T</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 778 112 916 137; x_wconf 89' lang='eng' dir='ltr'><em>(AF130254)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 267 161 858 188; baseline 0 -5"><span class='ocrx_word' id='word_1_16' title='bbox 267 163 423 183; x_wconf 85' lang='eng' dir='ltr'><em>PaenibaciI/us</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 432 163 551 183; x_wconf 85' lang='eng' dir='ltr'><em>ehimensis</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 560 163 630 183; x_wconf 88' lang='eng' dir='ltr'><em>KCTC</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 640 161 708 183; x_wconf 79' lang='eng' dir='ltr'><em>3748T</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 718 163 858 188; x_wconf 87' lang='eng' dir='ltr'><em>(AY116665)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 250 212 853 289">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 250 212 853 289">
+     <span class='ocr_line' id='line_1_5' title="bbox 290 212 820 239; baseline 0 -5"><span class='ocrx_word' id='word_1_21' title='bbox 290 214 446 234; x_wconf 85' lang='eng' dir='ltr'><em>Paenibaci/Ius</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 455 214 495 234; x_wconf 89' lang='eng' dir='ltr'><em>soli</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 503 214 573 234; x_wconf 87' lang='eng' dir='ltr'><em>KCTC</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 585 212 666 234; x_wconf 85' lang='eng' dir='ltr'><em>13010T</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 676 214 820 239; x_wconf 84' lang='eng' dir='ltr'><em>(DQ309072)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 250 261 853 289; baseline 0 -6"><span class='ocrx_word' id='word_1_26' title='bbox 250 263 406 283; x_wconf 79' lang='eng' dir='ltr'><em>Paenibaci/lus</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 415 263 546 288; x_wconf 85' lang='eng' dir='ltr'><em>chinjuensis</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 555 263 611 283; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 623 261 705 283; x_wconf 90' lang='eng' dir='ltr'><em>15045T</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 714 263 853 289; x_wconf 86' lang='eng' dir='ltr'><em>(AF164345)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 0 23 490 540">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 0 23 490 540">
+     <span class='ocr_line' id='line_1_7' title="bbox 0 23 490 123; baseline 0 0"><span class='ocrx_word' id='word_1_31' title='bbox 0 23 490 123; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> <span class='ocrx_word' id='word_1_32' title='bbox 224 100 332 123; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 0 123 332 201; baseline 0.009 -53"><span class='ocrx_word' id='word_1_33' title='bbox 0 123 332 201; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 0 201 289 303; baseline 0 0"><span class='ocrx_word' id='word_1_34' title='bbox 0 201 289 303; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 31 303 352 358; baseline 0.006 -2"><span class='ocrx_word' id='word_1_35' title='bbox 31 303 352 358; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 46 358 351 409; baseline 0 144"><span class='ocrx_word' id='word_1_36' title='bbox 46 358 351 409; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 74 409 479 452; baseline 0 101"><span class='ocrx_word' id='word_1_37' title='bbox 74 409 479 452; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 74 452 458 540; baseline 0 0"><span class='ocrx_word' id='word_1_38' title='bbox 74 452 458 540; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 191 99 224 115">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 191 99 224 115">
+     <span class='ocr_line' id='line_1_14' title="bbox 191 99 224 115; baseline 0 0"><span class='ocrx_word' id='word_1_39' title='bbox 191 99 224 115; x_wconf 84' lang='eng'><em>000</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 354 316 863 344">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 354 316 863 344">
+     <span class='ocr_line' id='line_1_15' title="bbox 354 316 863 344; baseline 0 -6"><span class='ocrx_word' id='word_1_40' title='bbox 354 319 510 338; x_wconf 86' lang='eng' dir='ltr'><em>Paenibacillus</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 519 319 600 338; x_wconf 87' lang='eng' dir='ltr'><em>validus</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 610 318 665 338; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 676 316 745 338; x_wconf 87' lang='eng' dir='ltr'><em>3037T</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 754 319 863 344; x_wconf 80' lang='eng'><em>(078320)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 351 369 1121 492">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 351 369 1121 492">
+     <span class='ocr_line' id='line_1_16' title="bbox 351 369 1048 396; baseline 0.001 -6"><span class='ocrx_word' id='word_1_45' title='bbox 351 371 507 391; x_wconf 84' lang='eng' dir='ltr'><em>Paenibacillus</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 515 371 741 396; x_wconf 84' lang='eng' dir='ltr'><em>naphthalenovorans</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 751 371 806 391; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 818 369 901 391; x_wconf 74' lang='eng' dir='ltr'><em>14203T</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 910 371 1048 396; x_wconf 86' lang='eng' dir='ltr'><em>(AF353681)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 481 417 1121 445; baseline 0 -6"><span class='ocrx_word' id='word_1_50' title='bbox 481 420 637 439; x_wconf 84' lang='eng' dir='ltr'><em>Paenibacillus</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 645 420 803 444; x_wconf 87' lang='eng' dir='ltr'><em>ginsengihumi</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 810 419 881 439; x_wconf 92' lang='eng' dir='ltr'><em>KCTC</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 892 417 974 439; x_wconf 84' lang='eng' dir='ltr'><em>13141T</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 983 419 1121 445; x_wconf 85' lang='eng' dir='ltr'><em>(EF452662)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 458 465 946 492; baseline 0 -5"><span class='ocrx_word' id='word_1_55' title='bbox 458 467 627 487; x_wconf 87' lang='eng' dir='ltr'><em>Paenibacillus</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 635 467 701 492; x_wconf 90' lang='eng' dir='ltr'><em>pueri</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 709 465 795 487; x_wconf 81' lang='eng' dir='ltr'><em>b09i-3T</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 804 467 889 492; x_wconf 88' lang='eng' dir='ltr'><em>(EU391</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 896 467 946 492; x_wconf 87' lang='eng'><em>156)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 73 517 939 550">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 73 517 939 550">
+     <span class='ocr_line' id='line_1_19' title="bbox 73 517 939 550; baseline -0.005 -1"><span class='ocrx_word' id='word_1_60' title='bbox 73 518 119 538; x_wconf 76' lang='eng'><em>0-01</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 361 534 404 550; x_wconf 68' lang='eng'><em>1000</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 409 517 441 549; x_wconf 65' lang='eng'><em>2&#39;</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 462 525 632 545; x_wconf 82' lang='eng' dir='ltr'><em>Paenibacillus</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 639 525 705 550; x_wconf 88' lang='eng' dir='ltr'><em>pueri</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 714 525 785 545; x_wconf 91' lang='eng' dir='ltr'><em>b13i-1</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 798 525 939 550; x_wconf 86' lang='eng' dir='ltr'><em>(EU391155)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 51 547 146 551">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 51 547 146 551">
+     <span class='ocr_line' id='line_1_20' title="bbox 51 547 146 551; baseline 0 2"><span class='ocrx_word' id='word_1_67' title='bbox 51 547 146 551; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002378-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002378-0-001.pbm.png
new file mode 100644
index 00000000..ae5109fa
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002378-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002378-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002378-0-001.pbm.png.hocr
new file mode 100644
index 00000000..919fb9de
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002378-0-001.pbm.png.hocr
@@ -0,0 +1,226 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002378-0-001.pbm.png"; bbox 0 0 2071 937; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 71 518 73 799">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 71 518 73 799">
+     <span class='ocr_line' id='line_1_1' title="bbox 71 518 73 799; baseline 0 138"><span class='ocrx_word' id='word_1_1' title='bbox 71 518 73 799; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 326 487 370 509">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 326 487 370 509">
+     <span class='ocr_line' id='line_1_2' title="bbox 326 487 370 509; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 326 487 370 509; x_wconf 95' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 407 309 409 485">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 407 309 409 485">
+     <span class='ocr_line' id='line_1_3' title="bbox 407 309 409 485; baseline 0 452"><span class='ocrx_word' id='word_1_3' title='bbox 407 309 409 485; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 409 467 995 504">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 409 467 995 504">
+     <span class='ocr_line' id='line_1_4' title="bbox 409 467 995 504; baseline 0 0"><span class='ocrx_word' id='word_1_4' title='bbox 409 467 995 504; x_wconf 88' lang='eng'>—|:</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 498 454 733 545">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 498 454 733 545">
+     <span class='ocr_line' id='line_1_5' title="bbox 498 454 529 475; baseline 0 0"><span class='ocrx_word' id='word_1_5' title='bbox 498 454 529 475; x_wconf 87' lang='eng'>83</span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 702 523 733 545; baseline 0 0"><span class='ocrx_word' id='word_1_6' title='bbox 702 523 733 545; x_wconf 86' lang='eng'>68</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 598 562 642 583">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 598 562 642 583">
+     <span class='ocr_line' id='line_1_7' title="bbox 598 562 642 583; baseline 0 0"><span class='ocrx_word' id='word_1_7' title='bbox 598 562 642 583; x_wconf 92' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 595 766 640 788">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 595 766 640 788">
+     <span class='ocr_line' id='line_1_8' title="bbox 595 766 640 788; baseline 0.022 -1"><span class='ocrx_word' id='word_1_8' title='bbox 595 766 640 788; x_wconf 93' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 924 8 2069 559">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 924 8 2069 559">
+     <span class='ocr_line' id='line_1_9' title="bbox 1176 8 1795 36; baseline 0 -6"><span class='ocrx_word' id='word_1_9' title='bbox 1176 8 1303 30; x_wconf 84' lang='eng' dir='ltr'>Gemmata</span> <span class='ocrx_word' id='word_1_10' title='bbox 1314 8 1496 36; x_wconf 86' lang='eng' dir='ltr'>obscurig/obus</span> <span class='ocrx_word' id='word_1_11' title='bbox 1507 8 1568 30; x_wconf 91' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_12' title='bbox 1579 8 1659 33; x_wconf 73' lang='eng' dir='ltr'>5831T,</span> <span class='ocrx_word' id='word_1_13' title='bbox 1668 8 1795 30; x_wconf 88' lang='eng' dir='ltr'>AJ231191</span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 1211 43 1792 68; baseline 0 -3"><span class='ocrx_word' id='word_1_14' title='bbox 1211 43 1393 65; x_wconf 85' lang='eng' dir='ltr'>Gemmata-Iike</span> <span class='ocrx_word' id='word_1_15' title='bbox 1403 43 1473 65; x_wconf 89' lang='eng' dir='ltr'>strain</span> <span class='ocrx_word' id='word_1_16' title='bbox 1485 43 1616 65; x_wconf 84' lang='eng' dir='ltr'>Schlesner</span> <span class='ocrx_word' id='word_1_17' title='bbox 1625 43 1680 68; x_wconf 86' lang='eng'>633,</span> <span class='ocrx_word' id='word_1_18' title='bbox 1691 43 1792 65; x_wconf 88' lang='eng' dir='ltr'>X81957</span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 1157 78 1706 103; baseline 0.002 -4"><span class='ocrx_word' id='word_1_19' title='bbox 1157 78 1339 100; x_wconf 87' lang='eng' dir='ltr'>Gemmata-Iike</span> <span class='ocrx_word' id='word_1_20' title='bbox 1349 78 1419 100; x_wconf 89' lang='eng' dir='ltr'>strain</span> <span class='ocrx_word' id='word_1_21' title='bbox 1430 78 1561 103; x_wconf 90' lang='eng' dir='ltr'>JW11-2f5,</span> <span class='ocrx_word' id='word_1_22' title='bbox 1570 78 1706 100; x_wconf 87' lang='eng' dir='ltr'>AF239696</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 1189 112 1731 138; baseline 0.002 -4"><span class='ocrx_word' id='word_1_23' title='bbox 1189 112 1371 135; x_wconf 84' lang='eng' dir='ltr'>Gemmata—Iike</span> <span class='ocrx_word' id='word_1_24' title='bbox 1382 113 1451 135; x_wconf 86' lang='eng' dir='ltr'>strain</span> <span class='ocrx_word' id='word_1_25' title='bbox 1463 113 1585 138; x_wconf 87' lang='eng' dir='ltr'>JW3-8sO,</span> <span class='ocrx_word' id='word_1_26' title='bbox 1595 113 1731 135; x_wconf 84' lang='eng' dir='ltr'>AF239694</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 1189 147 1679 173; baseline 0 -4"><span class='ocrx_word' id='word_1_27' title='bbox 1189 147 1371 169; x_wconf 82' lang='eng' dir='ltr'>Gemmata—Iike</span> <span class='ocrx_word' id='word_1_28' title='bbox 1382 148 1451 169; x_wconf 80' lang='eng' dir='ltr'>strain</span> <span class='ocrx_word' id='word_1_29' title='bbox 1463 147 1533 173; x_wconf 75' lang='eng' dir='ltr'>Soil9,</span> <span class='ocrx_word' id='word_1_30' title='bbox 1543 148 1679 169; x_wconf 88' lang='eng' dir='ltr'>AF239698</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 1272 182 1807 208; baseline 0 -4"><span class='ocrx_word' id='word_1_31' title='bbox 1272 182 1454 204; x_wconf 86' lang='eng' dir='ltr'>Gemmata-Iike</span> <span class='ocrx_word' id='word_1_32' title='bbox 1465 182 1534 204; x_wconf 86' lang='eng' dir='ltr'>strain</span> <span class='ocrx_word' id='word_1_33' title='bbox 1546 182 1807 208; x_wconf 85' lang='eng' dir='ltr'>JW9—3f1,AF239697</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 1160 217 1668 245; baseline 0 -6"><span class='ocrx_word' id='word_1_34' title='bbox 1160 217 1342 239; x_wconf 86' lang='eng' dir='ltr'>Gemmata—Iike</span> <span class='ocrx_word' id='word_1_35' title='bbox 1352 217 1422 239; x_wconf 87' lang='eng' dir='ltr'>strain</span> <span class='ocrx_word' id='word_1_36' title='bbox 1434 217 1522 245; x_wconf 71' lang='eng' dir='ltr'>Cjuql4,</span> <span class='ocrx_word' id='word_1_37' title='bbox 1532 217 1668 239; x_wconf 87' lang='eng' dir='ltr'>AF239693</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 1186 252 1752 278; baseline 0 -4"><span class='ocrx_word' id='word_1_38' title='bbox 1186 252 1369 274; x_wconf 84' lang='eng' dir='ltr'>Gemmata—Iike</span> <span class='ocrx_word' id='word_1_39' title='bbox 1380 252 1463 274; x_wconf 89' lang='eng' dir='ltr'>isolate</span> <span class='ocrx_word' id='word_1_40' title='bbox 1473 252 1595 274; x_wconf 88' lang='eng' dir='ltr'>JW10—3f1</span> <span class='ocrx_word' id='word_1_41' title='bbox 1603 271 1606 278; x_wconf 86' lang='eng'>,</span> <span class='ocrx_word' id='word_1_42' title='bbox 1615 252 1752 274; x_wconf 86' lang='eng' dir='ltr'>AF239695</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 1195 277 1598 315; baseline 0 -6"><span class='ocrx_word' id='word_1_43' title='bbox 1195 281 1298 310; x_wconf 90' lang='eng' dir='ltr'>Strain</span> <span class='ocrx_word' id='word_1_44' title='bbox 1312 282 1352 309; x_wconf 94' lang='eng' dir='ltr'>A1</span> <span class='ocrx_word' id='word_1_45' title='bbox 1359 277 1404 315; x_wconf 78' lang='eng' dir='ltr'>OT,</span> <span class='ocrx_word' id='word_1_46' title='bbox 1417 282 1598 310; x_wconf 90' lang='eng' dir='ltr'>AM162406</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 1379 322 1930 350; baseline 0 -6"><span class='ocrx_word' id='word_1_47' title='bbox 1379 322 1524 350; x_wconf 87' lang='eng' dir='ltr'>Isosphaera</span> <span class='ocrx_word' id='word_1_48' title='bbox 1533 322 1619 350; x_wconf 89' lang='eng' dir='ltr'>pal/ida</span> <span class='ocrx_word' id='word_1_49' title='bbox 1630 322 1691 344; x_wconf 90' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_50' title='bbox 1702 322 1782 347; x_wconf 50' lang='eng'>96130,</span> <span class='ocrx_word' id='word_1_51' title='bbox 1800 322 1930 344; x_wconf 87' lang='eng' dir='ltr'>AJ231195</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 1386 357 1948 382; baseline 0 -3"><span class='ocrx_word' id='word_1_52' title='bbox 1386 357 1537 379; x_wconf 78' lang='eng' dir='ltr'>‘Nostocoida</span> <span class='ocrx_word' id='word_1_53' title='bbox 1548 357 1645 379; x_wconf 85' lang='eng' dir='ltr'>Iimico/a</span> <span class='ocrx_word' id='word_1_54' title='bbox 1657 357 1684 379; x_wconf 90' lang='eng'><strong><em>|||’</em></strong></span> <span class='ocrx_word' id='word_1_55' title='bbox 1695 357 1802 382; x_wconf 89' lang='eng' dir='ltr'>Ben220,</span> <span class='ocrx_word' id='word_1_56' title='bbox 1811 357 1948 379; x_wconf 92' lang='eng' dir='ltr'>AF244748</span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 1360 392 1921 417; baseline 0 -3"><span class='ocrx_word' id='word_1_57' title='bbox 1360 392 1511 414; x_wconf 86' lang='eng' dir='ltr'>‘Nostocoida</span> <span class='ocrx_word' id='word_1_58' title='bbox 1521 392 1619 414; x_wconf 87' lang='eng' dir='ltr'>Iimico/a</span> <span class='ocrx_word' id='word_1_59' title='bbox 1630 392 1658 414; x_wconf 81' lang='eng'><strong><em>|||’</em></strong></span> <span class='ocrx_word' id='word_1_60' title='bbox 1669 392 1775 417; x_wconf 85' lang='eng' dir='ltr'>Ben223,</span> <span class='ocrx_word' id='word_1_61' title='bbox 1785 392 1921 414; x_wconf 87' lang='eng' dir='ltr'>AF244750</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 1148 426 2069 454; baseline 0 -6"><span class='ocrx_word' id='word_1_62' title='bbox 1148 432 1403 434; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_63' title='bbox 1417 426 1611 454; x_wconf 87' lang='eng' dir='ltr'>Singulisphaera</span> <span class='ocrx_word' id='word_1_64' title='bbox 1622 426 1744 454; x_wconf 85' lang='eng' dir='ltr'>acidiphila</span> <span class='ocrx_word' id='word_1_65' title='bbox 1755 427 1814 448; x_wconf 90' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_66' title='bbox 1826 426 1917 452; x_wconf 44' lang='eng'>186581</span> <span class='ocrx_word' id='word_1_67' title='bbox 1927 426 2069 448; x_wconf 88' lang='eng' dir='ltr'>AM850678</span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 1024 461 1581 489; baseline 0 -6"><span class='ocrx_word' id='word_1_68' title='bbox 1024 462 1207 489; x_wconf 82' lang='eng' dir='ltr'>Blastopirellula</span> <span class='ocrx_word' id='word_1_69' title='bbox 1218 462 1307 483; x_wconf 87' lang='eng' dir='ltr'>marina</span> <span class='ocrx_word' id='word_1_70' title='bbox 1319 462 1379 483; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_71' title='bbox 1391 461 1470 487; x_wconf 49' lang='eng'>36451</span> <span class='ocrx_word' id='word_1_72' title='bbox 1482 462 1581 483; x_wconf 87' lang='eng' dir='ltr'>X62912</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 924 496 1397 524; baseline 0 -6"><span class='ocrx_word' id='word_1_73' title='bbox 924 496 1028 518; x_wconf 83' lang='eng' dir='ltr'>Pirel/u/a</span> <span class='ocrx_word' id='word_1_74' title='bbox 1039 496 1124 524; x_wconf 85' lang='eng' dir='ltr'>staleyi</span> <span class='ocrx_word' id='word_1_75' title='bbox 1133 497 1193 518; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_76' title='bbox 1204 496 1284 522; x_wconf 44' lang='eng'>60681</span> <span class='ocrx_word' id='word_1_77' title='bbox 1296 496 1397 518; x_wconf 86' lang='eng' dir='ltr'>X81946</span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 1361 531 2049 559; baseline 0 -6"><span class='ocrx_word' id='word_1_78' title='bbox 1361 531 1513 553; x_wconf 87' lang='eng' dir='ltr'>Sch/esneria</span> <span class='ocrx_word' id='word_1_79' title='bbox 1522 531 1656 559; x_wconf 86' lang='eng' dir='ltr'>paludicola</span> <span class='ocrx_word' id='word_1_80' title='bbox 1665 531 1742 553; x_wconf 89' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_81' title='bbox 1753 531 2049 557; x_wconf 48' lang='eng' dir='ltr'>BAA-13931AM162407</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 409 9 1359 419">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 409 9 1359 419">
+     <span class='ocr_line' id='line_1_25' title="bbox 1048 9 1184 66; baseline 0 0"><span class='ocrx_word' id='word_1_82' title='bbox 1048 9 1184 66; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 911 80 1157 115; baseline 0 -29"><span class='ocrx_word' id='word_1_83' title='bbox 911 80 1157 115; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 763 115 1246 203; baseline 0 0"><span class='ocrx_word' id='word_1_84' title='bbox 763 115 1246 203; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 443 203 1160 259; baseline 0 -38"><span class='ocrx_word' id='word_1_85' title='bbox 443 203 1160 259; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 443 259 1053 291; baseline 0 646"><span class='ocrx_word' id='word_1_86' title='bbox 443 259 1053 291; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 409 291 1359 419; baseline 0 0"><span class='ocrx_word' id='word_1_87' title='bbox 409 291 1359 419; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 1087 48 1089 85">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 1087 48 1089 85">
+     <span class='ocr_line' id='line_1_31' title="bbox 1087 48 1089 85; baseline 0 852"><span class='ocrx_word' id='word_1_88' title='bbox 1087 48 1089 85; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 1000 70 1045 91">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 1000 70 1045 91">
+     <span class='ocr_line' id='line_1_32' title="bbox 1000 70 1045 91; baseline 0 0"><span class='ocrx_word' id='word_1_89' title='bbox 1000 70 1045 91; x_wconf 91' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 714 173 904 230">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 714 173 904 230">
+     <span class='ocr_line' id='line_1_33' title="bbox 874 173 904 194; baseline 0 0"><span class='ocrx_word' id='word_1_90' title='bbox 874 173 904 194; x_wconf 88' lang='eng'>98</span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 714 209 759 230; baseline 0 0"><span class='ocrx_word' id='word_1_91' title='bbox 714 209 722 230; x_wconf 86' lang='eng'>1</span> <span class='ocrx_word' id='word_1_92' title='bbox 729 209 759 230; x_wconf 93' lang='eng'>00</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 1146 397 1148 434">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 1146 397 1148 434">
+     <span class='ocr_line' id='line_1_35' title="bbox 1146 397 1148 434; baseline 0 503"><span class='ocrx_word' id='word_1_93' title='bbox 1146 397 1148 434; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 649 553 742 555">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 649 553 742 555">
+     <span class='ocr_line' id='line_1_36' title="bbox 649 553 742 555; baseline 0 382"><span class='ocrx_word' id='word_1_94' title='bbox 649 553 742 555; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 740 537 742 573">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 740 537 742 573">
+     <span class='ocr_line' id='line_1_37' title="bbox 740 537 742 573; baseline 0 364"><span class='ocrx_word' id='word_1_95' title='bbox 740 537 742 573; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 741 536 1689 594">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 742 566 1689 594">
+     <span class='ocr_line' id='line_1_38' title="bbox 742 566 1689 594; baseline 0 -6"><span class='ocrx_word' id='word_1_96' title='bbox 742 571 1052 573; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_97' title='bbox 1080 566 1265 594; x_wconf 82' lang='eng' dir='ltr'>Planctomyces</span> <span class='ocrx_word' id='word_1_98' title='bbox 1274 566 1422 594; x_wconf 80' lang='eng' dir='ltr'>Iimnophilus</span> <span class='ocrx_word' id='word_1_99' title='bbox 1433 566 1494 588; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_100' title='bbox 1505 566 1585 592; x_wconf 73' lang='eng' dir='ltr'>3776T,</span> <span class='ocrx_word' id='word_1_101' title='bbox 1596 567 1689 588; x_wconf 86' lang='eng' dir='ltr'>X62911</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 649 553 651 625">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 649 553 651 625">
+     <span class='ocr_line' id='line_1_39' title="bbox 649 553 651 625; baseline 0 312"><span class='ocrx_word' id='word_1_102' title='bbox 649 553 651 625; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 651 595 1909 713">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 651 595 1909 713">
+     <span class='ocr_line' id='line_1_40' title="bbox 651 595 1909 644; baseline -0.002 -19"><span class='ocrx_word' id='word_1_103' title='bbox 651 595 1239 644; x_wconf 57' lang='eng'>—88[:</span> <span class='ocrx_word' id='word_1_104' title='bbox 1268 601 1453 629; x_wconf 80' lang='eng' dir='ltr'>Planctomyces</span> <span class='ocrx_word' id='word_1_105' title='bbox 1462 601 1609 623; x_wconf 86' lang='eng' dir='ltr'>bras/Iiensis</span> <span class='ocrx_word' id='word_1_106' title='bbox 1620 602 1680 623; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_107' title='bbox 1692 601 1771 627; x_wconf 39' lang='eng'>53053</span> <span class='ocrx_word' id='word_1_108' title='bbox 1781 602 1909 623; x_wconf 87' lang='eng' dir='ltr'>AJ231190</span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 1209 635 1778 663; baseline 0 -6"><span class='ocrx_word' id='word_1_109' title='bbox 1209 635 1394 663; x_wconf 86' lang='eng' dir='ltr'>Planctomyces</span> <span class='ocrx_word' id='word_1_110' title='bbox 1403 635 1475 657; x_wconf 86' lang='eng' dir='ltr'>maris</span> <span class='ocrx_word' id='word_1_111' title='bbox 1486 635 1546 657; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_112' title='bbox 1558 635 1638 661; x_wconf 64' lang='eng' dir='ltr'>879W,</span> <span class='ocrx_word' id='word_1_113' title='bbox 1647 635 1778 657; x_wconf 89' lang='eng' dir='ltr'>AJ231184</span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 767 665 1576 713; baseline -0.002 -18"><span class='ocrx_word' id='word_1_114' title='bbox 767 665 1081 713; x_wconf 49' lang='eng' dir='ltr'>iﬂandidatus</span> <span class='ocrx_word' id='word_1_115' title='bbox 1091 671 1205 693; x_wconf 87' lang='eng' dir='ltr'>Brocadia</span> <span class='ocrx_word' id='word_1_116' title='bbox 1216 671 1430 697; x_wconf 82' lang='eng' dir='ltr'>anammoxidans’,</span> <span class='ocrx_word' id='word_1_117' title='bbox 1439 671 1576 693; x_wconf 84' lang='eng' dir='ltr'>AF375994</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 730 706 1666 769">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 730 699 1666 769">
+     <span class='ocr_line' id='line_1_43' title="bbox 730 699 1518 734; baseline 0 -6"><span class='ocrx_word' id='word_1_118' title='bbox 730 699 760 720; x_wconf 82' lang='eng'>83</span> <span class='ocrx_word' id='word_1_119' title='bbox 975 706 1129 728; x_wconf 84' lang='eng' dir='ltr'>&#39;Candidatus</span> <span class='ocrx_word' id='word_1_120' title='bbox 1140 706 1254 728; x_wconf 90' lang='eng' dir='ltr'>Brocadia</span> <span class='ocrx_word' id='word_1_121' title='bbox 1264 706 1364 734; x_wconf 85' lang='eng' dir='ltr'>fulgida’,</span> <span class='ocrx_word' id='word_1_122' title='bbox 1377 706 1518 729; x_wconf 87' lang='eng' dir='ltr'>DQ459989</span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 941 741 1666 769; baseline -0.001 -6"><span class='ocrx_word' id='word_1_123' title='bbox 941 741 1097 763; x_wconf 85' lang='eng' dir='ltr'>‘Candidatus</span> <span class='ocrx_word' id='word_1_124' title='bbox 1104 741 1342 769; x_wconf 88' lang='eng' dir='ltr'>Anammoxoglobus</span> <span class='ocrx_word' id='word_1_125' title='bbox 1353 741 1515 768; x_wconf 83' lang='eng' dir='ltr'>propionicus‘,</span> <span class='ocrx_word' id='word_1_126' title='bbox 1529 741 1666 764; x_wconf 88' lang='eng' dir='ltr'>DQ317601</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 767 695 769 748">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 767 695 769 748">
+     <span class='ocr_line' id='line_1_45' title="bbox 767 695 769 748; baseline 0 189"><span class='ocrx_word' id='word_1_127' title='bbox 767 695 769 748; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 71 797 651 799">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 71 797 651 799">
+     <span class='ocr_line' id='line_1_46' title="bbox 71 797 651 799; baseline 0 138"><span class='ocrx_word' id='word_1_128' title='bbox 71 797 651 799; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 374 901 429 923">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 374 901 429 923">
+     <span class='ocr_line' id='line_1_47' title="bbox 374 901 429 923; baseline 0 0"><span class='ocrx_word' id='word_1_129' title='bbox 374 901 429 923; x_wconf 89' lang='eng'>0.10</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 651 727 1593 803">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 651 733 1593 803">
+     <span class='ocr_line' id='line_1_48' title="bbox 651 733 912 754; baseline 0 0"><span class='ocrx_word' id='word_1_130' title='bbox 651 733 681 754; x_wconf 89' lang='eng'>60</span> <span class='ocrx_word' id='word_1_131' title='bbox 769 746 912 748; x_wconf 92' lang='eng'><strong>—</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_49' title="bbox 952 775 1593 803; baseline 0 -5"><span class='ocrx_word' id='word_1_132' title='bbox 952 775 1108 798; x_wconf 79' lang='eng' dir='ltr'>‘Candidatus</span> <span class='ocrx_word' id='word_1_133' title='bbox 1118 776 1241 798; x_wconf 88' lang='eng' dir='ltr'>Kuenenia</span> <span class='ocrx_word' id='word_1_134' title='bbox 1251 775 1447 803; x_wconf 74' lang='eng' dir='ltr'>stuttganiensis’,</span> <span class='ocrx_word' id='word_1_135' title='bbox 1456 776 1593 798; x_wconf 85' lang='eng' dir='ltr'>AF375995</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 649 553 651 869">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 649 553 651 869">
+     <span class='ocr_line' id='line_1_50' title="bbox 649 553 651 869; baseline 0 68"><span class='ocrx_word' id='word_1_136' title='bbox 649 553 651 869; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 651 809 1714 888">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 804 809 1714 888">
+     <span class='ocr_line' id='line_1_51' title="bbox 987 809 1689 836; baseline 0.003 -6"><span class='ocrx_word' id='word_1_137' title='bbox 987 809 1031 830; x_wconf 93' lang='eng'>100</span> <span class='ocrx_word' id='word_1_138' title='bbox 1134 810 1290 832; x_wconf 83' lang='eng' dir='ltr'>‘Candidatus</span> <span class='ocrx_word' id='word_1_139' title='bbox 1300 810 1428 832; x_wconf 86' lang='eng' dir='ltr'>Scalindua</span> <span class='ocrx_word' id='word_1_140' title='bbox 1440 810 1543 836; x_wconf 79' lang='eng' dir='ltr'>brodae’,</span> <span class='ocrx_word' id='word_1_141' title='bbox 1553 811 1689 832; x_wconf 86' lang='eng' dir='ltr'>AY254883</span> 
+     </span>
+     <span class='ocr_line' id='line_1_52' title="bbox 804 816 1714 888; baseline 0 -21"><span class='ocrx_word' id='word_1_142' title='bbox 804 838 834 860; x_wconf 85' lang='eng'>99</span> <span class='ocrx_word' id='word_1_143' title='bbox 1035 816 1118 888; x_wconf 69' lang='eng' dir='ltr'>E</span> <span class='ocrx_word' id='word_1_144' title='bbox 1148 845 1304 867; x_wconf 84' lang='eng' dir='ltr'>‘Candidatus</span> <span class='ocrx_word' id='word_1_145' title='bbox 1314 845 1442 867; x_wconf 88' lang='eng' dir='ltr'>Scalindua</span> <span class='ocrx_word' id='word_1_146' title='bbox 1453 845 1573 871; x_wconf 71' lang='eng' dir='ltr'>sorokinii’,</span> <span class='ocrx_word' id='word_1_147' title='bbox 1583 845 1714 867; x_wconf 89' lang='eng' dir='ltr'>AY257181</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 1175 880 1742 909">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 1175 880 1742 909">
+     <span class='ocr_line' id='line_1_53' title="bbox 1175 880 1742 909; baseline -0.002 -6"><span class='ocrx_word' id='word_1_148' title='bbox 1175 880 1331 903; x_wconf 76' lang='eng' dir='ltr'>‘Candidatus</span> <span class='ocrx_word' id='word_1_149' title='bbox 1340 880 1469 903; x_wconf 89' lang='eng' dir='ltr'>Scalindua</span> <span class='ocrx_word' id='word_1_150' title='bbox 1479 880 1595 909; x_wconf 87' lang='eng' dir='ltr'>wagneri’,</span> <span class='ocrx_word' id='word_1_151' title='bbox 1605 880 1742 903; x_wconf 90' lang='eng' dir='ltr'>AY254882</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002394-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002394-0-000.pbm.png
new file mode 100644
index 00000000..09fec912
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002394-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002394-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002394-0-000.pbm.png.hocr
new file mode 100644
index 00000000..74df47e3
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002394-0-000.pbm.png.hocr
@@ -0,0 +1,287 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002394-0-000.pbm.png"; bbox 0 0 1302 1001; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 76 825 78 866">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 76 825 78 866">
+     <span class='ocr_line' id='line_1_1' title="bbox 76 825 78 866; baseline 0 135"><span class='ocrx_word' id='word_1_1' title='bbox 76 825 78 866; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 116 48 160 66">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 116 48 160 66">
+     <span class='ocr_line' id='line_1_2' title="bbox 116 48 160 66; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 116 48 160 66; x_wconf 87' lang='eng'><em>0.02</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 111 500 147 518">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 111 500 147 518">
+     <span class='ocr_line' id='line_1_3' title="bbox 111 500 147 518; baseline 0 0"><span class='ocrx_word' id='word_1_3' title='bbox 111 500 147 518; x_wconf 90' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 0 516 543 982">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 0 516 543 982">
+     <span class='ocr_line' id='line_1_4' title="bbox 13 516 159 673; baseline 0 0"><span class='ocrx_word' id='word_1_4' title='bbox 13 516 159 673; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 0 673 78 719; baseline 0 -15"><span class='ocrx_word' id='word_1_5' title='bbox 0 673 78 719; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 13 719 78 859; baseline 0 -32"><span class='ocrx_word' id='word_1_6' title='bbox 13 719 78 859; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 13 859 484 919; baseline 0 0"><span class='ocrx_word' id='word_1_7' title='bbox 13 859 484 919; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 13 919 543 982; baseline 0 -45"><span class='ocrx_word' id='word_1_8' title='bbox 13 919 543 982; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 238 93 240 169">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 238 93 240 169">
+     <span class='ocr_line' id='line_1_9' title="bbox 238 93 240 169; baseline 0 832"><span class='ocrx_word' id='word_1_9' title='bbox 238 93 240 169; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 419 0 1302 223">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 419 0 1302 106">
+     <span class='ocr_line' id='line_1_10' title="bbox 500 0 1302 30; baseline -0.001 -6"><span class='ocrx_word' id='word_1_10' title='bbox 500 1 785 24; x_wconf 85' lang='eng' dir='ltr'><em>Pseudoxanthomonas</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 794 1 1003 30; x_wconf 83' lang='eng' dir='ltr'><em>broegbernensis</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 1014 0 1137 24; x_wconf 89' lang='eng' dir='ltr'><em>B1616/1T</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 1147 1 1302 29; x_wconf 91' lang='eng' dir='ltr'>(AJ012231)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 499 39 1275 68; baseline 0 -6"><span class='ocrx_word' id='word_1_14' title='bbox 499 40 754 68; x_wconf 82' lang='eng' dir='ltr'><em>Stenotrophomonas</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 764 40 907 68; x_wconf 82' lang='eng' dir='ltr'><em>maltophilia</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 917 40 998 62; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 1011 39 1104 62; x_wconf 82' lang='eng' dir='ltr'><em>13637T</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 1115 40 1275 68; x_wconf 85' lang='eng' dir='ltr'><em>(ABOO8509)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 419 78 1042 106; baseline 0 -5"><span class='ocrx_word' id='word_1_19' title='bbox 419 78 608 101; x_wconf 84' lang='eng' dir='ltr'><em>Xanthomonas</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 618 78 764 106; x_wconf 84' lang='eng' dir='ltr'><em>campestris</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 774 78 836 101; x_wconf 92' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 848 78 909 101; x_wconf 80' lang='eng' dir='ltr'><em>568T</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 920 78 1042 106; x_wconf 88' lang='eng' dir='ltr'><em>(X95917)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 561 117 1088 146">
+     <span class='ocr_line' id='line_1_13' title="bbox 561 117 1088 146; baseline 0 -7"><span class='ocrx_word' id='word_1_24' title='bbox 561 117 651 146; x_wconf 87' lang='eng' dir='ltr'><em>Xylella</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 662 117 788 140; x_wconf 83' lang='eng' dir='ltr'><em>fastidiosa</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 800 117 919 140; x_wconf 88' lang='eng' dir='ltr'><em>PCE-FFT</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 930 117 1088 145; x_wconf 85' lang='eng' dir='ltr'>(AF192343)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 474 155 1131 184">
+     <span class='ocr_line' id='line_1_14' title="bbox 474 155 1131 184; baseline 0 -6"><span class='ocrx_word' id='word_1_28' title='bbox 474 156 666 178; x_wconf 88' lang='eng' dir='ltr'><em>Thermomonas</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 676 156 836 184; x_wconf 77' lang='eng' dir='ltr'><em>haemolytica</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 846 155 966 178; x_wconf 91' lang='eng' dir='ltr'><em>A50-7-3T</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 976 156 1131 184; x_wconf 89' lang='eng' dir='ltr'><em>(AJ300185)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 476 194 1104 223">
+     <span class='ocr_line' id='line_1_15' title="bbox 476 194 1104 223; baseline 0 -6"><span class='ocrx_word' id='word_1_32' title='bbox 476 195 632 217; x_wconf 87' lang='eng' dir='ltr'><em>Luteimonas</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 642 195 764 223; x_wconf 82' lang='eng' dir='ltr'><em>composti</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 772 194 929 217; x_wconf 83' lang='eng' dir='ltr'><em>CC—YY255T</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 939 195 1104 223; x_wconf 83' lang='eng' dir='ltr'>(DQB46687)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 236 7 557 133">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 236 7 557 133">
+     <span class='ocr_line' id='line_1_16' title="bbox 236 7 495 82; baseline 0 0"><span class='ocrx_word' id='word_1_36' title='bbox 236 7 495 82; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 236 82 557 133; baseline 0 0"><span class='ocrx_word' id='word_1_37' title='bbox 236 82 557 133; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 173 239 494 245">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 173 239 494 245">
+     <span class='ocr_line' id='line_1_18' title="bbox 173 239 494 245; baseline 0 756"><span class='ocrx_word' id='word_1_38' title='bbox 173 239 494 245; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 203 177 205 300">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 203 177 205 300">
+     <span class='ocr_line' id='line_1_19' title="bbox 203 177 205 300; baseline 0 701"><span class='ocrx_word' id='word_1_39' title='bbox 203 177 205 300; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 225 130 228 322">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 225 130 228 322">
+     <span class='ocr_line' id='line_1_20' title="bbox 225 130 228 322; baseline 0 679"><span class='ocrx_word' id='word_1_40' title='bbox 225 130 228 322; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 173 240 175 444">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 173 240 175 444">
+     <span class='ocr_line' id='line_1_21' title="bbox 173 240 175 444; baseline 0 557"><span class='ocrx_word' id='word_1_41' title='bbox 173 240 175 444; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 173 442 216 444">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 173 442 216 444">
+     <span class='ocr_line' id='line_1_22' title="bbox 173 442 216 444; baseline 0 557"><span class='ocrx_word' id='word_1_42' title='bbox 173 442 216 444; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 182 453 207 470">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 182 453 207 470">
+     <span class='ocr_line' id='line_1_23' title="bbox 182 453 207 470; baseline 0 0"><span class='ocrx_word' id='word_1_43' title='bbox 182 453 207 470; x_wconf 89' lang='eng'><em>85</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 214 379 216 505">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 214 379 216 505">
+     <span class='ocr_line' id='line_1_24' title="bbox 214 379 216 505; baseline 0 496"><span class='ocrx_word' id='word_1_44' title='bbox 214 379 216 505; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 226 457 245 459">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 226 457 245 459">
+     <span class='ocr_line' id='line_1_25' title="bbox 226 457 245 459; baseline 0 542"><span class='ocrx_word' id='word_1_45' title='bbox 226 457 245 459; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 243 437 245 478">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 243 437 245 478">
+     <span class='ocr_line' id='line_1_26' title="bbox 243 437 245 478; baseline 0 523"><span class='ocrx_word' id='word_1_46' title='bbox 243 437 245 478; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 225 130 228 551">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 225 130 228 551">
+     <span class='ocr_line' id='line_1_27' title="bbox 225 130 228 551; baseline 0 450"><span class='ocrx_word' id='word_1_47' title='bbox 225 130 228 551; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 151 341 153 706">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 151 341 153 706">
+     <span class='ocr_line' id='line_1_28' title="bbox 151 341 153 706; baseline 0 295"><span class='ocrx_word' id='word_1_48' title='bbox 151 341 153 706; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 153 698 216 731">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 153 698 216 731">
+     <span class='ocr_line' id='line_1_29' title="bbox 153 698 216 712; baseline 0 0"><span class='ocrx_word' id='word_1_49' title='bbox 153 698 216 712; x_wconf 73' lang='eng' dir='ltr'><em>—o</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 177 714 198 731; baseline 0 0"><span class='ocrx_word' id='word_1_50' title='bbox 177 714 198 731; x_wconf 85' lang='eng'>91</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 209 670 211 740">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 209 670 211 740">
+     <span class='ocr_line' id='line_1_31' title="bbox 209 670 211 740; baseline 0 261"><span class='ocrx_word' id='word_1_51' title='bbox 209 670 211 740; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 226 549 260 551">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 226 549 260 551">
+     <span class='ocr_line' id='line_1_32' title="bbox 226 549 260 551; baseline 0 450"><span class='ocrx_word' id='word_1_52' title='bbox 226 549 260 551; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 258 515 260 582">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 258 515 260 582">
+     <span class='ocr_line' id='line_1_33' title="bbox 258 515 260 582; baseline 0 419"><span class='ocrx_word' id='word_1_53' title='bbox 258 515 260 582; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 227 167 466 253">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 229 236 254 253">
+     <span class='ocr_line' id='line_1_34' title="bbox 229 236 254 253; baseline 0 0"><span class='ocrx_word' id='word_1_54' title='bbox 229 236 254 253; x_wconf 88' lang='eng'><em>68</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 245 437 347 439">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 245 437 347 439">
+     <span class='ocr_line' id='line_1_35' title="bbox 245 437 347 439; baseline 0 562"><span class='ocrx_word' id='word_1_55' title='bbox 245 437 347 439; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 258 553 332 633">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 258 553 332 633">
+     <span class='ocr_line' id='line_1_36' title="bbox 258 553 332 633; baseline 0 -23"><span class='ocrx_word' id='word_1_56' title='bbox 258 553 332 633; x_wconf 34' lang='eng' dir='ltr'><em>i</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 389 233 1124 379">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 505 233 1124 262">
+     <span class='ocr_line' id='line_1_37' title="bbox 505 233 1124 262; baseline 0 -6"><span class='ocrx_word' id='word_1_57' title='bbox 505 234 661 256; x_wconf 83' lang='eng' dir='ltr'><em>Luteimonas</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 671 234 783 262; x_wconf 79' lang='eng' dir='ltr'><em>mephitis</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 794 233 959 256; x_wconf 80' lang='eng' dir='ltr'><em>B1953/27.1T</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 969 234 1124 262; x_wconf 87' lang='eng' dir='ltr'>(AJ012228)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 389 272 1070 301">
+     <span class='ocr_line' id='line_1_38' title="bbox 389 272 1070 301; baseline 0 -6"><span class='ocrx_word' id='word_1_61' title='bbox 389 273 404 295; x_wconf 93' lang='eng' dir='ltr'><strong><em>L</em></strong></span> <span class='ocrx_word' id='word_1_62' title='bbox 405 273 540 301; x_wconf 82' lang='eng' dir='ltr'><em>ysobacter</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 547 273 703 295; x_wconf 87' lang='eng' dir='ltr'><em>brunescens</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 714 272 793 295; x_wconf 89' lang='eng' dir='ltr'><em>KCTC</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 806 272 899 295; x_wconf 77' lang='eng' dir='ltr'><em>12130T</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 910 273 1070 301; x_wconf 85' lang='eng' dir='ltr'>(AB161360)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 402 311 1081 379">
+     <span class='ocr_line' id='line_1_39' title="bbox 402 311 1081 340; baseline 0 -6"><span class='ocrx_word' id='word_1_67' title='bbox 402 312 566 340; x_wconf 87' lang='eng' dir='ltr'><em>Lysobacter</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 572 312 753 340; x_wconf 85' lang='eng' dir='ltr'><em>panaciterrae</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 762 312 835 334; x_wconf 87' lang='eng' dir='ltr'><em>Gsoil</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 847 311 908 334; x_wconf 82' lang='eng' dir='ltr'><em>068T</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 919 312 1081 340; x_wconf 87' lang='eng' dir='ltr'><em>(ABZ45359)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 433 350 1020 379; baseline 0 -6"><span class='ocrx_word' id='word_1_72' title='bbox 433 351 583 379; x_wconf 83' lang='eng' dir='ltr'><em>Lysobacter</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 590 351 718 373; x_wconf 87' lang='eng' dir='ltr'><em>niabensis</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 728 350 844 373; x_wconf 81' lang='eng' dir='ltr'><em>GH34—4T</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 855 351 1020 379; x_wconf 90' lang='eng' dir='ltr'>(DQ462461)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 216 357 1112 418">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 216 357 1112 418">
+     <span class='ocr_line' id='line_1_41' title="bbox 216 357 424 401; baseline 0 0"><span class='ocrx_word' id='word_1_76' title='bbox 216 357 424 401; x_wconf 68' lang='eng'><em>—95+:</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 416 388 1112 418; baseline -0.001 -6"><span class='ocrx_word' id='word_1_77' title='bbox 416 390 430 411; x_wconf 93' lang='eng' dir='ltr'><em>L</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 432 390 566 418; x_wconf 77' lang='eng' dir='ltr'><em>ysobacter</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 572 390 809 418; x_wconf 88' lang='eng' dir='ltr'><em>yangpyeongensis</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 819 388 936 412; x_wconf 78' lang='eng' dir='ltr'><em>GH19-3T</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 947 389 1046 418; x_wconf 86' lang='eng' dir='ltr'>(DQ191</span> <span class='ocrx_word' id='word_1_82' title='bbox 1055 390 1112 418; x_wconf 88' lang='eng'>179)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 343 427 1032 573">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 343 427 1032 573">
+     <span class='ocr_line' id='line_1_43' title="bbox 357 427 1032 457; baseline -0.001 -6"><span class='ocrx_word' id='word_1_83' title='bbox 357 428 508 457; x_wconf 78' lang='eng' dir='ltr'><em>Lysobacter</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 515 434 703 457; x_wconf 86' lang='eng' dir='ltr'><em>enzymogenes</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 714 428 777 451; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 788 427 867 451; x_wconf 89' lang='eng' dir='ltr'><em>2043T</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 878 428 1032 456; x_wconf 86' lang='eng' dir='ltr'>(AJ298291)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 383 466 977 495; baseline 0 -6"><span class='ocrx_word' id='word_1_88' title='bbox 383 467 533 495; x_wconf 82' lang='eng' dir='ltr'><em>Lysobacter</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 540 467 674 489; x_wconf 78' lang='eng' dir='ltr'><em>niastensis</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 684 466 801 489; x_wconf 89' lang='eng' dir='ltr'><em>GH41-7T</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 812 467 977 495; x_wconf 87' lang='eng' dir='ltr'>(DQ462462)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 429 505 996 534; baseline 0 -6"><span class='ocrx_word' id='word_1_92' title='bbox 429 506 580 534; x_wconf 79' lang='eng' dir='ltr'><em>Lysobacter</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 587 506 716 528; x_wconf 84' lang='eng' dir='ltr'><em>koreensis</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 727 505 826 528; x_wconf 78' lang='eng' dir='ltr'><em>Dae16T</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 836 506 996 534; x_wconf 88' lang='eng' dir='ltr'>(AB166878)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 343 544 891 573; baseline 0 -6"><span class='ocrx_word' id='word_1_96' title='bbox 343 545 493 573; x_wconf 80' lang='eng' dir='ltr'><em>Lysobacter</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 501 545 593 573; x_wconf 83' lang='eng' dir='ltr'><em>capsici</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 601 544 722 567; x_wconf 81' lang='eng' dir='ltr'><em>YCS194T</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 733 545 891 573; x_wconf 89' lang='eng' dir='ltr'>(EF488749)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 278 583 1003 651">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 278 583 1003 651">
+     <span class='ocr_line' id='line_1_47' title="bbox 278 583 1003 613; baseline -0.001 -6"><span class='ocrx_word' id='word_1_100' title='bbox 278 592 302 610; x_wconf 85' lang='eng' dir='ltr'><em>oo</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 331 584 481 612; x_wconf 82' lang='eng' dir='ltr'><em>Lysobacter</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 488 590 636 613; x_wconf 88' lang='eng' dir='ltr'><em>gummosus</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 646 584 726 607; x_wconf 91' lang='eng' dir='ltr'><em>KCTC</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 739 583 832 607; x_wconf 80' lang='eng' dir='ltr'><em>12132T</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 843 584 1003 612; x_wconf 89' lang='eng' dir='ltr'>(AB161361)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_48' title="bbox 283 622 986 651; baseline 0 -6"><span class='ocrx_word' id='word_1_106' title='bbox 283 622 307 639; x_wconf 85' lang='eng'><em>55</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 343 623 493 651; x_wconf 80' lang='eng' dir='ltr'><em>Lysobacter</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 501 623 651 645; x_wconf 82' lang='eng' dir='ltr'><em>ant/bioticus</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 662 623 725 645; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 737 622 815 645; x_wconf 89' lang='eng' dir='ltr'><em>2044T</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 826 623 986 651; x_wconf 86' lang='eng' dir='ltr'>(ABO19582)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 246 777 271 794">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 246 777 271 794">
+     <span class='ocr_line' id='line_1_49' title="bbox 246 777 271 794; baseline 0 0"><span class='ocrx_word' id='word_1_112' title='bbox 246 777 271 794; x_wconf 86' lang='eng'><em>69</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 243 944 295 991">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 243 944 295 991">
+     <span class='ocr_line' id='line_1_50' title="bbox 243 944 279 962; baseline 0.028 -1"><span class='ocrx_word' id='word_1_113' title='bbox 243 944 279 962; x_wconf 88' lang='eng'><em>100</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_51' title="bbox 271 973 295 991; baseline 0.042 -1"><span class='ocrx_word' id='word_1_114' title='bbox 271 973 295 991; x_wconf 85' lang='eng'><em>76</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 343 661 963 690">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 343 661 963 690">
+     <span class='ocr_line' id='line_1_52' title="bbox 343 661 963 690; baseline 0 -6"><span class='ocrx_word' id='word_1_115' title='bbox 343 662 493 690; x_wconf 87' lang='eng' dir='ltr'><em>Lysobacter</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 500 662 678 690; x_wconf 82' lang='eng' dir='ltr'><em>daejeonensis</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 688 661 788 684; x_wconf 88' lang='eng' dir='ltr'><em>GH1—9T</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 799 662 898 690; x_wconf 89' lang='eng' dir='ltr'>(DQ191</span> <span class='ocrx_word' id='word_1_119' title='bbox 907 662 963 690; x_wconf 90' lang='eng'>178)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 211 700 1079 788">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 211 700 1079 788">
+     <span class='ocr_line' id='line_1_53' title="bbox 378 700 958 729; baseline -0.002 -6"><span class='ocrx_word' id='word_1_120' title='bbox 378 700 528 729; x_wconf 80' lang='eng' dir='ltr'><em>Lysobacter</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 536 700 697 723; x_wconf 79' lang='eng' dir='ltr'><em>concretionis</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 707 700 788 723; x_wconf 90' lang='eng' dir='ltr'><em>K007T</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 798 700 958 728; x_wconf 90' lang='eng' dir='ltr'>(AB161359)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_54' title="bbox 211 709 1079 788; baseline 0 -27"><span class='ocrx_word' id='word_1_124' title='bbox 211 709 437 788; x_wconf 27' lang='eng' dir='ltr'><em>ﬁr;—</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 448 739 598 768; x_wconf 81' lang='eng' dir='ltr'><em>Lysobacter</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 605 739 701 762; x_wconf 81' lang='eng' dir='ltr'><em>defluvii</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 710 739 764 761; x_wconf 93' lang='eng' dir='ltr'><em>IMM</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 770 739 772 761; x_wconf 98' lang='eng'><strong><em>|</em></strong></span> <span class='ocrx_word' id='word_1_129' title='bbox 778 739 794 761; x_wconf 95' lang='eng' dir='ltr'>B</span> <span class='ocrx_word' id='word_1_130' title='bbox 804 739 904 762; x_wconf 80' lang='eng' dir='ltr'><em>APB-9T</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 915 739 1079 767; x_wconf 86' lang='eng' dir='ltr'>(AM283465)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 296 777 1271 1001">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 296 777 1271 1001">
+     <span class='ocr_line' id='line_1_55' title="bbox 379 777 1009 806; baseline 0 -6"><span class='ocrx_word' id='word_1_132' title='bbox 379 778 529 806; x_wconf 81' lang='eng' dir='ltr'><em>Lysobacter</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 537 778 687 806; x_wconf 86' lang='eng' dir='ltr'><em>spongiico/a</em></span> <span class='ocrx_word' id='word_1_134' title='bbox 699 778 765 800; x_wconf 93' lang='eng' dir='ltr'><em>KMM</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 777 777 838 800; x_wconf 88' lang='eng' dir='ltr'><em>329T</em></span> <span class='ocrx_word' id='word_1_136' title='bbox 849 778 1009 806; x_wconf 80' lang='eng' dir='ltr'>(A8299978)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_56' title="bbox 296 816 866 845; baseline 0 -6"><span class='ocrx_word' id='word_1_137' title='bbox 296 817 449 845; x_wconf 83' lang='eng' dir='ltr'><em>Aqu/monas</em></span> <span class='ocrx_word' id='word_1_138' title='bbox 460 817 531 839; x_wconf 84' lang='eng' dir='ltr'><em>voraii</em></span> <span class='ocrx_word' id='word_1_139' title='bbox 539 817 641 839; x_wconf 89' lang='eng' dir='ltr'>GPTSA</span> <span class='ocrx_word' id='word_1_140' title='bbox 651 816 696 839; x_wconf 89' lang='eng' dir='ltr'><em>20T</em></span> <span class='ocrx_word' id='word_1_141' title='bbox 707 817 866 845; x_wconf 89' lang='eng' dir='ltr'>(AY544768)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_57' title="bbox 359 855 943 884; baseline 0 -6"><span class='ocrx_word' id='word_1_142' title='bbox 359 856 509 878; x_wconf 88' lang='eng' dir='ltr'><em>Dokdone/Ia</em></span> <span class='ocrx_word' id='word_1_143' title='bbox 520 856 649 878; x_wconf 83' lang='eng' dir='ltr'><em>koreensis</em></span> <span class='ocrx_word' id='word_1_144' title='bbox 660 855 772 878; x_wconf 88' lang='eng' dir='ltr'><em>DS-123T</em></span> <span class='ocrx_word' id='word_1_145' title='bbox 783 856 943 884; x_wconf 86' lang='eng' dir='ltr'>(AY987368)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_58' title="bbox 495 894 1087 923; baseline 0 -6"><span class='ocrx_word' id='word_1_146' title='bbox 495 895 614 917; x_wconf 82' lang='eng' dir='ltr'><em>Frateuria</em></span> <span class='ocrx_word' id='word_1_147' title='bbox 625 895 732 917; x_wconf 81' lang='eng' dir='ltr'><em>aurantia</em></span> <span class='ocrx_word' id='word_1_148' title='bbox 744 894 827 917; x_wconf 88' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_149' title='bbox 838 894 916 917; x_wconf 74' lang='eng' dir='ltr'><em>3245T</em></span> <span class='ocrx_word' id='word_1_150' title='bbox 927 895 1087 923; x_wconf 77' lang='eng' dir='ltr'>(ABOQ1194)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_59' title="bbox 408 933 961 962; baseline 0 -6"><span class='ocrx_word' id='word_1_151' title='bbox 408 934 562 956; x_wconf 85' lang='eng' dir='ltr'><em>Fulvimonas</em></span> <span class='ocrx_word' id='word_1_152' title='bbox 572 934 618 956; x_wconf 81' lang='eng' dir='ltr'><em>soli</em></span> <span class='ocrx_word' id='word_1_153' title='bbox 627 934 689 956; x_wconf 91' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_154' title='bbox 703 933 795 956; x_wconf 81' lang='eng' dir='ltr'><em>19981T</em></span> <span class='ocrx_word' id='word_1_155' title='bbox 806 934 961 962; x_wconf 86' lang='eng' dir='ltr'>(AJ311653)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_60' title="bbox 552 972 1271 1001; baseline 0 -6"><span class='ocrx_word' id='word_1_156' title='bbox 552 973 761 995; x_wconf 82' lang='eng' dir='ltr'><em>Rhodanobacter</em></span> <span class='ocrx_word' id='word_1_157' title='bbox 768 973 972 995; x_wconf 80' lang='eng' dir='ltr'><em>Iindanic/asticus</em></span> <span class='ocrx_word' id='word_1_158' title='bbox 983 972 1102 995; x_wconf 89' lang='eng' dir='ltr'><em>RP5557T</em></span> <span class='ocrx_word' id='word_1_159' title='bbox 1113 973 1271 1001; x_wconf 89' lang='eng' dir='ltr'>(AF039167)</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002444-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002444-0-000.pbm.png
new file mode 100644
index 00000000..e0f9adaa
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002444-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002444-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002444-0-000.pbm.png.hocr
new file mode 100644
index 00000000..93943cd8
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002444-0-000.pbm.png.hocr
@@ -0,0 +1,146 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002444-0-000.pbm.png"; bbox 0 0 1479 1277; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 179 510 204 528">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 179 510 204 528">
+     <span class='ocr_line' id='line_1_1' title="bbox 179 510 204 528; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 179 510 204 528; x_wconf 82' lang='eng'>98</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 181 686 206 704">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 181 686 206 704">
+     <span class='ocr_line' id='line_1_2' title="bbox 181 686 206 704; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 181 686 206 704; x_wconf 85' lang='eng'>76</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 153 1255 198 1273">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 153 1255 198 1273">
+     <span class='ocr_line' id='line_1_3' title="bbox 153 1255 198 1273; baseline 0 0"><span class='ocrx_word' id='word_1_3' title='bbox 153 1255 198 1273; x_wconf 91' lang='eng'>0.02</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 209 851 235 869">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 209 851 235 869">
+     <span class='ocr_line' id='line_1_4' title="bbox 209 851 235 869; baseline 0 0"><span class='ocrx_word' id='word_1_4' title='bbox 209 851 235 869; x_wconf 85' lang='eng'>73</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 231 998 256 1016">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 231 998 256 1016">
+     <span class='ocr_line' id='line_1_5' title="bbox 231 998 256 1016; baseline 0 0"><span class='ocrx_word' id='word_1_5' title='bbox 231 998 256 1016; x_wconf 85' lang='eng'>86</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 222 1103 259 1121">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 222 1103 259 1121">
+     <span class='ocr_line' id='line_1_6' title="bbox 222 1103 259 1121; baseline 0.027 -1"><span class='ocrx_word' id='word_1_6' title='bbox 222 1103 259 1121; x_wconf 89' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 476 306 478 438">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 476 306 478 438">
+     <span class='ocr_line' id='line_1_7' title="bbox 476 306 478 438; baseline 0 839"><span class='ocrx_word' id='word_1_7' title='bbox 476 306 478 438; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 430 371 432 490">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 430 371 432 490">
+     <span class='ocr_line' id='line_1_8' title="bbox 430 371 432 490; baseline 0 787"><span class='ocrx_word' id='word_1_8' title='bbox 430 371 432 490; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 679 4 1220 32">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 679 4 1220 32">
+     <span class='ocr_line' id='line_1_9' title="bbox 679 4 1220 32; baseline 0 -5"><span class='ocrx_word' id='word_1_9' title='bbox 679 7 858 32; x_wconf 81' lang='eng' dir='ltr'>Hymenobacter</span> <span class='ocrx_word' id='word_1_10' title='bbox 865 4 1062 32; x_wconf 78' lang='eng' dir='ltr'>riguiWPCB131T</span> <span class='ocrx_word' id='word_1_11' title='bbox 1071 6 1220 32; x_wconf 89' lang='eng' dir='ltr'>(DQ089669)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 474 16 755 386">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 474 16 755 386">
+     <span class='ocr_line' id='line_1_10' title="bbox 510 16 720 99; baseline -0.029 1"><span class='ocrx_word' id='word_1_12' title='bbox 510 16 720 99; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 499 99 707 203; baseline 0.024 -57"><span class='ocrx_word' id='word_1_13' title='bbox 499 99 707 203; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 474 203 755 303; baseline 0 -48"><span class='ocrx_word' id='word_1_14' title='bbox 474 203 755 303; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 474 303 688 360; baseline 0.023 -5"><span class='ocrx_word' id='word_1_15' title='bbox 474 303 688 360; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 499 360 654 386; baseline 0 891"><span class='ocrx_word' id='word_1_16' title='bbox 499 360 654 386; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 654 56 1354 502">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 654 56 1354 502">
+     <span class='ocr_line' id='line_1_15' title="bbox 727 56 1316 85; baseline 0 -6"><span class='ocrx_word' id='word_1_17' title='bbox 727 59 906 85; x_wconf 81' lang='eng' dir='ltr'>Hymenobacter</span> <span class='ocrx_word' id='word_1_18' title='bbox 912 59 1068 85; x_wconf 84' lang='eng' dir='ltr'>Xinjiangensis</span> <span class='ocrx_word' id='word_1_19' title='bbox 1077 56 1316 85; x_wconf 78' lang='eng' dir='ltr'>X2-1gT(D0888329)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 714 109 1304 137; baseline 0 -5"><span class='ocrx_word' id='word_1_20' title='bbox 714 112 893 137; x_wconf 73' lang='eng' dir='ltr'>Hymenobacter</span> <span class='ocrx_word' id='word_1_21' title='bbox 899 112 1107 137; x_wconf 86' lang='eng' dir='ltr'>gelipurpurascens</span> <span class='ocrx_word' id='word_1_22' title='bbox 1115 109 1304 137; x_wconf 88' lang='eng' dir='ltr'>Txg1T(Y18836)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 677 160 1322 189; baseline 0 -6"><span class='ocrx_word' id='word_1_23' title='bbox 677 163 856 189; x_wconf 80' lang='eng' dir='ltr'>Hymenobacter</span> <span class='ocrx_word' id='word_1_24' title='bbox 863 163 1022 183; x_wconf 83' lang='eng' dir='ltr'>actinosc/erus</span> <span class='ocrx_word' id='word_1_25' title='bbox 1031 163 1108 183; x_wconf 90' lang='eng' dir='ltr'><strong>CCUG</strong></span> <span class='ocrx_word' id='word_1_26' title='bbox 1120 163 1190 183; x_wconf 83' lang='eng'>39621</span> <span class='ocrx_word' id='word_1_27' title='bbox 1195 160 1206 173; x_wconf 93' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_28' title='bbox 1212 163 1248 189; x_wconf 92' lang='eng' dir='ltr'>(Y1</span> <span class='ocrx_word' id='word_1_29' title='bbox 1254 163 1322 189; x_wconf 81' lang='eng'>7356)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 707 213 1297 241; baseline 0 -6"><span class='ocrx_word' id='word_1_30' title='bbox 707 215 886 241; x_wconf 85' lang='eng' dir='ltr'>Hymenobacter</span> <span class='ocrx_word' id='word_1_31' title='bbox 893 215 1018 240; x_wconf 88' lang='eng' dir='ltr'>aerophi/us</span> <span class='ocrx_word' id='word_1_32' title='bbox 1028 215 1136 235; x_wconf 87' lang='eng' dir='ltr'>|/26-Cor1</span> <span class='ocrx_word' id='word_1_33' title='bbox 1142 213 1152 226; x_wconf 91' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_34' title='bbox 1158 215 1297 241; x_wconf 87' lang='eng' dir='ltr'>(AJ276901)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 759 264 1354 293; baseline 0 -6"><span class='ocrx_word' id='word_1_35' title='bbox 759 267 939 293; x_wconf 79' lang='eng' dir='ltr'>Hymenobacter</span> <span class='ocrx_word' id='word_1_36' title='bbox 945 267 1126 287; x_wconf 82' lang='eng' dir='ltr'>roseosalivan‘us</span> <span class='ocrx_word' id='word_1_37' title='bbox 1134 264 1354 293; x_wconf 82' lang='eng' dir='ltr'>AA—718T(Y18833)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 688 317 1274 346; baseline 0 -6"><span class='ocrx_word' id='word_1_38' title='bbox 688 320 867 345; x_wconf 75' lang='eng' dir='ltr'>Hymenobacter</span> <span class='ocrx_word' id='word_1_39' title='bbox 873 320 1031 340; x_wconf 87' lang='eng' dir='ltr'>norwichensis</span> <span class='ocrx_word' id='word_1_40' title='bbox 1041 317 1126 340; x_wconf 82' lang='eng' dir='ltr'>NS/SOT</span> <span class='ocrx_word' id='word_1_41' title='bbox 1135 320 1172 346; x_wconf 88' lang='eng' dir='ltr'>(AJ</span> <span class='ocrx_word' id='word_1_42' title='bbox 1176 320 1274 346; x_wconf 88' lang='eng'>549285)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 654 369 1189 398; baseline 0 -6"><span class='ocrx_word' id='word_1_43' title='bbox 654 372 833 397; x_wconf 83' lang='eng' dir='ltr'>Hymenobacter</span> <span class='ocrx_word' id='word_1_44' title='bbox 840 372 991 392; x_wconf 76' lang='eng' dir='ltr'>chitin/vorans</span> <span class='ocrx_word' id='word_1_45' title='bbox 1000 372 1054 392; x_wconf 85' lang='eng' dir='ltr'>Txc1</span> <span class='ocrx_word' id='word_1_46' title='bbox 1059 369 1070 382; x_wconf 91' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_47' title='bbox 1079 372 1189 398; x_wconf 84' lang='eng' dir='ltr'>(Y18837)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 666 423 1332 451; baseline 0 -5"><span class='ocrx_word' id='word_1_48' title='bbox 666 425 857 451; x_wconf 85' lang='eng' dir='ltr'>Hymenobacter</span> <span class='ocrx_word' id='word_1_49' title='bbox 865 425 1079 451; x_wconf 83' lang='eng' dir='ltr'>daecheongensis</span> <span class='ocrx_word' id='word_1_50' title='bbox 1088 423 1177 446; x_wconf 84' lang='eng' dir='ltr'>Dae14T</span> <span class='ocrx_word' id='word_1_51' title='bbox 1186 425 1332 451; x_wconf 84' lang='eng' dir='ltr'>(EU370958)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 744 473 1209 502; baseline 0 -6"><span class='ocrx_word' id='word_1_52' title='bbox 744 476 923 502; x_wconf 84' lang='eng' dir='ltr'>Hymenobacter</span> <span class='ocrx_word' id='word_1_53' title='bbox 930 476 972 496; x_wconf 90' lang='eng' dir='ltr'>soli</span> <span class='ocrx_word' id='word_1_54' title='bbox 980 473 1056 496; x_wconf 91' lang='eng' dir='ltr'>PB17T</span> <span class='ocrx_word' id='word_1_55' title='bbox 1065 476 1209 502; x_wconf 87' lang='eng' dir='ltr'>(AB251884)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 374 489 1083 553">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 374 489 1083 553">
+     <span class='ocr_line' id='line_1_24' title="bbox 374 489 1083 553; baseline 0.001 -6"><span class='ocrx_word' id='word_1_56' title='bbox 374 489 771 553; x_wconf 40' lang='eng' dir='ltr'>K—Hymenobacter</span> <span class='ocrx_word' id='word_1_57' title='bbox 777 527 884 548; x_wconf 81' lang='eng' dir='ltr'>ocel/atus</span> <span class='ocrx_word' id='word_1_58' title='bbox 893 527 947 548; x_wconf 88' lang='eng' dir='ltr'>Txo1</span> <span class='ocrx_word' id='word_1_59' title='bbox 953 525 964 538; x_wconf 90' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_60' title='bbox 973 527 1083 553; x_wconf 89' lang='eng' dir='ltr'>(Y18838)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 330 747 368 765">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 330 747 368 765">
+     <span class='ocr_line' id='line_1_25' title="bbox 330 747 368 765; baseline 0 0"><span class='ocrx_word' id='word_1_61' title='bbox 330 747 368 765; x_wconf 85' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 545 577 1474 1178">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 545 577 1474 1178">
+     <span class='ocr_line' id='line_1_26' title="bbox 545 577 1126 605; baseline 0 -5"><span class='ocrx_word' id='word_1_62' title='bbox 545 579 718 600; x_wconf 86' lang='eng' dir='ltr'>Adhaeribacter</span> <span class='ocrx_word' id='word_1_63' title='bbox 725 579 840 605; x_wconf 83' lang='eng' dir='ltr'>aquaticus</span> <span class='ocrx_word' id='word_1_64' title='bbox 850 577 1126 605; x_wconf 86' lang='eng' dir='ltr'>MBRG1.5T(AJ626894)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 618 629 1191 658; baseline 0 -6"><span class='ocrx_word' id='word_1_65' title='bbox 618 632 786 652; x_wconf 85' lang='eng' dir='ltr'>Persicobacter</span> <span class='ocrx_word' id='word_1_66' title='bbox 793 632 894 652; x_wconf 84' lang='eng' dir='ltr'>diff/uens</span> <span class='ocrx_word' id='word_1_67' title='bbox 905 632 989 652; x_wconf 90' lang='eng' dir='ltr'>NCIMB</span> <span class='ocrx_word' id='word_1_68' title='bbox 1001 629 1071 652; x_wconf 91' lang='eng' dir='ltr'>1402T</span> <span class='ocrx_word' id='word_1_69' title='bbox 1079 632 1191 658; x_wconf 86' lang='eng' dir='ltr'>(D12660)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 649 681 1345 710; baseline 0 -6"><span class='ocrx_word' id='word_1_70' title='bbox 649 684 855 704; x_wconf 87' lang='eng' dir='ltr'>Reichenbachie/Ia</span> <span class='ocrx_word' id='word_1_71' title='bbox 865 684 1041 710; x_wconf 83' lang='eng' dir='ltr'>agariperforans</span> <span class='ocrx_word' id='word_1_72' title='bbox 1051 684 1110 704; x_wconf 94' lang='eng' dir='ltr'>KMM</span> <span class='ocrx_word' id='word_1_73' title='bbox 1121 681 1192 704; x_wconf 86' lang='eng' dir='ltr'>3525T</span> <span class='ocrx_word' id='word_1_74' title='bbox 1201 684 1345 710; x_wconf 83' lang='eng' dir='ltr'>(AB058919)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 703 733 1253 762; baseline 0 -6"><span class='ocrx_word' id='word_1_75' title='bbox 703 736 859 762; x_wconf 86' lang='eng' dir='ltr'>Dyadobacter</span> <span class='ocrx_word' id='word_1_76' title='bbox 866 736 1003 756; x_wconf 84' lang='eng' dir='ltr'>fermentans</span> <span class='ocrx_word' id='word_1_77' title='bbox 1013 733 1253 762; x_wconf 86' lang='eng' dir='ltr'>NS114T(AF137029)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 883 786 1421 814; baseline 0 -6"><span class='ocrx_word' id='word_1_78' title='bbox 883 788 973 808; x_wconf 89' lang='eng' dir='ltr'>Rune/la</span> <span class='ocrx_word' id='word_1_79' title='bbox 983 788 1119 814; x_wconf 82' lang='eng' dir='ltr'>slithyformis</span> <span class='ocrx_word' id='word_1_80' title='bbox 1127 788 1201 808; x_wconf 88' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_81' title='bbox 1211 786 1297 808; x_wconf 79' lang='eng' dir='ltr'>2593GT</span> <span class='ocrx_word' id='word_1_82' title='bbox 1306 788 1421 814; x_wconf 88' lang='eng' dir='ltr'>(M62786)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 735 838 1278 866; baseline -0.002 -5"><span class='ocrx_word' id='word_1_83' title='bbox 735 840 900 861; x_wconf 83' lang='eng' dir='ltr'>Flectobacil/us</span> <span class='ocrx_word' id='word_1_84' title='bbox 909 840 979 866; x_wconf 84' lang='eng' dir='ltr'><em>major</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 985 840 1057 861; x_wconf 89' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_86' title='bbox 1067 838 1154 861; x_wconf 81' lang='eng' dir='ltr'>29496T</span> <span class='ocrx_word' id='word_1_87' title='bbox 1162 840 1278 866; x_wconf 84' lang='eng' dir='ltr'>(M62787)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 777 890 1293 918; baseline 0 -5"><span class='ocrx_word' id='word_1_88' title='bbox 777 892 912 913; x_wconf 82' lang='eng' dir='ltr'>Flexibacter</span> <span class='ocrx_word' id='word_1_89' title='bbox 919 892 991 913; x_wconf 80' lang='eng' dir='ltr'>ﬂex/[is</span> <span class='ocrx_word' id='word_1_90' title='bbox 999 892 1073 913; x_wconf 87' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_91' title='bbox 1082 890 1169 913; x_wconf 86' lang='eng' dir='ltr'>23079T</span> <span class='ocrx_word' id='word_1_92' title='bbox 1178 892 1293 918; x_wconf 86' lang='eng' dir='ltr'>(M62794)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 717 942 1269 971; baseline 0 -6"><span class='ocrx_word' id='word_1_93' title='bbox 717 945 846 971; x_wconf 79' lang='eng' dir='ltr'><em>Cytophaga</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 856 945 1001 965; x_wconf 75' lang='eng' dir='ltr'>hutchinsonii</span> <span class='ocrx_word' id='word_1_95' title='bbox 1009 945 1066 965; x_wconf 94' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_96' title='bbox 1078 945 1132 965; x_wconf 92' lang='eng'>1761</span> <span class='ocrx_word' id='word_1_97' title='bbox 1137 942 1148 955; x_wconf 96' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_98' title='bbox 1157 945 1269 971; x_wconf 89' lang='eng' dir='ltr'>(D12663)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 656 994 1361 1023; baseline 0 -6"><span class='ocrx_word' id='word_1_99' title='bbox 656 997 853 1023; x_wconf 82' lang='eng' dir='ltr'>Sporocytophaga</span> <span class='ocrx_word' id='word_1_100' title='bbox 863 997 1048 1023; x_wconf 84' lang='eng' dir='ltr'>myxococcoides</span> <span class='ocrx_word' id='word_1_101' title='bbox 1058 997 1116 1017; x_wconf 91' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_102' title='bbox 1128 994 1212 1017; x_wconf 86' lang='eng' dir='ltr'>11118T</span> <span class='ocrx_word' id='word_1_103' title='bbox 1221 997 1361 1023; x_wconf 88' lang='eng' dir='ltr'>(AJ310654)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 625 1046 1189 1075; baseline 0 -6"><span class='ocrx_word' id='word_1_104' title='bbox 625 1049 766 1069; x_wconf 84' lang='eng' dir='ltr'>Pedobacter</span> <span class='ocrx_word' id='word_1_105' title='bbox 773 1049 891 1074; x_wconf 85' lang='eng' dir='ltr'>heparinus</span> <span class='ocrx_word' id='word_1_106' title='bbox 902 1049 959 1069; x_wconf 91' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_107' title='bbox 969 1046 1040 1069; x_wconf 83' lang='eng' dir='ltr'>2366T</span> <span class='ocrx_word' id='word_1_108' title='bbox 1049 1049 1189 1075; x_wconf 86' lang='eng' dir='ltr'>(AJ438172)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 654 1100 1307 1126; baseline -0.002 -5"><span class='ocrx_word' id='word_1_109' title='bbox 654 1100 872 1126; x_wconf 81' lang='eng' dir='ltr'>Sphingobacterium</span> <span class='ocrx_word' id='word_1_110' title='bbox 881 1100 1020 1126; x_wconf 85' lang='eng' dir='ltr'><em>spiritivorum</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 1030 1100 1087 1121; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_112' title='bbox 1097 1100 1156 1121; x_wconf 86' lang='eng'>2582</span> <span class='ocrx_word' id='word_1_113' title='bbox 1167 1100 1307 1126; x_wconf 90' lang='eng' dir='ltr'>(AJ459411)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 883 1150 1474 1178; baseline -0.002 -5"><span class='ocrx_word' id='word_1_114' title='bbox 883 1152 1068 1173; x_wconf 85' lang='eng' dir='ltr'><em>Flavobacterium</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 1078 1152 1172 1178; x_wconf 82' lang='eng' dir='ltr'>aquatile</span> <span class='ocrx_word' id='word_1_116' title='bbox 1181 1152 1254 1173; x_wconf 92' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_117' title='bbox 1266 1150 1351 1173; x_wconf 85' lang='eng' dir='ltr'>11947T</span> <span class='ocrx_word' id='word_1_118' title='bbox 1360 1152 1474 1178; x_wconf 88' lang='eng' dir='ltr'>(M62797)</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002451-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002451-0-000.pbm.png
new file mode 100644
index 00000000..a90342eb
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002451-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002451-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002451-0-000.pbm.png.hocr
new file mode 100644
index 00000000..d009b9df
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002451-0-000.pbm.png.hocr
@@ -0,0 +1,160 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002451-0-000.pbm.png"; bbox 0 0 994 1056; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 198 4 883 332">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 202 4 883 245">
+     <span class='ocr_line' id='line_1_1' title="bbox 202 4 850 33; baseline -0.003 -4"><span class='ocrx_word' id='word_1_1' title='bbox 202 12 233 29; x_wconf 73' lang='eng'><em>98*</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 331 6 484 27; x_wconf 85' lang='eng' dir='ltr'><em>Salinicoccus</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 493 7 605 27; x_wconf 86' lang='eng' dir='ltr'><em>iranensis</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 614 4 688 28; x_wconf 88' lang='eng' dir='ltr'>QW6T</span> <span class='ocrx_word' id='word_1_5' title='bbox 698 6 850 33; x_wconf 86' lang='eng' dir='ltr'>(DQ767692)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 329 46 883 75; baseline 0 -5"><span class='ocrx_word' id='word_1_6' title='bbox 329 49 483 70; x_wconf 86' lang='eng' dir='ltr'><em>Saliniooccus</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 492 49 566 70; x_wconf 88' lang='eng' dir='ltr'><em>luteus</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 574 49 622 69; x_wconf 94' lang='eng' dir='ltr'><em>YIM</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 633 46 721 70; x_wconf 90' lang='eng' dir='ltr'><em>70202T</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 731 49 883 75; x_wconf 79' lang='eng' dir='ltr'>(D0352839)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 249 91 770 120; baseline 0 -6"><span class='ocrx_word' id='word_1_11' title='bbox 249 93 403 114; x_wconf 86' lang='eng' dir='ltr'><em>Salinicoccus</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 411 99 495 114; x_wconf 86' lang='eng' dir='ltr'><em>roseus</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 505 93 564 114; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 575 91 647 114; x_wconf 85' lang='eng' dir='ltr'>5351T</span> <span class='ocrx_word' id='word_1_15' title='bbox 657 93 770 120; x_wconf 85' lang='eng' dir='ltr'>(X94559)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 257 133 861 162; baseline 0 -6"><span class='ocrx_word' id='word_1_16' title='bbox 257 135 411 156; x_wconf 81' lang='eng' dir='ltr'><em>Sal/nicoccus</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 419 135 551 161; x_wconf 88' lang='eng' dir='ltr'><em>hispanicus</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 562 135 620 156; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 631 133 703 156; x_wconf 88' lang='eng' dir='ltr'>5352T</span> <span class='ocrx_word' id='word_1_20' title='bbox 713 135 861 162; x_wconf 87' lang='eng' dir='ltr'>(AY028927)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 268 174 811 203; baseline 0 -6"><span class='ocrx_word' id='word_1_21' title='bbox 268 176 422 197; x_wconf 88' lang='eng' dir='ltr'><em>Salinicoccus</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 431 177 555 197; x_wconf 88' lang='eng' dir='ltr'><em>siamensis</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 565 174 654 197; x_wconf 90' lang='eng' dir='ltr'><em>PN1-2T</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 664 176 811 203; x_wconf 85' lang='eng' dir='ltr'>(AB258358)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 258 216 776 245; baseline 0 -6"><span class='ocrx_word' id='word_1_25' title='bbox 258 218 412 239; x_wconf 84' lang='eng' dir='ltr'><em>Salinicoccus</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 421 219 538 239; x_wconf 85' lang='eng' dir='ltr'><em>salsiraiae</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 549 219 585 239; x_wconf 94' lang='eng' dir='ltr'>RH</span> <span class='ocrx_word' id='word_1_28' title='bbox 590 219 598 239; x_wconf 99' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 603 216 614 230; x_wconf 99' lang='eng' dir='ltr'><em>T</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 624 218 776 245; x_wconf 77' lang='eng'>(00333949)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 198 254 799 332">
+     <span class='ocr_line' id='line_1_7' title="bbox 198 254 799 288; baseline 0 -6"><span class='ocrx_word' id='word_1_31' title='bbox 198 254 240 270; x_wconf 68' lang='eng'><em>100&#39;</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 256 261 410 282; x_wconf 88' lang='eng' dir='ltr'><em>Salinicoccus</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 415 261 508 288; x_wconf 85' lang='eng' dir='ltr'><em>jeotgali</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 516 259 637 282; x_wconf 83' lang='eng' dir='ltr'>82R53-5T</span> <span class='ocrx_word' id='word_1_35' title='bbox 647 261 799 288; x_wconf 84' lang='eng' dir='ltr'>(DQ471329)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 256 303 763 332; baseline -0.002 -5"><span class='ocrx_word' id='word_1_36' title='bbox 256 306 409 327; x_wconf 80' lang='eng' dir='ltr'><em>Salinicoccus</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 419 306 555 332; x_wconf 88' lang='eng' dir='ltr'><em>alkaliphilus</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 564 303 607 327; x_wconf 88' lang='eng' dir='ltr'><em>T8T</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 617 306 763 332; x_wconf 90' lang='eng' dir='ltr'>(AF275710)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 195 345 865 415">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 195 345 865 415">
+     <span class='ocr_line' id='line_1_9' title="bbox 196 345 865 374; baseline 0 -6"><span class='ocrx_word' id='word_1_40' title='bbox 196 359 235 361; x_wconf 98' lang='eng'>—</span> <span class='ocrx_word' id='word_1_41' title='bbox 242 347 396 368; x_wconf 88' lang='eng' dir='ltr'><em>Salinicoccus</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 405 348 576 374; x_wconf 85' lang='eng' dir='ltr'><em>kunmingensis</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 584 348 632 368; x_wconf 94' lang='eng' dir='ltr'><em>YIM</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 643 345 703 368; x_wconf 93' lang='eng' dir='ltr'><em>Y15T</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 713 347 865 374; x_wconf 87' lang='eng' dir='ltr'>(DQ837380)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 195 386 853 415; baseline 0 -6"><span class='ocrx_word' id='word_1_46' title='bbox 195 401 248 404; x_wconf 97' lang='eng'>—</span> <span class='ocrx_word' id='word_1_47' title='bbox 256 388 417 409; x_wconf 77' lang='eng' dir='ltr'><em>‘Sa/inicoccus</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 426 388 553 409; x_wconf 76' lang='eng' dir='ltr'><em>salitudinis‘</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 563 386 853 415; x_wconf 86' lang='eng' dir='ltr'><em>YIM-C678T(EF590121)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 240 428 992 972">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 240 428 992 754">
+     <span class='ocr_line' id='line_1_11' title="bbox 264 428 801 457; baseline 0 -5"><span class='ocrx_word' id='word_1_50' title='bbox 264 430 418 452; x_wconf 86' lang='eng' dir='ltr'><em>Salinicoccus</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 427 431 565 452; x_wconf 89' lang='eng' dir='ltr'><em>halodurans</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 573 428 642 451; x_wconf 91' lang='eng' dir='ltr'>W24T</span> <span class='ocrx_word' id='word_1_53' title='bbox 649 430 801 457; x_wconf 78' lang='eng' dir='ltr'>(D0989633)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 313 470 823 499; baseline -0.002 -5"><span class='ocrx_word' id='word_1_54' title='bbox 313 473 466 494; x_wconf 87' lang='eng' dir='ltr'><em>Salinicoccus</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 475 473 542 494; x_wconf 87' lang='eng' dir='ltr'><em>albus</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 550 470 823 499; x_wconf 86' lang='eng' dir='ltr'><em>YIM—Y21T(EF177692)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 326 513 920 542; baseline 0 -6"><span class='ocrx_word' id='word_1_57' title='bbox 326 516 544 536; x_wconf 86' lang='eng' dir='ltr'><em>Nosocomiicoccus</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 553 516 665 541; x_wconf 79' lang='eng' dir='ltr'><em>ampullae</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 674 515 748 536; x_wconf 91' lang='eng' dir='ltr'>TRF-1</span> <span class='ocrx_word' id='word_1_60' title='bbox 754 513 764 527; x_wconf 96' lang='eng' dir='ltr'><em>T</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 772 515 920 542; x_wconf 86' lang='eng' dir='ltr'>(EU240886)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 309 555 992 584; baseline -0.001 -5"><span class='ocrx_word' id='word_1_62' title='bbox 309 558 492 584; x_wconf 86' lang='eng' dir='ltr'><em>Jeotgalicoccus</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 500 558 655 584; x_wconf 84' lang='eng' dir='ltr'><em>pinnipedialis</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 664 558 744 579; x_wconf 88' lang='eng' dir='ltr'><strong>CCUG</strong></span> <span class='ocrx_word' id='word_1_65' title='bbox 754 555 843 578; x_wconf 88' lang='eng' dir='ltr'><em>42722T</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 850 558 992 584; x_wconf 86' lang='eng' dir='ltr'>(AJ251530)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 304 598 957 627; baseline 0 -5"><span class='ocrx_word' id='word_1_67' title='bbox 304 601 506 627; x_wconf 79' lang='eng' dir='ltr'><em>Jeotgalicoccus</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 515 601 623 622; x_wconf 88' lang='eng' dir='ltr'><em>marinus</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 631 601 687 622; x_wconf 91' lang='eng' dir='ltr'><em>JSM</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 697 598 957 627; x_wconf 86' lang='eng' dir='ltr'>076033T(EU583727)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 285 644 911 673; baseline 0 -6"><span class='ocrx_word' id='word_1_71' title='bbox 285 647 468 673; x_wconf 84' lang='eng' dir='ltr'><em>Jeotgalicoccus</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 477 647 629 667; x_wconf 81' lang='eng' dir='ltr'><em>halotolerans</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 638 644 756 667; x_wconf 91' lang='eng' dir='ltr'>YKJ-101T</span> <span class='ocrx_word' id='word_1_74' title='bbox 764 646 911 673; x_wconf 86' lang='eng' dir='ltr'><em>(AY028925)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 310 686 955 715; baseline 0 -6"><span class='ocrx_word' id='word_1_75' title='bbox 310 688 493 715; x_wconf 82' lang='eng' dir='ltr'><em>Jeotgalicoccus</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 502 688 673 715; x_wconf 83' lang='eng' dir='ltr'><em>psychrophilus</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 681 688 753 709; x_wconf 91' lang='eng' dir='ltr'>YKJ-1</span> <span class='ocrx_word' id='word_1_78' title='bbox 761 686 800 709; x_wconf 91' lang='eng' dir='ltr'><em>15T</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 808 688 955 715; x_wconf 87' lang='eng' dir='ltr'>(AY028926)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 240 725 711 754; baseline 0 -5"><span class='ocrx_word' id='word_1_80' title='bbox 240 728 404 749; x_wconf 83' lang='eng' dir='ltr'><em>Macrococcus</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 413 728 508 749; x_wconf 88' lang='eng' dir='ltr'><em>bovicus</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 518 725 591 749; x_wconf 94' lang='eng' dir='ltr'>L2T4T</span> <span class='ocrx_word' id='word_1_83' title='bbox 598 728 711 754; x_wconf 95' lang='eng' dir='ltr'>(Y15714)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 245 768 902 972">
+     <span class='ocr_line' id='line_1_19' title="bbox 245 768 796 797; baseline 0 -6"><span class='ocrx_word' id='word_1_84' title='bbox 245 771 409 791; x_wconf 80' lang='eng' dir='ltr'><em>Macrococcus</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 418 771 573 791; x_wconf 84' lang='eng' dir='ltr'><em>carouselicus</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 583 768 796 797; x_wconf 87' lang='eng' dir='ltr'><em>H8b16T(Y15713)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 288 813 856 842; baseline 0 -6"><span class='ocrx_word' id='word_1_87' title='bbox 288 815 483 842; x_wconf 79' lang='eng' dir='ltr'><em>Staphylococcus</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 492 816 625 841; x_wconf 84' lang='eng' dir='ltr'><em>nepalensis</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 634 815 690 836; x_wconf 90' lang='eng' dir='ltr'><em>CW1</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 696 813 706 827; x_wconf 96' lang='eng' dir='ltr'><em>T</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 714 815 856 842; x_wconf 91' lang='eng' dir='ltr'><em>(AJ517414)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 291 855 900 884; baseline 0 -6"><span class='ocrx_word' id='word_1_92' title='bbox 291 857 485 884; x_wconf 83' lang='eng' dir='ltr'><em>Staphylococcus</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 493 857 690 884; x_wconf 80' lang='eng' dir='ltr'><em>piscifermentans</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 699 855 778 878; x_wconf 82' lang='eng' dir='ltr'>SK03T</span> <span class='ocrx_word' id='word_1_95' title='bbox 788 857 900 884; x_wconf 91' lang='eng' dir='ltr'>(Y15754)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 276 899 895 928; baseline 0 -6"><span class='ocrx_word' id='word_1_96' title='bbox 276 901 473 922; x_wconf 82' lang='eng' dir='ltr'><em>Carnobacterium</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 481 902 653 928; x_wconf 83' lang='eng' dir='ltr'><em>pleistocenium</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 663 899 742 922; x_wconf 92' lang='eng' dir='ltr'>FTR1T</span> <span class='ocrx_word' id='word_1_99' title='bbox 750 901 895 928; x_wconf 89' lang='eng' dir='ltr'>(AF450136)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 284 943 902 972; baseline 0 -6"><span class='ocrx_word' id='word_1_100' title='bbox 284 946 452 967; x_wconf 82' lang='eng' dir='ltr'><em>Enterococcus</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 462 945 559 967; x_wconf 87' lang='eng' dir='ltr'><em>faecium</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 567 945 642 967; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 654 943 740 967; x_wconf 84' lang='eng' dir='ltr'>19434T</span> <span class='ocrx_word' id='word_1_104' title='bbox 751 945 902 972; x_wconf 89' lang='eng' dir='ltr'><em>(DQ411813)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 294 985 930 1054">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 294 985 930 1054">
+     <span class='ocr_line' id='line_1_24' title="bbox 294 985 898 1014; baseline 0 -6"><span class='ocrx_word' id='word_1_105' title='bbox 294 988 462 1008; x_wconf 86' lang='eng' dir='ltr'><em>Enterococcus</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 472 987 562 1008; x_wconf 83' lang='eng' dir='ltr'><em>mundti/</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 569 987 645 1008; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 654 985 743 1008; x_wconf 79' lang='eng' dir='ltr'><em>4318GT</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 753 987 898 1014; x_wconf 86' lang='eng' dir='ltr'>(AF061013)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 337 1025 930 1054; baseline 0 -6"><span class='ocrx_word' id='word_1_110' title='bbox 337 1027 508 1048; x_wconf 86' lang='eng' dir='ltr'><em>Marinococcus</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 517 1027 643 1053; x_wconf 89' lang='eng' dir='ltr'><em>halophi/us</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 653 1027 711 1048; x_wconf 92' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 722 1025 810 1048; x_wconf 89' lang='eng' dir='ltr'>20408T</span> <span class='ocrx_word' id='word_1_114' title='bbox 818 1027 930 1054; x_wconf 86' lang='eng' dir='ltr'>(X90835)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 0 19 327 1044">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 0 19 327 1044">
+     <span class='ocr_line' id='line_1_26' title="bbox 167 19 323 134; baseline 0 -57"><span class='ocrx_word' id='word_1_115' title='bbox 167 19 323 134; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 158 134 253 237; baseline 0 -61"><span class='ocrx_word' id='word_1_116' title='bbox 158 134 253 237; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 150 237 198 259; baseline 0 797"><span class='ocrx_word' id='word_1_117' title='bbox 150 237 198 259; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 145 259 251 346; baseline 0 -15"><span class='ocrx_word' id='word_1_118' title='bbox 145 259 251 346; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 121 346 194 388; baseline 0 668"><span class='ocrx_word' id='word_1_119' title='bbox 121 346 194 388; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 84 388 264 471; baseline 0 -42"><span class='ocrx_word' id='word_1_120' title='bbox 84 388 264 471; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 84 471 322 556; baseline 0 -15"><span class='ocrx_word' id='word_1_121' title='bbox 84 471 322 556; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 84 556 307 598; baseline 0 0"><span class='ocrx_word' id='word_1_122' title='bbox 84 556 307 598; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 45 598 301 641; baseline 0 -11"><span class='ocrx_word' id='word_1_123' title='bbox 45 598 301 641; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 45 641 307 729; baseline 0 -18"><span class='ocrx_word' id='word_1_124' title='bbox 45 641 307 729; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 0 729 240 768; baseline 0 288"><span class='ocrx_word' id='word_1_125' title='bbox 0 729 240 768; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 0 768 283 856; baseline 0 0"><span class='ocrx_word' id='word_1_126' title='bbox 0 768 283 856; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 0 856 283 942; baseline 0 -57"><span class='ocrx_word' id='word_1_127' title='bbox 0 856 283 942; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 0 942 284 986; baseline 0 70"><span class='ocrx_word' id='word_1_128' title='bbox 0 942 284 986; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 0 986 327 1044; baseline 0 0"><span class='ocrx_word' id='word_1_129' title='bbox 0 986 327 1044; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 53 114 93 130">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 53 114 93 130">
+     <span class='ocr_line' id='line_1_41' title="bbox 53 114 93 130; baseline 0 0"><span class='ocrx_word' id='word_1_130' title='bbox 53 114 93 130; x_wconf 62' lang='eng'>0,02</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 37 145 109 149">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 37 145 109 149">
+     <span class='ocr_line' id='line_1_42' title="bbox 37 145 109 149; baseline 0 907"><span class='ocrx_word' id='word_1_131' title='bbox 37 145 109 149; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 241 176 261 208">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 241 176 261 208">
+     <span class='ocr_line' id='line_1_43' title="bbox 241 176 261 208; baseline 0 0"><span class='ocrx_word' id='word_1_132' title='bbox 241 176 261 208; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 135 184 241 231">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 135 184 241 231">
+     <span class='ocr_line' id='line_1_44' title="bbox 209 184 241 200; baseline 0 0"><span class='ocrx_word' id='word_1_133' title='bbox 209 184 241 200; x_wconf 70' lang='eng'>53*</span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 135 214 167 231; baseline 0 0"><span class='ocrx_word' id='word_1_134' title='bbox 135 214 167 231; x_wconf 70' lang='eng'>67*</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 194 359 196 403">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 194 359 196 403">
+     <span class='ocr_line' id='line_1_46' title="bbox 194 359 196 403; baseline 0 653"><span class='ocrx_word' id='word_1_135' title='bbox 194 359 196 403; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 50 615 85 635">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 50 615 85 635">
+     <span class='ocr_line' id='line_1_47' title="bbox 50 615 85 635; baseline 0 -4"><span class='ocrx_word' id='word_1_136' title='bbox 50 615 85 635; x_wconf 85' lang='eng' dir='ltr'><em>95p</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002469-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002469-0-000.pbm.png
new file mode 100644
index 00000000..8c6fc5d6
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002469-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002469-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002469-0-000.pbm.png.hocr
new file mode 100644
index 00000000..aced66d7
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002469-0-000.pbm.png.hocr
@@ -0,0 +1,246 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002469-0-000.pbm.png"; bbox 0 0 1302 1005; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 235 4 270 22">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 235 4 270 22">
+     <span class='ocr_line' id='line_1_1' title="bbox 235 4 270 22; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 235 4 270 22; x_wconf 80' lang='eng'><em>98*</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 150 10 608 436">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 150 10 608 436">
+     <span class='ocr_line' id='line_1_2' title="bbox 226 10 540 47; baseline 0 -22"><span class='ocrx_word' id='word_1_2' title='bbox 226 10 540 47; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 200 47 490 94; baseline 0 0"><span class='ocrx_word' id='word_1_3' title='bbox 200 47 490 94; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 200 94 485 114; baseline 0 891"><span class='ocrx_word' id='word_1_4' title='bbox 200 94 485 114; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 200 114 481 150; baseline 0 -21"><span class='ocrx_word' id='word_1_5' title='bbox 200 114 481 150; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 164 150 608 198; baseline 0 0"><span class='ocrx_word' id='word_1_6' title='bbox 164 150 608 198; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 150 198 438 289; baseline 0 0"><span class='ocrx_word' id='word_1_7' title='bbox 150 198 438 289; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 164 289 419 323; baseline 0 682"><span class='ocrx_word' id='word_1_8' title='bbox 164 289 419 323; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 164 323 514 371; baseline 0 0"><span class='ocrx_word' id='word_1_9' title='bbox 164 323 514 371; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 164 371 413 407; baseline 0.004 -1"><span class='ocrx_word' id='word_1_10' title='bbox 164 371 413 407; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 164 407 391 436; baseline 0 -9"><span class='ocrx_word' id='word_1_11' title='bbox 164 407 168 427; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> <span class='ocrx_word' id='word_1_12' title='bbox 206 407 391 436; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 168 5 1300 1002">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 168 5 1119 517">
+     <span class='ocr_line' id='line_1_12' title="bbox 545 5 1064 33; baseline 0 -6"><span class='ocrx_word' id='word_1_13' title='bbox 545 7 708 27; x_wconf 72' lang='eng' dir='ltr'><em>Grad/[bacillus</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 716 7 861 27; x_wconf 81' lang='eng' dir='ltr'><em>ha/oto/erans</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 871 5 919 27; x_wconf 87' lang='eng' dir='ltr'><em>NNT</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 926 7 1064 33; x_wconf 88' lang='eng' dir='ltr'><em>(AF036922)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 490 39 1051 67; baseline 0.002 -6"><span class='ocrx_word' id='word_1_17' title='bbox 490 42 662 62; x_wconf 87' lang='eng' dir='ltr'><em>Paraliobacillus</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 671 42 811 67; x_wconf 85' lang='eng' dir='ltr'><em>ryukyuensis</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 820 39 904 62; x_wconf 90' lang='eng' dir='ltr'><em>015-7T</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 911 41 1051 67; x_wconf 86' lang='eng' dir='ltr'><em>(AB087828)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 492 74 1014 101; baseline 0 -5"><span class='ocrx_word' id='word_1_21' title='bbox 492 76 635 96; x_wconf 86' lang='eng' dir='ltr'><em>Halobacillus</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 643 76 737 96; x_wconf 87' lang='eng' dir='ltr'><em>Iocisa/is</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 746 74 867 96; x_wconf 86' lang='eng' dir='ltr'><em>MSS-155T</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 874 76 1014 101; x_wconf 84' lang='eng' dir='ltr'><em>(AY190534)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 485 108 909 136; baseline 0 -5"><span class='ocrx_word' id='word_1_25' title='bbox 485 111 629 131; x_wconf 85' lang='eng' dir='ltr'><em>Ha/obaci/Ius</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 637 111 720 131; x_wconf 84' lang='eng' dir='ltr'><em>Iitora/is</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 728 108 795 131; x_wconf 90' lang='eng' dir='ltr'><em>SL-4T</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 801 111 909 136; x_wconf 84' lang='eng' dir='ltr'>(X94558)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 476 143 1031 171; baseline 0 -6"><span class='ocrx_word' id='word_1_29' title='bbox 476 146 671 165; x_wconf 86' lang='eng' dir='ltr'><em>ThalassobaciI/us</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 679 146 789 165; x_wconf 86' lang='eng' dir='ltr'><em>devorans</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 797 143 888 165; x_wconf 80' lang='eng' dir='ltr'><em>G—19.1T</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 896 145 1031 171; x_wconf 85' lang='eng' dir='ltr'><em>(AJ717299)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 614 178 1119 206; baseline 0 -6"><span class='ocrx_word' id='word_1_33' title='bbox 614 180 761 200; x_wconf 77' lang='eng' dir='ltr'><em>Lent/bacillus</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 769 180 881 205; x_wconf 73' lang='eng' dir='ltr'><em>salicampi</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 889 178 971 200; x_wconf 90' lang='eng' dir='ltr'><em>SF-20T</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 978 180 1119 206; x_wconf 82' lang='eng' dir='ltr'><em>(AY057394)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 438 212 1002 240; baseline 0 -6"><span class='ocrx_word' id='word_1_37' title='bbox 438 215 577 240; x_wconf 83' lang='eng' dir='ltr'><em>Virgibacillus</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 585 215 735 235; x_wconf 83' lang='eng' dir='ltr'><em>dokdonensis</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 745 212 1002 240; x_wconf 73' lang='eng' dir='ltr'><em>DSW-1OT(AY822043)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 423 247 1025 275; baseline 0 -6"><span class='ocrx_word' id='word_1_40' title='bbox 423 249 563 274; x_wconf 84' lang='eng' dir='ltr'><em>Virgibacillus</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 570 249 745 274; x_wconf 80' lang='eng' dir='ltr'><em>pantathenticus</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 754 249 830 269; x_wconf 92' lang='eng' dir='ltr'><em>NCDO</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 842 247 909 269; x_wconf 89' lang='eng' dir='ltr'><em>1765T</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 916 249 1025 275; x_wconf 86' lang='eng' dir='ltr'><em>(D78477)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 426 281 919 309; baseline 0 -5"><span class='ocrx_word' id='word_1_45' title='bbox 426 284 566 309; x_wconf 85' lang='eng' dir='ltr'><em>Virgibaci/Ius</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 574 284 715 304; x_wconf 82' lang='eng' dir='ltr'><em>marismortui</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 724 281 776 304; x_wconf 92' lang='eng' dir='ltr'><em>123T</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 783 283 919 309; x_wconf 84' lang='eng' dir='ltr'><em>(AJ009793)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 420 316 1081 344; baseline 0 -6"><span class='ocrx_word' id='word_1_49' title='bbox 420 319 559 344; x_wconf 87' lang='eng' dir='ltr'><em>VirgibaciI/us</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 568 318 761 338; x_wconf 82' lang='eng' dir='ltr'><em>halodenitriﬂcans</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 768 318 841 338; x_wconf 93' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 849 316 1081 344; x_wconf 79' lang='eng' dir='ltr'><em>49067T(AB021186)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 519 351 1083 379; baseline 0 -6"><span class='ocrx_word' id='word_1_53' title='bbox 519 353 700 373; x_wconf 86' lang='eng' dir='ltr'><em>Oceanobacil/us</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 708 353 819 378; x_wconf 87' lang='eng' dir='ltr'><em>iheyensis</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 829 351 936 373; x_wconf 78' lang='eng' dir='ltr'><em>HTE831T</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 943 353 1083 379; x_wconf 86' lang='eng' dir='ltr'><em>(ABO10863)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 413 385 934 413; baseline 0 -5"><span class='ocrx_word' id='word_1_57' title='bbox 413 388 608 408; x_wconf 83' lang='eng' dir='ltr'><em>Paucisa/ibacillus</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 616 388 716 413; x_wconf 86' lang='eng' dir='ltr'><em>globu/us</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 725 385 934 413; x_wconf 72' lang='eng' dir='ltr'><em>BZZT(AM114102)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 168 418 969 448; baseline 0.002 -7"><span class='ocrx_word' id='word_1_60' title='bbox 168 418 206 441; x_wconf 75' lang='eng' dir='ltr'><em>70p</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 391 422 579 443; x_wconf 88' lang='eng' dir='ltr'><em>Ornithinibacillus</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 587 422 741 443; x_wconf 85' lang='eng' dir='ltr'><em>californiensis</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 750 420 823 443; x_wconf 85' lang='eng' dir='ltr'><em>MB-9T</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 830 422 969 448; x_wconf 85' lang='eng' dir='ltr'><em>(AF326365)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 175 455 858 501; baseline 0 -24"><span class='ocrx_word' id='word_1_65' title='bbox 175 455 383 501; x_wconf 37' lang='eng'><em>£1:</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 392 457 545 477; x_wconf 86' lang='eng' dir='ltr'><em>Salinibacillus</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 553 457 655 477; x_wconf 83' lang='eng' dir='ltr'><em>kushneri</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 662 455 711 477; x_wconf 80' lang='eng' dir='ltr'><em>8-2T</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 718 457 858 482; x_wconf 84' lang='eng' dir='ltr'><em>(AY321434)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 379 489 894 517; baseline 0 -5"><span class='ocrx_word' id='word_1_70' title='bbox 379 492 533 512; x_wconf 84' lang='eng' dir='ltr'><em>Salinibaci/lus</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 541 492 674 517; x_wconf 84' lang='eng' dir='ltr'><em>aidingensis</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 683 489 746 512; x_wconf 89' lang='eng' dir='ltr'><em>25-7T</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 753 492 894 517; x_wconf 85' lang='eng' dir='ltr'><em>(AY321436)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 174 524 1100 621">
+     <span class='ocr_line' id='line_1_27' title="bbox 174 524 868 552; baseline 0 -6"><span class='ocrx_word' id='word_1_74' title='bbox 174 533 365 535; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_75' title='bbox 373 526 513 546; x_wconf 76' lang='eng' dir='ltr'><em>Sal/rhabdus</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 521 526 613 551; x_wconf 74' lang='eng' dir='ltr'><em>euzebyi</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 621 524 715 546; x_wconf 91' lang='eng' dir='ltr'><em>CVS14T</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 722 526 868 552; x_wconf 83' lang='eng' dir='ltr'><em>(AM292417)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 473 558 1100 586; baseline 0 -5"><span class='ocrx_word' id='word_1_79' title='bbox 473 561 639 581; x_wconf 86' lang='eng' dir='ltr'><em>Pontibacillus</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 648 561 781 586; x_wconf 86' lang='eng' dir='ltr'><em>halophilus</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 789 561 842 581; x_wconf 90' lang='eng' dir='ltr'><em>JSM</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 852 558 951 581; x_wconf 55' lang='eng' dir='ltr'><em>0763056T</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 958 561 1100 586; x_wconf 87' lang='eng' dir='ltr'><em>(EU583728)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 477 593 1022 621; baseline 0 -5"><span class='ocrx_word' id='word_1_84' title='bbox 477 595 627 616; x_wconf 85' lang='eng' dir='ltr'><em>Pontibacil/us</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 635 595 730 616; x_wconf 80' lang='eng' dir='ltr'><em>marinus</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 739 593 874 616; x_wconf 89' lang='eng' dir='ltr'><em>BH030004T</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 882 595 1022 621; x_wconf 84' lang='eng' dir='ltr'><em>(AY603977)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 291 628 1300 1002">
+     <span class='ocr_line' id='line_1_30' title="bbox 341 628 1118 656; baseline 0 -6"><span class='ocrx_word' id='word_1_88' title='bbox 341 633 375 650; x_wconf 76' lang='eng'><em>99’</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 499 631 648 650; x_wconf 85' lang='eng' dir='ltr'><em>Pontibacillus</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 657 631 826 656; x_wconf 78' lang='eng' dir='ltr'><em>chungwhensis</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 835 628 971 650; x_wconf 78' lang='eng' dir='ltr'><em>BH030062T</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 978 630 1118 656; x_wconf 87' lang='eng' dir='ltr'><em>(AY553296)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 291 663 900 690; baseline 0 -5"><span class='ocrx_word' id='word_1_93' title='bbox 291 664 338 682; x_wconf 72' lang='eng'>100‘</span> <span class='ocrx_word' id='word_1_94' title='bbox 357 665 565 685; x_wconf 79' lang='eng' dir='ltr'><em>—P/anococcus</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 574 665 701 685; x_wconf 80' lang='eng' dir='ltr'><em>rifietoensis</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 711 663 757 685; x_wconf 72' lang='eng' dir='ltr'><em>MST</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 763 665 900 690; x_wconf 82' lang='eng' dir='ltr'><em>(AJ493659)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 355 697 915 725; baseline 0.002 -6"><span class='ocrx_word' id='word_1_98' title='bbox 355 706 412 709; x_wconf 93' lang='eng'>—</span> <span class='ocrx_word' id='word_1_99' title='bbox 419 700 570 720; x_wconf 86' lang='eng' dir='ltr'><em>Planococcus</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 579 700 694 720; x_wconf 75' lang='eng' dir='ltr'><em>maritimus</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 702 697 769 720; x_wconf 75' lang='eng' dir='ltr'><em>TF-QT</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 776 700 915 725; x_wconf 90' lang='eng' dir='ltr'><em>(AF500007)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 339 732 983 760; baseline 0 -6"><span class='ocrx_word' id='word_1_103' title='bbox 339 734 535 754; x_wconf 79' lang='eng' dir='ltr'><em>Saccharococcus</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 543 734 696 759; x_wconf 81' lang='eng' dir='ltr'><em>thermophilus</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 703 734 775 754; x_wconf 94' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 784 732 869 754; x_wconf 83' lang='eng' dir='ltr'><em>43125T</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 876 734 983 760; x_wconf 85' lang='eng' dir='ltr'><em>(X70430)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 442 766 1095 794; baseline -0.002 -5"><span class='ocrx_word' id='word_1_108' title='bbox 442 768 637 789; x_wconf 84' lang='eng' dir='ltr'><em>Saccharococcus</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 645 769 850 794; x_wconf 85' lang='eng' dir='ltr'><em>caldoxylosilyticus</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 859 766 946 789; x_wconf 80' lang='eng' dir='ltr'><em>S1812T</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 955 768 1095 794; x_wconf 90' lang='eng' dir='ltr'><em>(AF067651)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 567 801 1063 829; baseline 0 -6"><span class='ocrx_word' id='word_1_112' title='bbox 567 803 705 823; x_wconf 86' lang='eng' dir='ltr'><em>Geobaci/lus</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 714 803 869 823; x_wconf 82' lang='eng' dir='ltr'><em>subterraneus</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 878 801 917 823; x_wconf 79' lang='eng' dir='ltr'><em>34T</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 924 803 1063 829; x_wconf 87' lang='eng' dir='ltr'><em>(AF276306)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 438 832 1300 863; baseline 0 -5"><span class='ocrx_word' id='word_1_116' title='bbox 438 832 484 850; x_wconf 80' lang='eng'>100*</span> <span class='ocrx_word' id='word_1_117' title='bbox 602 838 740 858; x_wconf 86' lang='eng' dir='ltr'><em>Geabaci/lus</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 749 838 976 863; x_wconf 80' lang='eng' dir='ltr'><em>stearothermophi/us</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 986 838 1058 858; x_wconf 88' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 1070 836 1300 863; x_wconf 76' lang='eng' dir='ltr'><em>12550T(ABZ71757)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 358 870 936 898; baseline 0 -6"><span class='ocrx_word' id='word_1_121' title='bbox 358 873 522 898; x_wconf 86' lang='eng' dir='ltr'><em>Anoxybacillus</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 531 873 702 892; x_wconf 84' lang='eng' dir='ltr'><em>voinovskiensis</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 710 870 786 892; x_wconf 89' lang='eng' dir='ltr'><em>TH13T</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 795 872 936 898; x_wconf 87' lang='eng' dir='ltr'><em>(AB110008)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 506 905 1091 933; baseline 0.002 -6"><span class='ocrx_word' id='word_1_125' title='bbox 506 908 711 933; x_wconf 86' lang='eng' dir='ltr'><em>—Anoxybacillus</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 719 908 861 933; x_wconf 84' lang='eng' dir='ltr'><em>sayderensis</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 869 905 945 928; x_wconf 92' lang='eng' dir='ltr'><em>ABO4T</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 952 908 1091 933; x_wconf 86' lang='eng' dir='ltr'><em>(AF001963)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 587 940 1194 968; baseline 0 -6"><span class='ocrx_word' id='word_1_129' title='bbox 587 942 751 967; x_wconf 84' lang='eng' dir='ltr'><em>Anoxybaci/lus</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 760 942 903 962; x_wconf 88' lang='eng' dir='ltr'><em>ﬂavithermus</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 913 942 969 962; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_132' title='bbox 979 940 1048 962; x_wconf 85' lang='eng' dir='ltr'><em>2641T</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 1055 942 1194 968; x_wconf 86' lang='eng' dir='ltr'><em>(AF004589)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 613 975 1087 1002; baseline 0 -5"><span class='ocrx_word' id='word_1_134' title='bbox 613 977 811 1002; x_wconf 81' lang='eng' dir='ltr'><em>Exiguobacterium</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 820 977 893 997; x_wconf 87' lang='eng' dir='ltr'><em>undae</em></span> <span class='ocrx_word' id='word_1_136' title='bbox 903 975 942 997; x_wconf 90' lang='eng' dir='ltr'><em>L2T</em></span> <span class='ocrx_word' id='word_1_137' title='bbox 951 977 1087 1002; x_wconf 87' lang='eng' dir='ltr'><em>(AJ344151)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 36 54 207 83">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 36 54 207 83">
+     <span class='ocr_line' id='line_1_41' title="bbox 36 54 207 83; baseline -0.006 0"><span class='ocrx_word' id='word_1_138' title='bbox 36 65 78 83; x_wconf 87' lang='eng'><em>0.01</em></span> <span class='ocrx_word' id='word_1_139' title='bbox 172 54 207 72; x_wconf 56' lang='eng'><em>65*</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 15 94 102 97">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 15 94 102 97">
+     <span class='ocr_line' id='line_1_42' title="bbox 15 94 102 97; baseline 0 908"><span class='ocrx_word' id='word_1_140' title='bbox 15 94 102 97; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 146 129 191 147">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 146 129 191 147">
+     <span class='ocr_line' id='line_1_43' title="bbox 146 129 191 147; baseline -0.022 0"><span class='ocrx_word' id='word_1_141' title='bbox 146 129 191 147; x_wconf 85' lang='eng' dir='ltr'><em>68m</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 128 247 153 265">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 128 247 153 265">
+     <span class='ocr_line' id='line_1_44' title="bbox 128 247 153 265; baseline 0 0"><span class='ocrx_word' id='word_1_142' title='bbox 128 247 153 265; x_wconf 91' lang='eng'>50</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 109 360 134 377">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 109 360 134 377">
+     <span class='ocr_line' id='line_1_45' title="bbox 109 360 134 377; baseline 0 0"><span class='ocrx_word' id='word_1_143' title='bbox 109 360 134 377; x_wconf 87' lang='eng'><em>55</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 1 384 567 859">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 1 384 567 859">
+     <span class='ocr_line' id='line_1_46' title="bbox 31 384 154 462; baseline 0 0"><span class='ocrx_word' id='word_1_144' title='bbox 31 384 154 462; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 31 462 133 531; baseline 0 -4"><span class='ocrx_word' id='word_1_145' title='bbox 31 462 133 531; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_48' title="bbox 31 531 133 566; baseline 0 439"><span class='ocrx_word' id='word_1_146' title='bbox 31 531 133 566; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_49' title="bbox 31 566 469 600; baseline 0 405"><span class='ocrx_word' id='word_1_147' title='bbox 31 566 469 600; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_50' title="bbox 1 600 469 635; baseline 0 0"><span class='ocrx_word' id='word_1_148' title='bbox 1 600 469 635; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_51' title="bbox 1 635 100 703; baseline 0 -33"><span class='ocrx_word' id='word_1_149' title='bbox 1 635 100 703; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_52' title="bbox 1 703 338 739; baseline 0 266"><span class='ocrx_word' id='word_1_150' title='bbox 1 703 338 739; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_53' title="bbox 1 739 339 774; baseline 0 231"><span class='ocrx_word' id='word_1_151' title='bbox 1 739 339 774; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_54' title="bbox 1 774 442 808; baseline 0 197"><span class='ocrx_word' id='word_1_152' title='bbox 1 774 442 808; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_55' title="bbox 1 808 567 859; baseline 0 -16"><span class='ocrx_word' id='word_1_153' title='bbox 1 808 562 859; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> <span class='ocrx_word' id='word_1_154' title='bbox 484 823 567 843; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 148 270 150 509">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 148 270 150 509">
+     <span class='ocr_line' id='line_1_56' title="bbox 148 270 150 509; baseline 0 496"><span class='ocrx_word' id='word_1_155' title='bbox 148 270 150 509; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 148 507 174 509">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 148 507 174 509">
+     <span class='ocr_line' id='line_1_57' title="bbox 148 507 174 509; baseline 0 496"><span class='ocrx_word' id='word_1_156' title='bbox 148 507 174 509; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 172 484 174 535">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 172 484 174 535">
+     <span class='ocr_line' id='line_1_58' title="bbox 172 484 174 535; baseline 0 470"><span class='ocrx_word' id='word_1_157' title='bbox 172 484 174 535; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 137 513 162 531">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 137 513 162 531">
+     <span class='ocr_line' id='line_1_59' title="bbox 137 513 162 531; baseline 0.04 -1"><span class='ocrx_word' id='word_1_158' title='bbox 137 513 162 531; x_wconf 89' lang='eng'><em>76</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 390 603 392 639">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 390 603 392 639">
+     <span class='ocr_line' id='line_1_60' title="bbox 390 603 392 639; baseline 0 366"><span class='ocrx_word' id='word_1_159' title='bbox 390 603 392 639; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 392 637 494 639">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 392 637 494 639">
+     <span class='ocr_line' id='line_1_61' title="bbox 392 637 494 639; baseline 0 366"><span class='ocrx_word' id='word_1_160' title='bbox 392 637 494 639; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 96 689 357 691">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 96 689 357 691">
+     <span class='ocr_line' id='line_1_62' title="bbox 96 689 357 691; baseline 0 314"><span class='ocrx_word' id='word_1_161' title='bbox 96 689 357 691; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 355 672 357 706">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 355 672 357 706">
+     <span class='ocr_line' id='line_1_63' title="bbox 355 672 357 706; baseline 0 299"><span class='ocrx_word' id='word_1_162' title='bbox 355 672 357 706; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 96 689 98 840">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 96 689 98 840">
+     <span class='ocr_line' id='line_1_64' title="bbox 96 689 98 840; baseline 0 165"><span class='ocrx_word' id='word_1_163' title='bbox 96 689 98 840; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 1 843 597 987">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 1 859 504 987">
+     <span class='ocr_line' id='line_1_65' title="bbox 1 859 504 987; baseline 0 0"><span class='ocrx_word' id='word_1_164' title='bbox 1 859 504 987; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 504 914 506 950">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 504 914 506 950">
+     <span class='ocr_line' id='line_1_66' title="bbox 504 914 506 950; baseline 0 55"><span class='ocrx_word' id='word_1_165' title='bbox 504 914 506 950; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 505 948 587 951">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 505 948 587 951">
+     <span class='ocr_line' id='line_1_67' title="bbox 505 948 587 951; baseline 0 54"><span class='ocrx_word' id='word_1_166' title='bbox 505 948 587 951; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 5 983 605 985">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 5 983 605 985">
+     <span class='ocr_line' id='line_1_68' title="bbox 5 983 605 985; baseline 0 20"><span class='ocrx_word' id='word_1_167' title='bbox 5 983 605 985; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002477-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002477-0-000.pbm.png
new file mode 100644
index 00000000..8f2753f4
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002477-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002477-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002477-0-000.pbm.png.hocr
new file mode 100644
index 00000000..6c521181
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002477-0-000.pbm.png.hocr
@@ -0,0 +1,94 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002477-0-000.pbm.png"; bbox 0 0 1657 1252; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 0 4 547 45">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 0 4 547 45">
+     <span class='ocr_line' id='line_1_1' title="bbox 247 4 308 26; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 247 4 308 26; x_wconf 90' lang='eng'><em>0.05</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 0 25 547 45; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 0 25 547 45; x_wconf 94' lang='eng' dir='ltr'><em>I—l</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 56 97 1656 1211">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 56 97 1656 1211">
+     <span class='ocr_line' id='line_1_3' title="bbox 88 97 1123 126; baseline 0.001 -8"><span class='ocrx_word' id='word_1_3' title='bbox 88 100 110 118; x_wconf 82' lang='eng'>9</span> <span class='ocrx_word' id='word_1_4' title='bbox 442 98 857 120; x_wconf 85' lang='eng' dir='ltr'><em>Antarctobacterheliothermus</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 868 97 982 120; x_wconf 73' lang='eng' dir='ltr'><em>EL-219T</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 993 97 1123 126; x_wconf 89' lang='eng' dir='ltr'>(Y11552)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 419 134 894 163; baseline 0 -6"><span class='ocrx_word' id='word_1_7' title='bbox 419 135 545 163; x_wconf 83' lang='eng' dir='ltr'><em>Sagittula</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 556 135 660 157; x_wconf 84' lang='eng' dir='ltr'><em>stellata</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 672 134 749 157; x_wconf 82' lang='eng' dir='ltr'><em>E—37T</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 760 135 894 163; x_wconf 88' lang='eng' dir='ltr'><em>(U58356)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 97 172 1172 202; baseline 0.001 -8"><span class='ocrx_word' id='word_1_11' title='bbox 97 184 120 202; x_wconf 71' lang='eng'>31</span> <span class='ocrx_word' id='word_1_12' title='bbox 482 173 769 200; x_wconf 78' lang='eng' dir='ltr'><em>Ketogulonicigenium</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 779 173 914 195; x_wconf 86' lang='eng' dir='ltr'><em>robustum</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 924 172 992 195; x_wconf 81' lang='eng' dir='ltr'><em>X6LT</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 1002 172 1172 200; x_wconf 86' lang='eng' dir='ltr'><em>(AF136850)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 443 209 1137 238; baseline -0.001 -6"><span class='ocrx_word' id='word_1_16' title='bbox 443 209 605 232; x_wconf 89' lang='eng' dir='ltr'><em>Oceanicola</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 615 210 775 238; x_wconf 88' lang='eng' dir='ltr'><em>granulosus</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 786 209 957 232; x_wconf 90' lang='eng' dir='ltr'><em>HTCC2516T</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 968 209 1137 238; x_wconf 86' lang='eng' dir='ltr'><em>(AY424896)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 56 246 1118 275; baseline 0.002 -8"><span class='ocrx_word' id='word_1_20' title='bbox 56 249 80 267; x_wconf 89' lang='eng'>9</span> <span class='ocrx_word' id='word_1_21' title='bbox 183 246 220 263; x_wconf 91' lang='eng'>10</span> <span class='ocrx_word' id='word_1_22' title='bbox 478 247 664 269; x_wconf 85' lang='eng' dir='ltr'><em>Roseisalinus</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 674 247 834 269; x_wconf 82' lang='eng' dir='ltr'><em>antarcticus</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 845 246 941 269; x_wconf 91' lang='eng' dir='ltr'><em>EL—88T</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 952 247 1118 275; x_wconf 88' lang='eng' dir='ltr'><em>(AJ605747)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 380 283 1207 312; baseline 0.002 -7"><span class='ocrx_word' id='word_1_26' title='bbox 380 287 417 305; x_wconf 91' lang='eng'>10</span> <span class='ocrx_word' id='word_1_27' title='bbox 529 284 675 307; x_wconf 82' lang='eng' dir='ltr'><em>Loktane/la</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 686 284 848 312; x_wconf 87' lang='eng' dir='ltr'><em>fryxel/ensis</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 859 284 922 307; x_wconf 91' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 933 283 1032 307; x_wconf 90' lang='eng' dir='ltr'><em>22007T</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 1042 284 1207 312; x_wconf 88' lang='eng' dir='ltr'><em>(AJ582225)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 511 321 1179 350; baseline 0 -6"><span class='ocrx_word' id='word_1_32' title='bbox 511 322 660 344; x_wconf 83' lang='eng' dir='ltr'><em>Loktanella</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 671 322 815 344; x_wconf 88' lang='eng' dir='ltr'><em>salsilacus</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 825 322 889 344; x_wconf 93' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 900 321 1001 344; x_wconf 84' lang='eng' dir='ltr'><em>21507T</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 1012 322 1179 350; x_wconf 85' lang='eng' dir='ltr'><em>(AJ440997)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 190 349 1171 388; baseline 0 -6"><span class='ocrx_word' id='word_1_37' title='bbox 190 349 228 367; x_wconf 67' lang='eng'>1&quot;</span> <span class='ocrx_word' id='word_1_38' title='bbox 455 360 604 382; x_wconf 86' lang='eng' dir='ltr'><em>Loktanella</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 616 359 807 382; x_wconf 85' lang='eng' dir='ltr'><em>vestfoldensis</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 817 359 882 382; x_wconf 94' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 893 359 994 382; x_wconf 81' lang='eng' dir='ltr'><em>22003T</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 1004 359 1171 388; x_wconf 87' lang='eng' dir='ltr'><em>(AJ582226)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 262 396 1185 425; baseline 0.002 -8"><span class='ocrx_word' id='word_1_43' title='bbox 262 399 286 417; x_wconf 83' lang='eng'>9</span> <span class='ocrx_word' id='word_1_44' title='bbox 464 397 615 425; x_wconf 86' lang='eng' dir='ltr'><em>Leisingera</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 626 397 919 425; x_wconf 86' lang='eng' dir='ltr'><em>methylohalidivorans</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 930 396 1005 419; x_wconf 81' lang='eng' dir='ltr'><em>MBZT</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 1015 397 1185 425; x_wconf 87' lang='eng' dir='ltr'><em>(AY005463)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 189 427 1071 462; baseline 0 -6"><span class='ocrx_word' id='word_1_48' title='bbox 189 427 212 445; x_wconf 72' lang='eng'>91</span> <span class='ocrx_word' id='word_1_49' title='bbox 427 434 812 462; x_wconf 83' lang='eng' dir='ltr'><em>Phaeobactergallaeciensis</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 823 433 929 456; x_wconf 73' lang='eng' dir='ltr'><em>133107T</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 939 434 1071 462; x_wconf 90' lang='eng' dir='ltr'><em>(Y13244)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 399 471 1022 500; baseline 0.002 -7"><span class='ocrx_word' id='word_1_52' title='bbox 399 472 559 494; x_wconf 89' lang='eng' dir='ltr'><em>Marinovum</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 569 472 680 500; x_wconf 85' lang='eng' dir='ltr'><em>algico/a</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 689 472 772 494; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 783 471 1022 500; x_wconf 70' lang='eng' dir='ltr'><em>51440T(X78315)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 208 508 1238 537; baseline 0.002 -8"><span class='ocrx_word' id='word_1_56' title='bbox 208 511 231 529; x_wconf 86' lang='eng'>8</span> <span class='ocrx_word' id='word_1_57' title='bbox 495 509 676 531; x_wconf 83' lang='eng' dir='ltr'><em>Roseovar/us</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 686 510 874 531; x_wconf 88' lang='eng' dir='ltr'><em>crassostreae</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 884 508 1238 537; x_wconf 51' lang='eng' dir='ltr'><em>CV919—3127(AF114484)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 133 540 1061 574; baseline 0.001 -6"><span class='ocrx_word' id='word_1_60' title='bbox 133 540 157 557; x_wconf 81' lang='eng'>5</span> <span class='ocrx_word' id='word_1_61' title='bbox 435 547 616 569; x_wconf 84' lang='eng' dir='ltr'><em>Roseovarius</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 626 547 803 569; x_wconf 87' lang='eng' dir='ltr'><em>nubinhibens</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 814 546 880 569; x_wconf 73' lang='eng' dir='ltr'><em>ISMT</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 890 546 1061 574; x_wconf 87' lang='eng' dir='ltr'><em>(AF098495)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 416 583 1162 612; baseline 0 -6"><span class='ocrx_word' id='word_1_65' title='bbox 416 584 611 606; x_wconf 86' lang='eng' dir='ltr'><em>Roseovarius</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 619 584 762 612; x_wconf 84' lang='eng' dir='ltr'><em>pacificus</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 771 590 815 612; x_wconf 88' lang='eng' dir='ltr'><em>sp.</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 828 590 888 606; x_wconf 94' lang='eng' dir='ltr'><em>nov.</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 899 584 928 606; x_wconf 92' lang='eng'><em>81</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 936 583 976 606; x_wconf 90' lang='eng' dir='ltr'><em>-2T</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 985 584 1162 612; x_wconf 89' lang='eng' dir='ltr'><em>(DQ120726)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 69 615 1133 650; baseline -0.002 -5"><span class='ocrx_word' id='word_1_72' title='bbox 69 615 95 632; x_wconf 72' lang='eng'>6</span> <span class='ocrx_word' id='word_1_73' title='bbox 508 622 689 644; x_wconf 84' lang='eng' dir='ltr'><em>Roseovarius</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 699 627 828 644; x_wconf 86' lang='eng' dir='ltr'><em>mucosus</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 838 621 956 643; x_wconf 92' lang='eng' dir='ltr'><em>DFL-24T</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 967 621 1133 650; x_wconf 86' lang='eng' dir='ltr'><em>(AJ534215)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 247 658 1042 687; baseline 0 -6"><span class='ocrx_word' id='word_1_77' title='bbox 247 658 273 675; x_wconf 76' lang='eng'><strong>=‘</strong></span> <span class='ocrx_word' id='word_1_78' title='bbox 468 659 650 681; x_wconf 87' lang='eng' dir='ltr'><em>Roseovarius</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 660 659 777 681; x_wconf 83' lang='eng' dir='ltr'><em>tolerans</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 787 658 902 681; x_wconf 89' lang='eng' dir='ltr'><em>EL—172T</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 912 659 1042 687; x_wconf 91' lang='eng' dir='ltr'>(Y11551)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 290 696 1243 724; baseline 0.002 -8"><span class='ocrx_word' id='word_1_82' title='bbox 290 699 314 716; x_wconf 90' lang='eng'>9</span> <span class='ocrx_word' id='word_1_83' title='bbox 622 696 781 718; x_wconf 86' lang='eng' dir='ltr'><em>Rose/vivax</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 790 696 952 718; x_wconf 87' lang='eng' dir='ltr'><em>halodurans</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 962 696 1023 718; x_wconf 91' lang='eng' dir='ltr'><em>OCh</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 1034 696 1099 718; x_wconf 77' lang='eng' dir='ltr'><em>239T</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 1109 696 1243 724; x_wconf 87' lang='eng' dir='ltr'><em>(D85829)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 532 733 1171 762; baseline 0 -6"><span class='ocrx_word' id='word_1_88' title='bbox 532 734 691 756; x_wconf 88' lang='eng' dir='ltr'><em>Roseivivax</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 700 734 880 756; x_wconf 84' lang='eng' dir='ltr'><em>haloto/erans</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 890 734 952 756; x_wconf 90' lang='eng' dir='ltr'><em>OCh</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 963 733 1027 756; x_wconf 93' lang='eng' dir='ltr'><em>210T</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 1037 734 1171 762; x_wconf 87' lang='eng' dir='ltr'><em>(D85831)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 563 770 1067 799; baseline 0 -6"><span class='ocrx_word' id='word_1_93' title='bbox 563 771 693 799; x_wconf 90' lang='eng' dir='ltr'><em>Salipiger</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 700 777 829 793; x_wconf 87' lang='eng' dir='ltr'><em>mucosus</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 837 770 887 793; x_wconf 84' lang='eng' dir='ltr'><em>A3T</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 897 771 1067 799; x_wconf 92' lang='eng' dir='ltr'>(AY527274)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 185 808 1284 836; baseline 0.001 -7"><span class='ocrx_word' id='word_1_97' title='bbox 185 811 211 829; x_wconf 88' lang='eng'><em>87</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 581 809 751 830; x_wconf 86' lang='eng' dir='ltr'><em>Paracoccus</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 761 808 939 830; x_wconf 84' lang='eng' dir='ltr'><em>denitrificans</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 947 808 1030 830; x_wconf 93' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 1043 808 1142 830; x_wconf 76' lang='eng' dir='ltr'><em>17741T</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 1152 808 1284 836; x_wconf 88' lang='eng' dir='ltr'>(Y16927)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 127 839 1656 874; baseline 0 -6"><span class='ocrx_word' id='word_1_103' title='bbox 127 839 153 856; x_wconf 71' lang='eng'><em>&quot;</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 1017 846 1169 868; x_wconf 86' lang='eng' dir='ltr'><em>Roseibium</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 1179 846 1364 868; x_wconf 87' lang='eng' dir='ltr'><em>hamelinense</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 1375 846 1437 868; x_wconf 89' lang='eng' dir='ltr'><em>OCh</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 1448 845 1512 868; x_wconf 82' lang='eng' dir='ltr'><em>368T</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 1522 846 1656 874; x_wconf 87' lang='eng' dir='ltr'><em>(D85836)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 549 882 1248 912; baseline -0.001 -6"><span class='ocrx_word' id='word_1_109' title='bbox 549 883 738 906; x_wconf 85' lang='eng' dir='ltr'><em>Rhodobacter</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 747 883 992 911; x_wconf 84' lang='eng' dir='ltr'><em>ve/dkampiiATCC</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 1003 882 1103 906; x_wconf 82' lang='eng' dir='ltr'><em>35703T</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 1114 883 1248 912; x_wconf 82' lang='eng' dir='ltr'><em>(D16421)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 363 920 1064 949; baseline 0 -6"><span class='ocrx_word' id='word_1_113' title='bbox 363 921 778 943; x_wconf 84' lang='eng' dir='ltr'><em>SilicibacterIacuscaeru/ensis</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 789 920 919 943; x_wconf 91' lang='eng' dir='ltr'><em>|T|—1157T</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 930 921 1064 949; x_wconf 90' lang='eng' dir='ltr'><em>(U77644)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 469 958 1177 986; baseline 0.003 -8"><span class='ocrx_word' id='word_1_116' title='bbox 469 961 507 978; x_wconf 84' lang='eng'>10</span> <span class='ocrx_word' id='word_1_117' title='bbox 559 958 1177 986; x_wconf 73' lang='eng' dir='ltr'><em>Octadecabacterantarcticus307T(U14583)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 213 989 1176 1024; baseline 0 -6"><span class='ocrx_word' id='word_1_118' title='bbox 213 989 251 1006; x_wconf 66' lang='eng'>1°</span> <span class='ocrx_word' id='word_1_119' title='bbox 604 996 958 1018; x_wconf 83' lang='eng' dir='ltr'><em>Octadecabacterarcticus</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 967 995 1032 1018; x_wconf 77' lang='eng' dir='ltr'><em>238T</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 1042 996 1176 1024; x_wconf 87' lang='eng' dir='ltr'>(U73725)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 435 1032 1152 1061; baseline 0 -6"><span class='ocrx_word' id='word_1_122' title='bbox 435 1033 626 1055; x_wconf 86' lang='eng' dir='ltr'><em>Thalassobius</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 635 1033 833 1061; x_wconf 86' lang='eng' dir='ltr'><em>gelatinovorus</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 844 1033 895 1055; x_wconf 95' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 909 1032 1007 1055; x_wconf 88' lang='eng' dir='ltr'><em>12617T</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 1018 1033 1152 1061; x_wconf 80' lang='eng'><em>(088523)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 297 1070 1093 1098; baseline 0 -6"><span class='ocrx_word' id='word_1_127' title='bbox 297 1073 335 1091; x_wconf 89' lang='eng'>10</span> <span class='ocrx_word' id='word_1_128' title='bbox 436 1070 810 1092; x_wconf 81' lang='eng' dir='ltr'><em>Roseobacterdenitrificans</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 819 1070 881 1092; x_wconf 90' lang='eng' dir='ltr'><em>OCh</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 894 1070 954 1092; x_wconf 73' lang='eng' dir='ltr'><em>114T</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 965 1070 1093 1098; x_wconf 93' lang='eng' dir='ltr'><em>(LO1784)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 443 1108 1089 1137; baseline 0 -6"><span class='ocrx_word' id='word_1_132' title='bbox 443 1109 743 1131; x_wconf 83' lang='eng' dir='ltr'><em>Roseobacterlitoralis</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 752 1109 835 1131; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_134' title='bbox 844 1108 946 1131; x_wconf 80' lang='eng' dir='ltr'><em>49566T</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 957 1109 1089 1137; x_wconf 84' lang='eng' dir='ltr'>(X78312)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 137 1144 951 1175; baseline 0.002 -10"><span class='ocrx_word' id='word_1_136' title='bbox 137 1157 160 1175; x_wconf 72' lang='eng'><strong>9</strong></span> <span class='ocrx_word' id='word_1_137' title='bbox 221 1148 247 1165; x_wconf 39' lang='eng'><em>:4</em></span> <span class='ocrx_word' id='word_1_138' title='bbox 402 1145 682 1167; x_wconf 80' lang='eng' dir='ltr'><em>Sulﬁtobacterbrevis</em></span> <span class='ocrx_word' id='word_1_139' title='bbox 693 1144 808 1167; x_wconf 80' lang='eng' dir='ltr'><em>EL—162T</em></span> <span class='ocrx_word' id='word_1_140' title='bbox 818 1145 951 1173; x_wconf 88' lang='eng' dir='ltr'><em>(Y16425)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 376 1182 1075 1211; baseline 0 -6"><span class='ocrx_word' id='word_1_141' title='bbox 376 1182 562 1205; x_wconf 82' lang='eng' dir='ltr'><em>Sulfitobacter</em></span> <span class='ocrx_word' id='word_1_142' title='bbox 569 1183 780 1205; x_wconf 86' lang='eng' dir='ltr'><em>mediterraneus</em></span> <span class='ocrx_word' id='word_1_143' title='bbox 789 1182 933 1205; x_wconf 89' lang='eng' dir='ltr'><em>CH-B427T</em></span> <span class='ocrx_word' id='word_1_144' title='bbox 943 1182 1075 1211; x_wconf 90' lang='eng' dir='ltr'>(Y17387)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 206 1210 967 1248">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 206 1210 967 1248">
+     <span class='ocr_line' id='line_1_33' title="bbox 206 1210 967 1248; baseline 0 -6"><span class='ocrx_word' id='word_1_145' title='bbox 206 1210 230 1227; x_wconf 70' lang='eng'>8</span> <span class='ocrx_word' id='word_1_146' title='bbox 344 1219 967 1248; x_wconf 72' lang='eng' dir='ltr'><em>SulﬁtobacterpontiacusChLG1OT(Y13155)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002519-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002519-0-000.pbm.png
new file mode 100644
index 00000000..1624e39b
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002519-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002519-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002519-0-000.pbm.png.hocr
new file mode 100644
index 00000000..e4510773
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002519-0-000.pbm.png.hocr
@@ -0,0 +1,332 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002519-0-000.pbm.png"; bbox 0 0 1160 939; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 7 11 554 13">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 7 11 554 13">
+     <span class='ocr_line' id='line_1_1' title="bbox 7 11 554 13; baseline 0 926"><span class='ocrx_word' id='word_1_1' title='bbox 7 11 554 13; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 270 0 1125 68">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 270 0 1125 68">
+     <span class='ocr_line' id='line_1_2' title="bbox 570 0 1125 32; baseline 0 -4"><span class='ocrx_word' id='word_1_2' title='bbox 570 5 725 28; x_wconf 63' lang='eng' dir='ltr'><em>Escher/ma</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 735 5 873 28; x_wconf 81' lang='eng' dir='ltr'><em>col/ATCC</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 887 6 894 28; x_wconf 99' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 906 6 913 28; x_wconf 99' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 923 0 985 28; x_wconf 78' lang='eng' dir='ltr'><em>775T</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 995 2 1125 32; x_wconf 86' lang='eng' dir='ltr'>(X80725)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 270 34 907 68; baseline 0 -7"><span class='ocrx_word' id='word_1_8' title='bbox 270 38 439 61; x_wconf 77' lang='eng' dir='ltr'><em>Comamanas</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 449 38 567 68; x_wconf 68' lang='eng' dir='ltr'><em>{err/gene</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 577 38 642 61; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 656 34 735 61; x_wconf 77' lang='eng' dir='ltr'><em>7099T</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 745 36 907 66; x_wconf 88' lang='eng' dir='ltr'>(AJ420326)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 91 67 849 114">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 91 67 849 102">
+     <span class='ocr_line' id='line_1_4' title="bbox 91 67 849 102; baseline 0 -8"><span class='ocrx_word' id='word_1_13' title='bbox 91 79 221 102; x_wconf 62' lang='eng'><em>100—</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 236 71 363 94; x_wconf 69' lang='eng' dir='ltr'><em>SuffereI/a</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 370 71 506 101; x_wconf 82' lang='eng' dir='ltr'><em>parV/rubra</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 514 71 557 94; x_wconf 94' lang='eng' dir='ltr'><em>YIT</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 570 73 577 94; x_wconf 99' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 589 67 667 94; x_wconf 77' lang='eng' dir='ltr'><em>1816T</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 677 69 849 99; x_wconf 84' lang='eng' dir='ltr'><em>(AB300989)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 73 104 130 106">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 73 104 130 106">
+     <span class='ocr_line' id='line_1_5' title="bbox 73 104 130 106; baseline 0 833"><span class='ocrx_word' id='word_1_20' title='bbox 73 104 130 106; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 26 158 75 160">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 26 158 75 160">
+     <span class='ocr_line' id='line_1_6' title="bbox 26 158 75 160; baseline 0 779"><span class='ocrx_word' id='word_1_21' title='bbox 26 158 75 160; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 73 104 75 213">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 73 104 75 213">
+     <span class='ocr_line' id='line_1_7' title="bbox 73 104 75 213; baseline 0 726"><span class='ocrx_word' id='word_1_22' title='bbox 73 104 75 213; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 128 79 130 130">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 128 79 130 130">
+     <span class='ocr_line' id='line_1_8' title="bbox 128 79 130 130; baseline 0 809"><span class='ocrx_word' id='word_1_23' title='bbox 128 79 130 130; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 259 102 1003 198">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 259 102 1003 198">
+     <span class='ocr_line' id='line_1_9' title="bbox 289 102 940 132; baseline 0 -5"><span class='ocrx_word' id='word_1_24' title='bbox 289 104 416 127; x_wconf 72' lang='eng' dir='ltr'><em>Sufferel/a</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 428 105 644 127; x_wconf 81' lang='eng' dir='ltr'><em>wadsworthens/s</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 651 105 720 127; x_wconf 93' lang='eng' dir='ltr'><em>WAL</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 732 105 801 127; x_wconf 90' lang='eng'>7877</span> <span class='ocrx_word' id='word_1_28' title='bbox 813 102 940 132; x_wconf 83' lang='eng' dir='ltr'>(L37785)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 259 133 952 165; baseline 0 -4"><span class='ocrx_word' id='word_1_29' title='bbox 259 138 385 161; x_wconf 73' lang='eng' dir='ltr'><em>Sufferel/a</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 395 138 567 161; x_wconf 78' lang='eng' dir='ltr'><em>sfercor/can/s</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 575 138 668 161; x_wconf 86' lang='eng' dir='ltr'><strong>CCUG</strong></span> <span class='ocrx_word' id='word_1_32' title='bbox 680 133 780 161; x_wconf 71' lang='eng' dir='ltr'><em>47620T</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 790 135 952 165; x_wconf 86' lang='eng' dir='ltr'><em>(AJ566849)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 296 168 1003 198; baseline 0 -4"><span class='ocrx_word' id='word_1_34' title='bbox 296 179 355 181; x_wconf 90' lang='eng'>—</span> <span class='ocrx_word' id='word_1_35' title='bbox 365 171 510 194; x_wconf 76' lang='eng' dir='ltr'><em>Uncultured</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 522 171 652 194; x_wconf 86' lang='eng' dir='ltr'><em>bacterium</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 664 171 735 194; x_wconf 88' lang='eng' dir='ltr'>clone</span> <span class='ocrx_word' id='word_1_38' title='bbox 748 171 822 194; x_wconf 86' lang='eng' dir='ltr'><em>D093</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 833 168 1003 198; x_wconf 88' lang='eng' dir='ltr'><em>(AY916355)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 128 129 147 130">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 128 129 147 130">
+     <span class='ocr_line' id='line_1_12' title="bbox 128 129 147 130; baseline 0 809"><span class='ocrx_word' id='word_1_40' title='bbox 128 129 147 130; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 145 112 147 147">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 145 112 147 147">
+     <span class='ocr_line' id='line_1_13' title="bbox 145 112 147 147; baseline 0 792"><span class='ocrx_word' id='word_1_41' title='bbox 145 112 147 147; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 119 135 140 150">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 119 135 140 150">
+     <span class='ocr_line' id='line_1_14' title="bbox 119 135 140 150; baseline 0 0"><span class='ocrx_word' id='word_1_42' title='bbox 119 135 140 150; x_wconf 93' lang='eng'><em>77</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 147 146 244 147">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 147 146 244 147">
+     <span class='ocr_line' id='line_1_15' title="bbox 147 146 244 147; baseline 0 792"><span class='ocrx_word' id='word_1_43' title='bbox 147 146 244 147; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 73 211 331 214">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 73 211 331 214">
+     <span class='ocr_line' id='line_1_16' title="bbox 73 211 331 214; baseline 0 725"><span class='ocrx_word' id='word_1_44' title='bbox 73 211 331 214; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 7 11 9 307">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 7 11 9 307">
+     <span class='ocr_line' id='line_1_17' title="bbox 7 11 9 307; baseline 0 632"><span class='ocrx_word' id='word_1_45' title='bbox 7 11 9 307; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 7 305 28 307">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 7 305 28 307">
+     <span class='ocr_line' id='line_1_18' title="bbox 7 305 28 307; baseline 0 632"><span class='ocrx_word' id='word_1_46' title='bbox 7 305 28 307; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 257 202 1160 298">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 257 202 1160 298">
+     <span class='ocr_line' id='line_1_19' title="bbox 257 202 995 232; baseline 0 -5"><span class='ocrx_word' id='word_1_47' title='bbox 257 215 290 230; x_wconf 74' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 340 204 484 227; x_wconf 87' lang='eng' dir='ltr'><em>Uncultured</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 497 204 627 227; x_wconf 84' lang='eng' dir='ltr'><em>bacterium</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 639 204 710 227; x_wconf 88' lang='eng' dir='ltr'>clone</span> <span class='ocrx_word' id='word_1_51' title='bbox 722 204 822 227; x_wconf 89' lang='eng' dir='ltr'>HuCA4</span> <span class='ocrx_word' id='word_1_52' title='bbox 833 202 995 232; x_wconf 84' lang='eng' dir='ltr'><em>(AJ408960)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 283 233 1160 266; baseline -0.002 -3"><span class='ocrx_word' id='word_1_53' title='bbox 283 249 304 263; x_wconf 78' lang='eng'><em>72</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 329 237 525 261; x_wconf 82' lang='eng' dir='ltr'><em>Parasuttere/la</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 536 237 799 261; x_wconf 69' lang='eng' dir='ltr'><em>excrement/hominis</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 807 237 852 261; x_wconf 98' lang='eng' dir='ltr'><em>YIT</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 866 239 875 261; x_wconf 96' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 886 233 969 261; x_wconf 78' lang='eng' dir='ltr'><em>1859T</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 980 235 1160 266; x_wconf 89' lang='eng' dir='ltr'>(AB370250)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 288 269 1031 298; baseline -0.001 -3"><span class='ocrx_word' id='word_1_60' title='bbox 288 280 310 295; x_wconf 74' lang='eng' dir='ltr'><em>es</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 334 271 479 294; x_wconf 86' lang='eng' dir='ltr'><em>Uncultured</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 491 271 621 294; x_wconf 83' lang='eng' dir='ltr'><em>bacterium</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 633 271 704 294; x_wconf 90' lang='eng' dir='ltr'>clone</span> <span class='ocrx_word' id='word_1_64' title='bbox 716 270 842 294; x_wconf 87' lang='eng' dir='ltr'><em>014C-E5</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 853 269 1031 298; x_wconf 81' lang='eng' dir='ltr'><em>(D0905669)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 295 179 296 245">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 295 179 296 245">
+     <span class='ocr_line' id='line_1_22' title="bbox 295 179 296 245; baseline 0 694"><span class='ocrx_word' id='word_1_66' title='bbox 295 179 296 245; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 0 313 23 327">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 0 313 23 327">
+     <span class='ocr_line' id='line_1_23' title="bbox 0 313 23 327; baseline 0 0"><span class='ocrx_word' id='word_1_67' title='bbox 0 313 23 327; x_wconf 79' lang='eng'><em>59</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 52 378 54 413">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 52 378 54 413">
+     <span class='ocr_line' id='line_1_24' title="bbox 52 378 54 413; baseline 0 526"><span class='ocrx_word' id='word_1_68' title='bbox 52 378 54 413; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 26 158 28 455">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 26 158 28 455">
+     <span class='ocr_line' id='line_1_25' title="bbox 26 158 28 455; baseline 0 484"><span class='ocrx_word' id='word_1_69' title='bbox 26 158 28 455; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 47 445 49 582">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 47 445 49 582">
+     <span class='ocr_line' id='line_1_26' title="bbox 47 445 49 582; baseline 0 357"><span class='ocrx_word' id='word_1_70' title='bbox 47 445 49 582; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 109 478 131 492">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 109 478 131 492">
+     <span class='ocr_line' id='line_1_27' title="bbox 109 478 131 492; baseline 0 0"><span class='ocrx_word' id='word_1_71' title='bbox 109 478 131 492; x_wconf 88' lang='eng'>87</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 295 302 1134 332">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 295 302 1134 332">
+     <span class='ocr_line' id='line_1_28' title="bbox 295 302 1134 332; baseline 0 -4"><span class='ocrx_word' id='word_1_72' title='bbox 295 308 317 323; x_wconf 75' lang='eng'>80</span> <span class='ocrx_word' id='word_1_73' title='bbox 335 305 479 328; x_wconf 88' lang='eng' dir='ltr'><em>Uncultured</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 492 305 622 328; x_wconf 86' lang='eng' dir='ltr'><em>bacterium</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 634 305 706 328; x_wconf 89' lang='eng' dir='ltr'>clone</span> <span class='ocrx_word' id='word_1_76' title='bbox 718 305 807 328; x_wconf 86' lang='eng' dir='ltr'><em>RL304</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 818 305 945 328; x_wconf 86' lang='eng' dir='ltr'><em>aal73c05</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 957 302 1134 332; x_wconf 82' lang='eng' dir='ltr'>(D0824230)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 232 333 970 500">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 232 333 970 500">
+     <span class='ocr_line' id='line_1_29' title="bbox 284 333 970 365; baseline 0 -4"><span class='ocrx_word' id='word_1_79' title='bbox 284 333 318 348; x_wconf 38' lang='eng'><em>10°</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 332 338 476 361; x_wconf 87' lang='eng' dir='ltr'><em>Uncultured</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 489 338 619 361; x_wconf 86' lang='eng' dir='ltr'><em>bacterium</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 631 338 702 361; x_wconf 90' lang='eng' dir='ltr'>clone</span> <span class='ocrx_word' id='word_1_83' title='bbox 715 338 788 361; x_wconf 87' lang='eng' dir='ltr'><em>D769</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 800 335 970 365; x_wconf 83' lang='eng' dir='ltr'><em>(AY986364)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 260 366 798 400; baseline 0 -7"><span class='ocrx_word' id='word_1_85' title='bbox 260 370 424 393; x_wconf 69' lang='eng' dir='ltr'><em>Oxa/obacter</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 431 370 580 400; x_wconf 70' lang='eng' dir='ltr'><em>form/genes</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 588 366 655 393; x_wconf 80' lang='eng' dir='ltr'><em>OxBT</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 665 368 694 397; x_wconf 91' lang='eng' dir='ltr'><em>(U</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 698 372 732 393; x_wconf 83' lang='eng'><em>49</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 737 372 750 393; x_wconf 94' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 754 372 769 393; x_wconf 88' lang='eng'>5</span> <span class='ocrx_word' id='word_1_92' title='bbox 774 368 798 398; x_wconf 90' lang='eng'>7)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 268 399 898 434; baseline 0 -7"><span class='ocrx_word' id='word_1_93' title='bbox 268 404 437 427; x_wconf 61' lang='eng' dir='ltr'><em>Burkho/der/Qa</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 447 404 552 434; x_wconf 60' lang='eng' dir='ltr'><em>cepaC/a</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 559 404 644 427; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 656 399 755 427; x_wconf 75' lang='eng' dir='ltr'><em>25416T</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 766 402 868 431; x_wconf 88' lang='eng' dir='ltr'><em>(U9692</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 874 402 898 431; x_wconf 92' lang='eng'><em>7)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 232 432 808 467; baseline 0 -7"><span class='ocrx_word' id='word_1_99' title='bbox 232 437 315 460; x_wconf 79' lang='eng' dir='ltr'><em>DerX/a</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 323 445 455 467; x_wconf 80' lang='eng' dir='ltr'><em>gummosa</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 465 437 515 460; x_wconf 92' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 529 432 626 460; x_wconf 84' lang='eng' dir='ltr'><em>13946T</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 636 435 808 465; x_wconf 87' lang='eng' dir='ltr'>(AB089482)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 290 466 919 500; baseline 0 -7"><span class='ocrx_word' id='word_1_104' title='bbox 290 471 420 493; x_wconf 80' lang='eng' dir='ltr'><em>Brack/e/la</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 430 471 563 500; x_wconf 71' lang='eng' dir='ltr'><em>oed/pod/s</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 571 470 635 494; x_wconf 90' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 650 472 732 493; x_wconf 89' lang='eng'>19451</span> <span class='ocrx_word' id='word_1_108' title='bbox 740 466 747 477; x_wconf 49' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_109' title='bbox 757 468 919 498; x_wconf 87' lang='eng' dir='ltr'>(AJ277742)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 106 494 138 496">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 106 494 138 496">
+     <span class='ocr_line' id='line_1_34' title="bbox 106 494 138 496; baseline 0 443"><span class='ocrx_word' id='word_1_110' title='bbox 106 494 138 496; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 139 499 953 600">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 139 499 953 600">
+     <span class='ocr_line' id='line_1_35' title="bbox 341 499 953 534; baseline 0 -7"><span class='ocrx_word' id='word_1_111' title='bbox 341 504 440 534; x_wconf 69' lang='eng' dir='ltr'><em>O/I&#39;ge/Aa</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 451 504 573 527; x_wconf 74' lang='eng' dir='ltr'><em>urethra/is</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 580 504 665 527; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 679 505 686 527; x_wconf 94' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 697 499 776 527; x_wconf 77' lang='eng' dir='ltr'><em>7960T</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 786 501 953 532; x_wconf 89' lang='eng' dir='ltr'>(AF227163)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 139 532 855 577; baseline 0 -17"><span class='ocrx_word' id='word_1_117' title='bbox 139 544 256 577; x_wconf 41' lang='eng'><em>£17</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 270 537 393 566; x_wconf 77' lang='eng' dir='ltr'><em>Pe/fslega</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 404 544 529 566; x_wconf 81' lang='eng' dir='ltr'><em>europaea</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 538 536 602 560; x_wconf 88' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 617 532 715 560; x_wconf 88' lang='eng' dir='ltr'><em>10982T</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 725 534 764 564; x_wconf 93' lang='eng' dir='ltr'><em>(Y1</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 776 534 855 564; x_wconf 88' lang='eng'><em>1890)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 285 565 930 600; baseline 0.002 -8"><span class='ocrx_word' id='word_1_124' title='bbox 285 570 406 600; x_wconf 77' lang='eng' dir='ltr'><em>Tay/ore/la</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 416 570 585 599; x_wconf 62' lang='eng' dir='ltr'><em>eqw&#39;gem&#39;fa/Ils</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 594 569 678 593; x_wconf 91' lang='eng' dir='ltr'><em>NCTC</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 692 571 700 592; x_wconf 93' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 711 571 718 592; x_wconf 93' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 729 571 737 592; x_wconf 90' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 746 565 789 593; x_wconf 73' lang='eng' dir='ltr'><em>84T</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 800 567 930 597; x_wconf 88' lang='eng' dir='ltr'><em>(X68645)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 47 576 267 581">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 47 576 267 581">
+     <span class='ocr_line' id='line_1_38' title="bbox 47 576 267 581; baseline 0 358"><span class='ocrx_word' id='word_1_132' title='bbox 47 576 267 581; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 81 586 138 601">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 81 586 138 601">
+     <span class='ocr_line' id='line_1_39' title="bbox 81 586 138 601; baseline 0 0"><span class='ocrx_word' id='word_1_133' title='bbox 81 586 138 601; x_wconf 80' lang='eng'><em>99—</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 106 494 108 668">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 106 494 108 668">
+     <span class='ocr_line' id='line_1_40' title="bbox 106 494 108 668; baseline 0 271"><span class='ocrx_word' id='word_1_134' title='bbox 106 494 108 668; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 112 863 134 878">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 112 863 134 878">
+     <span class='ocr_line' id='line_1_41' title="bbox 112 863 134 878; baseline 0 0"><span class='ocrx_word' id='word_1_135' title='bbox 112 863 134 878; x_wconf 83' lang='eng'>26</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 194 599 898 664">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 194 599 898 664">
+     <span class='ocr_line' id='line_1_42' title="bbox 194 599 898 631; baseline 0 -4"><span class='ocrx_word' id='word_1_136' title='bbox 194 611 200 613; x_wconf 82' lang='eng'>&#39;</span> <span class='ocrx_word' id='word_1_137' title='bbox 224 604 426 627; x_wconf 77' lang='eng' dir='ltr'><em>Tetrath/bbacler</em></span> <span class='ocrx_word' id='word_1_138' title='bbox 432 604 606 627; x_wconf 75' lang='eng' dir='ltr'><em>kashm/rens/s</em></span> <span class='ocrx_word' id='word_1_139' title='bbox 614 604 711 627; x_wconf 93' lang='eng' dir='ltr'>WT001</span> <span class='ocrx_word' id='word_1_140' title='bbox 719 599 727 611; x_wconf 51' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_141' title='bbox 737 601 851 631; x_wconf 87' lang='eng' dir='ltr'><em>(AJ8644</em></span> <span class='ocrx_word' id='word_1_142' title='bbox 856 601 898 631; x_wconf 91' lang='eng'><em>70)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 194 632 887 664; baseline 0 -4"><span class='ocrx_word' id='word_1_143' title='bbox 194 644 217 646; x_wconf 96' lang='eng'>—</span> <span class='ocrx_word' id='word_1_144' title='bbox 233 637 365 660; x_wconf 66' lang='eng' dir='ltr'><em>Advene/Aa</em></span> <span class='ocrx_word' id='word_1_145' title='bbox 375 637 488 660; x_wconf 75' lang='eng' dir='ltr'><em>mcenata</em></span> <span class='ocrx_word' id='word_1_146' title='bbox 497 637 589 660; x_wconf 89' lang='eng' dir='ltr'><strong>CCUG</strong></span> <span class='ocrx_word' id='word_1_147' title='bbox 601 632 701 660; x_wconf 84' lang='eng' dir='ltr'><em>45225T</em></span> <span class='ocrx_word' id='word_1_148' title='bbox 712 634 887 664; x_wconf 81' lang='eng' dir='ltr'><em>(AM944734)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 138 627 194 629">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 138 627 194 629">
+     <span class='ocr_line' id='line_1_44' title="bbox 138 627 194 629; baseline 0 310"><span class='ocrx_word' id='word_1_149' title='bbox 138 627 194 629; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 192 611 194 646">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 192 611 194 646">
+     <span class='ocr_line' id='line_1_45' title="bbox 192 611 194 646; baseline 0 293"><span class='ocrx_word' id='word_1_150' title='bbox 192 611 194 646; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 154 634 188 648">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 154 634 188 648">
+     <span class='ocr_line' id='line_1_46' title="bbox 154 634 188 648; baseline 0 0"><span class='ocrx_word' id='word_1_151' title='bbox 154 634 188 648; x_wconf 85' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 133 666 865 700">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 133 666 865 700">
+     <span class='ocr_line' id='line_1_47' title="bbox 133 666 865 700; baseline 0 -7"><span class='ocrx_word' id='word_1_152' title='bbox 133 677 254 679; x_wconf 90' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_153' title='bbox 267 670 424 700; x_wconf 70' lang='eng' dir='ltr'><em>Aloe/lgenes</em></span> <span class='ocrx_word' id='word_1_154' title='bbox 433 670 535 693; x_wconf 64' lang='eng' dir='ltr'><em>faeca/Ils</em></span> <span class='ocrx_word' id='word_1_155' title='bbox 542 670 627 693; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_156' title='bbox 638 666 719 693; x_wconf 72' lang='eng' dir='ltr'><em>8750T</em></span> <span class='ocrx_word' id='word_1_157' title='bbox 729 668 865 698; x_wconf 87' lang='eng' dir='ltr'>(M22508)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 145 710 225 712">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 145 710 225 712">
+     <span class='ocr_line' id='line_1_48' title="bbox 145 710 225 712; baseline 0 227"><span class='ocrx_word' id='word_1_158' title='bbox 145 710 225 712; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_37' title="bbox 136 699 958 898">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 235 699 772 733">
+     <span class='ocr_line' id='line_1_49' title="bbox 235 699 772 733; baseline 0 -7"><span class='ocrx_word' id='word_1_159' title='bbox 235 704 436 733; x_wconf 61' lang='eng' dir='ltr'><em>H&#39;gmem‘whaga</em></span> <span class='ocrx_word' id='word_1_160' title='bbox 446 704 522 727; x_wconf 79' lang='eng' dir='ltr'><em>kul/ae</em></span> <span class='ocrx_word' id='word_1_161' title='bbox 531 699 594 726; x_wconf 76' lang='eng' dir='ltr'><em>K24T</em></span> <span class='ocrx_word' id='word_1_162' title='bbox 605 701 737 731; x_wconf 87' lang='eng' dir='ltr'><em>(AF28291</em></span> <span class='ocrx_word' id='word_1_163' title='bbox 746 701 772 731; x_wconf 90' lang='eng'>6)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 246 732 842 766">
+     <span class='ocr_line' id='line_1_50' title="bbox 246 732 842 766; baseline 0 -7"><span class='ocrx_word' id='word_1_164' title='bbox 246 737 380 759; x_wconf 80' lang='eng' dir='ltr'><em>Kersters/a</em></span> <span class='ocrx_word' id='word_1_165' title='bbox 389 737 496 766; x_wconf 77' lang='eng' dir='ltr'><em>gy/orum</em></span> <span class='ocrx_word' id='word_1_166' title='bbox 505 736 569 760; x_wconf 91' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_167' title='bbox 581 732 662 759; x_wconf 76' lang='eng' dir='ltr'><em>5906T</em></span> <span class='ocrx_word' id='word_1_168' title='bbox 673 734 770 764; x_wconf 87' lang='eng' dir='ltr'>(AY131</span> <span class='ocrx_word' id='word_1_169' title='bbox 780 734 842 764; x_wconf 90' lang='eng'>213)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 136 765 951 833">
+     <span class='ocr_line' id='line_1_51' title="bbox 136 765 951 800; baseline -0.002 -6"><span class='ocrx_word' id='word_1_170' title='bbox 136 774 145 789; x_wconf 82' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_171' title='bbox 148 774 229 795; x_wconf 62' lang='eng' dir='ltr'><em>L—</em></span> <span class='ocrx_word' id='word_1_172' title='bbox 237 770 450 793; x_wconf 77' lang='eng' dir='ltr'><em>Achromobacfer</em></span> <span class='ocrx_word' id='word_1_173' title='bbox 456 770 624 800; x_wconf 73' lang='eng' dir='ltr'><em>xylosoxzdans</em></span> <span class='ocrx_word' id='word_1_174' title='bbox 633 770 699 793; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_175' title='bbox 713 765 810 793; x_wconf 74' lang='eng' dir='ltr'><em>10346T</em></span> <span class='ocrx_word' id='word_1_176' title='bbox 820 767 860 797; x_wconf 94' lang='eng' dir='ltr'>(Y1</span> <span class='ocrx_word' id='word_1_177' title='bbox 869 767 951 797; x_wconf 89' lang='eng'>4908)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_52' title="bbox 154 799 827 833; baseline 0.001 -7"><span class='ocrx_word' id='word_1_178' title='bbox 154 799 176 813; x_wconf 72' lang='eng'>97</span> <span class='ocrx_word' id='word_1_179' title='bbox 184 810 219 812; x_wconf 84' lang='eng'>—</span> <span class='ocrx_word' id='word_1_180' title='bbox 230 804 368 827; x_wconf 78' lang='eng' dir='ltr'><em>Bordefel/a</em></span> <span class='ocrx_word' id='word_1_181' title='bbox 375 804 500 833; x_wconf 67' lang='eng' dir='ltr'><em>peﬁuss/s</em></span> <span class='ocrx_word' id='word_1_182' title='bbox 507 803 592 827; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_183' title='bbox 603 799 684 827; x_wconf 82' lang='eng' dir='ltr'><em>9797T</em></span> <span class='ocrx_word' id='word_1_184' title='bbox 694 801 827 831; x_wconf 88' lang='eng' dir='ltr'><em>(U04950)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 139 832 838 866">
+     <span class='ocr_line' id='line_1_53' title="bbox 139 832 838 866; baseline -0.001 -6"><span class='ocrx_word' id='word_1_185' title='bbox 139 844 228 845; x_wconf 42' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_186' title='bbox 241 836 417 860; x_wconf 74' lang='eng' dir='ltr'><em>Caste//an/e//a</em></span> <span class='ocrx_word' id='word_1_187' title='bbox 427 837 571 866; x_wconf 80' lang='eng' dir='ltr'><em>defragrans</em></span> <span class='ocrx_word' id='word_1_188' title='bbox 579 832 666 860; x_wconf 87' lang='eng' dir='ltr'><em>54PinT</em></span> <span class='ocrx_word' id='word_1_189' title='bbox 676 834 809 864; x_wconf 87' lang='eng' dir='ltr'><em>(AJ00544</em></span> <span class='ocrx_word' id='word_1_190' title='bbox 814 834 838 864; x_wconf 93' lang='eng'><em>7)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 139 865 958 898">
+     <span class='ocr_line' id='line_1_54' title="bbox 139 865 958 898; baseline 0 -5"><span class='ocrx_word' id='word_1_191' title='bbox 139 876 198 878; x_wconf 88' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_192' title='bbox 210 870 378 893; x_wconf 69' lang='eng' dir='ltr'><em>Pusﬂ/I&#39;nvonas</em></span> <span class='ocrx_word' id='word_1_193' title='bbox 386 870 563 893; x_wconf 75' lang='eng' dir='ltr'><em>noertemann/i</em></span> <span class='ocrx_word' id='word_1_194' title='bbox 569 870 667 893; x_wconf 92' lang='eng' dir='ltr'><em>NCIMB</em></span> <span class='ocrx_word' id='word_1_195' title='bbox 680 871 688 893; x_wconf 96' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_196' title='bbox 697 865 778 893; x_wconf 88' lang='eng' dir='ltr'><em>4020T</em></span> <span class='ocrx_word' id='word_1_197' title='bbox 788 868 958 898; x_wconf 82' lang='eng' dir='ltr'>(AY695828)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_38' title="bbox 205 917 228 931">
+    <p class='ocr_par' dir='ltr' id='par_1_42' title="bbox 205 917 228 931">
+     <span class='ocr_line' id='line_1_55' title="bbox 205 917 228 931; baseline 0 0"><span class='ocrx_word' id='word_1_198' title='bbox 205 917 228 931; x_wconf 89' lang='eng'><em>0.1</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_39' title="bbox 146 726 169 740">
+    <p class='ocr_par' dir='ltr' id='par_1_43' title="bbox 146 726 169 740">
+     <span class='ocr_line' id='line_1_56' title="bbox 146 726 169 740; baseline 0 0"><span class='ocrx_word' id='word_1_199' title='bbox 146 726 169 740; x_wconf 79' lang='eng'><em>33</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_40' title="bbox 143 710 145 770">
+    <p class='ocr_par' dir='ltr' id='par_1_44' title="bbox 143 710 145 770">
+     <span class='ocr_line' id='line_1_57' title="bbox 143 710 145 770; baseline 0 169"><span class='ocrx_word' id='word_1_200' title='bbox 143 710 145 770; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_41' title="bbox 160 744 237 745">
+    <p class='ocr_par' dir='ltr' id='par_1_45' title="bbox 160 744 237 745">
+     <span class='ocr_line' id='line_1_58' title="bbox 160 744 237 745; baseline 0 194"><span class='ocrx_word' id='word_1_201' title='bbox 160 744 237 745; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_42' title="bbox 143 768 160 770">
+    <p class='ocr_par' dir='ltr' id='par_1_46' title="bbox 143 768 160 770">
+     <span class='ocr_line' id='line_1_59' title="bbox 143 768 160 770; baseline 0 169"><span class='ocrx_word' id='word_1_202' title='bbox 143 768 160 770; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_43' title="bbox 158 744 160 777">
+    <p class='ocr_par' dir='ltr' id='par_1_47' title="bbox 158 744 160 777">
+     <span class='ocr_line' id='line_1_60' title="bbox 158 744 160 777; baseline 0 162"><span class='ocrx_word' id='word_1_203' title='bbox 158 744 160 777; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_44' title="bbox 183 777 184 812">
+    <p class='ocr_par' dir='ltr' id='par_1_48' title="bbox 183 777 184 812">
+     <span class='ocr_line' id='line_1_61' title="bbox 183 777 184 812; baseline 0 127"><span class='ocrx_word' id='word_1_204' title='bbox 183 777 184 812; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_45' title="bbox 137 478 140 878">
+    <p class='ocr_par' dir='ltr' id='par_1_49' title="bbox 137 478 140 878">
+     <span class='ocr_line' id='line_1_62' title="bbox 137 478 140 878; baseline 0 61"><span class='ocrx_word' id='word_1_205' title='bbox 137 478 140 878; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002576-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002576-0-001.pbm.png
new file mode 100644
index 00000000..44c65b1e
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002576-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002576-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002576-0-001.pbm.png.hocr
new file mode 100644
index 00000000..6b7afbb4
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002576-0-001.pbm.png.hocr
@@ -0,0 +1,98 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002576-0-001.pbm.png"; bbox 0 0 994 659; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 118 1 993 620">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 118 1 993 620">
+     <span class='ocr_line' id='line_1_1' title="bbox 298 1 823 30; baseline 0 -4"><span class='ocrx_word' id='word_1_1' title='bbox 298 4 457 26; x_wconf 81' lang='eng' dir='ltr'><em>Roseovarius</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 468 4 570 26; x_wconf 84' lang='eng' dir='ltr'><em>tolerans</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 581 4 636 26; x_wconf 93' lang='eng' dir='ltr'><em>EL-1</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 645 2 688 26; x_wconf 54' lang='eng'><em>7?</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 697 1 735 30; x_wconf 93' lang='eng' dir='ltr'><em>(Y1</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 746 1 823 30; x_wconf 88' lang='eng'><em>1551)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 309 37 881 67; baseline -0.002 -4"><span class='ocrx_word' id='word_1_7' title='bbox 309 41 468 63; x_wconf 84' lang='eng' dir='ltr'><em>Roseovarius</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 478 48 595 63; x_wconf 84' lang='eng' dir='ltr'><em>mucosus</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 607 39 716 62; x_wconf 85' lang='eng' dir='ltr'><em>DFL—24T</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 725 37 881 67; x_wconf 89' lang='eng' dir='ltr'><em>(AJ534215)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 253 75 853 104; baseline -0.002 -4"><span class='ocrx_word' id='word_1_11' title='bbox 253 77 412 100; x_wconf 84' lang='eng' dir='ltr'><em>Roseovarius</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 422 75 853 104; x_wconf 72' lang='eng' dir='ltr'><em>aestuariiSMK—122T(EU156066)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 272 112 844 141; baseline 0 -5"><span class='ocrx_word' id='word_1_13' title='bbox 272 114 431 136; x_wconf 82' lang='eng' dir='ltr'><em>Roseovarius</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 442 114 602 136; x_wconf 85' lang='eng' dir='ltr'><em>nubinhibens</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 613 113 673 136; x_wconf 91' lang='eng' dir='ltr'><em>ISMT</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 682 112 844 141; x_wconf 85' lang='eng' dir='ltr'><em>(AF098495)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 309 148 993 178; baseline 0 -5"><span class='ocrx_word' id='word_1_17' title='bbox 309 151 468 173; x_wconf 84' lang='eng' dir='ltr'><em>Roseovarius</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 479 154 643 173; x_wconf 85' lang='eng' dir='ltr'><em>crassostreae</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 653 151 788 173; x_wconf 88' lang='eng' dir='ltr'><em>CV919-31</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 797 149 822 173; x_wconf 68' lang='eng' dir='ltr'><em>QT</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 832 148 888 178; x_wconf 88' lang='eng' dir='ltr'>(AF1</span> <span class='ocrx_word' id='word_1_22' title='bbox 898 148 993 178; x_wconf 88' lang='eng'><em>14484)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 261 185 870 214; baseline 0 -4"><span class='ocrx_word' id='word_1_23' title='bbox 261 188 428 210; x_wconf 84' lang='eng' dir='ltr'><em>Roseovarius</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 438 188 608 210; x_wconf 85' lang='eng' dir='ltr'><em>halotolerans</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 620 186 697 210; x_wconf 88' lang='eng' dir='ltr'><em>HJ50T</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 707 185 870 214; x_wconf 89' lang='eng' dir='ltr'><em>(EU431217)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 280 222 920 251; baseline -0.002 -4"><span class='ocrx_word' id='word_1_27' title='bbox 280 224 426 247; x_wconf 84' lang='eng' dir='ltr'><em>Silicibacter</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 434 225 651 247; x_wconf 85' lang='eng' dir='ltr'><em>lacuscaerulensis</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 661 225 712 246; x_wconf 97' lang='eng' dir='ltr'><em>|T|—1</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 723 226 730 246; x_wconf 97' lang='eng'>1</span> <span class='ocrx_word' id='word_1_31' title='bbox 739 223 783 246; x_wconf 89' lang='eng' dir='ltr'><em>57T</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 792 222 920 251; x_wconf 89' lang='eng' dir='ltr'><em>(U77644)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 272 259 827 290; baseline -0.002 -6"><span class='ocrx_word' id='word_1_33' title='bbox 272 261 418 284; x_wconf 78' lang='eng' dir='ltr'><em>Si/icibacter</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 424 261 547 290; x_wconf 79' lang='eng' dir='ltr'><em>pomeroyi</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 556 260 655 284; x_wconf 86' lang='eng' dir='ltr'><em>DSS-3T</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 665 259 827 288; x_wconf 87' lang='eng' dir='ltr'>(AF098491)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 241 296 699 327; baseline 0 -7"><span class='ocrx_word' id='word_1_37' title='bbox 241 298 384 321; x_wconf 83' lang='eng' dir='ltr'><em>Marinovum</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 395 298 494 327; x_wconf 84' lang='eng' dir='ltr'><em>a/gico/a</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 505 296 699 325; x_wconf 68' lang='eng' dir='ltr'><em>FF3T(X78315)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 260 333 917 364; baseline 0 -7"><span class='ocrx_word' id='word_1_40' title='bbox 260 335 393 364; x_wconf 84' lang='eng' dir='ltr'><em>Leisingera</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 403 335 662 364; x_wconf 83' lang='eng' dir='ltr'><em>methy/ohalidivorans</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 673 334 744 357; x_wconf 77' lang='eng' dir='ltr'><em>MBQT</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 754 333 917 362; x_wconf 88' lang='eng' dir='ltr'><em>(AY005463)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 239 369 830 401; baseline 0 -7"><span class='ocrx_word' id='word_1_44' title='bbox 239 372 405 394; x_wconf 81' lang='eng' dir='ltr'><em>Phaeobacter</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 412 372 581 401; x_wconf 83' lang='eng' dir='ltr'><em>gallaeciensis</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 592 372 642 394; x_wconf 92' lang='eng' dir='ltr'><em>BS1</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 651 371 694 394; x_wconf 87' lang='eng' dir='ltr'><em>07T</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 704 370 742 399; x_wconf 91' lang='eng' dir='ltr'><em>(Y1</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 751 369 830 399; x_wconf 87' lang='eng'>3244)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 313 406 784 437; baseline 0 -6"><span class='ocrx_word' id='word_1_50' title='bbox 313 409 428 437; x_wconf 85' lang='eng' dir='ltr'><em>Salipiger</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 436 416 553 431; x_wconf 85' lang='eng' dir='ltr'><em>mucosus</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 563 407 610 431; x_wconf 88' lang='eng' dir='ltr'><em>A3T</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 620 406 784 435; x_wconf 86' lang='eng' dir='ltr'><em>(AY527274)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 161 443 833 474; baseline 0 -6"><span class='ocrx_word' id='word_1_54' title='bbox 161 457 229 459; x_wconf 94' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_55' title='bbox 237 446 385 474; x_wconf 84' lang='eng' dir='ltr'><em>Donghicola</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 396 446 517 468; x_wconf 88' lang='eng' dir='ltr'><em>eburneus</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 527 444 651 468; x_wconf 83' lang='eng' dir='ltr'><em>SW-277T</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 661 443 833 472; x_wconf 83' lang='eng' dir='ltr'><em>(D0667965)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 246 480 785 509; baseline -0.002 -4"><span class='ocrx_word' id='word_1_59' title='bbox 246 483 412 505; x_wconf 83' lang='eng' dir='ltr'><em>Roseobacter</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 421 483 512 505; x_wconf 83' lang='eng' dir='ltr'><em>Iitoralis</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 523 482 576 505; x_wconf 88' lang='eng' dir='ltr'><em>Och</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 589 481 649 504; x_wconf 80' lang='eng' dir='ltr'><em>149T</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 659 480 785 509; x_wconf 85' lang='eng' dir='ltr'><em>(X78312)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 118 494 816 569; baseline 0 -28"><span class='ocrx_word' id='word_1_64' title='bbox 118 494 404 569; x_wconf 56' lang='eng' dir='ltr'><em>EESu/fitobacter</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 411 519 538 548; x_wconf 84' lang='eng' dir='ltr'><em>pontiacus</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 548 519 625 542; x_wconf 88' lang='eng' dir='ltr'><em>ChLG</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 639 518 680 541; x_wconf 90' lang='eng' dir='ltr'><em>10T</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 690 517 728 546; x_wconf 94' lang='eng' dir='ltr'><em>(Y1</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 737 517 816 546; x_wconf 89' lang='eng'><em>3155)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 131 554 823 583; baseline 0 -5"><span class='ocrx_word' id='word_1_70' title='bbox 131 555 154 570; x_wconf 76' lang='eng'>59</span> <span class='ocrx_word' id='word_1_71' title='bbox 219 556 386 578; x_wconf 80' lang='eng' dir='ltr'><em>Sulfitobacter</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 395 556 482 578; x_wconf 87' lang='eng' dir='ltr'><em>dubius</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 493 556 558 578; x_wconf 94' lang='eng' dir='ltr'><em>KMM</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 570 554 649 578; x_wconf 87' lang='eng' dir='ltr'><em>3554T</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 659 554 717 583; x_wconf 90' lang='eng' dir='ltr'>(AY1</span> <span class='ocrx_word' id='word_1_76' title='bbox 726 557 771 578; x_wconf 91' lang='eng'>801</span> <span class='ocrx_word' id='word_1_77' title='bbox 780 554 823 583; x_wconf 84' lang='eng'><em>02)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 242 591 901 620; baseline 0 -5"><span class='ocrx_word' id='word_1_78' title='bbox 242 593 373 615; x_wconf 81' lang='eng' dir='ltr'><em>Loktane/la</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 386 593 553 615; x_wconf 82' lang='eng' dir='ltr'><em>vestfoldensis</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 564 593 625 616; x_wconf 85' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 638 591 735 615; x_wconf 85' lang='eng' dir='ltr'><em>22003T</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 745 591 901 620; x_wconf 83' lang='eng' dir='ltr'><em>(AJ582226)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 40 622 925 659">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 40 622 925 659">
+     <span class='ocr_line' id='line_1_18' title="bbox 40 622 925 659; baseline 0 -7"><span class='ocrx_word' id='word_1_83' title='bbox 40 622 304 659; x_wconf 88' lang='eng'><em>\—</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 311 630 477 652; x_wconf 85' lang='eng' dir='ltr'><em>Burkholderia</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 488 630 588 659; x_wconf 86' lang='eng' dir='ltr'><em>cepacia</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 597 630 679 652; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 690 631 753 652; x_wconf 87' lang='eng'><em>2541</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 762 629 787 652; x_wconf 89' lang='eng' dir='ltr'><em>6T</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 797 628 925 657; x_wconf 85' lang='eng' dir='ltr'><em>(U96927)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 117 12 307 440">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 117 12 307 440">
+     <span class='ocr_line' id='line_1_19' title="bbox 156 12 307 61; baseline 0 -17"><span class='ocrx_word' id='word_1_90' title='bbox 156 12 307 61; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 126 61 306 228; baseline 0 -110"><span class='ocrx_word' id='word_1_91' title='bbox 126 61 306 228; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 117 228 270 281; baseline 0 378"><span class='ocrx_word' id='word_1_92' title='bbox 117 228 270 281; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 126 281 258 366; baseline 0 0"><span class='ocrx_word' id='word_1_93' title='bbox 126 281 258 366; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 126 366 233 440; baseline 0 -45"><span class='ocrx_word' id='word_1_94' title='bbox 126 366 164 440; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> <span class='ocrx_word' id='word_1_95' title='bbox 187 366 233 395; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 36 97 78 112">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 36 97 78 112">
+     <span class='ocr_line' id='line_1_24' title="bbox 36 97 78 112; baseline 0 0"><span class='ocrx_word' id='word_1_96' title='bbox 36 97 78 112; x_wconf 64' lang='eng'><em>0,02</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 88 369 187 388">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 88 369 187 388">
+     <span class='ocr_line' id='line_1_25' title="bbox 88 369 187 388; baseline 0 0"><span class='ocrx_word' id='word_1_97' title='bbox 88 369 111 384; x_wconf 83' lang='eng'><em>57</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 164 373 187 388; x_wconf 86' lang='eng'><strong>96</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 159 423 161 459">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 159 423 161 459">
+     <span class='ocr_line' id='line_1_26' title="bbox 159 423 161 459; baseline 0 200"><span class='ocrx_word' id='word_1_99' title='bbox 159 423 161 459; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 116 254 118 523">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 116 254 118 523">
+     <span class='ocr_line' id='line_1_27' title="bbox 116 254 118 523; baseline 0 136"><span class='ocrx_word' id='word_1_100' title='bbox 116 254 118 523; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002592-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002592-0-000.pbm.png
new file mode 100644
index 00000000..2b8ac480
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002592-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002592-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002592-0-000.pbm.png.hocr
new file mode 100644
index 00000000..3ef82852
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002592-0-000.pbm.png.hocr
@@ -0,0 +1,183 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002592-0-000.pbm.png"; bbox 0 0 1302 794; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 415 0 1302 794">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 593 0 1139 29">
+     <span class='ocr_line' id='line_1_1' title="bbox 593 0 1139 29; baseline 0 -6"><span class='ocrx_word' id='word_1_1' title='bbox 593 3 809 23; x_wconf 88' lang='eng' dir='ltr'><em>Planomicrobium</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 817 3 904 29; x_wconf 86' lang='eng' dir='ltr'><em>glaciei</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 912 0 983 23; x_wconf 77' lang='eng' dir='ltr'><em>0423T</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 993 3 1139 28; x_wconf 82' lang='eng' dir='ltr'><em>(EU036220)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 547 38 1123 66">
+     <span class='ocr_line' id='line_1_2' title="bbox 547 38 1123 66; baseline 0 -5"><span class='ocrx_word' id='word_1_5' title='bbox 547 41 743 61; x_wconf 83' lang='eng' dir='ltr'><em>Planomicrobium</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 752 41 861 61; x_wconf 82' lang='eng' dir='ltr'><em>chinense</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 872 38 974 61; x_wconf 81' lang='eng' dir='ltr'><em>DX3-12T</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 983 41 1123 66; x_wconf 86' lang='eng' dir='ltr'><em>(AJ697862)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 508 77 1167 105">
+     <span class='ocr_line' id='line_1_3' title="bbox 508 77 1167 105; baseline 0 -6"><span class='ocrx_word' id='word_1_9' title='bbox 508 79 704 100; x_wconf 88' lang='eng' dir='ltr'><em>Planomicrobium</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 713 79 851 100; x_wconf 83' lang='eng' dir='ltr'><em>mcmeekinii</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 860 79 917 100; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 930 77 1014 100; x_wconf 78' lang='eng' dir='ltr'><em>13963T</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 1024 79 1167 105; x_wconf 87' lang='eng' dir='ltr'>(AF041791)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 548 115 1293 143">
+     <span class='ocr_line' id='line_1_4' title="bbox 548 115 1293 143; baseline 0 -6"><span class='ocrx_word' id='word_1_14' title='bbox 548 117 745 137; x_wconf 85' lang='eng' dir='ltr'><em>Planomicrobium</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 754 117 949 137; x_wconf 85' lang='eng' dir='ltr'><em>alkanoc/asticum</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 959 117 1045 137; x_wconf 91' lang='eng' dir='ltr'><strong>NCIMB</strong></span> <span class='ocrx_word' id='word_1_17' title='bbox 1057 115 1142 137; x_wconf 75' lang='eng' dir='ltr'><em>13489T</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 1151 117 1293 143; x_wconf 81' lang='eng' dir='ltr'><em>(AF029364)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 484 153 1039 181">
+     <span class='ocr_line' id='line_1_5' title="bbox 484 153 1039 181; baseline 0 -5"><span class='ocrx_word' id='word_1_19' title='bbox 484 156 680 176; x_wconf 82' lang='eng' dir='ltr'><em>Planomicrobium</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 689 156 802 176; x_wconf 88' lang='eng' dir='ltr'><em>koreense</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 810 153 887 176; x_wconf 70' lang='eng' dir='ltr'>JGO7T</span> <span class='ocrx_word' id='word_1_22' title='bbox 897 156 1039 181; x_wconf 89' lang='eng' dir='ltr'><em>(AF144750)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 499 191 1173 220">
+     <span class='ocr_line' id='line_1_6' title="bbox 499 191 1173 220; baseline 0 -6"><span class='ocrx_word' id='word_1_23' title='bbox 499 194 695 214; x_wconf 84' lang='eng' dir='ltr'><em>Planomicrobium</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 703 194 881 220; x_wconf 86' lang='eng' dir='ltr'><em>psychrophilum</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 890 194 949 214; x_wconf 88' lang='eng' dir='ltr'><em>CMS</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 960 191 1024 214; x_wconf 83' lang='eng' dir='ltr'><em>530rT</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 1034 194 1173 219; x_wconf 87' lang='eng' dir='ltr'><em>(AJ314746)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 415 229 1114 257">
+     <span class='ocr_line' id='line_1_7' title="bbox 415 229 1114 257; baseline 0 -5"><span class='ocrx_word' id='word_1_28' title='bbox 415 241 467 243; x_wconf 96' lang='eng'>—</span> <span class='ocrx_word' id='word_1_29' title='bbox 476 232 672 252; x_wconf 72' lang='eng' dir='ltr'><em>Planomicroblum</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 682 232 843 252; x_wconf 81' lang='eng' dir='ltr'><em>okeanokoites</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 853 232 896 252; x_wconf 91' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 908 229 993 252; x_wconf 77' lang='eng' dir='ltr'><em>12536T</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 1002 232 1114 257; x_wconf 84' lang='eng' dir='ltr'><em>(D55729)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 630 268 1225 296">
+     <span class='ocr_line' id='line_1_8' title="bbox 630 268 1225 296; baseline -0.002 -5"><span class='ocrx_word' id='word_1_34' title='bbox 630 270 785 291; x_wconf 84' lang='eng' dir='ltr'><em>Planococcus</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 794 270 964 291; x_wconf 77' lang='eng' dir='ltr'><em>stackebrandtii</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 974 268 1071 291; x_wconf 79' lang='eng' dir='ltr'><em>K22-03T</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 1081 270 1225 296; x_wconf 87' lang='eng' dir='ltr'><em>(AY437845)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 522 307 1111 335">
+     <span class='ocr_line' id='line_1_9' title="bbox 522 307 1111 335; baseline 0 -6"><span class='ocrx_word' id='word_1_38' title='bbox 522 309 678 329; x_wconf 85' lang='eng' dir='ltr'><em>Planococcus</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 687 309 819 329; x_wconf 81' lang='eng' dir='ltr'><em>antarct/cus</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 828 309 888 329; x_wconf 89' lang='eng' dir='ltr'><em>CMS</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 897 307 962 329; x_wconf 88' lang='eng' dir='ltr'><em>260rT</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 972 309 1111 335; x_wconf 86' lang='eng' dir='ltr'><em>(AJ314745)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 601 344 1128 373">
+     <span class='ocr_line' id='line_1_10' title="bbox 601 344 1128 373; baseline 0 -6"><span class='ocrx_word' id='word_1_43' title='bbox 601 347 756 367; x_wconf 78' lang='eng' dir='ltr'><em>Planococcus</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 765 347 845 367; x_wconf 84' lang='eng' dir='ltr'><em>kocurii</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 854 347 911 367; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 922 344 1008 367; x_wconf 90' lang='eng' dir='ltr'><em>20747T</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 1018 347 1128 373; x_wconf 85' lang='eng' dir='ltr'>(X62173)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 489 383 1002 411">
+     <span class='ocr_line' id='line_1_11' title="bbox 489 383 1002 411; baseline 0 -5"><span class='ocrx_word' id='word_1_48' title='bbox 489 385 645 406; x_wconf 84' lang='eng' dir='ltr'><em>Planococcus</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 654 385 772 406; x_wconf 81' lang='eng' dir='ltr'><em>maritimus</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 781 383 849 406; x_wconf 84' lang='eng' dir='ltr'><em>TF-9T</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 859 385 1002 411; x_wconf 90' lang='eng' dir='ltr'><em>(AF500007)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 521 421 1017 449">
+     <span class='ocr_line' id='line_1_12' title="bbox 521 421 1017 449; baseline 0 -5"><span class='ocrx_word' id='word_1_52' title='bbox 521 424 676 444; x_wconf 84' lang='eng' dir='ltr'><em>Planococcus</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 685 424 816 444; x_wconf 76' lang='eng' dir='ltr'><em>maitriensis</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 825 421 868 444; x_wconf 91' lang='eng' dir='ltr'><em>S1T</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 878 424 1017 449; x_wconf 86' lang='eng' dir='ltr'><em>(AJ544622)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 621 459 1168 487">
+     <span class='ocr_line' id='line_1_13' title="bbox 621 459 1168 487; baseline 0 -5"><span class='ocrx_word' id='word_1_56' title='bbox 621 462 776 482; x_wconf 84' lang='eng' dir='ltr'><em>Planococcus</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 785 462 904 482; x_wconf 78' lang='eng' dir='ltr'><em>columbae</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 914 462 943 487; x_wconf 88' lang='eng' dir='ltr'>Pg</span> <span class='ocrx_word' id='word_1_59' title='bbox 948 462 988 482; x_wconf 89' lang='eng' dir='ltr'><em>EX1</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 996 459 1019 482; x_wconf 94' lang='eng' dir='ltr'><em>1T</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 1029 462 1168 487; x_wconf 87' lang='eng' dir='ltr'>(AJ966515)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 450 497 1007 528">
+     <span class='ocr_line' id='line_1_14' title="bbox 450 497 1007 528; baseline 0 -8"><span class='ocrx_word' id='word_1_62' title='bbox 450 511 474 528; x_wconf 77' lang='eng'><em>77</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 506 500 662 520; x_wconf 83' lang='eng' dir='ltr'><em>Planococous</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 671 500 801 520; x_wconf 82' lang='eng' dir='ltr'><em>riﬁetoensis</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 811 497 858 520; x_wconf 89' lang='eng' dir='ltr'><em>M8T</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 868 500 1007 526; x_wconf 86' lang='eng' dir='ltr'><em>(AJ493659)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 533 536 1074 564">
+     <span class='ocr_line' id='line_1_15' title="bbox 533 536 1074 564; baseline -0.002 -5"><span class='ocrx_word' id='word_1_67' title='bbox 533 538 689 559; x_wconf 83' lang='eng' dir='ltr'><em>Planococcus</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 698 538 778 559; x_wconf 84' lang='eng' dir='ltr'><em>citreus</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 787 538 873 559; x_wconf 89' lang='eng' dir='ltr'><strong>NCIMB</strong></span> <span class='ocrx_word' id='word_1_70' title='bbox 886 536 955 559; x_wconf 73' lang='eng' dir='ltr'><em>1493T</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 964 538 1074 564; x_wconf 89' lang='eng' dir='ltr'><em>(X62172)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 557 574 1108 602">
+     <span class='ocr_line' id='line_1_16' title="bbox 557 574 1108 602; baseline -0.002 -5"><span class='ocrx_word' id='word_1_72' title='bbox 557 576 718 602; x_wconf 85' lang='eng' dir='ltr'><em>Sporosarcina</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 727 576 861 602; x_wconf 75' lang='eng' dir='ltr'><em>aquimarina</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 872 574 956 597; x_wconf 86' lang='eng' dir='ltr'><em>SW28T</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 966 576 1108 602; x_wconf 89' lang='eng' dir='ltr'><em>(AF202056)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 645 613 1101 641">
+     <span class='ocr_line' id='line_1_17' title="bbox 645 613 1101 641; baseline 0 -6"><span class='ocrx_word' id='word_1_76' title='bbox 645 615 731 635; x_wconf 78' lang='eng' dir='ltr'><em>Kurth/a</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 740 615 805 641; x_wconf 84' lang='eng' dir='ltr'><em>zopﬁi</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 813 615 899 635; x_wconf 91' lang='eng' dir='ltr'><em>NCIMB</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 910 613 980 635; x_wconf 74' lang='eng' dir='ltr'><em>9878T</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 990 615 1101 641; x_wconf 87' lang='eng' dir='ltr'><em>(X70321)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 557 651 1182 717">
+     <span class='ocr_line' id='line_1_18' title="bbox 557 651 1133 679; baseline 0.002 -6"><span class='ocrx_word' id='word_1_81' title='bbox 557 654 719 679; x_wconf 83' lang='eng' dir='ltr'><em>Lysinibacillus</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 727 654 859 679; x_wconf 81' lang='eng' dir='ltr'><em>sphaericus</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 870 654 915 673; x_wconf 94' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 928 651 1012 674; x_wconf 82' lang='eng' dir='ltr'><em>13420T</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 1022 654 1133 679; x_wconf 87' lang='eng' dir='ltr'><em>(D16280)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 647 689 1182 717; baseline -0.002 -5"><span class='ocrx_word' id='word_1_86' title='bbox 647 691 810 717; x_wconf 82' lang='eng' dir='ltr'><em>Caryophanon</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 819 691 885 712; x_wconf 83' lang='eng' dir='ltr'><em>latum</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 895 691 981 712; x_wconf 90' lang='eng' dir='ltr'><strong>NCIMB</strong></span> <span class='ocrx_word' id='word_1_89' title='bbox 991 689 1062 712; x_wconf 78' lang='eng' dir='ltr'><em>9533T</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 1072 691 1182 717; x_wconf 89' lang='eng' dir='ltr'><em>(X70314)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 516 727 991 755">
+     <span class='ocr_line' id='line_1_20' title="bbox 516 727 991 755; baseline 0 -5"><span class='ocrx_word' id='word_1_91' title='bbox 516 730 610 750; x_wconf 84' lang='eng' dir='ltr'><em>Bacillus</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 618 730 702 750; x_wconf 81' lang='eng' dir='ltr'><em>subti/is</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 712 730 789 750; x_wconf 92' lang='eng' dir='ltr'><em>NCDO</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 802 727 870 750; x_wconf 79' lang='eng' dir='ltr'><em>1769T</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 881 730 991 755; x_wconf 88' lang='eng' dir='ltr'>(X60646)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 649 766 1302 794">
+     <span class='ocr_line' id='line_1_21' title="bbox 649 766 1302 794; baseline 0 -6"><span class='ocrx_word' id='word_1_96' title='bbox 649 768 852 794; x_wconf 84' lang='eng' dir='ltr'><em>Exiguobacterium</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 862 768 1012 788; x_wconf 80' lang='eng' dir='ltr'><em>aurantiacum</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 1022 768 1101 788; x_wconf 90' lang='eng' dir='ltr'><em>NCDO</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 1111 766 1182 788; x_wconf 77' lang='eng' dir='ltr'><em>2321T</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 1192 768 1302 794; x_wconf 84' lang='eng' dir='ltr'><em>(X70316)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 165 7 616 501">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 165 7 616 501">
+     <span class='ocr_line' id='line_1_22' title="bbox 392 7 588 80; baseline 0 0"><span class='ocrx_word' id='word_1_101' title='bbox 392 7 588 80; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 385 80 542 157; baseline 0 -18"><span class='ocrx_word' id='word_1_102' title='bbox 385 80 542 157; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 365 157 484 195; baseline 0 599"><span class='ocrx_word' id='word_1_103' title='bbox 365 157 484 195; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 252 195 495 271; baseline 0 0"><span class='ocrx_word' id='word_1_104' title='bbox 252 195 495 271; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 252 271 516 310; baseline 0 484"><span class='ocrx_word' id='word_1_105' title='bbox 252 271 516 310; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 252 310 597 369; baseline 0 0"><span class='ocrx_word' id='word_1_106' title='bbox 252 310 597 369; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 165 369 489 425; baseline 0 -38"><span class='ocrx_word' id='word_1_107' title='bbox 165 369 489 425; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 165 425 516 463; baseline 0 331"><span class='ocrx_word' id='word_1_108' title='bbox 165 425 516 463; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 165 463 616 501; baseline 0 -31"><span class='ocrx_word' id='word_1_109' title='bbox 165 463 616 501; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 153 233 192 250">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 153 233 192 250">
+     <span class='ocr_line' id='line_1_31' title="bbox 153 233 192 250; baseline 0 0"><span class='ocrx_word' id='word_1_110' title='bbox 153 233 192 250; x_wconf 88' lang='eng'><em>0.01</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 412 244 414 281">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 412 244 414 281">
+     <span class='ocr_line' id='line_1_32' title="bbox 412 244 414 281; baseline 0 513"><span class='ocrx_word' id='word_1_111' title='bbox 412 244 414 281; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 0 470 644 783">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 0 470 644 769">
+     <span class='ocr_line' id='line_1_33' title="bbox 95 470 616 543; baseline 0 -61"><span class='ocrx_word' id='word_1_112' title='bbox 95 501 450 543; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> <span class='ocrx_word' id='word_1_113' title='bbox 445 470 616 482; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 95 543 533 578; baseline 0 216"><span class='ocrx_word' id='word_1_114' title='bbox 95 543 533 578; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 95 578 557 616; baseline 0 178"><span class='ocrx_word' id='word_1_115' title='bbox 95 578 557 616; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 0 616 644 637; baseline 0 157"><span class='ocrx_word' id='word_1_116' title='bbox 0 616 644 637; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 0 637 557 693; baseline 0 101"><span class='ocrx_word' id='word_1_117' title='bbox 0 637 557 693; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 0 693 511 713; baseline 0 81"><span class='ocrx_word' id='word_1_118' title='bbox 0 693 511 713; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 0 713 516 769; baseline 0 25"><span class='ocrx_word' id='word_1_119' title='bbox 0 713 516 769; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 421 478 445 495">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 421 478 445 495">
+     <span class='ocr_line' id='line_1_40' title="bbox 421 478 445 495; baseline 0 0"><span class='ocrx_word' id='word_1_120' title='bbox 421 478 445 495; x_wconf 87' lang='eng'><em>80</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 307 662 309 702">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 307 662 309 702">
+     <span class='ocr_line' id='line_1_41' title="bbox 307 662 309 702; baseline 0 92"><span class='ocrx_word' id='word_1_121' title='bbox 307 662 309 702; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002618-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002618-0-001.pbm.png
new file mode 100644
index 00000000..30994263
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002618-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002618-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002618-0-001.pbm.png.hocr
new file mode 100644
index 00000000..6cbd995b
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002618-0-001.pbm.png.hocr
@@ -0,0 +1,174 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002618-0-001.pbm.png"; bbox 0 0 1300 697; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 82 161 84 515">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 82 161 84 515">
+     <span class='ocr_line' id='line_1_1' title="bbox 82 161 84 515; baseline 0 182"><span class='ocrx_word' id='word_1_1' title='bbox 82 161 84 515; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 28 338 30 609">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 28 338 30 609">
+     <span class='ocr_line' id='line_1_2' title="bbox 28 338 30 609; baseline 0 88"><span class='ocrx_word' id='word_1_2' title='bbox 28 338 30 609; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 1 472 3 682">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 1 472 3 682">
+     <span class='ocr_line' id='line_1_3' title="bbox 1 472 3 682; baseline 0 15"><span class='ocrx_word' id='word_1_3' title='bbox 1 472 3 682; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 395 42 686 47">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 395 42 686 47">
+     <span class='ocr_line' id='line_1_4' title="bbox 395 42 686 47; baseline 0 650"><span class='ocrx_word' id='word_1_4' title='bbox 395 42 686 47; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 68 1 1238 89">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 103 1 1238 89">
+     <span class='ocr_line' id='line_1_5' title="bbox 684 1 1142 26; baseline 0 -6"><span class='ocrx_word' id='word_1_5' title='bbox 684 1 806 21; x_wconf 85' lang='eng' dir='ltr'><strong><em>Filimonas</em></strong></span> <span class='ocrx_word' id='word_1_6' title='bbox 814 1 912 21; x_wconf 85' lang='eng' dir='ltr'><em>lacunae</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 919 1 992 20; x_wconf 91' lang='eng' dir='ltr'><em>YT21T</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 1001 1 1142 26; x_wconf 86' lang='eng' dir='ltr'>(AB362776)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 103 10 1238 85; baseline 0.001 -33"><span class='ocrx_word' id='word_1_9' title='bbox 103 29 141 44; x_wconf 71' lang='eng'><em>0-02</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 422 10 429 85; x_wconf 45' lang='eng' dir='ltr'>E</span> <span class='ocrx_word' id='word_1_11' title='bbox 695 33 843 58; x_wconf 76' lang='eng' dir='ltr'><em>Segetibacter</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 849 34 961 53; x_wconf 85' lang='eng' dir='ltr'><em>koreensis</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 970 33 1027 53; x_wconf 83' lang='eng' dir='ltr'>Gsoil</span> <span class='ocrx_word' id='word_1_14' title='bbox 1037 32 1090 53; x_wconf 78' lang='eng' dir='ltr'><em>664T</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 1099 34 1238 58; x_wconf 77' lang='eng' dir='ltr'>(A3267478)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 664 64 1060 89; baseline 0 -5"><span class='ocrx_word' id='word_1_16' title='bbox 664 65 794 84; x_wconf 83' lang='eng' dir='ltr'><em>Terrimonas</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 802 65 858 84; x_wconf 80' lang='eng' dir='ltr'><em>lutea</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 868 64 912 84; x_wconf 76' lang='eng' dir='ltr'><em>DYT</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 922 65 1060 89; x_wconf 86' lang='eng' dir='ltr'>(AB192292)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 468 74 1242 122">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 468 74 1242 122">
+     <span class='ocr_line' id='line_1_8' title="bbox 468 74 1242 122; baseline 0 -6"><span class='ocrx_word' id='word_1_20' title='bbox 468 74 686 109; x_wconf 56' lang='eng' dir='ltr'>C</span> <span class='ocrx_word' id='word_1_21' title='bbox 696 97 826 116; x_wconf 85' lang='eng' dir='ltr'><em>Terrimonas</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 835 97 952 122; x_wconf 86' lang='eng' dir='ltr'><em>ferruginea</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 960 97 1030 116; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 1042 96 1122 116; x_wconf 70' lang='eng' dir='ltr'><em>13524T</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 1132 97 1242 121; x_wconf 84' lang='eng' dir='ltr'>(M62798)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 470 128 1190 185">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 613 128 1190 185">
+     <span class='ocr_line' id='line_1_9' title="bbox 613 128 1190 172; baseline 0 -24"><span class='ocrx_word' id='word_1_26' title='bbox 613 138 644 172; x_wconf 64' lang='eng' dir='ltr'>E</span> <span class='ocrx_word' id='word_1_27' title='bbox 652 129 751 149; x_wconf 82' lang='eng' dir='ltr'><em>Niaste/la</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 759 129 913 154; x_wconf 86' lang='eng' dir='ltr'><em>yeongjuensis</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 922 128 1038 149; x_wconf 79' lang='eng' dir='ltr'><em>GR20—13T</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 1047 129 1190 153; x_wconf 84' lang='eng' dir='ltr'>(DQ244076)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 651 160 1148 185; baseline 0 -5"><span class='ocrx_word' id='word_1_31' title='bbox 651 161 751 180; x_wconf 80' lang='eng' dir='ltr'><em>Niaste/la</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 760 161 872 180; x_wconf 85' lang='eng' dir='ltr'><em>koreensis</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 881 160 996 180; x_wconf 84' lang='eng' dir='ltr'><em>GR20-1OT</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 1006 161 1148 185; x_wconf 84' lang='eng' dir='ltr'>(DQ244077)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 470 192 1234 281">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 515 192 1234 281">
+     <span class='ocr_line' id='line_1_11' title="bbox 631 192 1090 218; baseline 0 -6"><span class='ocrx_word' id='word_1_35' title='bbox 631 193 783 218; x_wconf 80' lang='eng' dir='ltr'><em>Chitinophaga</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 793 194 859 212; x_wconf 84' lang='eng' dir='ltr'><em>terrae</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 870 192 942 212; x_wconf 72' lang='eng' dir='ltr'><em>KP01T</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 952 193 1090 217; x_wconf 89' lang='eng' dir='ltr'>(AB278570)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 515 202 1234 269; baseline 0 -25"><span class='ocrx_word' id='word_1_39' title='bbox 515 202 526 251; x_wconf 55' lang='eng' dir='ltr'><em>‘E</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 576 202 768 269; x_wconf 65' lang='eng' dir='ltr'><em>EChitinophaga</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 777 225 957 249; x_wconf 74' lang='eng' dir='ltr'><em>ginsengisegetis</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 966 225 1024 244; x_wconf 87' lang='eng' dir='ltr'><em>Gsoil</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 1034 224 1087 244; x_wconf 82' lang='eng' dir='ltr'><em>040T</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 1096 225 1234 249; x_wconf 80' lang='eng' dir='ltr'>(A8264798)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 627 256 1183 281; baseline 0 -5"><span class='ocrx_word' id='word_1_45' title='bbox 627 257 780 281; x_wconf 81' lang='eng' dir='ltr'><em>Chitinophaga</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 789 257 920 276; x_wconf 84' lang='eng' dir='ltr'><em>arvensico/a</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 931 257 973 276; x_wconf 94' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 986 256 1066 276; x_wconf 74' lang='eng' dir='ltr'><em>12650T</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 1075 257 1183 281; x_wconf 86' lang='eng' dir='ltr'>(D12657)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 487 288 1256 396">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 636 288 1256 345">
+     <span class='ocr_line' id='line_1_14' title="bbox 636 288 1212 313; baseline 0 -5"><span class='ocrx_word' id='word_1_50' title='bbox 636 289 788 313; x_wconf 80' lang='eng' dir='ltr'><em>Chitinophaga</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 793 289 922 313; x_wconf 84' lang='eng' dir='ltr'><em>japonensis</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 932 289 972 308; x_wconf 93' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 984 288 1064 308; x_wconf 73' lang='eng' dir='ltr'><em>16041T</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 1074 289 1212 313; x_wconf 87' lang='eng' dir='ltr'>(ABO78055)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 695 320 1256 345; baseline 0 -5"><span class='ocrx_word' id='word_1_55' title='bbox 695 320 848 345; x_wconf 80' lang='eng' dir='ltr'><em>Chitinophaga</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 857 321 970 340; x_wconf 82' lang='eng' dir='ltr'><em>skermanii</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 977 320 1104 340; x_wconf 69' lang='eng' dir='ltr'><em>CC-SG1BT</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 1113 320 1256 345; x_wconf 85' lang='eng' dir='ltr'>(DQ062743)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 437 44 439 124">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 437 44 439 124">
+     <span class='ocr_line' id='line_1_16' title="bbox 437 44 439 124; baseline 0 573"><span class='ocrx_word' id='word_1_59' title='bbox 437 44 439 124; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 395 46 398 279">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 395 46 398 279">
+     <span class='ocr_line' id='line_1_17' title="bbox 395 46 398 279; baseline 0 418"><span class='ocrx_word' id='word_1_60' title='bbox 395 46 398 279; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 469 92 471 330">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 469 92 471 330">
+     <span class='ocr_line' id='line_1_18' title="bbox 469 92 471 330; baseline 0 367"><span class='ocrx_word' id='word_1_61' title='bbox 469 92 471 330; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 468 328 690 331">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 468 328 690 331">
+     <span class='ocr_line' id='line_1_19' title="bbox 468 328 690 331; baseline 0 366"><span class='ocrx_word' id='word_1_62' title='bbox 468 328 690 331; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 485 297 488 360">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 485 297 488 360">
+     <span class='ocr_line' id='line_1_20' title="bbox 485 297 488 360; baseline 0 337"><span class='ocrx_word' id='word_1_63' title='bbox 485 297 488 360; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 84 352 1248 536">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 84 352 1248 536">
+     <span class='ocr_line' id='line_1_21' title="bbox 671 352 1190 377; baseline 0.002 -6"><span class='ocrx_word' id='word_1_64' title='bbox 671 352 824 377; x_wconf 80' lang='eng' dir='ltr'><em>Chitinophaga</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 833 353 902 372; x_wconf 78' lang='eng' dir='ltr'><em>sancti</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 911 352 951 372; x_wconf 93' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 962 352 1043 372; x_wconf 84' lang='eng' dir='ltr'><em>15057T</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 1052 353 1190 377; x_wconf 84' lang='eng' dir='ltr'>(ABO78066)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 702 383 1248 409; baseline 0 -5"><span class='ocrx_word' id='word_1_69' title='bbox 702 384 855 409; x_wconf 83' lang='eng' dir='ltr'><em>Chitinophaga</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 863 385 959 409; x_wconf 82' lang='eng' dir='ltr'><em>pinensis</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 967 384 1023 404; x_wconf 87' lang='eng' dir='ltr'><em>ACM</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 1034 383 1102 404; x_wconf 77' lang='eng' dir='ltr'><em>2034T</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 1111 385 1248 409; x_wconf 89' lang='eng' dir='ltr'>(AFO78775)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 578 392 1223 459; baseline 0 -24"><span class='ocrx_word' id='word_1_74' title='bbox 578 392 589 444; x_wconf 59' lang='eng' dir='ltr'><em>‘E</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 630 392 639 459; x_wconf 45' lang='eng'><strong>%</strong></span> <span class='ocrx_word' id='word_1_76' title='bbox 648 416 800 441; x_wconf 80' lang='eng' dir='ltr'><em>Chitinophaga</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 809 416 947 441; x_wconf 75' lang='eng' dir='ltr'><em>ginsengisoli</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 955 416 1012 436; x_wconf 80' lang='eng' dir='ltr'><strong>Gsoil</strong></span> <span class='ocrx_word' id='word_1_79' title='bbox 1022 415 1075 436; x_wconf 87' lang='eng' dir='ltr'><em>052T</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 1084 416 1223 440; x_wconf 85' lang='eng' dir='ltr'>(AB245374)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 651 447 1198 473; baseline 0 -6"><span class='ocrx_word' id='word_1_81' title='bbox 651 448 804 473; x_wconf 80' lang='eng' dir='ltr'><em>Chitinophaga</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 813 448 908 467; x_wconf 85' lang='eng' dir='ltr'><em>ﬁliformis</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 918 448 958 467; x_wconf 94' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 970 447 1050 467; x_wconf 71' lang='eng' dir='ltr'><em>15056T</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 1060 448 1198 472; x_wconf 81' lang='eng' dir='ltr'>(AB078049)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 183 479 1151 505; baseline 0 -6"><span class='ocrx_word' id='word_1_86' title='bbox 183 490 632 491; x_wconf 94' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_87' title='bbox 642 480 767 504; x_wconf 84' lang='eng' dir='ltr'><em>Saprospira</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 776 480 862 505; x_wconf 78' lang='eng' dir='ltr'><em>grand/&#39;5</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 869 480 939 499; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 949 479 1031 499; x_wconf 88' lang='eng' dir='ltr'><em>23119T</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 1041 480 1151 504; x_wconf 88' lang='eng' dir='ltr'>(M58795)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 84 511 1172 536; baseline 0 -5"><span class='ocrx_word' id='word_1_92' title='bbox 84 513 177 515; x_wconf 89' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_93' title='bbox 539 512 766 531; x_wconf 83' lang='eng' dir='ltr'><em>Haliscomenobacter</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 772 512 785 531; x_wconf 92' lang='eng' dir='ltr'><em>h</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 786 512 883 536; x_wconf 82' lang='eng' dir='ltr'><em>ydrossis</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 890 512 961 531; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 970 511 1053 531; x_wconf 90' lang='eng' dir='ltr'><em>27775T</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 1062 512 1172 536; x_wconf 85' lang='eng' dir='ltr'>(M58790)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 582 543 1299 600">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 582 543 1299 600">
+     <span class='ocr_line' id='line_1_27' title="bbox 744 543 1299 568; baseline 0 -5"><span class='ocrx_word' id='word_1_99' title='bbox 744 544 852 563; x_wconf 87' lang='eng' dir='ltr'><em>Lewine/Ia</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 861 544 983 563; x_wconf 81' lang='eng' dir='ltr'><em>cohaerens</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 991 544 1061 563; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 1071 543 1153 563; x_wconf 67' lang='eng' dir='ltr'><em>23123T</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 1163 544 1299 568; x_wconf 87' lang='eng' dir='ltr'>(AF039292)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 582 575 1106 600; baseline 0 -5"><span class='ocrx_word' id='word_1_104' title='bbox 582 576 712 595; x_wconf 80' lang='eng' dir='ltr'><em>Flexibacter</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 718 576 817 595; x_wconf 86' lang='eng' dir='ltr'><em>roseo/us</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 826 576 867 595; x_wconf 92' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 878 575 959 595; x_wconf 85' lang='eng' dir='ltr'><em>16707T</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 968 576 1106 600; x_wconf 82' lang='eng' dir='ltr'><em>(ABO78063)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 101 585 1186 664">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 101 607 1186 664">
+     <span class='ocr_line' id='line_1_29' title="bbox 101 607 1087 650; baseline 0 0"><span class='ocrx_word' id='word_1_109' title='bbox 101 608 800 650; x_wconf 53' lang='eng' dir='ltr'><em>—¢:W&#39;°’e””ber</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 807 608 847 627; x_wconf 68' lang='eng' dir='ltr'><em>&#39;FO</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 859 607 939 627; x_wconf 57' lang='eng' dir='ltr'><em>166W</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 949 608 1087 632; x_wconf 57' lang='eng'><em>(“3078065)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 689 639 1186 664; baseline 0 -5"><span class='ocrx_word' id='word_1_113' title='bbox 689 640 819 659; x_wconf 78' lang='eng' dir='ltr'><em>Flexibacter</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 826 640 896 659; x_wconf 84' lang='eng' dir='ltr'><em>erXi/is</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 906 640 946 659; x_wconf 90' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 958 639 1038 659; x_wconf 72' lang='eng' dir='ltr'><em>15060T</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 1048 640 1186 664; x_wconf 87' lang='eng' dir='ltr'>(ABO78050)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 535 362 537 420">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 535 362 537 420">
+     <span class='ocr_line' id='line_1_31' title="bbox 535 362 537 420; baseline 0 277"><span class='ocrx_word' id='word_1_118' title='bbox 535 362 537 420; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 181 490 183 537">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 181 490 183 537">
+     <span class='ocr_line' id='line_1_32' title="bbox 181 490 183 537; baseline 0 160"><span class='ocrx_word' id='word_1_119' title='bbox 181 490 183 537; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 99 585 101 634">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 99 585 101 634">
+     <span class='ocr_line' id='line_1_33' title="bbox 99 585 101 634; baseline 0 63"><span class='ocrx_word' id='word_1_120' title='bbox 99 585 101 634; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 1 680 554 682">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 1 680 554 682">
+     <span class='ocr_line' id='line_1_34' title="bbox 1 680 554 682; baseline 0 15"><span class='ocrx_word' id='word_1_121' title='bbox 1 680 554 682; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 562 671 1130 696">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 562 671 1130 696">
+     <span class='ocr_line' id='line_1_35' title="bbox 562 671 1130 696; baseline 0 -5"><span class='ocrx_word' id='word_1_122' title='bbox 562 672 740 691; x_wconf 70' lang='eng' dir='ltr'><em>Flavobacterium</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 749 672 840 696; x_wconf 81' lang='eng' dir='ltr'><em>aquatile</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 848 672 918 691; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 930 671 1010 691; x_wconf 74' lang='eng' dir='ltr'><em>11947T</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 1020 672 1130 696; x_wconf 88' lang='eng' dir='ltr'>(M62797)</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002626-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002626-0-000.pbm.png
new file mode 100644
index 00000000..cc9ce677
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002626-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002626-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002626-0-000.pbm.png.hocr
new file mode 100644
index 00000000..2995b7c7
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002626-0-000.pbm.png.hocr
@@ -0,0 +1,114 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002626-0-000.pbm.png"; bbox 0 0 1562 1216; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 554 0 1246 29">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 554 0 1246 29">
+     <span class='ocr_line' id='line_1_1' title="bbox 554 0 1246 29; baseline 0 -6"><span class='ocrx_word' id='word_1_1' title='bbox 554 1 580 20; x_wconf 78' lang='eng'><em>64</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 841 3 863 23; x_wconf 89' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 873 3 962 29; x_wconf 84' lang='eng' dir='ltr'><em>pal/ens</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 970 3 1026 23; x_wconf 91' lang='eng' dir='ltr'><em>AHN</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 1039 0 1125 23; x_wconf 78' lang='eng' dir='ltr'><em>10371T</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 1135 3 1246 29; x_wconf 83' lang='eng' dir='ltr'><em>(Y13105)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 42 31 1346 125">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 42 31 1346 125">
+     <span class='ocr_line' id='line_1_2' title="bbox 98 31 1346 69; baseline 0.002 -16"><span class='ocrx_word' id='word_1_7' title='bbox 98 51 109 69; x_wconf 74' lang='eng'>0</span> <span class='ocrx_word' id='word_1_8' title='bbox 119 51 144 69; x_wconf 76' lang='eng'><em>02</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 525 31 551 49; x_wconf 83' lang='eng'><em>94</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 843 34 865 54; x_wconf 92' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 877 34 1011 60; x_wconf 87' lang='eng' dir='ltr'><em>nigrescens</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 1019 34 1093 55; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 1104 31 1192 55; x_wconf 84' lang='eng' dir='ltr'><em>33563T</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 1202 34 1346 60; x_wconf 82' lang='eng' dir='ltr'><em>(AF414833)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 42 62 1270 92; baseline 0.002 -9"><span class='ocrx_word' id='word_1_15' title='bbox 42 67 201 88; x_wconf 64' lang='eng'><em>|&#39;—[</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 466 74 491 92; x_wconf 72' lang='eng'><em>69</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 773 65 794 85; x_wconf 88' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 806 65 935 86; x_wconf 85' lang='eng' dir='ltr'><em>intermedia</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 944 65 1018 86; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 1028 62 1116 86; x_wconf 79' lang='eng' dir='ltr'>25611T</span> <span class='ocrx_word' id='word_1_21' title='bbox 1127 65 1270 91; x_wconf 82' lang='eng' dir='ltr'><em>(AF414821)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 102 94 1277 125; baseline -0.003 -5"><span class='ocrx_word' id='word_1_22' title='bbox 102 96 141 120; x_wconf 77' lang='eng' dir='ltr'><em>Knuc</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 410 106 435 125; x_wconf 75' lang='eng'><em>34</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 593 94 631 113; x_wconf 70' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 893 97 916 117; x_wconf 90' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 927 96 1023 117; x_wconf 87' lang='eng' dir='ltr'><em>falsenii</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 1031 94 1119 117; x_wconf 78' lang='eng' dir='ltr'><em>04052T</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 1128 97 1277 122; x_wconf 87' lang='eng' dir='ltr'><em>(AB429504)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 528 125 1281 341">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 528 125 1281 341">
+     <span class='ocr_line' id='line_1_5' title="bbox 823 125 1241 153; baseline 0 -5"><span class='ocrx_word' id='word_1_29' title='bbox 823 128 845 148; x_wconf 97' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 857 128 943 148; x_wconf 88' lang='eng' dir='ltr'><em>disiens</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 950 127 1025 148; x_wconf 88' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 1035 125 1123 148; x_wconf 76' lang='eng' dir='ltr'><em>29426T</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 1133 128 1241 153; x_wconf 88' lang='eng' dir='ltr'><em>(L16483)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 793 156 1223 185; baseline 0 -6"><span class='ocrx_word' id='word_1_34' title='bbox 793 159 815 179; x_wconf 80' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 827 159 925 185; x_wconf 80' lang='eng' dir='ltr'><em>corporis</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 933 158 1007 179; x_wconf 87' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 1017 156 1105 179; x_wconf 81' lang='eng' dir='ltr'><em>33547T</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 1115 159 1223 185; x_wconf 86' lang='eng' dir='ltr'><em>(L16465)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 742 187 1245 216; baseline 0 -6"><span class='ocrx_word' id='word_1_39' title='bbox 742 190 764 210; x_wconf 87' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 775 190 928 216; x_wconf 87' lang='eng' dir='ltr'><em>pa/udivivens</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 937 190 991 211; x_wconf 86' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 1004 187 1090 211; x_wconf 82' lang='eng' dir='ltr'><em>13650T</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 1100 190 1245 216; x_wconf 87' lang='eng' dir='ltr'><em>(ABO78827)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 780 219 1169 247; baseline 0.003 -6"><span class='ocrx_word' id='word_1_44' title='bbox 780 221 802 241; x_wconf 87' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 815 221 870 242; x_wconf 84' lang='eng' dir='ltr'><em>bivia</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 879 221 953 242; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 963 219 1051 242; x_wconf 76' lang='eng' dir='ltr'><em>29303T</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 1061 221 1169 247; x_wconf 89' lang='eng' dir='ltr'><em>(L16475)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 528 250 1281 278; baseline -0.001 -5"><span class='ocrx_word' id='word_1_49' title='bbox 528 255 566 273; x_wconf 77' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 835 252 857 272; x_wconf 89' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_51' title='bbox 870 252 936 273; x_wconf 83' lang='eng' dir='ltr'><em>amnii</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 944 252 1023 273; x_wconf 91' lang='eng' dir='ltr'><strong>CCUG</strong></span> <span class='ocrx_word' id='word_1_53' title='bbox 1034 250 1121 273; x_wconf 74' lang='eng' dir='ltr'><em>53648T</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 1131 252 1281 278; x_wconf 88' lang='eng' dir='ltr'><em>(AM422125)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 673 281 1105 310; baseline -0.002 -5"><span class='ocrx_word' id='word_1_55' title='bbox 673 284 695 304; x_wconf 89' lang='eng' dir='ltr'>P.</span> <span class='ocrx_word' id='word_1_56' title='bbox 708 284 807 305; x_wconf 89' lang='eng' dir='ltr'><em>oulorum</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 815 283 889 305; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 899 281 987 305; x_wconf 81' lang='eng' dir='ltr'><em>43324T</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 997 284 1105 310; x_wconf 87' lang='eng' dir='ltr'><em>(L16472)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 719 313 1156 341; baseline 0.002 -6"><span class='ocrx_word' id='word_1_60' title='bbox 719 315 741 335; x_wconf 89' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 753 315 838 336; x_wconf 89' lang='eng' dir='ltr'><em>salivae</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 847 315 901 336; x_wconf 84' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 915 313 1000 336; x_wconf 84' lang='eng' dir='ltr'><em>12084T</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 1010 315 1156 341; x_wconf 85' lang='eng' dir='ltr'><em>(AB108826)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 444 344 1300 466">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 444 344 1300 466">
+     <span class='ocr_line' id='line_1_12' title="bbox 444 344 1116 376; baseline 0 -10"><span class='ocrx_word' id='word_1_65' title='bbox 444 358 470 376; x_wconf 70' lang='eng'>96</span> <span class='ocrx_word' id='word_1_66' title='bbox 739 346 762 366; x_wconf 90' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 774 346 818 367; x_wconf 88' lang='eng' dir='ltr'><em>on&#39;s</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 826 346 900 367; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 911 344 998 367; x_wconf 77' lang='eng' dir='ltr'><em>33573T</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 1008 346 1116 372; x_wconf 87' lang='eng' dir='ltr'><em>(L16474)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 493 375 1211 403; baseline 0.003 -7"><span class='ocrx_word' id='word_1_71' title='bbox 493 377 518 396; x_wconf 85' lang='eng'><em>58</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 798 378 820 398; x_wconf 91' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 832 378 949 398; x_wconf 84' lang='eng' dir='ltr'><em>macu/osa</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 959 375 1057 398; x_wconf 82' lang='eng' dir='ltr'><em>W1609T</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 1068 378 1211 403; x_wconf 84' lang='eng' dir='ltr'><em>(EF534314)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 728 406 1164 434; baseline 0 -5"><span class='ocrx_word' id='word_1_76' title='bbox 728 409 749 429; x_wconf 74' lang='eng' dir='ltr'><em>F’.</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 763 409 866 429; x_wconf 82' lang='eng' dir='ltr'><em>veroralis</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 874 408 948 429; x_wconf 86' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 959 406 1046 429; x_wconf 78' lang='eng' dir='ltr'><em>33779T</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 1057 409 1164 434; x_wconf 82' lang='eng' dir='ltr'><em>(L16473)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 502 437 1300 466; baseline 0.001 -6"><span class='ocrx_word' id='word_1_81' title='bbox 502 437 540 456; x_wconf 77' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 736 440 758 460; x_wconf 95' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 770 440 963 466; x_wconf 79' lang='eng' dir='ltr'><em>melaninogenica</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 973 440 1047 461; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 1057 438 1145 461; x_wconf 85' lang='eng' dir='ltr'><em>25845T</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 1155 440 1300 466; x_wconf 86' lang='eng' dir='ltr'><em>(AY323525)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 292 469 1562 1216">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 292 469 1562 1216">
+     <span class='ocr_line' id='line_1_16' title="bbox 698 469 1108 497; baseline 0.002 -6"><span class='ocrx_word' id='word_1_87' title='bbox 698 471 720 491; x_wconf 92' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 732 471 792 497; x_wconf 91' lang='eng' dir='ltr'><em>copn&#39;</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 800 471 854 492; x_wconf 83' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 867 469 953 492; x_wconf 79' lang='eng' dir='ltr'><em>13464T</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 963 471 1108 497; x_wconf 86' lang='eng' dir='ltr'><em>(AB064923)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 772 500 1224 528; baseline 0 -5"><span class='ocrx_word' id='word_1_92' title='bbox 772 502 794 523; x_wconf 90' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 807 502 908 523; x_wconf 82' lang='eng' dir='ltr'><em>albensis</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 918 502 975 523; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 988 500 1074 523; x_wconf 83' lang='eng' dir='ltr'><em>11370T</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 1084 502 1224 528; x_wconf 87' lang='eng' dir='ltr'><em>(AJ011683)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 981 531 1562 559; baseline 0 -5"><span class='ocrx_word' id='word_1_97' title='bbox 981 534 1003 554; x_wconf 91' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 1015 534 1244 554; x_wconf 80' lang='eng' dir='ltr'><em>multisaccharivorax</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 1253 533 1308 554; x_wconf 87' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 1321 531 1407 554; x_wconf 79' lang='eng' dir='ltr'><em>12954T</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 1417 534 1562 559; x_wconf 76' lang='eng' dir='ltr'><em>(ABZOO414)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 869 562 1270 591; baseline 0 -6"><span class='ocrx_word' id='word_1_102' title='bbox 869 565 891 585; x_wconf 95' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 903 565 998 585; x_wconf 80' lang='eng' dir='ltr'><em>denta/is</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 1008 565 1066 585; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 1077 562 1149 585; x_wconf 76' lang='eng' dir='ltr'><em>3688T</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 1159 565 1270 591; x_wconf 86' lang='eng' dir='ltr'><em>(X81876)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 895 593 1348 622; baseline 0 -5"><span class='ocrx_word' id='word_1_107' title='bbox 895 596 917 617; x_wconf 66' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 930 596 1049 622; x_wconf 82' lang='eng' dir='ltr'><em>bergensis</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 1058 593 1192 617; x_wconf 76' lang='eng' dir='ltr'><em>94087913T</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 1202 596 1348 622; x_wconf 83' lang='eng' dir='ltr'><em>(AY350613)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 593 625 1319 653; baseline 0.006 -9"><span class='ocrx_word' id='word_1_111' title='bbox 593 626 631 644; x_wconf 89' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 836 627 858 647; x_wconf 91' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 870 627 1004 648; x_wconf 85' lang='eng' dir='ltr'><em>multiformis</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 1013 627 1067 648; x_wconf 91' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 1080 625 1319 653; x_wconf 74' lang='eng' dir='ltr'><em>12541T(AB182483)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 801 656 1281 685; baseline 0 -6"><span class='ocrx_word' id='word_1_116' title='bbox 801 659 823 679; x_wconf 94' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 836 659 944 679; x_wconf 84' lang='eng' dir='ltr'><em>denticola</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 954 659 1028 679; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 1038 656 1126 679; x_wconf 81' lang='eng' dir='ltr'><em>35308T</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 1136 659 1281 685; x_wconf 86' lang='eng' dir='ltr'><em>(AY323524)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 900 687 1322 716; baseline 0 -6"><span class='ocrx_word' id='word_1_121' title='bbox 900 690 922 710; x_wconf 93' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 935 690 1023 710; x_wconf 82' lang='eng' dir='ltr'><em>buccae</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 1031 689 1105 710; x_wconf 88' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 1116 687 1204 710; x_wconf 79' lang='eng' dir='ltr'><em>33574T</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 1214 690 1322 716; x_wconf 88' lang='eng' dir='ltr'><em>(L16477)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 440 718 1276 747; baseline 0.001 -6"><span class='ocrx_word' id='word_1_126' title='bbox 440 723 465 741; x_wconf 93' lang='eng'><strong>77</strong></span> <span class='ocrx_word' id='word_1_127' title='bbox 888 721 910 741; x_wconf 93' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 922 721 1029 742; x_wconf 87' lang='eng' dir='ltr'><em>baroniae</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 1039 718 1121 742; x_wconf 77' lang='eng' dir='ltr'><em>E9.33T</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 1131 721 1276 747; x_wconf 86' lang='eng' dir='ltr'><em>(AY840553)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 860 750 1327 778; baseline -0.002 -5"><span class='ocrx_word' id='word_1_131' title='bbox 860 752 882 772; x_wconf 95' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_132' title='bbox 894 753 1008 773; x_wconf 78' lang='eng' dir='ltr'><em>stercorea</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 1018 752 1072 773; x_wconf 92' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_134' title='bbox 1086 750 1171 773; x_wconf 81' lang='eng' dir='ltr'><em>13469T</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 1181 752 1327 778; x_wconf 80' lang='eng' dir='ltr'><em>(ABZ44774)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 740 783 1303 809; baseline 0 -5"><span class='ocrx_word' id='word_1_136' title='bbox 740 784 769 804; x_wconf 79' lang='eng' dir='ltr'>‘P.</span> <span class='ocrx_word' id='word_1_137' title='bbox 781 784 934 804; x_wconf 77' lang='eng' dir='ltr'><em>massiliensis’</em></span> <span class='ocrx_word' id='word_1_138' title='bbox 946 783 1047 804; x_wconf 86' lang='eng' dir='ltr'><em>Smarlab</em></span> <span class='ocrx_word' id='word_1_139' title='bbox 1059 784 1148 804; x_wconf 87' lang='eng'>121567</span> <span class='ocrx_word' id='word_1_140' title='bbox 1159 784 1303 809; x_wconf 87' lang='eng' dir='ltr'><em>(AF487886)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 422 812 1277 845; baseline 0 -10"><span class='ocrx_word' id='word_1_141' title='bbox 422 826 448 845; x_wconf 73' lang='eng'>63</span> <span class='ocrx_word' id='word_1_142' title='bbox 879 814 901 835; x_wconf 92' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_143' title='bbox 914 814 979 835; x_wconf 76' lang='eng' dir='ltr'><em>oral/‘3</em></span> <span class='ocrx_word' id='word_1_144' title='bbox 987 814 1061 835; x_wconf 88' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_145' title='bbox 1072 812 1160 835; x_wconf 78' lang='eng' dir='ltr'><em>33269T</em></span> <span class='ocrx_word' id='word_1_146' title='bbox 1170 814 1277 840; x_wconf 87' lang='eng' dir='ltr'><em>(L16480)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 919 844 1362 872; baseline 0 -6"><span class='ocrx_word' id='word_1_147' title='bbox 919 846 941 866; x_wconf 92' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_148' title='bbox 953 846 1043 867; x_wconf 89' lang='eng' dir='ltr'><em>marshii</em></span> <span class='ocrx_word' id='word_1_149' title='bbox 1052 846 1109 867; x_wconf 86' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_150' title='bbox 1122 844 1208 867; x_wconf 81' lang='eng' dir='ltr'><em>16973T</em></span> <span class='ocrx_word' id='word_1_151' title='bbox 1218 846 1362 872; x_wconf 87' lang='eng' dir='ltr'><em>(AF481227)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 473 874 1262 905; baseline 0.003 -9"><span class='ocrx_word' id='word_1_152' title='bbox 473 886 496 905; x_wconf 73' lang='eng'>61</span> <span class='ocrx_word' id='word_1_153' title='bbox 840 877 861 897; x_wconf 93' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_154' title='bbox 873 877 946 898; x_wconf 82' lang='eng' dir='ltr'><em>shahii</em></span> <span class='ocrx_word' id='word_1_155' title='bbox 954 877 1008 898; x_wconf 90' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_156' title='bbox 1021 874 1107 898; x_wconf 88' lang='eng' dir='ltr'><em>12083T</em></span> <span class='ocrx_word' id='word_1_157' title='bbox 1117 877 1262 903; x_wconf 88' lang='eng' dir='ltr'><em>(AB108825)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 600 906 1242 934; baseline 0.002 -6"><span class='ocrx_word' id='word_1_158' title='bbox 600 910 638 928; x_wconf 88' lang='eng'>100</span> <span class='ocrx_word' id='word_1_159' title='bbox 802 908 824 929; x_wconf 96' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_160' title='bbox 836 908 945 929; x_wconf 79' lang='eng' dir='ltr'><em>Ioescheii</em></span> <span class='ocrx_word' id='word_1_161' title='bbox 952 908 1026 929; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_162' title='bbox 1038 906 1124 929; x_wconf 76' lang='eng' dir='ltr'><em>15930T</em></span> <span class='ocrx_word' id='word_1_163' title='bbox 1134 908 1242 934; x_wconf 87' lang='eng' dir='ltr'><em>(L16481)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 922 937 1389 966; baseline 0.002 -6"><span class='ocrx_word' id='word_1_164' title='bbox 922 940 943 960; x_wconf 93' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_165' title='bbox 954 940 1073 966; x_wconf 78' lang='eng' dir='ltr'><em>pleuritidis</em></span> <span class='ocrx_word' id='word_1_166' title='bbox 1082 940 1136 961; x_wconf 92' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_167' title='bbox 1148 937 1235 961; x_wconf 92' lang='eng' dir='ltr'><em>14110T</em></span> <span class='ocrx_word' id='word_1_168' title='bbox 1245 940 1389 966; x_wconf 82' lang='eng' dir='ltr'><em>(A8278593)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 514 968 1341 997; baseline 0.001 -7"><span class='ocrx_word' id='word_1_169' title='bbox 514 972 552 990; x_wconf 89' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_170' title='bbox 885 971 907 991; x_wconf 94' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_171' title='bbox 919 976 1008 991; x_wconf 85' lang='eng' dir='ltr'><em>enoeca</em></span> <span class='ocrx_word' id='word_1_172' title='bbox 1018 971 1092 991; x_wconf 93' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_173' title='bbox 1103 968 1190 991; x_wconf 74' lang='eng' dir='ltr'><em>51261T</em></span> <span class='ocrx_word' id='word_1_174' title='bbox 1200 971 1341 997; x_wconf 84' lang='eng' dir='ltr'><em>(AJ005635)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 895 1000 1387 1028; baseline 0.002 -6"><span class='ocrx_word' id='word_1_175' title='bbox 895 1002 916 1022; x_wconf 91' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_176' title='bbox 928 1002 1075 1023; x_wconf 86' lang='eng' dir='ltr'><em>nanceiensis</em></span> <span class='ocrx_word' id='word_1_177' title='bbox 1083 1002 1127 1022; x_wconf 92' lang='eng' dir='ltr'><em>AIP</em></span> <span class='ocrx_word' id='word_1_178' title='bbox 1137 1002 1177 1023; x_wconf 86' lang='eng'><em>261</em></span> <span class='ocrx_word' id='word_1_179' title='bbox 1185 1000 1232 1023; x_wconf 88' lang='eng' dir='ltr'><em>.03T</em></span> <span class='ocrx_word' id='word_1_180' title='bbox 1242 1002 1387 1028; x_wconf 83' lang='eng' dir='ltr'><em>(AY957555)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 867 1031 1321 1059; baseline 0 -5"><span class='ocrx_word' id='word_1_181' title='bbox 867 1033 889 1054; x_wconf 93' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_182' title='bbox 902 1033 1034 1054; x_wconf 88' lang='eng' dir='ltr'><em>timonensis</em></span> <span class='ocrx_word' id='word_1_183' title='bbox 1042 1031 1162 1054; x_wconf 91' lang='eng' dir='ltr'><em>4401737T</em></span> <span class='ocrx_word' id='word_1_184' title='bbox 1172 1033 1321 1059; x_wconf 80' lang='eng' dir='ltr'><em>(DQS18919)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 555 1062 1255 1090; baseline 0.001 -6"><span class='ocrx_word' id='word_1_185' title='bbox 555 1066 593 1084; x_wconf 92' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_186' title='bbox 823 1065 845 1085; x_wconf 93' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_187' title='bbox 857 1065 957 1085; x_wconf 81' lang='eng' dir='ltr'><em>buccalis</em></span> <span class='ocrx_word' id='word_1_188' title='bbox 965 1064 1039 1085; x_wconf 88' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_189' title='bbox 1050 1062 1137 1085; x_wconf 80' lang='eng' dir='ltr'><em>3531GT</em></span> <span class='ocrx_word' id='word_1_190' title='bbox 1147 1065 1255 1090; x_wconf 85' lang='eng' dir='ltr'><em>(L16476)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 796 1093 1254 1121; baseline 0 -5"><span class='ocrx_word' id='word_1_191' title='bbox 796 1096 818 1116; x_wconf 80' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_192' title='bbox 830 1096 955 1116; x_wconf 84' lang='eng' dir='ltr'><em>ruminico/a</em></span> <span class='ocrx_word' id='word_1_193' title='bbox 964 1095 1038 1116; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_194' title='bbox 1051 1093 1136 1116; x_wconf 82' lang='eng' dir='ltr'><em>19189T</em></span> <span class='ocrx_word' id='word_1_195' title='bbox 1146 1096 1254 1121; x_wconf 90' lang='eng' dir='ltr'><em>(L16482)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 292 1125 1214 1153; baseline 0.002 -7"><span class='ocrx_word' id='word_1_196' title='bbox 292 1128 330 1146; x_wconf 90' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_197' title='bbox 775 1127 797 1147; x_wconf 92' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_198' title='bbox 810 1127 883 1148; x_wconf 86' lang='eng' dir='ltr'><em>brevis</em></span> <span class='ocrx_word' id='word_1_199' title='bbox 891 1127 965 1148; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_200' title='bbox 978 1125 1064 1148; x_wconf 75' lang='eng' dir='ltr'><em>19188T</em></span> <span class='ocrx_word' id='word_1_201' title='bbox 1074 1127 1214 1153; x_wconf 83' lang='eng' dir='ltr'><em>(AJ011682)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 718 1156 1157 1184; baseline 0.002 -6"><span class='ocrx_word' id='word_1_202' title='bbox 718 1158 740 1178; x_wconf 92' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_203' title='bbox 752 1158 841 1184; x_wconf 81' lang='eng' dir='ltr'><em>bryantii</em></span> <span class='ocrx_word' id='word_1_204' title='bbox 851 1158 908 1179; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_205' title='bbox 921 1156 1007 1179; x_wconf 89' lang='eng' dir='ltr'><em>11371T</em></span> <span class='ocrx_word' id='word_1_206' title='bbox 1017 1158 1157 1184; x_wconf 87' lang='eng' dir='ltr'><em>(AJ006457)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 821 1186 1294 1216; baseline 0 -6"><span class='ocrx_word' id='word_1_207' title='bbox 821 1189 842 1210; x_wconf 75' lang='eng' dir='ltr'><em>P.</em></span> <span class='ocrx_word' id='word_1_208' title='bbox 855 1190 963 1210; x_wconf 80' lang='eng' dir='ltr'><em>tannerae</em></span> <span class='ocrx_word' id='word_1_209' title='bbox 972 1189 1046 1210; x_wconf 88' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_210' title='bbox 1056 1186 1144 1210; x_wconf 81' lang='eng' dir='ltr'><em>51259T</em></span> <span class='ocrx_word' id='word_1_211' title='bbox 1154 1189 1294 1216; x_wconf 86' lang='eng' dir='ltr'><em>(AJ005634)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002642-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002642-0-000.pbm.png
new file mode 100644
index 00000000..0accb6be
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002642-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002642-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002642-0-000.pbm.png.hocr
new file mode 100644
index 00000000..f2e95e83
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002642-0-000.pbm.png.hocr
@@ -0,0 +1,358 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002642-0-000.pbm.png"; bbox 0 0 994 1508; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 20 4 56 22">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 20 4 56 22">
+     <span class='ocr_line' id='line_1_1' title="bbox 20 4 56 22; baseline 0.028 -1"><span class='ocrx_word' id='word_1_1' title='bbox 20 4 56 22; x_wconf 90' lang='eng'>1%</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 1 29 64 31">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 1 29 64 31">
+     <span class='ocr_line' id='line_1_2' title="bbox 1 29 64 31; baseline 0 1477"><span class='ocrx_word' id='word_1_2' title='bbox 1 29 64 31; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 216 50 896 76">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 216 50 896 76">
+     <span class='ocr_line' id='line_1_3' title="bbox 216 50 896 76; baseline 0 -5"><span class='ocrx_word' id='word_1_3' title='bbox 216 50 410 76; x_wconf 77' lang='eng' dir='ltr'><em>Pseudoruegeria</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 420 50 539 76; x_wconf 83' lang='eng' dir='ltr'><em>aqu/maris</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 563 50 636 71; x_wconf 86' lang='eng' dir='ltr'><em>KCTC</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 647 50 731 71; x_wconf 88' lang='eng' dir='ltr'><em>12737T</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 745 50 896 76; x_wconf 87' lang='eng' dir='ltr'><em>(DQ675021)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 91 122 180 124">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 91 122 180 124">
+     <span class='ocr_line' id='line_1_4' title="bbox 91 122 180 124; baseline 0 1384"><span class='ocrx_word' id='word_1_8' title='bbox 91 122 180 124; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 63 112 683 138">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 63 112 683 138">
+     <span class='ocr_line' id='line_1_5' title="bbox 63 112 683 138; baseline 0 -5"><span class='ocrx_word' id='word_1_9' title='bbox 63 127 67 138; x_wconf 37' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 186 113 296 138; x_wconf 85' lang='eng' dir='ltr'><em>Ruegeria</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 305 113 420 138; x_wconf 83' lang='eng' dir='ltr'><em>pomeroyi</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 442 112 531 133; x_wconf 78' lang='eng' dir='ltr'><em>DSS-3T</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 539 112 683 138; x_wconf 85' lang='eng' dir='ltr'><em>(AF098491)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 69 60 71 182">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 69 60 71 182">
+     <span class='ocr_line' id='line_1_6' title="bbox 69 60 71 182; baseline 0 1326"><span class='ocrx_word' id='word_1_14' title='bbox 69 60 71 182; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 69 180 91 182">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 69 180 91 182">
+     <span class='ocr_line' id='line_1_7' title="bbox 69 180 91 182; baseline 0 1326"><span class='ocrx_word' id='word_1_15' title='bbox 69 180 91 182; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 67 173 779 206">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 67 173 779 206">
+     <span class='ocr_line' id='line_1_8' title="bbox 67 173 779 206; baseline 0 -12"><span class='ocrx_word' id='word_1_16' title='bbox 67 194 83 206; x_wconf 64' lang='eng'>76</span> <span class='ocrx_word' id='word_1_17' title='bbox 196 175 307 200; x_wconf 85' lang='eng' dir='ltr'><em>Ruegeria</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 316 175 521 194; x_wconf 84' lang='eng' dir='ltr'><em>Iacuscaeru/ensis</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 545 173 656 195; x_wconf 88' lang='eng' dir='ltr'><em>lTl-1157T</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 665 174 779 200; x_wconf 87' lang='eng' dir='ltr'><em>(U77644)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 89 122 91 238">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 89 122 91 238">
+     <span class='ocr_line' id='line_1_9' title="bbox 89 122 91 238; baseline 0 1270"><span class='ocrx_word' id='word_1_21' title='bbox 89 122 91 238; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 127 246 200 248">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 127 246 200 248">
+     <span class='ocr_line' id='line_1_10' title="bbox 127 246 200 248; baseline 0 1260"><span class='ocrx_word' id='word_1_22' title='bbox 127 246 200 248; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 205 235 716 262">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 205 235 716 262">
+     <span class='ocr_line' id='line_1_11' title="bbox 205 235 716 262; baseline 0 -5"><span class='ocrx_word' id='word_1_23' title='bbox 205 237 316 262; x_wconf 85' lang='eng' dir='ltr'><em>Ruegeria</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 325 237 427 257; x_wconf 85' lang='eng' dir='ltr'><em>atlantica</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 449 237 494 256; x_wconf 93' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 507 235 591 257; x_wconf 80' lang='eng' dir='ltr'><em>14463T</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 602 236 716 262; x_wconf 85' lang='eng' dir='ltr'>(D88526)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 82 253 90 264">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 82 253 90 264">
+     <span class='ocr_line' id='line_1_12' title="bbox 82 253 90 264; baseline 0 0"><span class='ocrx_word' id='word_1_28' title='bbox 82 253 90 264; x_wconf 88' lang='eng'><strong>6</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 125 246 127 341">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 125 246 127 341">
+     <span class='ocr_line' id='line_1_13' title="bbox 125 246 127 341; baseline 0 -77"><span class='ocrx_word' id='word_1_29' title='bbox 125 246 127 341; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 91 253 758 386">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 91 253 758 386">
+     <span class='ocr_line' id='line_1_14' title="bbox 91 253 99 264; baseline 0 0"><span class='ocrx_word' id='word_1_30' title='bbox 91 253 99 264; x_wconf 85' lang='eng'><em>7</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 103 297 758 324; baseline 0 -6"><span class='ocrx_word' id='word_1_31' title='bbox 103 304 119 315; x_wconf 72' lang='eng'><em>59</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 222 298 333 324; x_wconf 75' lang='eng' dir='ltr'><em>Ruegerl’a</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 341 298 430 324; x_wconf 83' lang='eng' dir='ltr'><em>pelagia</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 451 297 597 319; x_wconf 80' lang='eng' dir='ltr'><em>HTCCZ663T</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 607 298 758 324; x_wconf 71' lang='eng' dir='ltr'><em>(DQ916141)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 183 350 758 386; baseline 0 -5"><span class='ocrx_word' id='word_1_36' title='bbox 183 350 207 362; x_wconf 82' lang='eng'><em>‘°°</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 218 361 329 386; x_wconf 85' lang='eng' dir='ltr'><em>Ruegeria</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 338 361 424 381; x_wconf 83' lang='eng' dir='ltr'><em>mob/[is</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 446 360 490 381; x_wconf 90' lang='eng' dir='ltr'><em>CIP</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 502 360 602 381; x_wconf 61' lang='eng' dir='ltr'>109181T</span> <span class='ocrx_word' id='word_1_41' title='bbox 612 360 758 386; x_wconf 79' lang='eng' dir='ltr'><em>(A8255401)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 23 407 47 419">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 23 407 47 419">
+     <span class='ocr_line' id='line_1_17' title="bbox 23 407 47 419; baseline 0 0"><span class='ocrx_word' id='word_1_42' title='bbox 23 407 47 419; x_wconf 82' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 216 422 776 449">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 216 422 776 449">
+     <span class='ocr_line' id='line_1_18' title="bbox 216 422 776 449; baseline 0 -6"><span class='ocrx_word' id='word_1_43' title='bbox 216 423 376 443; x_wconf 85' lang='eng' dir='ltr'><em>Tha/assobius</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 385 423 490 443; x_wconf 78' lang='eng' dir='ltr'><em>aestuarii</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 505 422 611 443; x_wconf 48' lang='eng' dir='ltr'><em>‘102049T</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 630 422 776 449; x_wconf 90' lang='eng' dir='ltr'><em>(AY442178)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 88 484 883 511">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 88 484 883 511">
+     <span class='ocr_line' id='line_1_19' title="bbox 88 484 883 511; baseline 0 -6"><span class='ocrx_word' id='word_1_47' title='bbox 88 490 104 501; x_wconf 84' lang='eng'><em>77</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 126 494 207 496; x_wconf 94' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_49' title='bbox 214 485 375 505; x_wconf 80' lang='eng' dir='ltr'><em>Thalassobius</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 384 485 560 505; x_wconf 81' lang='eng' dir='ltr'><em>mediterraneus</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 578 484 652 505; x_wconf 91' lang='eng' dir='ltr'><em>CECT</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 662 484 732 505; x_wconf 74' lang='eng' dir='ltr'><em>5383T</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 742 484 883 511; x_wconf 87' lang='eng' dir='ltr'><em>(AJ878874)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 124 494 126 558">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 124 494 126 558">
+     <span class='ocr_line' id='line_1_20' title="bbox 124 494 126 558; baseline 0 950"><span class='ocrx_word' id='word_1_54' title='bbox 124 494 126 558; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 126 546 831 573">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 126 546 831 573">
+     <span class='ocr_line' id='line_1_21' title="bbox 126 546 831 573; baseline 0 -6"><span class='ocrx_word' id='word_1_55' title='bbox 126 556 190 558; x_wconf 96' lang='eng'>—</span> <span class='ocrx_word' id='word_1_56' title='bbox 197 547 358 567; x_wconf 82' lang='eng' dir='ltr'><em>Thalossobius</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 366 547 546 573; x_wconf 82' lang='eng' dir='ltr'><em>gelatinovorans</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 566 547 612 567; x_wconf 89' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 624 546 708 567; x_wconf 78' lang='eng' dir='ltr'><em>12617T</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 718 546 831 573; x_wconf 84' lang='eng' dir='ltr'><em>(D88523)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 284 618 351 621">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 284 618 351 621">
+     <span class='ocr_line' id='line_1_22' title="bbox 284 618 351 621; baseline 0 887"><span class='ocrx_word' id='word_1_61' title='bbox 284 618 351 621; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 357 608 928 635">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 357 608 928 635">
+     <span class='ocr_line' id='line_1_23' title="bbox 357 608 928 635; baseline 0 -6"><span class='ocrx_word' id='word_1_62' title='bbox 357 609 515 629; x_wconf 83' lang='eng' dir='ltr'><em>Roseobacter</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 522 609 669 629; x_wconf 85' lang='eng' dir='ltr'><em>denitriﬁcans</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 687 609 735 629; x_wconf 90' lang='eng' dir='ltr'><em>Och</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 747 608 800 629; x_wconf 81' lang='eng' dir='ltr'><em>114T</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 811 609 928 635; x_wconf 85' lang='eng' dir='ltr'><em>(M96746)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 196 650 283 651">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 196 650 283 651">
+     <span class='ocr_line' id='line_1_24' title="bbox 196 650 283 651; baseline 0 857"><span class='ocrx_word' id='word_1_67' title='bbox 196 650 283 651; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 256 656 281 667">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 256 656 281 667">
+     <span class='ocr_line' id='line_1_25' title="bbox 256 656 281 667; baseline 0 0"><span class='ocrx_word' id='word_1_68' title='bbox 256 656 281 667; x_wconf 68' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 57 670 887 699">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 57 670 887 699">
+     <span class='ocr_line' id='line_1_26' title="bbox 57 670 887 699; baseline 0 -8"><span class='ocrx_word' id='word_1_69' title='bbox 57 688 73 699; x_wconf 57' lang='eng'><em>63</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 284 680 320 683; x_wconf 98' lang='eng'>—</span> <span class='ocrx_word' id='word_1_71' title='bbox 325 671 484 691; x_wconf 78' lang='eng' dir='ltr'><em>Roseobacter</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 490 671 576 691; x_wconf 84' lang='eng' dir='ltr'><em>litoralis</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 594 671 668 691; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 677 670 766 691; x_wconf 81' lang='eng' dir='ltr'><em>49566T</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 776 671 887 696; x_wconf 84' lang='eng' dir='ltr'><em>(X78312)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 103 719 196 721">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 103 719 196 721">
+     <span class='ocr_line' id='line_1_27' title="bbox 103 719 196 721; baseline 0 787"><span class='ocrx_word' id='word_1_76' title='bbox 103 719 196 721; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 208 732 868 759">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 208 732 868 759">
+     <span class='ocr_line' id='line_1_28' title="bbox 208 732 868 759; baseline 0 -6"><span class='ocrx_word' id='word_1_77' title='bbox 208 743 314 745; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_78' title='bbox 320 733 475 753; x_wconf 84' lang='eng' dir='ltr'><em>Sulfitobacter</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 480 733 600 758; x_wconf 79' lang='eng' dir='ltr'><em>pontiacus</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 622 733 692 753; x_wconf 92' lang='eng' dir='ltr'><em>ChLG</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 704 732 742 753; x_wconf 93' lang='eng' dir='ltr'><em>1OT</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 756 733 868 759; x_wconf 84' lang='eng' dir='ltr'><em>(Y17388)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 194 650 196 788">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 194 650 196 788">
+     <span class='ocr_line' id='line_1_29' title="bbox 194 650 196 788; baseline 0 720"><span class='ocrx_word' id='word_1_83' title='bbox 194 650 196 788; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 186 794 903 821">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 186 794 903 821">
+     <span class='ocr_line' id='line_1_30' title="bbox 186 794 903 821; baseline 0 -6"><span class='ocrx_word' id='word_1_84' title='bbox 186 795 202 807; x_wconf 68' lang='eng'><em>5&quot;</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 286 805 306 807; x_wconf 98' lang='eng'>—</span> <span class='ocrx_word' id='word_1_86' title='bbox 312 794 467 815; x_wconf 79' lang='eng' dir='ltr'><em>Su/ﬁtobacter</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 473 795 582 815; x_wconf 80' lang='eng' dir='ltr'><em>delicatus</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 603 795 663 815; x_wconf 93' lang='eng' dir='ltr'><em>KMM</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 675 794 745 815; x_wconf 84' lang='eng' dir='ltr'><em>3584T</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 757 794 903 821; x_wconf 85' lang='eng' dir='ltr'><em>(AY180103)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 257 842 281 853">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 257 842 281 853">
+     <span class='ocr_line' id='line_1_31' title="bbox 257 842 281 853; baseline 0 0"><span class='ocrx_word' id='word_1_91' title='bbox 257 842 281 853; x_wconf 68' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 206 743 208 838">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 206 743 208 838">
+     <span class='ocr_line' id='line_1_32' title="bbox 206 743 208 838; baseline 0 670"><span class='ocrx_word' id='word_1_92' title='bbox 206 743 208 838; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 206 836 286 838">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 206 836 286 838">
+     <span class='ocr_line' id='line_1_33' title="bbox 206 836 286 838; baseline 0 670"><span class='ocrx_word' id='word_1_93' title='bbox 206 836 286 838; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 284 621 286 869">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 284 621 286 869">
+     <span class='ocr_line' id='line_1_34' title="bbox 284 621 286 869; baseline 0 639"><span class='ocrx_word' id='word_1_94' title='bbox 284 621 286 869; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 297 856 854 883">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 297 856 854 883">
+     <span class='ocr_line' id='line_1_35' title="bbox 297 856 854 883; baseline 0 -6"><span class='ocrx_word' id='word_1_95' title='bbox 297 857 452 877; x_wconf 82' lang='eng' dir='ltr'><em>Su/ﬁtobacter</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 458 857 539 877; x_wconf 89' lang='eng' dir='ltr'><em>dubius</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 553 857 614 877; x_wconf 93' lang='eng' dir='ltr'><em>KMM</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 625 856 695 877; x_wconf 78' lang='eng' dir='ltr'><em>3554T</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 708 857 854 883; x_wconf 86' lang='eng' dir='ltr'><em>(AY180102)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 77 479 79 887">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 77 479 79 887">
+     <span class='ocr_line' id='line_1_36' title="bbox 77 479 79 887; baseline 0 621"><span class='ocrx_word' id='word_1_100' title='bbox 77 479 79 887; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 283 918 819 945">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 283 918 819 945">
+     <span class='ocr_line' id='line_1_37' title="bbox 283 918 819 945; baseline 0 -6"><span class='ocrx_word' id='word_1_101' title='bbox 283 919 394 945; x_wconf 80' lang='eng' dir='ltr'><em>Rueger/‘a</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 404 919 496 945; x_wconf 86' lang='eng' dir='ltr'><em>a/gico/a</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 518 919 592 939; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 602 918 690 939; x_wconf 90' lang='eng' dir='ltr'><em>51440T</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 707 919 819 945; x_wconf 86' lang='eng' dir='ltr'><em>(X78315)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 306 980 838 1007">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 306 980 838 1007">
+     <span class='ocr_line' id='line_1_38' title="bbox 306 980 838 1007; baseline 0 -6"><span class='ocrx_word' id='word_1_106' title='bbox 306 981 465 1001; x_wconf 83' lang='eng' dir='ltr'><em>Phaeobacter</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 471 981 566 1001; x_wconf 79' lang='eng' dir='ltr'><em>arcticus</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 592 980 678 1001; x_wconf 74' lang='eng' dir='ltr'><em>20188T</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 687 981 838 1007; x_wconf 78' lang='eng' dir='ltr'><em>(DQS14304)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_37' title="bbox 103 719 105 1053">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 103 719 105 1053">
+     <span class='ocr_line' id='line_1_39' title="bbox 103 719 105 1053; baseline 0 455"><span class='ocrx_word' id='word_1_110' title='bbox 103 719 105 1053; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_38' title="bbox 147 1037 175 1039">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 147 1037 175 1039">
+     <span class='ocr_line' id='line_1_40' title="bbox 147 1037 175 1039; baseline 0 469"><span class='ocrx_word' id='word_1_111' title='bbox 147 1037 175 1039; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_39' title="bbox 103 1051 226 1055">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 103 1051 226 1055">
+     <span class='ocr_line' id='line_1_41' title="bbox 103 1051 226 1055; baseline 0 453"><span class='ocrx_word' id='word_1_112' title='bbox 103 1051 226 1055; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_40' title="bbox 173 991 175 1083">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 173 991 175 1083">
+     <span class='ocr_line' id='line_1_42' title="bbox 173 991 175 1083; baseline 0 425"><span class='ocrx_word' id='word_1_113' title='bbox 173 991 175 1083; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_41' title="bbox 103 1042 784 1069">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 103 1042 784 1069">
+     <span class='ocr_line' id='line_1_43' title="bbox 103 1042 784 1069; baseline 0 -6"><span class='ocrx_word' id='word_1_114' title='bbox 103 1057 119 1069; x_wconf 58' lang='eng'><em>79</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 153 1043 169 1055; x_wconf 73' lang='eng'><em>9°</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 231 1043 555 1069; x_wconf 81' lang='eng' dir='ltr'><em>Phaeobactergallaeciensis</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 574 1042 784 1069; x_wconf 72' lang='eng' dir='ltr'><em>BS1O7T(Y13244)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_42' title="bbox 197 1053 199 1114">
+    <p class='ocr_par' dir='ltr' id='par_1_42' title="bbox 197 1053 199 1114">
+     <span class='ocr_line' id='line_1_44' title="bbox 197 1053 199 1114; baseline 0 394"><span class='ocrx_word' id='word_1_118' title='bbox 197 1053 199 1114; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_43' title="bbox 200 1104 818 1131">
+    <p class='ocr_par' dir='ltr' id='par_1_43' title="bbox 200 1104 818 1131">
+     <span class='ocr_line' id='line_1_45' title="bbox 200 1104 818 1131; baseline 0 -6"><span class='ocrx_word' id='word_1_119' title='bbox 200 1105 384 1125; x_wconf 81' lang='eng' dir='ltr'><em>—Phaeobacter</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 391 1105 493 1125; x_wconf 87' lang='eng' dir='ltr'><em>inhibens</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 511 1105 568 1126; x_wconf 90' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 578 1104 664 1126; x_wconf 74' lang='eng' dir='ltr'><em>22475T</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 672 1105 818 1131; x_wconf 89' lang='eng' dir='ltr'>(AY177712)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_44' title="bbox 123 929 125 1175">
+    <p class='ocr_par' dir='ltr' id='par_1_44' title="bbox 123 929 125 1175">
+     <span class='ocr_line' id='line_1_46' title="bbox 123 929 125 1175; baseline 0 333"><span class='ocrx_word' id='word_1_124' title='bbox 123 929 125 1175; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_45' title="bbox 123 1173 257 1179">
+    <p class='ocr_par' dir='ltr' id='par_1_45' title="bbox 123 1173 257 1179">
+     <span class='ocr_line' id='line_1_47' title="bbox 123 1173 257 1179; baseline 0 329"><span class='ocrx_word' id='word_1_125' title='bbox 123 1173 257 1179; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_46' title="bbox 126 1166 854 1193">
+    <p class='ocr_par' dir='ltr' id='par_1_46' title="bbox 126 1166 854 1193">
+     <span class='ocr_line' id='line_1_48' title="bbox 126 1166 854 1193; baseline 0 -5"><span class='ocrx_word' id='word_1_126' title='bbox 126 1179 143 1191; x_wconf 61' lang='eng'><em>33</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 262 1167 420 1188; x_wconf 80' lang='eng' dir='ltr'><em>Phaeobacter</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 427 1167 583 1192; x_wconf 84' lang='eng' dir='ltr'><em>daeponensis</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 595 1166 693 1188; x_wconf 89' lang='eng' dir='ltr'><em>TF—218T</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 703 1167 854 1193; x_wconf 77' lang='eng' dir='ltr'><em>(DQQ81486)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_47' title="bbox 188 1177 190 1272">
+    <p class='ocr_par' dir='ltr' id='par_1_47' title="bbox 188 1177 190 1272">
+     <span class='ocr_line' id='line_1_49' title="bbox 188 1177 190 1272; baseline 0 236"><span class='ocrx_word' id='word_1_131' title='bbox 188 1177 190 1272; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_48' title="bbox 168 1229 879 1303">
+    <p class='ocr_par' dir='ltr' id='par_1_48' title="bbox 168 1229 879 1303">
+     <span class='ocr_line' id='line_1_50' title="bbox 168 1229 879 1303; baseline -0.001 -53"><span class='ocrx_word' id='word_1_132' title='bbox 168 1230 184 1241; x_wconf 64' lang='eng'><em>5&quot;</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 233 1229 425 1303; x_wconf 47' lang='eng' dir='ltr'><em>erhaeobacter</em></span> <span class='ocrx_word' id='word_1_134' title='bbox 433 1229 560 1250; x_wconf 87' lang='eng' dir='ltr'><em>caeruleus</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 573 1229 631 1250; x_wconf 90' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_136' title='bbox 641 1229 717 1250; x_wconf 87' lang='eng'>24370</span> <span class='ocrx_word' id='word_1_137' title='bbox 727 1229 879 1255; x_wconf 83' lang='eng' dir='ltr'><em>(AM943631)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_51' title="bbox 206 1276 222 1287; baseline 0 0"><span class='ocrx_word' id='word_1_138' title='bbox 206 1276 222 1287; x_wconf 75' lang='eng' dir='ltr'>1D</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_49' title="bbox 147 1037 148 1311">
+    <p class='ocr_par' dir='ltr' id='par_1_49' title="bbox 147 1037 148 1311">
+     <span class='ocr_line' id='line_1_52' title="bbox 147 1037 148 1311; baseline 0 197"><span class='ocrx_word' id='word_1_139' title='bbox 147 1037 148 1311; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_50' title="bbox 223 1276 894 1317">
+    <p class='ocr_par' dir='ltr' id='par_1_50' title="bbox 223 1276 894 1317">
+     <span class='ocr_line' id='line_1_53' title="bbox 223 1276 894 1317; baseline 0 -5"><span class='ocrx_word' id='word_1_140' title='bbox 223 1276 230 1287; x_wconf 62' lang='eng' dir='ltr'>D</span> <span class='ocrx_word' id='word_1_141' title='bbox 244 1291 547 1312; x_wconf 86' lang='eng' dir='ltr'><em>Phaeobactercaeruleus</em></span> <span class='ocrx_word' id='word_1_142' title='bbox 567 1291 625 1312; x_wconf 90' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_143' title='bbox 636 1290 722 1312; x_wconf 89' lang='eng' dir='ltr'><em>24369T</em></span> <span class='ocrx_word' id='word_1_144' title='bbox 742 1291 894 1317; x_wconf 87' lang='eng' dir='ltr'><em>(AM943630)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_51' title="bbox 136 1315 152 1327">
+    <p class='ocr_par' dir='ltr' id='par_1_51' title="bbox 136 1315 152 1327">
+     <span class='ocr_line' id='line_1_54' title="bbox 136 1315 152 1327; baseline -0.063 0"><span class='ocrx_word' id='word_1_145' title='bbox 136 1315 152 1327; x_wconf 82' lang='eng'><em>50</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_52' title="bbox 241 1352 858 1379">
+    <p class='ocr_par' dir='ltr' id='par_1_52' title="bbox 241 1352 858 1379">
+     <span class='ocr_line' id='line_1_55' title="bbox 241 1352 858 1379; baseline 0 -6"><span class='ocrx_word' id='word_1_146' title='bbox 241 1353 367 1379; x_wconf 82' lang='eng' dir='ltr'><em>Leisingera</em></span> <span class='ocrx_word' id='word_1_147' title='bbox 377 1353 622 1379; x_wconf 80' lang='eng' dir='ltr'><em>methylohalidivorans</em></span> <span class='ocrx_word' id='word_1_148' title='bbox 640 1352 704 1373; x_wconf 79' lang='eng' dir='ltr'><em>MBZT</em></span> <span class='ocrx_word' id='word_1_149' title='bbox 712 1353 858 1379; x_wconf 84' lang='eng' dir='ltr'><em>(AY005463)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_53' title="bbox 174 1400 190 1412">
+    <p class='ocr_par' dir='ltr' id='par_1_53' title="bbox 174 1400 190 1412">
+     <span class='ocr_line' id='line_1_56' title="bbox 174 1400 190 1412; baseline 0 0"><span class='ocrx_word' id='word_1_150' title='bbox 174 1400 190 1412; x_wconf 82' lang='eng'>97</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_54' title="bbox 224 1414 825 1441">
+    <p class='ocr_par' dir='ltr' id='par_1_54' title="bbox 224 1414 825 1441">
+     <span class='ocr_line' id='line_1_57' title="bbox 224 1414 825 1441; baseline 0.002 -6"><span class='ocrx_word' id='word_1_151' title='bbox 224 1416 349 1441; x_wconf 85' lang='eng' dir='ltr'><em>Leisingera</em></span> <span class='ocrx_word' id='word_1_152' title='bbox 360 1416 495 1441; x_wconf 86' lang='eng' dir='ltr'><em>aquimarina</em></span> <span class='ocrx_word' id='word_1_153' title='bbox 514 1415 570 1436; x_wconf 93' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_154' title='bbox 580 1414 666 1436; x_wconf 84' lang='eng' dir='ltr'><em>24366T</em></span> <span class='ocrx_word' id='word_1_155' title='bbox 674 1415 825 1441; x_wconf 85' lang='eng' dir='ltr'><em>(AM900415)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_55' title="bbox 0 1483 502 1493">
+    <p class='ocr_par' dir='ltr' id='par_1_55' title="bbox 0 1483 502 1493">
+     <span class='ocr_line' id='line_1_58' title="bbox 0 1483 502 1493; baseline 0 15"><span class='ocrx_word' id='word_1_156' title='bbox 0 1483 502 1493; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_56' title="bbox 504 1476 992 1503">
+    <p class='ocr_par' dir='ltr' id='par_1_56' title="bbox 504 1476 992 1503">
+     <span class='ocr_line' id='line_1_59' title="bbox 504 1476 992 1503; baseline -0.002 -5"><span class='ocrx_word' id='word_1_157' title='bbox 504 1477 595 1503; x_wconf 87' lang='eng' dir='ltr'><em>Stappia</em></span> <span class='ocrx_word' id='word_1_158' title='bbox 605 1477 713 1498; x_wconf 83' lang='eng' dir='ltr'><em>stel/u/ata</em></span> <span class='ocrx_word' id='word_1_159' title='bbox 728 1477 772 1497; x_wconf 93' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_160' title='bbox 785 1476 869 1498; x_wconf 81' lang='eng' dir='ltr'><em>12621T</em></span> <span class='ocrx_word' id='word_1_161' title='bbox 879 1477 992 1503; x_wconf 85' lang='eng' dir='ltr'><em>(D88525)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002683-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002683-0-000.pbm.png
new file mode 100644
index 00000000..c8cdba08
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002683-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002683-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002683-0-000.pbm.png.hocr
new file mode 100644
index 00000000..cbce7954
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002683-0-000.pbm.png.hocr
@@ -0,0 +1,157 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002683-0-000.pbm.png"; bbox 0 0 1242 2107; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 8 2 856 82">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 8 2 856 82">
+     <span class='ocr_line' id='line_1_1' title="bbox 8 2 59 27; baseline 0.02 -1"><span class='ocrx_word' id='word_1_1' title='bbox 8 2 17 26; x_wconf 95' lang='eng'>1</span> <span class='ocrx_word' id='word_1_2' title='bbox 33 2 59 27; x_wconf 91' lang='eng'><em>%</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 276 53 856 82; baseline 0 -6"><span class='ocrx_word' id='word_1_3' title='bbox 276 54 420 76; x_wconf 86' lang='eng' dir='ltr'><em>Roseivivax</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 429 54 576 76; x_wconf 88' lang='eng' dir='ltr'><em>halodurans</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 596 54 648 76; x_wconf 90' lang='eng' dir='ltr'><em>Och</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 659 53 718 76; x_wconf 81' lang='eng' dir='ltr'><em>239T</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 734 54 856 82; x_wconf 86' lang='eng' dir='ltr'><em>(D85829)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 111 100 919 248">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 111 100 919 248">
+     <span class='ocr_line' id='line_1_3' title="bbox 111 100 832 137; baseline 0 -6"><span class='ocrx_word' id='word_1_8' title='bbox 111 100 144 116; x_wconf 65' lang='eng'>10°</span> <span class='ocrx_word' id='word_1_9' title='bbox 250 109 394 131; x_wconf 83' lang='eng' dir='ltr'><em>Roseivivax</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 402 109 565 131; x_wconf 82' lang='eng' dir='ltr'><em>ha/otolerans</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 583 109 634 131; x_wconf 87' lang='eng' dir='ltr'><em>Och</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 645 108 832 137; x_wconf 65' lang='eng' dir='ltr'><em>210T(D85831)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 285 164 919 193; baseline -0.002 -6"><span class='ocrx_word' id='word_1_13' title='bbox 285 164 432 187; x_wconf 76' lang='eng' dir='ltr'><em>Oceanlcola</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 442 165 568 187; x_wconf 84' lang='eng' dir='ltr'><em>batsensis</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 587 164 667 187; x_wconf 93' lang='eng' dir='ltr'><em>HTCC</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 677 164 753 187; x_wconf 81' lang='eng' dir='ltr'><em>2597T</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 762 164 919 193; x_wconf 90' lang='eng' dir='ltr'>(AY424898)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 136 211 813 248; baseline 0 -6"><span class='ocrx_word' id='word_1_18' title='bbox 136 211 158 227; x_wconf 62' lang='eng'><em>59</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 250 220 396 242; x_wconf 88' lang='eng' dir='ltr'><em>Oceanicola</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 406 220 512 242; x_wconf 86' lang='eng' dir='ltr'><em>marinus</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 532 219 635 242; x_wconf 87' lang='eng' dir='ltr'><em>Azo-cT</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 650 220 813 248; x_wconf 79' lang='eng' dir='ltr'><em>(D0822569)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 158 273 989 746">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 158 274 989 745">
+     <span class='ocr_line' id='line_1_6' title="bbox 254 274 814 303; baseline 0 -6"><span class='ocrx_word' id='word_1_23' title='bbox 254 275 343 297; x_wconf 84' lang='eng' dir='ltr'><em>Shimia</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 353 275 443 297; x_wconf 81' lang='eng' dir='ltr'><em>marina</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 463 275 522 297; x_wconf 85' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 536 274 626 297; x_wconf 83' lang='eng' dir='ltr'><em>13038T</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 657 275 814 303; x_wconf 84' lang='eng' dir='ltr'><em>(AY962292)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 270 329 871 358; baseline 0 -6"><span class='ocrx_word' id='word_1_28' title='bbox 270 330 442 352; x_wconf 89' lang='eng' dir='ltr'><em>Thalassobius</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 452 330 565 352; x_wconf 81' lang='eng' dir='ltr'><em>aestuarii</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 589 329 701 352; x_wconf 78' lang='eng' dir='ltr'><em>JCZO49T</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 714 330 871 358; x_wconf 90' lang='eng' dir='ltr'>(AY442178)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 158 377 979 414; baseline 0 -7"><span class='ocrx_word' id='word_1_32' title='bbox 158 377 180 392; x_wconf 74' lang='eng'>93</span> <span class='ocrx_word' id='word_1_33' title='bbox 263 386 436 407; x_wconf 83' lang='eng' dir='ltr'><em>Thalassobius</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 445 386 636 407; x_wconf 84' lang='eng' dir='ltr'><em>mediterraneus</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 649 385 728 407; x_wconf 92' lang='eng' dir='ltr'><em>CECT</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 739 384 815 407; x_wconf 80' lang='eng' dir='ltr'><em>5383T</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 827 386 979 414; x_wconf 89' lang='eng' dir='ltr'>(AJ878874)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 249 438 816 466; baseline -0.007 -3"><span class='ocrx_word' id='word_1_38' title='bbox 249 441 364 463; x_wconf 87' lang='eng' dir='ltr'><em>Nautella</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 374 441 457 463; x_wconf 89' lang='eng' dir='ltr'><em>italica</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 471 440 533 463; x_wconf 92' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 544 440 637 463; x_wconf 84' lang='eng' dir='ltr'><em>24365T</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 652 438 816 466; x_wconf 88' lang='eng' dir='ltr'><em>(AM904562)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 227 484 809 532; baseline 0.002 -14"><span class='ocrx_word' id='word_1_43' title='bbox 227 484 235 532; x_wconf 0' lang='eng'><em></em></span> <span class='ocrx_word' id='word_1_44' title='bbox 249 496 364 518; x_wconf 89' lang='eng' dir='ltr'><em>Nautella</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 374 496 457 518; x_wconf 86' lang='eng' dir='ltr'><em>italica</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 471 497 533 519; x_wconf 92' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 544 497 626 519; x_wconf 88' lang='eng'><em>24364</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 645 497 809 525; x_wconf 86' lang='eng' dir='ltr'><em>(AM904563)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 213 551 757 587; baseline 0 -14"><span class='ocrx_word' id='word_1_49' title='bbox 213 571 223 587; x_wconf 67' lang='eng'><strong>9</strong></span> <span class='ocrx_word' id='word_1_50' title='bbox 249 552 364 573; x_wconf 86' lang='eng' dir='ltr'><em>Nautella</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 374 552 457 573; x_wconf 86' lang='eng' dir='ltr'><em>italica</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 471 552 582 573; x_wconf 85' lang='eng' dir='ltr'><em>R-28753</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 593 551 757 579; x_wconf 88' lang='eng' dir='ltr'><em>(AM944522)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 216 606 760 637; baseline -0.002 -8"><span class='ocrx_word' id='word_1_54' title='bbox 216 623 235 637; x_wconf 61' lang='eng' dir='ltr'><em>n.</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 249 607 364 629; x_wconf 87' lang='eng' dir='ltr'><em>Nautella</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 374 607 457 629; x_wconf 86' lang='eng' dir='ltr'><em>italica</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 473 607 585 629; x_wconf 90' lang='eng' dir='ltr'><em>R-25532</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 596 606 760 635; x_wconf 88' lang='eng' dir='ltr'>(AM944520)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 249 662 760 690; baseline -0.002 -6"><span class='ocrx_word' id='word_1_59' title='bbox 249 662 364 684; x_wconf 86' lang='eng' dir='ltr'><em>Nautella</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 374 662 457 684; x_wconf 86' lang='eng' dir='ltr'><em>italica</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 473 662 585 684; x_wconf 88' lang='eng' dir='ltr'><em>R-28717</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 596 662 760 690; x_wconf 86' lang='eng' dir='ltr'>(AM944521)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 267 716 989 745; baseline 0 -6"><span class='ocrx_word' id='word_1_63' title='bbox 267 717 476 745; x_wconf 89' lang='eng' dir='ltr'><em>Pseudoruegeria</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 487 717 615 745; x_wconf 84' lang='eng' dir='ltr'><em>aquimaris</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 635 717 713 739; x_wconf 92' lang='eng' dir='ltr'><em>KCTC</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 726 716 816 739; x_wconf 84' lang='eng' dir='ltr'><em>12737T</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 827 717 989 745; x_wconf 87' lang='eng' dir='ltr'><em>(DQ675021)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 213 482 223 539">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 213 482 223 539">
+     <span class='ocr_line' id='line_1_15' title="bbox 213 482 223 497; baseline 0 0"><span class='ocrx_word' id='word_1_68' title='bbox 213 482 223 497; x_wconf 83' lang='eng'>9</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 213 523 223 539; baseline 0 0"><span class='ocrx_word' id='word_1_69' title='bbox 213 523 223 539; x_wconf 84' lang='eng'>9</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 75 95 79 772">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 75 95 79 772">
+     <span class='ocr_line' id='line_1_17' title="bbox 75 95 79 772; baseline 0 -233"><span class='ocrx_word' id='word_1_70' title='bbox 75 95 79 772; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 102 770 887 967">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 102 771 887 855">
+     <span class='ocr_line' id='line_1_18' title="bbox 102 771 887 801; baseline 0 -7"><span class='ocrx_word' id='word_1_71' title='bbox 102 781 121 797; x_wconf 80' lang='eng'><em>91</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 295 772 415 800; x_wconf 86' lang='eng' dir='ltr'><em>Ruegeria</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 424 772 519 800; x_wconf 89' lang='eng' dir='ltr'><em>pelagia</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 545 771 703 794; x_wconf 78' lang='eng' dir='ltr'><em>HT002663T</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 724 772 887 801; x_wconf 85' lang='eng' dir='ltr'>(DQ916141)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 149 808 871 855; baseline 0 -6"><span class='ocrx_word' id='word_1_76' title='bbox 149 808 172 824; x_wconf 67' lang='eng'><em>50</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 249 819 282 834; x_wconf 62' lang='eng'><em>10°</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 292 828 412 855; x_wconf 88' lang='eng' dir='ltr'><em>Ruegeria</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 422 828 514 849; x_wconf 88' lang='eng' dir='ltr'><em>mobilis</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 533 827 581 849; x_wconf 92' lang='eng' dir='ltr'><em>CIP</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 594 826 701 849; x_wconf 82' lang='eng' dir='ltr'><em>109181T</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 714 827 871 855; x_wconf 79' lang='eng' dir='ltr'>(A5255401)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 178 881 884 966">
+     <span class='ocr_line' id='line_1_20' title="bbox 178 881 838 911; baseline 0 -6"><span class='ocrx_word' id='word_1_83' title='bbox 178 881 200 897; x_wconf 77' lang='eng'>99</span> <span class='ocrx_word' id='word_1_84' title='bbox 295 883 414 911; x_wconf 85' lang='eng' dir='ltr'><em>Ruegeria</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 423 883 548 911; x_wconf 87' lang='eng' dir='ltr'><em>pomeroyi</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 567 882 664 905; x_wconf 79' lang='eng' dir='ltr'><em>DSS-3T</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 682 883 838 911; x_wconf 85' lang='eng' dir='ltr'>(AF098491)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 189 937 884 966; baseline 0 -6"><span class='ocrx_word' id='word_1_88' title='bbox 189 943 212 959; x_wconf 82' lang='eng'>64</span> <span class='ocrx_word' id='word_1_89' title='bbox 334 938 453 966; x_wconf 86' lang='eng' dir='ltr'><em>Ruegeria</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 464 938 573 960; x_wconf 81' lang='eng' dir='ltr'><em>atlantica</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 598 938 646 960; x_wconf 93' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 660 937 750 960; x_wconf 83' lang='eng' dir='ltr'><em>14463T</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 762 938 884 966; x_wconf 87' lang='eng' dir='ltr'><em>(D88526)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 157 984 1063 1961">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 176 984 1001 1132">
+     <span class='ocr_line' id='line_1_22' title="bbox 215 984 918 1021; baseline 0 -6"><span class='ocrx_word' id='word_1_94' title='bbox 215 984 237 1000; x_wconf 70' lang='eng'><em>95</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 291 993 641 1021; x_wconf 86' lang='eng' dir='ltr'><em>Ruegerialacuscaerulensis</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 664 992 783 1015; x_wconf 93' lang='eng' dir='ltr'><em>ITI—1157T</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 796 993 918 1021; x_wconf 86' lang='eng' dir='ltr'>(U77644)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 362 1048 1001 1076; baseline 0 -6"><span class='ocrx_word' id='word_1_98' title='bbox 362 1048 628 1070; x_wconf 82' lang='eng' dir='ltr'><em>Sulﬁtobacterlitoralis</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 656 1048 718 1070; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 731 1048 822 1070; x_wconf 83' lang='eng' dir='ltr'><em>17584T</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 838 1048 1001 1076; x_wconf 80' lang='eng' dir='ltr'>(DQOQ7527)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 176 1103 949 1132; baseline -0.001 -6"><span class='ocrx_word' id='word_1_102' title='bbox 176 1109 198 1125; x_wconf 81' lang='eng'>99</span> <span class='ocrx_word' id='word_1_103' title='bbox 319 1104 656 1126; x_wconf 80' lang='eng' dir='ltr'><em>Roseobacterdenitriﬁcans</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 683 1103 805 1126; x_wconf 82' lang='eng' dir='ltr'><em>Och114T</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 824 1104 949 1132; x_wconf 82' lang='eng' dir='ltr'>(M96746)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 206 1150 1063 1298">
+     <span class='ocr_line' id='line_1_25' title="bbox 206 1150 886 1187; baseline -0.001 -6"><span class='ocrx_word' id='word_1_106' title='bbox 206 1150 239 1166; x_wconf 63' lang='eng'><em>10&quot;</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 279 1159 549 1181; x_wconf 80' lang='eng' dir='ltr'><em>Roseobacter/itoralis</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 568 1159 648 1181; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 658 1158 752 1181; x_wconf 75' lang='eng' dir='ltr'><em>49566T</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 765 1159 886 1187; x_wconf 87' lang='eng' dir='ltr'>(X78312)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 299 1213 997 1242; baseline 0 -6"><span class='ocrx_word' id='word_1_111' title='bbox 299 1214 464 1236; x_wconf 87' lang='eng' dir='ltr'><em>Roseovarius</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 474 1215 644 1236; x_wconf 82' lang='eng' dir='ltr'><em>crassostreae</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 662 1214 724 1236; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 738 1213 828 1236; x_wconf 80' lang='eng' dir='ltr'><em>16950T</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 842 1214 997 1242; x_wconf 90' lang='eng' dir='ltr'>(AF114484)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 307 1268 1063 1298; baseline 0 -6"><span class='ocrx_word' id='word_1_116' title='bbox 307 1270 510 1292; x_wconf 84' lang='eng' dir='ltr'><em>Thalassobacter</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 518 1270 711 1297; x_wconf 84' lang='eng' dir='ltr'><em>stenotrophicus</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 728 1269 807 1292; x_wconf 93' lang='eng' dir='ltr'><em>CECT</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 818 1268 893 1292; x_wconf 83' lang='eng' dir='ltr'><em>5294T</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 911 1269 1063 1298; x_wconf 83' lang='eng' dir='ltr'><em>(AJ631302)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 157 1324 1062 1960">
+     <span class='ocr_line' id='line_1_28' title="bbox 361 1324 905 1353; baseline -0.002 -6"><span class='ocrx_word' id='word_1_121' title='bbox 361 1325 682 1347; x_wconf 79' lang='eng' dir='ltr'><em>Octadecabacterarcticus</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 704 1324 764 1347; x_wconf 78' lang='eng' dir='ltr'><em>238T</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 783 1325 905 1353; x_wconf 90' lang='eng' dir='ltr'>(U73725)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 357 1379 999 1408; baseline 0 -6"><span class='ocrx_word' id='word_1_124' title='bbox 357 1380 507 1402; x_wconf 86' lang='eng' dir='ltr'><em>Jannaschia</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 517 1380 686 1408; x_wconf 85' lang='eng' dir='ltr'><em>donghaensis</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 707 1379 828 1402; x_wconf 88' lang='eng' dir='ltr'><em>DSW—17T</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 843 1380 999 1408; x_wconf 87' lang='eng' dir='ltr'><em>(EF202612)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 162 1434 1012 1465; baseline -0.009 0"><span class='ocrx_word' id='word_1_128' title='bbox 162 1449 184 1465; x_wconf 81' lang='eng'><em>65</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 217 1447 250 1463; x_wconf 88' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 350 1435 499 1457; x_wconf 88' lang='eng' dir='ltr'><em>Jannaschia</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 510 1435 665 1457; x_wconf 81' lang='eng' dir='ltr'><em>seosinens/s</em></span> <span class='ocrx_word' id='word_1_132' title='bbox 683 1435 742 1457; x_wconf 88' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 756 1434 1012 1463; x_wconf 79' lang='eng' dir='ltr'><em>13035T(AY906862)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 239 1489 988 1518; baseline 0 -6"><span class='ocrx_word' id='word_1_134' title='bbox 239 1495 261 1511; x_wconf 84' lang='eng'>59</span> <span class='ocrx_word' id='word_1_135' title='bbox 345 1491 495 1512; x_wconf 86' lang='eng' dir='ltr'><em>Jannaschia</em></span> <span class='ocrx_word' id='word_1_136' title='bbox 505 1491 704 1518; x_wconf 88' lang='eng' dir='ltr'><em>helgolandensis</em></span> <span class='ocrx_word' id='word_1_137' title='bbox 725 1491 766 1512; x_wconf 90' lang='eng' dir='ltr'><em>Hel</em></span> <span class='ocrx_word' id='word_1_138' title='bbox 779 1489 819 1512; x_wconf 84' lang='eng' dir='ltr'><em>10T</em></span> <span class='ocrx_word' id='word_1_139' title='bbox 836 1490 988 1518; x_wconf 84' lang='eng' dir='ltr'>(AJ438157)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 168 1537 934 1574; baseline -0.001 -6"><span class='ocrx_word' id='word_1_140' title='bbox 168 1549 187 1564; x_wconf 73' lang='eng'><em>51</em></span> <span class='ocrx_word' id='word_1_141' title='bbox 267 1537 290 1553; x_wconf 71' lang='eng'>99</span> <span class='ocrx_word' id='word_1_142' title='bbox 345 1546 495 1568; x_wconf 86' lang='eng' dir='ltr'><em>Jannaschia</em></span> <span class='ocrx_word' id='word_1_143' title='bbox 505 1546 573 1568; x_wconf 86' lang='eng' dir='ltr'><em>rubra</em></span> <span class='ocrx_word' id='word_1_144' title='bbox 602 1545 681 1568; x_wconf 90' lang='eng' dir='ltr'><em>CECT</em></span> <span class='ocrx_word' id='word_1_145' title='bbox 691 1545 767 1568; x_wconf 73' lang='eng' dir='ltr'><em>5088T</em></span> <span class='ocrx_word' id='word_1_146' title='bbox 782 1545 934 1574; x_wconf 84' lang='eng' dir='ltr'>(AJ748747)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 384 1600 1062 1629; baseline 0 -6"><span class='ocrx_word' id='word_1_147' title='bbox 384 1601 518 1623; x_wconf 83' lang='eng' dir='ltr'><em>Loktanel/a</em></span> <span class='ocrx_word' id='word_1_148' title='bbox 530 1601 701 1623; x_wconf 83' lang='eng' dir='ltr'><em>vestfoldensis</em></span> <span class='ocrx_word' id='word_1_149' title='bbox 729 1601 789 1623; x_wconf 89' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_150' title='bbox 801 1600 893 1623; x_wconf 89' lang='eng' dir='ltr'><em>22003T</em></span> <span class='ocrx_word' id='word_1_151' title='bbox 910 1601 1062 1629; x_wconf 85' lang='eng' dir='ltr'><em>(AJ582226)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 178 1654 975 1682; baseline -0.003 -5"><span class='ocrx_word' id='word_1_152' title='bbox 178 1661 201 1677; x_wconf 83' lang='eng'>69</span> <span class='ocrx_word' id='word_1_153' title='bbox 371 1657 539 1678; x_wconf 86' lang='eng' dir='ltr'><em>Roseisalinus</em></span> <span class='ocrx_word' id='word_1_154' title='bbox 549 1657 692 1678; x_wconf 81' lang='eng' dir='ltr'><em>antarcticus</em></span> <span class='ocrx_word' id='word_1_155' title='bbox 712 1656 800 1679; x_wconf 78' lang='eng' dir='ltr'><em>EL-88T</em></span> <span class='ocrx_word' id='word_1_156' title='bbox 824 1654 975 1682; x_wconf 84' lang='eng' dir='ltr'>(AJ605747)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 226 1703 1030 1739; baseline -0.002 -5"><span class='ocrx_word' id='word_1_157' title='bbox 226 1703 259 1719; x_wconf 64' lang='eng'>100</span> <span class='ocrx_word' id='word_1_158' title='bbox 361 1711 507 1734; x_wconf 88' lang='eng' dir='ltr'><em>Oceanicola</em></span> <span class='ocrx_word' id='word_1_159' title='bbox 517 1712 663 1739; x_wconf 87' lang='eng' dir='ltr'><em>granulosus</em></span> <span class='ocrx_word' id='word_1_160' title='bbox 685 1708 843 1731; x_wconf 79' lang='eng' dir='ltr'><em>HTCCZ516T</em></span> <span class='ocrx_word' id='word_1_161' title='bbox 872 1709 1030 1737; x_wconf 86' lang='eng' dir='ltr'>(AY424896)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 264 1766 826 1795; baseline 0.002 -7"><span class='ocrx_word' id='word_1_162' title='bbox 264 1767 383 1794; x_wconf 85' lang='eng' dir='ltr'><em>Ruegeria</em></span> <span class='ocrx_word' id='word_1_163' title='bbox 394 1767 493 1794; x_wconf 85' lang='eng' dir='ltr'><em>algicola</em></span> <span class='ocrx_word' id='word_1_164' title='bbox 511 1767 591 1789; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_165' title='bbox 602 1766 694 1789; x_wconf 84' lang='eng' dir='ltr'><em>51440T</em></span> <span class='ocrx_word' id='word_1_166' title='bbox 705 1767 826 1795; x_wconf 85' lang='eng' dir='ltr'>(X78315)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 250 1821 922 1850; baseline 0 -6"><span class='ocrx_word' id='word_1_167' title='bbox 250 1822 386 1850; x_wconf 76' lang='eng' dir='ltr'><em>Leisingera</em></span> <span class='ocrx_word' id='word_1_168' title='bbox 396 1822 660 1850; x_wconf 80' lang='eng' dir='ltr'><em>methylohalidivorans</em></span> <span class='ocrx_word' id='word_1_169' title='bbox 679 1821 749 1844; x_wconf 79' lang='eng' dir='ltr'><em>MBZT</em></span> <span class='ocrx_word' id='word_1_170' title='bbox 765 1822 922 1850; x_wconf 85' lang='eng' dir='ltr'>(AY005463)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 163 1874 918 1905; baseline 0 -6"><span class='ocrx_word' id='word_1_171' title='bbox 163 1889 185 1905; x_wconf 70' lang='eng'><em>93</em></span> <span class='ocrx_word' id='word_1_172' title='bbox 263 1877 610 1905; x_wconf 80' lang='eng' dir='ltr'><em>Phaeobacterdaeponensis</em></span> <span class='ocrx_word' id='word_1_173' title='bbox 636 1874 742 1897; x_wconf 74' lang='eng' dir='ltr'><em>TF-218T</em></span> <span class='ocrx_word' id='word_1_174' title='bbox 755 1877 918 1905; x_wconf 87' lang='eng' dir='ltr'><em>(DQ981486)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 157 1931 857 1960; baseline 0 -6"><span class='ocrx_word' id='word_1_175' title='bbox 157 1937 180 1953; x_wconf 87' lang='eng'>54</span> <span class='ocrx_word' id='word_1_176' title='bbox 249 1933 598 1960; x_wconf 86' lang='eng' dir='ltr'><em>Phaeobactergallaeciensis</em></span> <span class='ocrx_word' id='word_1_177' title='bbox 619 1931 717 1954; x_wconf 84' lang='eng' dir='ltr'><em>BS107T</em></span> <span class='ocrx_word' id='word_1_178' title='bbox 736 1932 857 1960; x_wconf 85' lang='eng' dir='ltr'>(Y13244)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 134 1840 156 1856">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 134 1840 156 1856">
+     <span class='ocr_line' id='line_1_40' title="bbox 134 1840 156 1856; baseline 0 0"><span class='ocrx_word' id='word_1_179' title='bbox 134 1840 156 1856; x_wconf 88' lang='eng'>58</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 180 1979 895 2019">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 180 1979 895 2019">
+     <span class='ocr_line' id='line_1_41' title="bbox 180 1979 895 2019; baseline 0.003 -9"><span class='ocrx_word' id='word_1_180' title='bbox 180 1979 213 1995; x_wconf 67' lang='eng'><em>10°</em></span> <span class='ocrx_word' id='word_1_181' title='bbox 244 1988 532 2010; x_wconf 73' lang='eng' dir='ltr'><em>Phaeobacterinh/bens</em></span> <span class='ocrx_word' id='word_1_182' title='bbox 553 1990 614 2013; x_wconf 93' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_183' title='bbox 625 1990 718 2013; x_wconf 88' lang='eng' dir='ltr'><em>22475T</em></span> <span class='ocrx_word' id='word_1_184' title='bbox 738 1990 895 2019; x_wconf 91' lang='eng' dir='ltr'>(AY177712)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 0 2038 685 2057">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 0 2039 685 2056">
+     <span class='ocr_line' id='line_1_42' title="bbox 0 2039 685 2056; baseline 0 51"><span class='ocrx_word' id='word_1_185' title='bbox 0 2039 685 2056; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 687 2043 1240 2104">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 687 2043 1240 2104">
+     <span class='ocr_line' id='line_1_43' title="bbox 687 2043 1237 2071; baseline 0 -6"><span class='ocrx_word' id='word_1_186' title='bbox 687 2043 841 2065; x_wconf 85' lang='eng' dir='ltr'><em>Aeromonas</em></span> <span class='ocrx_word' id='word_1_187' title='bbox 850 2043 986 2071; x_wconf 88' lang='eng' dir='ltr'><em>hydrophila</em></span> <span class='ocrx_word' id='word_1_188' title='bbox 1007 2043 1091 2071; x_wconf 86' lang='eng' dir='ltr'>subsp.</span> <span class='ocrx_word' id='word_1_189' title='bbox 1108 2043 1237 2065; x_wconf 83' lang='eng' dir='ltr'><em>bestiarum</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 935 2075 1240 2104; baseline -0.003 -6"><span class='ocrx_word' id='word_1_190' title='bbox 935 2076 1015 2098; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_191' title='bbox 1026 2075 1102 2098; x_wconf 80' lang='eng' dir='ltr'><em>7966T</em></span> <span class='ocrx_word' id='word_1_192' title='bbox 1120 2076 1240 2104; x_wconf 88' lang='eng' dir='ltr'><em>(X74677)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002691-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002691-0-000.pbm.png
new file mode 100644
index 00000000..eca6a5d0
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002691-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002691-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002691-0-000.pbm.png.hocr
new file mode 100644
index 00000000..d594eacb
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002691-0-000.pbm.png.hocr
@@ -0,0 +1,177 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002691-0-000.pbm.png"; bbox 0 0 1242 1345; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 243 2 1079 493">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 243 2 993 34">
+     <span class='ocr_line' id='line_1_1' title="bbox 243 2 993 34; baseline 0 -5"><span class='ocrx_word' id='word_1_1' title='bbox 243 5 275 26; x_wconf 87' lang='eng'>90</span> <span class='ocrx_word' id='word_1_2' title='bbox 313 5 502 29; x_wconf 83' lang='eng' dir='ltr'><em>Planococcus</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 515 5 611 29; x_wconf 83' lang='eng' dir='ltr'><em>citreus</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 624 4 730 30; x_wconf 92' lang='eng' dir='ltr'>NCIMB</span> <span class='ocrx_word' id='word_1_5' title='bbox 746 4 834 29; x_wconf 80' lang='eng' dir='ltr'><em>1493T</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 851 2 993 34; x_wconf 86' lang='eng' dir='ltr'><em>(X62172)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 246 60 1010 296">
+     <span class='ocr_line' id='line_1_2' title="bbox 246 60 931 100; baseline 0.001 -6"><span class='ocrx_word' id='word_1_7' title='bbox 246 60 276 80; x_wconf 77' lang='eng'><em>75</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 309 70 498 95; x_wconf 87' lang='eng' dir='ltr'><em>Planococcus</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 511 70 669 95; x_wconf 84' lang='eng' dir='ltr'><em>rifietoensis</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 681 69 739 95; x_wconf 91' lang='eng' dir='ltr'><em>M8T</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 756 67 931 100; x_wconf 86' lang='eng' dir='ltr'><em>(AJ493659)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 335 133 1010 168; baseline 0 -8"><span class='ocrx_word' id='word_1_12' title='bbox 335 136 524 160; x_wconf 84' lang='eng' dir='ltr'><em>Planococcus</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 536 136 679 160; x_wconf 85' lang='eng' dir='ltr'><em>columbae</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 692 136 778 168; x_wconf 91' lang='eng' dir='ltr'>PgEx1</span> <span class='ocrx_word' id='word_1_15' title='bbox 789 134 818 160; x_wconf 94' lang='eng' dir='ltr'><em>1T</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 835 133 1010 165; x_wconf 86' lang='eng' dir='ltr'><em>(AJ966515)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 315 198 949 231; baseline 0 -5"><span class='ocrx_word' id='word_1_17' title='bbox 315 201 505 226; x_wconf 90' lang='eng' dir='ltr'><em>Planococcus</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 517 201 658 226; x_wconf 84' lang='eng' dir='ltr'><em>maritimus</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 669 200 751 226; x_wconf 86' lang='eng' dir='ltr'><em>TF-9T</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 768 198 949 231; x_wconf 91' lang='eng' dir='ltr'>(AF500007)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 318 263 934 296; baseline 0 -5"><span class='ocrx_word' id='word_1_21' title='bbox 318 266 508 291; x_wconf 89' lang='eng' dir='ltr'><em>Planococcus</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 520 266 676 291; x_wconf 82' lang='eng' dir='ltr'><em>maitriensis</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 688 265 742 291; x_wconf 90' lang='eng' dir='ltr'><em>S1T</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 759 263 934 296; x_wconf 85' lang='eng' dir='ltr'><em>(AJ544622)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 301 329 1045 427">
+     <span class='ocr_line' id='line_1_6' title="bbox 301 329 1045 361; baseline 0 -5"><span class='ocrx_word' id='word_1_25' title='bbox 301 354 311 356; x_wconf 97' lang='eng'>_</span> <span class='ocrx_word' id='word_1_26' title='bbox 322 332 511 356; x_wconf 81' lang='eng' dir='ltr'><em>Planococcus</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 523 332 683 356; x_wconf 77' lang='eng' dir='ltr'><em>antarcticus</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 694 331 769 357; x_wconf 90' lang='eng' dir='ltr'><em>CMS</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 782 329 1045 361; x_wconf 74' lang='eng' dir='ltr'><em>260rT(AJ314745)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 301 368 1009 427; baseline 0 -5"><span class='ocrx_word' id='word_1_30' title='bbox 301 368 520 422; x_wconf 49' lang='eng' dir='ltr'><em>fig/anacoccus</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 532 397 631 422; x_wconf 88' lang='eng' dir='ltr'><em>kocurii</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 651 397 757 422; x_wconf 91' lang='eng' dir='ltr'>NCIMB</span> <span class='ocrx_word' id='word_1_33' title='bbox 771 396 841 422; x_wconf 76' lang='eng' dir='ltr'><em>629T</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 868 394 1009 427; x_wconf 86' lang='eng' dir='ltr'><em>(X62173)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 291 460 1079 493">
+     <span class='ocr_line' id='line_1_8' title="bbox 291 460 1079 493; baseline 0 -6"><span class='ocrx_word' id='word_1_35' title='bbox 291 484 324 486; x_wconf 96' lang='eng'>_</span> <span class='ocrx_word' id='word_1_36' title='bbox 336 463 525 488; x_wconf 82' lang='eng' dir='ltr'><em>Planococcus</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 537 463 744 488; x_wconf 78' lang='eng' dir='ltr'><em>stackebrandtii</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 754 461 879 488; x_wconf 75' lang='eng' dir='ltr'><em>K22—03T</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 896 460 1079 493; x_wconf 87' lang='eng' dir='ltr'><em>(AY437845)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 291 525 1154 560">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 291 525 1154 560">
+     <span class='ocr_line' id='line_1_9' title="bbox 291 525 1154 560; baseline 0 -7"><span class='ocrx_word' id='word_1_40' title='bbox 291 550 305 552; x_wconf 96' lang='eng'>_</span> <span class='ocrx_word' id='word_1_41' title='bbox 316 528 555 553; x_wconf 88' lang='eng' dir='ltr'><em>P/anomicrobium</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 566 528 782 560; x_wconf 81' lang='eng' dir='ltr'><em>psychrophi/um</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 795 528 869 553; x_wconf 90' lang='eng' dir='ltr'><em>CMS</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 882 527 962 553; x_wconf 89' lang='eng' dir='ltr'><em>53orT</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 979 525 1154 558; x_wconf 88' lang='eng' dir='ltr'><em>(AJ314746)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 273 120 328 596">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 273 120 328 596">
+     <span class='ocr_line' id='line_1_10' title="bbox 278 120 328 182; baseline 0 1163"><span class='ocrx_word' id='word_1_46' title='bbox 278 120 328 182; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 278 182 315 313; baseline 0 0"><span class='ocrx_word' id='word_1_47' title='bbox 278 182 315 313; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 279 313 299 377; baseline 0 968"><span class='ocrx_word' id='word_1_48' title='bbox 279 313 299 377; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 273 377 299 509; baseline 0 -65"><span class='ocrx_word' id='word_1_49' title='bbox 273 377 299 509; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 273 509 285 596; baseline 0 749"><span class='ocrx_word' id='word_1_50' title='bbox 273 509 285 596; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 240 200 270 220">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 240 200 270 220">
+     <span class='ocr_line' id='line_1_15' title="bbox 240 200 270 220; baseline 0 0"><span class='ocrx_word' id='word_1_51' title='bbox 240 200 270 220; x_wconf 91' lang='eng'><em>75</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 299 354 301 421">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 299 354 301 421">
+     <span class='ocr_line' id='line_1_16' title="bbox 299 354 301 421; baseline 0 924"><span class='ocrx_word' id='word_1_52' title='bbox 299 354 301 421; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 237 664 279 665">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 237 664 279 665">
+     <span class='ocr_line' id='line_1_17' title="bbox 237 664 279 665; baseline 0 680"><span class='ocrx_word' id='word_1_53' title='bbox 237 664 279 665; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 290 681 295 813">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 290 681 295 813">
+     <span class='ocr_line' id='line_1_18' title="bbox 290 681 295 813; baseline 0 532"><span class='ocrx_word' id='word_1_54' title='bbox 290 681 295 813; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 291 681 296 813">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 291 681 296 813">
+     <span class='ocr_line' id='line_1_19' title="bbox 291 681 296 813; baseline 0 532"><span class='ocrx_word' id='word_1_55' title='bbox 291 681 296 813; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 277 596 279 879">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 277 596 279 879">
+     <span class='ocr_line' id='line_1_20' title="bbox 277 596 279 879; baseline 0 466"><span class='ocrx_word' id='word_1_56' title='bbox 277 596 279 879; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 237 664 238 944">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 237 664 238 944">
+     <span class='ocr_line' id='line_1_21' title="bbox 237 664 238 944; baseline 0 401"><span class='ocrx_word' id='word_1_57' title='bbox 237 664 238 944; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 181 591 1240 1001">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 181 591 1240 1001">
+     <span class='ocr_line' id='line_1_22' title="bbox 289 591 1103 623; baseline 0 -5"><span class='ocrx_word' id='word_1_58' title='bbox 289 615 299 617; x_wconf 95' lang='eng'>_</span> <span class='ocrx_word' id='word_1_59' title='bbox 310 594 549 618; x_wconf 82' lang='eng' dir='ltr'><em>Planomicrobium</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 561 594 755 618; x_wconf 87' lang='eng' dir='ltr'><em>okeanokoites</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 767 593 818 618; x_wconf 93' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 833 592 942 618; x_wconf 80' lang='eng' dir='ltr'><em>12536T</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 959 591 1103 623; x_wconf 86' lang='eng' dir='ltr'>(D55729)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 208 632 1047 689; baseline 0.001 -6"><span class='ocrx_word' id='word_1_64' title='bbox 208 632 255 653; x_wconf 70' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 292 681 309 682; x_wconf 47' lang='eng'><em>,</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 329 659 568 684; x_wconf 85' lang='eng' dir='ltr'><em>Planomicrobium</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 581 659 712 684; x_wconf 87' lang='eng' dir='ltr'><em>chinense</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 726 658 854 684; x_wconf 86' lang='eng' dir='ltr'><em>DX3—12T</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 871 656 1047 689; x_wconf 83' lang='eng' dir='ltr'><em>(AJ697862)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 295 721 993 754; baseline 0 -5"><span class='ocrx_word' id='word_1_70' title='bbox 295 746 305 748; x_wconf 95' lang='eng'>_</span> <span class='ocrx_word' id='word_1_71' title='bbox 316 724 555 749; x_wconf 89' lang='eng' dir='ltr'><em>P/anomicrobium</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 567 724 700 749; x_wconf 88' lang='eng' dir='ltr'><em>koreense</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 711 721 993 754; x_wconf 77' lang='eng' dir='ltr'><em>JG07T(AF144750)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 190 776 1071 819; baseline 0 -5"><span class='ocrx_word' id='word_1_74' title='bbox 190 776 221 796; x_wconf 77' lang='eng'>54</span> <span class='ocrx_word' id='word_1_75' title='bbox 295 811 312 813; x_wconf 96' lang='eng'>_</span> <span class='ocrx_word' id='word_1_76' title='bbox 323 790 562 814; x_wconf 82' lang='eng' dir='ltr'><em>P/anomicrobium</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 574 790 742 814; x_wconf 86' lang='eng' dir='ltr'><em>mcmeekinii</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 751 788 864 815; x_wconf 73' lang='eng' dir='ltr'><em>823F2T</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 890 787 994 819; x_wconf 94' lang='eng' dir='ltr'>(AFO41</span> <span class='ocrx_word' id='word_1_80' title='bbox 1005 787 1071 819; x_wconf 89' lang='eng'>791)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 279 853 1240 885; baseline 0 -5"><span class='ocrx_word' id='word_1_81' title='bbox 279 877 301 879; x_wconf 96' lang='eng'>_</span> <span class='ocrx_word' id='word_1_82' title='bbox 312 855 551 880; x_wconf 88' lang='eng' dir='ltr'><em>P/anomicrobium</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 563 855 798 880; x_wconf 85' lang='eng' dir='ltr'><em>alkanoc/asticum</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 812 855 918 880; x_wconf 92' lang='eng' dir='ltr'>NCIMB</span> <span class='ocrx_word' id='word_1_85' title='bbox 934 854 1042 880; x_wconf 81' lang='eng' dir='ltr'><em>13489T</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 1059 853 1240 885; x_wconf 83' lang='eng' dir='ltr'><em>(AF029364)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 181 899 1034 951; baseline 0 -6"><span class='ocrx_word' id='word_1_87' title='bbox 181 899 213 919; x_wconf 75' lang='eng'>88</span> <span class='ocrx_word' id='word_1_88' title='bbox 238 942 284 944; x_wconf 96' lang='eng'>_</span> <span class='ocrx_word' id='word_1_89' title='bbox 295 921 481 951; x_wconf 85' lang='eng' dir='ltr'><em>Bhargavaea</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 493 921 697 945; x_wconf 89' lang='eng' dir='ltr'><em>cecembensis</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 710 920 828 945; x_wconf 86' lang='eng' dir='ltr'><em>DSE10T</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 846 917 1034 950; x_wconf 88' lang='eng' dir='ltr'><em>(AM286423)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 237 981 267 1001; baseline 0 0"><span class='ocrx_word' id='word_1_93' title='bbox 237 981 267 1001; x_wconf 91' lang='eng'>74</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 302 1038 799 1073">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 302 1038 799 1073">
+     <span class='ocr_line' id='line_1_29' title="bbox 302 1038 799 1073; baseline 0 -7"><span class='ocrx_word' id='word_1_94' title='bbox 302 1040 387 1066; x_wconf 88' lang='eng' dir='ltr'>Clade</span> <span class='ocrx_word' id='word_1_95' title='bbox 400 1041 403 1065; x_wconf 99' lang='eng'><strong><em>|</em></strong></span> <span class='ocrx_word' id='word_1_96' title='bbox 417 1038 543 1070; x_wconf 82' lang='eng' dir='ltr'><em>[Bacillus</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 554 1049 595 1073; x_wconf 85' lang='eng' dir='ltr'><em>Sp.</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 608 1038 656 1071; x_wconf 85' lang='eng'><em>(29</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 669 1038 799 1073; x_wconf 86' lang='eng' dir='ltr'><em>species)]</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 169 1058 216 1060">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 169 1058 216 1060">
+     <span class='ocr_line' id='line_1_30' title="bbox 169 1058 216 1060; baseline 0 285"><span class='ocrx_word' id='word_1_100' title='bbox 169 1058 216 1060; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 2 1164 171 1165">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 2 1164 171 1165">
+     <span class='ocr_line' id='line_1_31' title="bbox 2 1164 171 1165; baseline 0 180"><span class='ocrx_word' id='word_1_101' title='bbox 2 1164 171 1165; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 2 1164 3 1337">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 2 1164 3 1337">
+     <span class='ocr_line' id='line_1_32' title="bbox 2 1164 3 1337; baseline 0 8"><span class='ocrx_word' id='word_1_102' title='bbox 2 1164 3 1337; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 169 1058 171 1271">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 169 1058 171 1271">
+     <span class='ocr_line' id='line_1_33' title="bbox 169 1058 171 1271; baseline 0 74"><span class='ocrx_word' id='word_1_103' title='bbox 169 1058 171 1271; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 214 929 216 1189">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 214 929 216 1189">
+     <span class='ocr_line' id='line_1_34' title="bbox 214 929 216 1189; baseline 0 156"><span class='ocrx_word' id='word_1_104' title='bbox 214 929 216 1189; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 216 1142 870 1235">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 216 1142 870 1235">
+     <span class='ocr_line' id='line_1_35' title="bbox 228 1146 254 1165; baseline 0 0"><span class='ocrx_word' id='word_1_105' title='bbox 228 1146 254 1165; x_wconf 90' lang='eng'>71</span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 216 1142 870 1235; baseline 0 -39"><span class='ocrx_word' id='word_1_106' title='bbox 216 1142 302 1235; x_wconf 45' lang='eng'><strong>&lt;</strong></span> <span class='ocrx_word' id='word_1_107' title='bbox 313 1171 399 1196; x_wconf 84' lang='eng' dir='ltr'><em>Clade</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 412 1171 423 1196; x_wconf 99' lang='eng'><strong><em>||</em></strong></span> <span class='ocrx_word' id='word_1_109' title='bbox 437 1169 622 1201; x_wconf 83' lang='eng' dir='ltr'><em>[Geobaci/lus</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 633 1179 667 1203; x_wconf 87' lang='eng' dir='ltr'><em>sp</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 679 1169 701 1201; x_wconf 94' lang='eng'>(1</span> <span class='ocrx_word' id='word_1_112' title='bbox 712 1173 726 1196; x_wconf 98' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 739 1169 870 1203; x_wconf 85' lang='eng' dir='ltr'><em>species)]</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 317 1245 990 1343">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 317 1245 990 1343">
+     <span class='ocr_line' id='line_1_37' title="bbox 317 1245 990 1280; baseline 0 -8"><span class='ocrx_word' id='word_1_114' title='bbox 317 1248 512 1272; x_wconf 83' lang='eng' dir='ltr'><em>PaenibaCi/lus</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 523 1248 659 1280; x_wconf 77' lang='eng' dir='ltr'><em>polymyxa</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 672 1247 743 1273; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 756 1246 807 1272; x_wconf 78' lang='eng' dir='ltr'><em>36T</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 815 1245 990 1277; x_wconf 86' lang='eng' dir='ltr'><em>(AJ320493)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 367 1310 978 1343; baseline 0 -6"><span class='ocrx_word' id='word_1_119' title='bbox 367 1313 537 1338; x_wconf 84' lang='eng' dir='ltr'><em>Escherichia</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 549 1313 602 1338; x_wconf 86' lang='eng' dir='ltr'><em>coli</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 610 1313 702 1338; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 717 1314 725 1337; x_wconf 98' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 737 1314 746 1337; x_wconf 94' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 756 1312 825 1338; x_wconf 94' lang='eng' dir='ltr'><em>775T</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 836 1310 978 1343; x_wconf 84' lang='eng' dir='ltr'>(X80725)</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002725-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002725-0-000.pbm.png
new file mode 100644
index 00000000..fe569e23
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002725-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002725-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002725-0-000.pbm.png.hocr
new file mode 100644
index 00000000..fa969f23
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002725-0-000.pbm.png.hocr
@@ -0,0 +1,114 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002725-0-000.pbm.png"; bbox 0 0 1479 773; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 29 0 1347 93">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 129 0 1347 93">
+     <span class='ocr_line' id='line_1_1' title="bbox 129 0 1306 44; baseline 0.004 -13"><span class='ocrx_word' id='word_1_1' title='bbox 129 0 207 31; x_wconf 93' lang='eng'><strong>0.05</strong></span> <span class='ocrx_word' id='word_1_2' title='bbox 510 17 549 36; x_wconf 84' lang='eng'><strong>100</strong></span> <span class='ocrx_word' id='word_1_3' title='bbox 571 4 786 44; x_wconf 88' lang='eng' dir='ltr'><strong>Spirosoma</strong></span> <span class='ocrx_word' id='word_1_4' title='bbox 799 4 935 36; x_wconf 89' lang='eng' dir='ltr'><strong>Iuteum</strong></span> <span class='ocrx_word' id='word_1_5' title='bbox 950 4 1071 36; x_wconf 92' lang='eng' dir='ltr'><strong>M5-H2</strong></span> <span class='ocrx_word' id='word_1_6' title='bbox 1087 4 1306 44; x_wconf 89' lang='eng' dir='ltr'><strong>(EF187349)</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 449 47 1347 93; baseline 0.001 -9"><span class='ocrx_word' id='word_1_7' title='bbox 449 58 488 77; x_wconf 82' lang='eng'><strong>100</strong></span> <span class='ocrx_word' id='word_1_8' title='bbox 510 47 549 66; x_wconf 61' lang='eng'><strong>‘00</strong></span> <span class='ocrx_word' id='word_1_9' title='bbox 572 53 786 93; x_wconf 89' lang='eng' dir='ltr'><strong>Spirosoma</strong></span> <span class='ocrx_word' id='word_1_10' title='bbox 800 54 935 85; x_wconf 90' lang='eng' dir='ltr'><strong>Iuteum</strong></span> <span class='ocrx_word' id='word_1_11' title='bbox 949 53 1115 85; x_wconf 93' lang='eng' dir='ltr'><strong>SPM-1OT</strong></span> <span class='ocrx_word' id='word_1_12' title='bbox 1128 54 1347 93; x_wconf 91' lang='eng' dir='ltr'><strong>(EF451726)</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 461 87 1479 329">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 461 87 1479 329">
+     <span class='ocr_line' id='line_1_3' title="bbox 461 87 1479 148; baseline 0 -8"><span class='ocrx_word' id='word_1_13' title='bbox 461 87 488 106; x_wconf 65' lang='eng'><strong>94</strong></span> <span class='ocrx_word' id='word_1_14' title='bbox 581 109 795 148; x_wconf 87' lang='eng' dir='ltr'><strong>Spirosoma</strong></span> <span class='ocrx_word' id='word_1_15' title='bbox 808 109 1092 148; x_wconf 90' lang='eng' dir='ltr'><strong>spitsbergense</strong></span> <span class='ocrx_word' id='word_1_16' title='bbox 1105 109 1248 140; x_wconf 90' lang='eng' dir='ltr'><strong>SPM-9T</strong></span> <span class='ocrx_word' id='word_1_17' title='bbox 1261 109 1479 148; x_wconf 92' lang='eng' dir='ltr'><strong>(EF451725)</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 604 167 1342 207; baseline 0.001 -9"><span class='ocrx_word' id='word_1_18' title='bbox 604 167 800 207; x_wconf 88' lang='eng' dir='ltr'><strong>Spirosoma</strong></span> <span class='ocrx_word' id='word_1_19' title='bbox 814 168 894 207; x_wconf 91' lang='eng' dir='ltr'><em>rigui</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 905 167 1111 199; x_wconf 92' lang='eng' dir='ltr'><strong>WPCB118T</strong></span> <span class='ocrx_word' id='word_1_21' title='bbox 1125 168 1342 207; x_wconf 89' lang='eng' dir='ltr'><strong>(EF507900)</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 585 229 1359 269; baseline 0 -8"><span class='ocrx_word' id='word_1_22' title='bbox 585 229 781 269; x_wconf 89' lang='eng' dir='ltr'><strong>Spirosoma</strong></span> <span class='ocrx_word' id='word_1_23' title='bbox 796 230 939 269; x_wconf 88' lang='eng' dir='ltr'><strong>lingua/e</strong></span> <span class='ocrx_word' id='word_1_24' title='bbox 955 229 1042 261; x_wconf 91' lang='eng' dir='ltr'><strong>DSM</strong></span> <span class='ocrx_word' id='word_1_25' title='bbox 1058 229 1118 261; x_wconf 94' lang='eng' dir='ltr'><strong>74T</strong></span> <span class='ocrx_word' id='word_1_26' title='bbox 1132 230 1359 269; x_wconf 91' lang='eng' dir='ltr'><strong>(AM000023)</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 556 289 1327 329; baseline 0 -8"><span class='ocrx_word' id='word_1_27' title='bbox 556 290 742 321; x_wconf 85' lang='eng' dir='ltr'><strong>Rudane/la</strong></span> <span class='ocrx_word' id='word_1_28' title='bbox 756 290 845 321; x_wconf 87' lang='eng' dir='ltr'><em>Iutea</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 861 289 948 321; x_wconf 91' lang='eng' dir='ltr'><strong>DSM</strong></span> <span class='ocrx_word' id='word_1_30' title='bbox 967 289 1095 321; x_wconf 89' lang='eng' dir='ltr'><strong>19387T</strong></span> <span class='ocrx_word' id='word_1_31' title='bbox 1108 290 1327 329; x_wconf 90' lang='eng' dir='ltr'><strong>(EF635010)</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 552 347 1446 387">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 552 347 1446 387">
+     <span class='ocr_line' id='line_1_7' title="bbox 552 347 1446 387; baseline 0 -8"><span class='ocrx_word' id='word_1_32' title='bbox 552 348 729 379; x_wconf 87' lang='eng' dir='ltr'><strong>Larkine/la</strong></span> <span class='ocrx_word' id='word_1_33' title='bbox 743 348 913 387; x_wconf 88' lang='eng' dir='ltr'><strong>insperata</strong></span> <span class='ocrx_word' id='word_1_34' title='bbox 930 347 1060 379; x_wconf 93' lang='eng' dir='ltr'><strong>NCIMB</strong></span> <span class='ocrx_word' id='word_1_35' title='bbox 1077 347 1206 379; x_wconf 93' lang='eng' dir='ltr'><strong>14103T</strong></span> <span class='ocrx_word' id='word_1_36' title='bbox 1220 348 1446 387; x_wconf 90' lang='eng' dir='ltr'><strong>(AM000022)</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 366 405 1429 496">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 366 405 1429 496">
+     <span class='ocr_line' id='line_1_8' title="bbox 366 405 1409 445; baseline -0.003 -5"><span class='ocrx_word' id='word_1_37' title='bbox 366 419 493 440; x_wconf 87' lang='eng'><strong>100—</strong></span> <span class='ocrx_word' id='word_1_38' title='bbox 507 405 748 445; x_wconf 86' lang='eng' dir='ltr'><strong>Dyadobacter</strong></span> <span class='ocrx_word' id='word_1_39' title='bbox 758 405 932 437; x_wconf 89' lang='eng' dir='ltr'><strong>crustico/a</strong></span> <span class='ocrx_word' id='word_1_40' title='bbox 948 405 1036 437; x_wconf 92' lang='eng' dir='ltr'><strong>DSM</strong></span> <span class='ocrx_word' id='word_1_41' title='bbox 1054 405 1182 437; x_wconf 91' lang='eng' dir='ltr'><strong>16708T</strong></span> <span class='ocrx_word' id='word_1_42' title='bbox 1197 405 1409 445; x_wconf 92' lang='eng' dir='ltr'><strong>(AJ821885)</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 410 457 1429 496; baseline 0 -8"><span class='ocrx_word' id='word_1_43' title='bbox 410 472 507 474; x_wconf 94' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_44' title='bbox 520 457 761 496; x_wconf 89' lang='eng' dir='ltr'><strong>Dyadobacter</strong></span> <span class='ocrx_word' id='word_1_45' title='bbox 770 457 961 488; x_wconf 90' lang='eng' dir='ltr'><strong>hamtensis</strong></span> <span class='ocrx_word' id='word_1_46' title='bbox 973 457 1055 488; x_wconf 89' lang='eng' dir='ltr'><strong>JCM</strong></span> <span class='ocrx_word' id='word_1_47' title='bbox 1074 457 1202 488; x_wconf 89' lang='eng' dir='ltr'><strong>12919T</strong></span> <span class='ocrx_word' id='word_1_48' title='bbox 1216 457 1429 496; x_wconf 91' lang='eng' dir='ltr'><strong>(AJ619978)</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 613 514 1431 606">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 613 514 1431 606">
+     <span class='ocr_line' id='line_1_10' title="bbox 613 514 1431 554; baseline 0.001 -9"><span class='ocrx_word' id='word_1_49' title='bbox 613 514 752 546; x_wconf 87' lang='eng' dir='ltr'><strong>Rune/Ia</strong></span> <span class='ocrx_word' id='word_1_50' title='bbox 766 514 976 554; x_wconf 90' lang='eng' dir='ltr'><strong>slithyformis</strong></span> <span class='ocrx_word' id='word_1_51' title='bbox 987 514 1096 546; x_wconf 93' lang='eng' dir='ltr'><strong>ATCC</strong></span> <span class='ocrx_word' id='word_1_52' title='bbox 1110 514 1242 546; x_wconf 89' lang='eng' dir='ltr'><strong>29530T</strong></span> <span class='ocrx_word' id='word_1_53' title='bbox 1256 514 1431 554; x_wconf 89' lang='eng' dir='ltr'><strong>(M62786)</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 629 565 1422 606; baseline 0 -10"><span class='ocrx_word' id='word_1_54' title='bbox 629 566 768 597; x_wconf 88' lang='eng' dir='ltr'><strong>Rune/la</strong></span> <span class='ocrx_word' id='word_1_55' title='bbox 783 573 872 597; x_wconf 89' lang='eng' dir='ltr'><strong>zeae</strong></span> <span class='ocrx_word' id='word_1_56' title='bbox 885 565 994 597; x_wconf 92' lang='eng' dir='ltr'><strong>ATCC</strong></span> <span class='ocrx_word' id='word_1_57' title='bbox 1011 565 1191 597; x_wconf 87' lang='eng' dir='ltr'><strong>BAA-293T</strong></span> <span class='ocrx_word' id='word_1_58' title='bbox 1205 566 1422 606; x_wconf 85' lang='eng' dir='ltr'><strong>(AF137381)</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 420 621 1264 773">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 420 621 1264 773">
+     <span class='ocr_line' id='line_1_12' title="bbox 460 621 1264 661; baseline 0 -8"><span class='ocrx_word' id='word_1_59' title='bbox 460 622 618 653; x_wconf 90' lang='eng' dir='ltr'><strong>Arcice/la</strong></span> <span class='ocrx_word' id='word_1_60' title='bbox 633 622 788 661; x_wconf 87' lang='eng' dir='ltr'><strong>aquatica</strong></span> <span class='ocrx_word' id='word_1_61' title='bbox 805 621 891 653; x_wconf 92' lang='eng' dir='ltr'><strong>LMG</strong></span> <span class='ocrx_word' id='word_1_62' title='bbox 905 621 1037 653; x_wconf 88' lang='eng' dir='ltr'><strong>21963T</strong></span> <span class='ocrx_word' id='word_1_63' title='bbox 1051 622 1264 661; x_wconf 88' lang='eng' dir='ltr'><strong>(AJ535729)</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 461 677 1222 717; baseline 0 -8"><span class='ocrx_word' id='word_1_64' title='bbox 461 678 714 709; x_wconf 85' lang='eng' dir='ltr'><strong>Flectobaci/Ius</strong></span> <span class='ocrx_word' id='word_1_65' title='bbox 727 678 835 717; x_wconf 85' lang='eng' dir='ltr'><em>major</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 846 677 933 709; x_wconf 91' lang='eng' dir='ltr'><strong>DSM</strong></span> <span class='ocrx_word' id='word_1_67' title='bbox 952 677 1033 709; x_wconf 83' lang='eng' dir='ltr'><strong>103T</strong></span> <span class='ocrx_word' id='word_1_68' title='bbox 1047 678 1222 717; x_wconf 88' lang='eng' dir='ltr'><strong>(M62787)</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 420 735 1262 773; baseline -0.001 -6"><span class='ocrx_word' id='word_1_69' title='bbox 420 735 674 767; x_wconf 88' lang='eng' dir='ltr'><strong>Flectobacillus</strong></span> <span class='ocrx_word' id='word_1_70' title='bbox 685 735 782 767; x_wconf 84' lang='eng' dir='ltr'><em>lacus</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 795 735 877 767; x_wconf 92' lang='eng' dir='ltr'><strong>JCM</strong></span> <span class='ocrx_word' id='word_1_72' title='bbox 896 735 1024 767; x_wconf 89' lang='eng' dir='ltr'><strong>13398T</strong></span> <span class='ocrx_word' id='word_1_73' title='bbox 1038 735 1262 773; x_wconf 90' lang='eng' dir='ltr'><strong>(DQ112352)</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 184 64 594 310">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 184 64 594 310">
+     <span class='ocr_line' id='line_1_15' title="bbox 419 64 568 115; baseline 0 0"><span class='ocrx_word' id='word_1_74' title='bbox 419 78 461 115; x_wconf 95' lang='eng' dir='ltr'><strong> </strong></span> <span class='ocrx_word' id='word_1_75' title='bbox 488 64 568 115; x_wconf 95' lang='eng' dir='ltr'><strong>  </strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 260 115 581 167; baseline 0 606"><span class='ocrx_word' id='word_1_76' title='bbox 260 115 581 167; x_wconf 95' lang='eng' dir='ltr'><strong> </strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 184 167 594 209; baseline 0 564"><span class='ocrx_word' id='word_1_77' title='bbox 184 167 594 209; x_wconf 95' lang='eng' dir='ltr'><strong> </strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 184 209 585 269; baseline 0 504"><span class='ocrx_word' id='word_1_78' title='bbox 184 209 585 269; x_wconf 95' lang='eng' dir='ltr'><strong> </strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 184 269 556 310; baseline 0 0"><span class='ocrx_word' id='word_1_79' title='bbox 184 269 556 310; x_wconf 95' lang='eng' dir='ltr'><strong>  </strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 146 278 185 296">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 146 278 185 296">
+     <span class='ocr_line' id='line_1_20' title="bbox 146 278 185 296; baseline 0 0"><span class='ocrx_word' id='word_1_80' title='bbox 146 278 185 296; x_wconf 85' lang='eng'><strong>100</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 188 250 190 363">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 188 250 190 363">
+     <span class='ocr_line' id='line_1_21' title="bbox 188 250 190 363; baseline 0 410"><span class='ocrx_word' id='word_1_81' title='bbox 188 250 190 363; x_wconf 95' lang='eng' dir='ltr'><strong> </strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 0 298 617 755">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 0 298 617 755">
+     <span class='ocr_line' id='line_1_22' title="bbox 26 298 192 349; baseline 0 424"><span class='ocrx_word' id='word_1_82' title='bbox 26 298 192 349; x_wconf 95' lang='eng' dir='ltr'><strong> </strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 26 349 192 438; baseline 0 0"><span class='ocrx_word' id='word_1_83' title='bbox 26 349 192 438; x_wconf 95' lang='eng' dir='ltr'><strong>  </strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 0 438 410 515; baseline 0 -50"><span class='ocrx_word' id='word_1_84' title='bbox 0 438 410 515; x_wconf 95' lang='eng' dir='ltr'><strong>  </strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 0 515 617 601; baseline 0 0"><span class='ocrx_word' id='word_1_85' title='bbox 0 515 617 601; x_wconf 95' lang='eng' dir='ltr'><strong>  </strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 26 601 460 755; baseline 0 -39"><span class='ocrx_word' id='word_1_86' title='bbox 26 601 460 755; x_wconf 95' lang='eng' dir='ltr'><strong>   </strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 408 420 410 474">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 408 420 410 474">
+     <span class='ocr_line' id='line_1_27' title="bbox 408 420 410 474; baseline 0 299"><span class='ocrx_word' id='word_1_87' title='bbox 408 420 410 474; x_wconf 95' lang='eng' dir='ltr'><strong> </strong></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002741-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002741-0-000.pbm.png
new file mode 100644
index 00000000..fcd4090b
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002741-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002741-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002741-0-000.pbm.png.hocr
new file mode 100644
index 00000000..ff79c621
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002741-0-000.pbm.png.hocr
@@ -0,0 +1,370 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002741-0-000.pbm.png"; bbox 0 0 1420 1853; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 488 1 558 21">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 488 2 558 20">
+     <span class='ocr_line' id='line_1_1' title="bbox 488 2 558 20; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 488 2 558 20; x_wconf 92' lang='eng'>100/100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 447 37 526 88">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 447 37 526 87">
+     <span class='ocr_line' id='line_1_2' title="bbox 466 37 526 56; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 466 37 500 56; x_wconf 87' lang='eng'>99/1</span> <span class='ocrx_word' id='word_1_3' title='bbox 505 38 526 56; x_wconf 95' lang='eng'><em>00</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 447 69 496 87; baseline 0 0"><span class='ocrx_word' id='word_1_4' title='bbox 447 69 496 87; x_wconf 84' lang='eng'>53/94</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 511 155 560 175">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 511 156 560 174">
+     <span class='ocr_line' id='line_1_4' title="bbox 511 156 560 174; baseline 0 0"><span class='ocrx_word' id='word_1_5' title='bbox 511 156 560 174; x_wconf 88' lang='eng'><em>51/52</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 473 223 563 273">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 473 224 563 272">
+     <span class='ocr_line' id='line_1_5' title="bbox 493 224 563 243; baseline 0 0"><span class='ocrx_word' id='word_1_6' title='bbox 493 224 563 243; x_wconf 87' lang='eng'>100/100</span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 473 254 533 272; baseline 0 0"><span class='ocrx_word' id='word_1_7' title='bbox 473 254 533 272; x_wconf 83' lang='eng'>63/100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 454 298 503 317">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 454 298 503 317">
+     <span class='ocr_line' id='line_1_7' title="bbox 454 298 503 317; baseline 0 0"><span class='ocrx_word' id='word_1_8' title='bbox 454 298 503 317; x_wconf 84' lang='eng'>53/74</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 356 239 416 257">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 356 239 416 257">
+     <span class='ocr_line' id='line_1_8' title="bbox 356 239 416 257; baseline 0 0"><span class='ocrx_word' id='word_1_9' title='bbox 356 239 416 257; x_wconf 85' lang='eng'>95/100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 291 330 351 349">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 291 330 351 349">
+     <span class='ocr_line' id='line_1_9' title="bbox 291 330 351 349; baseline 0 0"><span class='ocrx_word' id='word_1_10' title='bbox 291 330 351 349; x_wconf 86' lang='eng'>95/100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 507 386 566 406">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 507 387 566 405">
+     <span class='ocr_line' id='line_1_10' title="bbox 507 387 566 405; baseline 0 0"><span class='ocrx_word' id='word_1_11' title='bbox 507 387 566 405; x_wconf 89' lang='eng'>100/92</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 222 423 530 453">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 222 424 530 453">
+     <span class='ocr_line' id='line_1_11' title="bbox 222 424 530 453; baseline 0 -11"><span class='ocrx_word' id='word_1_12' title='bbox 222 434 271 453; x_wconf 63' lang='eng'><em>82,94</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 460 424 530 442; x_wconf 85' lang='eng'>100/100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 504 513 564 533">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 504 514 564 532">
+     <span class='ocr_line' id='line_1_12' title="bbox 504 514 564 532; baseline 0 0"><span class='ocrx_word' id='word_1_14' title='bbox 504 514 564 532; x_wconf 87' lang='eng'>95/100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 143 582 579 614">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 143 582 579 614">
+     <span class='ocr_line' id='line_1_13' title="bbox 143 582 579 614; baseline 0 -13"><span class='ocrx_word' id='word_1_15' title='bbox 143 582 202 601; x_wconf 88' lang='eng'>100/99</span> <span class='ocrx_word' id='word_1_16' title='bbox 529 595 579 614; x_wconf 68' lang='eng'>91/69</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 477 624 537 644">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 477 625 537 643">
+     <span class='ocr_line' id='line_1_14' title="bbox 477 625 537 643; baseline 0 0"><span class='ocrx_word' id='word_1_17' title='bbox 477 625 537 643; x_wconf 90' lang='eng'>81/100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 479 749 518 768">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 479 749 518 768">
+     <span class='ocr_line' id='line_1_15' title="bbox 479 749 518 768; baseline 0.026 -1"><span class='ocrx_word' id='word_1_18' title='bbox 479 749 518 768; x_wconf 87' lang='eng'><em>76/—</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 62 814 566 843">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 62 814 566 842">
+     <span class='ocr_line' id='line_1_16' title="bbox 62 814 566 842; baseline 0 -10"><span class='ocrx_word' id='word_1_19' title='bbox 62 814 111 832; x_wconf 81' lang='eng'>98/88</span> <span class='ocrx_word' id='word_1_20' title='bbox 517 824 566 842; x_wconf 70' lang='eng'><em>51/99</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 519 869 569 889">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 519 870 569 888">
+     <span class='ocr_line' id='line_1_17' title="bbox 519 870 569 888; baseline 0 0"><span class='ocrx_word' id='word_1_21' title='bbox 519 870 569 888; x_wconf 87' lang='eng'>66/90</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 514 1158 740 1247">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 514 1159 740 1247">
+     <span class='ocr_line' id='line_1_18' title="bbox 514 1159 740 1247; baseline 0 0"><span class='ocrx_word' id='word_1_22' title='bbox 514 1159 740 1247; x_wconf 69' lang='eng' dir='ltr'>56/100E</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 492 1321 553 1341">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 492 1322 553 1340">
+     <span class='ocr_line' id='line_1_19' title="bbox 492 1322 553 1340; baseline 0 0"><span class='ocrx_word' id='word_1_23' title='bbox 492 1322 553 1340; x_wconf 86' lang='eng'>97/100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 7 1400 745 1450">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 489 1401 745 1449">
+     <span class='ocr_line' id='line_1_20' title="bbox 489 1401 745 1449; baseline 0 -30"><span class='ocrx_word' id='word_1_24' title='bbox 489 1401 549 1419; x_wconf 86' lang='eng'>94/100</span> <span class='ocrx_word' id='word_1_25' title='bbox 560 1406 745 1449; x_wconf 76' lang='eng'>:</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 509 1486 576 1541">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 509 1487 576 1540">
+     <span class='ocr_line' id='line_1_21' title="bbox 537 1487 576 1506; baseline 0 0"><span class='ocrx_word' id='word_1_26' title='bbox 537 1487 576 1506; x_wconf 84' lang='eng'>69/—</span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 509 1522 548 1540; baseline 0 0"><span class='ocrx_word' id='word_1_27' title='bbox 509 1522 548 1540; x_wconf 95' lang='eng'><em>70/—</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 499 1604 559 1625">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 499 1605 559 1624">
+     <span class='ocr_line' id='line_1_23' title="bbox 499 1605 559 1624; baseline 0.017 -1"><span class='ocrx_word' id='word_1_28' title='bbox 499 1605 559 1624; x_wconf 91' lang='eng'>70/100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 760 2 952 67">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 760 2 952 67">
+     <span class='ocr_line' id='line_1_24' title="bbox 761 2 952 23; baseline -0.005 0"><span class='ocrx_word' id='word_1_29' title='bbox 761 2 901 23; x_wconf 78' lang='eng' dir='ltr'><em>Escherichia</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 911 2 952 23; x_wconf 83' lang='eng' dir='ltr'><em>coli</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 760 41 936 67; baseline -0.006 -5"><span class='ocrx_word' id='word_1_31' title='bbox 760 41 855 67; x_wconf 87' lang='eng' dir='ltr'><em>Shigella</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 864 41 936 67; x_wconf 86' lang='eng' dir='ltr'><em>boydil</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 759 81 998 132">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 759 81 998 132">
+     <span class='ocr_line' id='line_1_26' title="bbox 759 81 998 102; baseline 0 0"><span class='ocrx_word' id='word_1_33' title='bbox 759 81 893 102; x_wconf 81' lang='eng' dir='ltr'><em>Salmonella</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 902 82 998 102; x_wconf 82' lang='eng' dir='ltr'><em>enter/ca</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 759 112 985 132; baseline 0 0"><span class='ocrx_word' id='word_1_35' title='bbox 759 112 847 132; x_wconf 79' lang='eng' dir='ltr'><em>Erwin/a</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 857 112 985 132; x_wconf 85' lang='eng' dir='ltr'><em>carotovora</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 761 150 936 175">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 761 150 936 175">
+     <span class='ocr_line' id='line_1_28' title="bbox 761 150 936 175; baseline 0 -5"><span class='ocrx_word' id='word_1_37' title='bbox 761 150 856 170; x_wconf 82' lang='eng' dir='ltr'><em>Yerslnla</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 864 150 936 175; x_wconf 80' lang='eng' dir='ltr'><em>pestis</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 760 193 1091 249">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 760 193 1091 249">
+     <span class='ocr_line' id='line_1_29' title="bbox 760 193 1091 213; baseline 0 0"><span class='ocrx_word' id='word_1_39' title='bbox 760 193 930 213; x_wconf 78' lang='eng' dir='ltr'><em>Photorhabdus</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 939 193 1091 213; x_wconf 83' lang='eng' dir='ltr'><em>luminescens</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 763 223 1081 249; baseline 0.003 -6"><span class='ocrx_word' id='word_1_41' title='bbox 763 223 945 249; x_wconf 73' lang='eng' dir='ltr'><em>Wigglesworthia</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 954 223 1081 249; x_wconf 85' lang='eng' dir='ltr'><em>glossinidia</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 754 260 1131 321">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 754 260 1130 321">
+     <span class='ocr_line' id='line_1_31' title="bbox 760 260 1007 285; baseline 0 -5"><span class='ocrx_word' id='word_1_43' title='bbox 760 260 876 280; x_wconf 82' lang='eng' dir='ltr'><em>Buchnera</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 886 260 1007 285; x_wconf 77' lang='eng' dir='ltr'><em>aphid/cola</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 754 300 1130 321; baseline 0 0"><span class='ocrx_word' id='word_1_45' title='bbox 754 300 799 321; x_wconf 81' lang='eng' dir='ltr'><em>‘Ca.</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 811 301 948 321; x_wconf 84' lang='eng' dir='ltr'>Baumannia</span> <span class='ocrx_word' id='word_1_47' title='bbox 958 300 1130 321; x_wconf 76' lang='eng' dir='ltr'><em>cicadellinicola’</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 761 343 1053 406">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 761 343 1053 406">
+     <span class='ocr_line' id='line_1_33' title="bbox 762 343 1000 369; baseline 0 -5"><span class='ocrx_word' id='word_1_48' title='bbox 762 343 850 364; x_wconf 85' lang='eng' dir='ltr'><em>Soda/ls</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 859 344 1000 369; x_wconf 83' lang='eng' dir='ltr'><em>gloss/nidius</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 761 380 1053 406; baseline 0.003 -6"><span class='ocrx_word' id='word_1_50' title='bbox 761 381 920 406; x_wconf 84' lang='eng' dir='ltr'><em>Haemophilus</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 929 380 1053 401; x_wconf 87' lang='eng' dir='ltr'><em>influenzae</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 755 422 1154 448">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 755 422 1154 448">
+     <span class='ocr_line' id='line_1_35' title="bbox 755 422 1154 448; baseline 0 -6"><span class='ocrx_word' id='word_1_52' title='bbox 755 422 909 442; x_wconf 78' lang='eng' dir='ltr'><em>‘Mannhelmla</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 918 422 1154 448; x_wconf 79' lang='eng' dir='ltr'><em>succiniciproducens’</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 1168 176 1381 196">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 1168 176 1381 196">
+     <span class='ocr_line' id='line_1_36' title="bbox 1168 176 1381 196; baseline 0 0"><span class='ocrx_word' id='word_1_54' title='bbox 1168 176 1381 196; x_wconf 83' lang='eng' dir='ltr'><em>Enterobacteriales</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 1199 422 1371 442">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 1199 422 1371 442">
+     <span class='ocr_line' id='line_1_37' title="bbox 1199 422 1371 442; baseline 0 0"><span class='ocrx_word' id='word_1_55' title='bbox 1199 422 1371 442; x_wconf 83' lang='eng' dir='ltr'><em>Pasteurellales</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 760 468 1053 607">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 760 468 1053 607">
+     <span class='ocr_line' id='line_1_38' title="bbox 761 468 1022 488; baseline 0 0"><span class='ocrx_word' id='word_1_56' title='bbox 761 468 897 488; x_wconf 83' lang='eng' dir='ltr'><em>Pasteurella</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 906 468 1022 488; x_wconf 85' lang='eng' dir='ltr'><em>multocida</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 760 507 1035 533; baseline 0 -6"><span class='ocrx_word' id='word_1_58' title='bbox 760 507 901 527; x_wconf 86' lang='eng' dir='ltr'><em>Aeromonas</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 909 507 1035 533; x_wconf 88' lang='eng' dir='ltr'><em>hydrophila</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 760 547 1053 567; baseline 0 0"><span class='ocrx_word' id='word_1_60' title='bbox 760 547 901 567; x_wconf 83' lang='eng' dir='ltr'><em>Aeromonas</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 910 547 1053 567; x_wconf 79' lang='eng' dir='ltr'><em>salmonicida</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 761 586 924 607; baseline 0 0"><span class='ocrx_word' id='word_1_62' title='bbox 761 587 827 607; x_wconf 87' lang='eng' dir='ltr'><em>Vibrlo</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 836 586 924 607; x_wconf 87' lang='eng' dir='ltr'><em>fischeri</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 1111 505 1327 571">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 1111 505 1327 571">
+     <span class='ocr_line' id='line_1_42' title="bbox 1111 505 1327 571; baseline 0 -26"><span class='ocrx_word' id='word_1_64' title='bbox 1111 505 1123 571; x_wconf 66' lang='eng'><strong><em>}</em></strong></span> <span class='ocrx_word' id='word_1_65' title='bbox 1133 525 1327 545; x_wconf 84' lang='eng' dir='ltr'><em>Aeromonadales</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 761 629 1395 790">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 761 629 1395 790">
+     <span class='ocr_line' id='line_1_43' title="bbox 762 629 1273 655; baseline 0.002 -5"><span class='ocrx_word' id='word_1_66' title='bbox 762 630 953 650; x_wconf 82' lang='eng' dir='ltr'><em>Photobacterium</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 961 629 1092 655; x_wconf 86' lang='eng' dir='ltr'><em>profundum</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 1140 632 1273 652; x_wconf 84' lang='eng' dir='ltr'><em>Vibriona/es</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 761 671 941 691; baseline 0 0"><span class='ocrx_word' id='word_1_69' title='bbox 761 671 828 691; x_wconf 88' lang='eng' dir='ltr'><em>Vibrio</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 837 671 941 691; x_wconf 85' lang='eng' dir='ltr'><em>cholerae</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 762 710 1041 731; baseline 0.004 -1"><span class='ocrx_word' id='word_1_71' title='bbox 762 710 902 731; x_wconf 85' lang='eng' dir='ltr'><em>Shewanella</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 911 711 1041 731; x_wconf 85' lang='eng' dir='ltr'><em>oneidensis</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 762 749 1009 769; baseline 0 0"><span class='ocrx_word' id='word_1_73' title='bbox 762 749 888 769; x_wconf 84' lang='eng' dir='ltr'><em>ldiomarina</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 897 749 1009 769; x_wconf 87' lang='eng' dir='ltr'><em>loihiensis</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 1189 770 1395 790; baseline 0 0"><span class='ocrx_word' id='word_1_75' title='bbox 1189 770 1395 790; x_wconf 80' lang='eng' dir='ltr'><em>Alteromonadales</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 762 788 1158 853">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 762 788 1158 853">
+     <span class='ocr_line' id='line_1_48' title="bbox 762 788 1074 814; baseline 0 -5"><span class='ocrx_word' id='word_1_76' title='bbox 762 788 869 809; x_wconf 80' lang='eng' dir='ltr'><em>Colwellia</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 877 789 1074 814; x_wconf 80' lang='eng' dir='ltr'><em>psychrerythraea</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_49' title="bbox 762 828 1158 853; baseline 0 -5"><span class='ocrx_word' id='word_1_78' title='bbox 762 828 1005 848; x_wconf 85' lang='eng' dir='ltr'><em>Pseudoalteromonas</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 1014 828 1158 853; x_wconf 83' lang='eng' dir='ltr'><em>haloplanktis</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 761 871 998 934">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 761 871 998 934">
+     <span class='ocr_line' id='line_1_50' title="bbox 761 871 998 896; baseline 0 -5"><span class='ocrx_word' id='word_1_80' title='bbox 761 871 955 896; x_wconf 85' lang='eng' dir='ltr'><em>Oceanospirillum</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 964 876 998 896; x_wconf 88' lang='eng' dir='ltr'><em>sp.</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_51' title="bbox 761 909 974 934; baseline 0 -5"><span class='ocrx_word' id='word_1_82' title='bbox 761 909 934 929; x_wconf 79' lang='eng' dir='ltr'><em>Oceanobacter</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 940 914 974 934; x_wconf 86' lang='eng' dir='ltr'><em>sp.</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 761 952 991 977">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 761 952 991 977">
+     <span class='ocr_line' id='line_1_52' title="bbox 761 952 991 977; baseline 0 -5"><span class='ocrx_word' id='word_1_84' title='bbox 761 952 853 972; x_wconf 85' lang='eng' dir='ltr'><em>Hahella</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 863 952 991 977; x_wconf 85' lang='eng' dir='ltr'><em>chejuensis</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 761 986 1369 1028">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 761 986 1369 1028">
+     <span class='ocr_line' id='line_1_53' title="bbox 761 986 1369 1028; baseline 0 -22"><span class='ocrx_word' id='word_1_86' title='bbox 761 986 988 1006; x_wconf 83' lang='eng' dir='ltr'><em>Chromohalobacter</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 994 986 1123 1011; x_wconf 86' lang='eng' dir='ltr'><em>saleXIgens</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 1162 1002 1369 1028; x_wconf 59' lang='eng' dir='ltr'><em>Oceanospiri/Iales</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_37' title="bbox 760 1037 1048 1063">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 760 1037 1048 1063">
+     <span class='ocr_line' id='line_1_54' title="bbox 760 1037 1048 1063; baseline 0 -6"><span class='ocrx_word' id='word_1_89' title='bbox 760 1037 922 1057; x_wconf 82' lang='eng' dir='ltr'><em>Marinabacter</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 929 1037 1048 1063; x_wconf 84' lang='eng' dir='ltr'><em>aquaeolei</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_38' title="bbox 760 1078 1103 1218">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 760 1078 1103 1218">
+     <span class='ocr_line' id='line_1_55' title="bbox 761 1078 1103 1104; baseline 0 -5"><span class='ocrx_word' id='word_1_91' title='bbox 761 1078 965 1104; x_wconf 86' lang='eng' dir='ltr'><em>Saccharophagus</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 974 1079 1103 1104; x_wconf 85' lang='eng' dir='ltr'><em>degradans</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_56' title="bbox 762 1117 970 1142; baseline 0 -5"><span class='ocrx_word' id='word_1_93' title='bbox 762 1117 928 1137; x_wconf 84' lang='eng' dir='ltr'><em>Marinomonas</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 937 1122 970 1142; x_wconf 88' lang='eng' dir='ltr'><em>sp.</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_57' title="bbox 760 1157 1083 1177; baseline 0 0"><span class='ocrx_word' id='word_1_95' title='bbox 760 1157 935 1177; x_wconf 86' lang='eng' dir='ltr'><em>Pseudomonas</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 944 1157 1083 1177; x_wconf 81' lang='eng' dir='ltr'><em>fluorescens</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_58' title="bbox 761 1192 1047 1218; baseline 0 -5"><span class='ocrx_word' id='word_1_97' title='bbox 761 1192 935 1213; x_wconf 87' lang='eng' dir='ltr'><em>Pseudomonas</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 944 1192 1047 1218; x_wconf 82' lang='eng' dir='ltr'><em>syringae</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_39' title="bbox 760 1235 1078 1298">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 760 1235 1078 1298">
+     <span class='ocr_line' id='line_1_59' title="bbox 760 1235 1078 1260; baseline 0 -5"><span class='ocrx_word' id='word_1_99' title='bbox 760 1235 935 1255; x_wconf 86' lang='eng' dir='ltr'><em>Pseudomonas</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 944 1235 1078 1260; x_wconf 83' lang='eng' dir='ltr'><em>aeruginosa</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_60' title="bbox 762 1278 1068 1298; baseline 0 0"><span class='ocrx_word' id='word_1_101' title='bbox 762 1278 906 1298; x_wconf 81' lang='eng' dir='ltr'><em>Alcanivorax</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 914 1278 1068 1298; x_wconf 83' lang='eng' dir='ltr'><em>borkumensis</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_40' title="bbox 1161 1255 1387 1276">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 1161 1255 1387 1276">
+     <span class='ocr_line' id='line_1_61' title="bbox 1161 1255 1387 1276; baseline 0 0"><span class='ocrx_word' id='word_1_103' title='bbox 1161 1255 1387 1276; x_wconf 82' lang='eng' dir='ltr'><em>Pseudomonadales</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_41' title="bbox 760 1322 1052 1423">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 760 1322 1051 1423">
+     <span class='ocr_line' id='line_1_62' title="bbox 760 1322 971 1347; baseline 0 -5"><span class='ocrx_word' id='word_1_104' title='bbox 760 1322 931 1342; x_wconf 81' lang='eng' dir='ltr'><em>Acinetobacter</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 937 1327 971 1347; x_wconf 88' lang='eng' dir='ltr'><em>sp.</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_63' title="bbox 761 1359 1038 1385; baseline 0 -6"><span class='ocrx_word' id='word_1_106' title='bbox 761 1359 938 1385; x_wconf 78' lang='eng' dir='ltr'><em>Psychrobacter</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 945 1359 1038 1379; x_wconf 82' lang='eng' dir='ltr'><em>arcticus</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_64' title="bbox 762 1397 1051 1423; baseline 0 -6"><span class='ocrx_word' id='word_1_108' title='bbox 762 1397 886 1423; x_wconf 85' lang='eng' dir='ltr'><em>Legione/la</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 894 1397 1051 1423; x_wconf 86' lang='eng' dir='ltr'><em>pneumophila</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_42' title="bbox 760 1439 1080 1545">
+    <p class='ocr_par' dir='ltr' id='par_1_42' title="bbox 760 1439 1080 1545">
+     <span class='ocr_line' id='line_1_65' title="bbox 760 1439 954 1460; baseline -0.005 0"><span class='ocrx_word' id='word_1_110' title='bbox 760 1439 855 1460; x_wconf 88' lang='eng' dir='ltr'><em>Coxiella</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 864 1439 954 1460; x_wconf 88' lang='eng' dir='ltr'><em>burnetii</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_66' title="bbox 760 1482 1080 1508; baseline 0 -5"><span class='ocrx_word' id='word_1_112' title='bbox 760 1482 941 1508; x_wconf 75' lang='eng' dir='ltr'><em>Methy/ococcus</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 950 1482 1080 1508; x_wconf 85' lang='eng' dir='ltr'><em>capsulatus</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_67' title="bbox 762 1525 1037 1545; baseline 0 0"><span class='ocrx_word' id='word_1_114' title='bbox 762 1525 934 1545; x_wconf 79' lang='eng' dir='ltr'><em>Alkali/imnicola</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 944 1525 1037 1545; x_wconf 83' lang='eng' dir='ltr'><em>ehrlichli</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_43' title="bbox 1161 1414 1320 1440">
+    <p class='ocr_par' dir='ltr' id='par_1_43' title="bbox 1161 1414 1320 1440">
+     <span class='ocr_line' id='line_1_68' title="bbox 1161 1414 1320 1440; baseline 0 -6"><span class='ocrx_word' id='word_1_116' title='bbox 1161 1414 1320 1440; x_wconf 69' lang='eng' dir='ltr'><em>Legions/lakes</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_44' title="bbox 1161 1510 1414 1536">
+    <p class='ocr_par' dir='ltr' id='par_1_44' title="bbox 1161 1510 1414 1536">
+     <span class='ocr_line' id='line_1_69' title="bbox 1161 1510 1414 1536; baseline 0 -6"><span class='ocrx_word' id='word_1_117' title='bbox 1161 1510 1363 1536; x_wconf 82' lang='eng' dir='ltr'><em>Methy/ococcales</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 1372 1510 1414 1530; x_wconf 79' lang='eng' dir='ltr'><em>and</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_45' title="bbox 760 1541 1381 1709">
+    <p class='ocr_par' dir='ltr' id='par_1_45' title="bbox 760 1541 1381 1709">
+     <span class='ocr_line' id='line_1_70' title="bbox 1162 1541 1322 1562; baseline 0 0"><span class='ocrx_word' id='word_1_119' title='bbox 1162 1541 1322 1562; x_wconf 87' lang='eng' dir='ltr'><em>Chromatlales</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_71' title="bbox 760 1566 1022 1586; baseline 0 0"><span class='ocrx_word' id='word_1_120' title='bbox 760 1566 932 1586; x_wconf 82' lang='eng' dir='ltr'><em>Nitrosococcus</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 941 1566 1022 1586; x_wconf 89' lang='eng' dir='ltr'><em>oceani</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_72' title="bbox 760 1609 1071 1634; baseline 0 -5"><span class='ocrx_word' id='word_1_122' title='bbox 760 1609 930 1629; x_wconf 83' lang='eng' dir='ltr'><em>Xanthomonas</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 940 1609 1071 1634; x_wconf 83' lang='eng' dir='ltr'><em>campestris</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_73' title="bbox 761 1629 1381 1672; baseline 0.002 -6"><span class='ocrx_word' id='word_1_124' title='bbox 761 1646 782 1666; x_wconf 93' lang='eng' dir='ltr'><em>X</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 780 1646 842 1672; x_wconf 86' lang='eng' dir='ltr'><em>ylella</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 851 1646 966 1667; x_wconf 83' lang='eng' dir='ltr'><em>fastidiosa</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 1159 1629 1381 1649; x_wconf 61' lang='eng' dir='ltr'><em>xanthomonadales</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_74' title="bbox 761 1685 1373 1709; baseline -0.007 0"><span class='ocrx_word' id='word_1_128' title='bbox 761 1689 930 1709; x_wconf 82' lang='eng' dir='ltr'><em>chhelobacter</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 936 1689 1039 1709; x_wconf 90' lang='eng' dir='ltr'><em>nodosus</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 1075 1700 1135 1702; x_wconf 96' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_131' title='bbox 1162 1685 1373 1706; x_wconf 81' lang='eng' dir='ltr'><em>Card/obacteriales</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_46' title="bbox 759 1735 1310 1774">
+    <p class='ocr_par' dir='ltr' id='par_1_46' title="bbox 759 1735 1310 1774">
+     <span class='ocr_line' id='line_1_75' title="bbox 759 1735 1232 1757; baseline 0.004 -2"><span class='ocrx_word' id='word_1_132' title='bbox 759 1735 890 1755; x_wconf 83' lang='eng' dir='ltr'><em>Thiamicros</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 906 1735 935 1755; x_wconf 88' lang='eng' dir='ltr'><em>ira</em></span> <span class='ocrx_word' id='word_1_134' title='bbox 945 1740 1012 1755; x_wconf 80' lang='eng' dir='ltr'><em>cruno</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 1029 1740 1073 1755; x_wconf 84' lang='eng' dir='ltr'><em>ena</em></span> <span class='ocrx_word' id='word_1_136' title='bbox 1191 1754 1193 1757; x_wconf 97' lang='eng'>.</span> <span class='ocrx_word' id='word_1_137' title='bbox 1229 1754 1232 1757; x_wconf 93' lang='eng'><strong><em>.</em></strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_76' title="bbox 890 1740 1310 1774; baseline 0.002 -1"><span class='ocrx_word' id='word_1_138' title='bbox 890 1740 905 1760; x_wconf 78' lang='eng' dir='ltr'><em>p</em></span> <span class='ocrx_word' id='word_1_139' title='bbox 1013 1740 1027 1761; x_wconf 79' lang='eng' dir='ltr'><strong><em>g</em></strong></span> <span class='ocrx_word' id='word_1_140' title='bbox 1157 1754 1310 1774; x_wconf 78' lang='eng' dir='ltr'><em>Th/otrlchales</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_47' title="bbox 1128 887 1132 1799">
+    <p class='ocr_par' dir='ltr' id='par_1_47' title="bbox 1128 887 1132 1799">
+     <span class='ocr_line' id='line_1_77' title="bbox 1128 887 1132 1799; baseline 0 54"><span class='ocrx_word' id='word_1_141' title='bbox 1128 887 1132 1799; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_48' title="bbox 760 1782 1017 1803">
+    <p class='ocr_par' dir='ltr' id='par_1_48' title="bbox 760 1782 1017 1803">
+     <span class='ocr_line' id='line_1_78' title="bbox 760 1782 1017 1803; baseline 0.004 -1"><span class='ocrx_word' id='word_1_142' title='bbox 760 1782 891 1803; x_wconf 85' lang='eng' dir='ltr'><em>Francisella</em></span> <span class='ocrx_word' id='word_1_143' title='bbox 901 1782 1017 1803; x_wconf 84' lang='eng' dir='ltr'><em>tularensis</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_49' title="bbox 760 1830 1047 1850">
+    <p class='ocr_par' dir='ltr' id='par_1_49' title="bbox 760 1830 1047 1850">
+     <span class='ocr_line' id='line_1_79' title="bbox 760 1830 1047 1850; baseline 0 0"><span class='ocrx_word' id='word_1_144' title='bbox 760 1830 792 1850; x_wconf 90' lang='eng' dir='ltr'><em>Ca</em></span> <span class='ocrx_word' id='word_1_145' title='bbox 795 1830 909 1850; x_wconf 86' lang='eng' dir='ltr'><em>ulobacter</em></span> <span class='ocrx_word' id='word_1_146' title='bbox 915 1830 1047 1850; x_wconf 85' lang='eng' dir='ltr'><em>crescentus</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002766-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002766-0-000.pbm.png
new file mode 100644
index 00000000..f5914238
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002766-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002766-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002766-0-000.pbm.png.hocr
new file mode 100644
index 00000000..6306f3b2
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002766-0-000.pbm.png.hocr
@@ -0,0 +1,164 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002766-0-000.pbm.png"; bbox 0 0 994 1049; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 87 360 124 378">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 87 360 124 378">
+     <span class='ocr_line' id='line_1_1' title="bbox 87 360 124 378; baseline 0.027 -1"><span class='ocrx_word' id='word_1_1' title='bbox 87 360 124 378; x_wconf 88' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 106 387 171 389">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 106 387 171 389">
+     <span class='ocr_line' id='line_1_2' title="bbox 106 387 171 389; baseline 0 660"><span class='ocrx_word' id='word_1_2' title='bbox 106 387 171 389; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 106 387 107 708">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 106 387 107 708">
+     <span class='ocr_line' id='line_1_3' title="bbox 106 387 107 708; baseline 0 341"><span class='ocrx_word' id='word_1_3' title='bbox 106 387 107 708; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 169 279 171 497">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 169 279 171 497">
+     <span class='ocr_line' id='line_1_4' title="bbox 169 279 171 497; baseline 0 552"><span class='ocrx_word' id='word_1_4' title='bbox 169 279 171 497; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 206 0 874 472">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 229 0 864 323">
+     <span class='ocr_line' id='line_1_5' title="bbox 230 0 864 28; baseline 0 -6"><span class='ocrx_word' id='word_1_5' title='bbox 230 0 370 28; x_wconf 82' lang='eng' dir='ltr'><em>Leptospira</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 380 0 573 28; x_wconf 82' lang='eng' dir='ltr'><em>borgpetersen/i</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 582 0 636 22; x_wconf 86' lang='eng' dir='ltr'>Mus</span> <span class='ocrx_word' id='word_1_8' title='bbox 648 0 694 22; x_wconf 83' lang='eng'><em>127</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 705 0 864 28; x_wconf 85' lang='eng' dir='ltr'><em>(AY631884)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 229 47 760 78; baseline -0.002 -6"><span class='ocrx_word' id='word_1_10' title='bbox 229 49 368 78; x_wconf 85' lang='eng' dir='ltr'><em>Leptospira</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 380 49 445 72; x_wconf 85' lang='eng' dir='ltr'><em>we/lii</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 453 47 591 72; x_wconf 80' lang='eng' dir='ltr'><em>CelledoniT</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 602 49 760 78; x_wconf 85' lang='eng' dir='ltr'><em>(AY631877)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 230 96 749 124; baseline 0 -6"><span class='ocrx_word' id='word_1_14' title='bbox 230 96 370 124; x_wconf 82' lang='eng' dir='ltr'><em>Leptospira</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 380 96 520 118; x_wconf 84' lang='eng' dir='ltr'><em>alexanderi</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 527 96 580 118; x_wconf 88' lang='eng' dir='ltr'><em>A23</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 591 96 749 124; x_wconf 83' lang='eng' dir='ltr'><em>(AY996803)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 229 144 802 175; baseline 0 -6"><span class='ocrx_word' id='word_1_18' title='bbox 229 147 368 175; x_wconf 74' lang='eng' dir='ltr'><em>Leptosp/&quot;ra</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 379 147 519 169; x_wconf 83' lang='eng' dir='ltr'><em>santarosai</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 528 147 561 169; x_wconf 95' lang='eng' dir='ltr'>LT</span> <span class='ocrx_word' id='word_1_21' title='bbox 571 144 633 169; x_wconf 89' lang='eng' dir='ltr'><em>821T</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 643 147 802 175; x_wconf 81' lang='eng' dir='ltr'><em>(AY631883)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 229 195 779 226; baseline 0 -6"><span class='ocrx_word' id='word_1_23' title='bbox 229 197 369 226; x_wconf 82' lang='eng' dir='ltr'><em>Leptospira</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 379 197 492 226; x_wconf 89' lang='eng' dir='ltr'><em>noguchii</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 500 197 539 220; x_wconf 93' lang='eng' dir='ltr'><em>CZ</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 549 195 611 220; x_wconf 78' lang='eng' dir='ltr'><em>2‘14T</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 621 197 779 226; x_wconf 87' lang='eng' dir='ltr'><em>(AY631886)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 231 243 787 274; baseline -0.002 -6"><span class='ocrx_word' id='word_1_28' title='bbox 231 246 370 274; x_wconf 81' lang='eng' dir='ltr'><em>Leptospira</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 381 246 531 274; x_wconf 86' lang='eng' dir='ltr'><em>interrogans</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 542 243 618 268; x_wconf 91' lang='eng' dir='ltr'><em>RGAT</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 629 246 787 274; x_wconf 86' lang='eng' dir='ltr'><em>(AY631894)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 233 292 790 323; baseline 0 -6"><span class='ocrx_word' id='word_1_32' title='bbox 233 295 372 323; x_wconf 79' lang='eng' dir='ltr'><em>Leptospira</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 382 295 513 317; x_wconf 84' lang='eng' dir='ltr'><em>kirschneri</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 521 292 622 317; x_wconf 71' lang='eng' dir='ltr'><em>3522C)T</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 632 295 790 323; x_wconf 83' lang='eng' dir='ltr'><em>(AY631895)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 206 344 874 424">
+     <span class='ocr_line' id='line_1_12' title="bbox 206 344 874 372; baseline 0 -6"><span class='ocrx_word' id='word_1_36' title='bbox 206 353 213 354; x_wconf 41' lang='eng'><strong><em>*</em></strong></span> <span class='ocrx_word' id='word_1_37' title='bbox 230 344 369 372; x_wconf 87' lang='eng' dir='ltr'><em>Leptospira</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 379 344 589 372; x_wconf 82' lang='eng' dir='ltr'><em>genomospecies</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 602 344 610 366; x_wconf 91' lang='eng'>1</span> <span class='ocrx_word' id='word_1_40' title='bbox 625 344 702 366; x_wconf 80' lang='eng'><em>79601</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 716 344 874 372; x_wconf 80' lang='eng' dir='ltr'><em>(AY631881)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 206 393 817 424; baseline 0 -6"><span class='ocrx_word' id='word_1_42' title='bbox 206 402 213 404; x_wconf 74' lang='eng'>&#39;</span> <span class='ocrx_word' id='word_1_43' title='bbox 230 395 384 424; x_wconf 86' lang='eng' dir='ltr'><em>Leptospira</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 393 395 490 424; x_wconf 83' lang='eng' dir='ltr'><em>kmetyi</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 499 393 646 424; x_wconf 88' lang='eng' dir='ltr'><em>Bejo-lso9T</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 654 395 817 424; x_wconf 88' lang='eng' dir='ltr'><em>(AB279549)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 206 440 815 471">
+     <span class='ocr_line' id='line_1_14' title="bbox 206 440 815 471; baseline 0 -6"><span class='ocrx_word' id='word_1_47' title='bbox 206 451 233 453; x_wconf 91' lang='eng'>—</span> <span class='ocrx_word' id='word_1_48' title='bbox 264 443 403 471; x_wconf 79' lang='eng' dir='ltr'><em>Leptospira</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 415 443 490 465; x_wconf 83' lang='eng' dir='ltr'><em>wolfﬁi</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 500 440 648 465; x_wconf 78' lang='eng' dir='ltr'><em>Khorat—HZT</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 659 443 815 471; x_wconf 88' lang='eng' dir='ltr'><em>(EF025496)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 176 389 202 407">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 176 389 202 407">
+     <span class='ocr_line' id='line_1_15' title="bbox 176 389 202 407; baseline 0 0"><span class='ocrx_word' id='word_1_52' title='bbox 176 389 202 407; x_wconf 87' lang='eng'><em>65</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 169 495 206 497">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 169 495 206 497">
+     <span class='ocr_line' id='line_1_16' title="bbox 169 495 206 497; baseline 0 552"><span class='ocrx_word' id='word_1_53' title='bbox 169 495 206 497; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 136 505 174 523">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 136 505 174 523">
+     <span class='ocr_line' id='line_1_17' title="bbox 136 505 174 523; baseline 0.026 -1"><span class='ocrx_word' id='word_1_54' title='bbox 136 505 174 523; x_wconf 90' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 171 549 208 567">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 171 549 208 567">
+     <span class='ocr_line' id='line_1_18' title="bbox 171 549 208 567; baseline 0 0"><span class='ocrx_word' id='word_1_55' title='bbox 171 549 208 567; x_wconf 91' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 204 280 208 539">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 204 280 208 539">
+     <span class='ocr_line' id='line_1_19' title="bbox 204 280 208 539; baseline 0 510"><span class='ocrx_word' id='word_1_56' title='bbox 204 280 208 539; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 256 538 994 719">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 261 539 766 570">
+     <span class='ocr_line' id='line_1_20' title="bbox 261 539 766 570; baseline 0 -6"><span class='ocrx_word' id='word_1_57' title='bbox 261 542 400 570; x_wconf 82' lang='eng' dir='ltr'><em>Leptosp/ra</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 411 542 510 564; x_wconf 84' lang='eng' dir='ltr'><em>broomi/</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 519 539 598 564; x_wconf 82' lang='eng' dir='ltr'><em>5399T</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 608 542 766 570; x_wconf 85' lang='eng' dir='ltr'><em>(AY796065)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 262 588 715 619">
+     <span class='ocr_line' id='line_1_21' title="bbox 262 588 715 619; baseline 0.002 -6"><span class='ocrx_word' id='word_1_61' title='bbox 262 591 402 619; x_wconf 86' lang='eng' dir='ltr'><em>Leptospira</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 412 591 493 614; x_wconf 85' lang='eng' dir='ltr'><em>inadai</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 503 588 547 614; x_wconf 81' lang='eng' dir='ltr'><em>10T</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 557 591 715 619; x_wconf 82' lang='eng' dir='ltr'><em>(AY631896)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 256 641 994 718">
+     <span class='ocr_line' id='line_1_22' title="bbox 256 641 994 669; baseline -0.001 -6"><span class='ocrx_word' id='word_1_65' title='bbox 256 641 395 669; x_wconf 81' lang='eng' dir='ltr'><em>Leptospira</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 405 641 616 669; x_wconf 84' lang='eng' dir='ltr'><em>genomospecies</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 627 641 641 663; x_wconf 86' lang='eng'><em>3</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 651 641 714 663; x_wconf 89' lang='eng' dir='ltr'><em>WaZ</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 726 641 824 663; x_wconf 88' lang='eng' dir='ltr'>Holland</span> <span class='ocrx_word' id='word_1_70' title='bbox 836 641 994 669; x_wconf 81' lang='eng' dir='ltr'><em>(AY631897)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 256 687 776 718; baseline 0 -6"><span class='ocrx_word' id='word_1_71' title='bbox 256 690 395 718; x_wconf 83' lang='eng' dir='ltr'><em>Leptospira</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 406 689 491 712; x_wconf 83' lang='eng' dir='ltr'><em>biflexa</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 503 690 577 712; x_wconf 86' lang='eng' dir='ltr'><em>Patoc</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 589 687 607 712; x_wconf 98' lang='eng' dir='ltr'><em>|T</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 618 690 776 718; x_wconf 85' lang='eng' dir='ltr'><em>(AY631876)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 194 490 760 604">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 194 490 760 604">
+     <span class='ocr_line' id='line_1_24' title="bbox 206 490 760 600; baseline 0.002 -86"><span class='ocrx_word' id='word_1_76' title='bbox 206 500 231 600; x_wconf 31' lang='eng' dir='ltr'><em>i</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 263 492 402 520; x_wconf 81' lang='eng' dir='ltr'><em>Leptospira</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 413 492 486 515; x_wconf 85' lang='eng' dir='ltr'><em>fainei</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 495 492 553 515; x_wconf 92' lang='eng' dir='ltr'>BUT</span> <span class='ocrx_word' id='word_1_80' title='bbox 562 490 591 515; x_wconf 72' lang='eng' dir='ltr'><em>EST</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 602 492 760 520; x_wconf 80' lang='eng' dir='ltr'><em>(AY631885)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 194 586 220 604; baseline 0 0"><span class='ocrx_word' id='word_1_82' title='bbox 194 586 220 604; x_wconf 87' lang='eng'>63</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 156 716 193 734">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 156 716 193 734">
+     <span class='ocr_line' id='line_1_26' title="bbox 156 716 193 734; baseline 0 0"><span class='ocrx_word' id='word_1_83' title='bbox 156 716 193 734; x_wconf 92' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 161 937 175 959">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 161 937 175 959">
+     <span class='ocr_line' id='line_1_27' title="bbox 161 937 175 959; baseline 0 0"><span class='ocrx_word' id='word_1_84' title='bbox 161 937 175 959; x_wconf 93' lang='eng' dir='ltr'><em>L</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 122 1003 169 1049">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 122 1003 169 1049">
+     <span class='ocr_line' id='line_1_28' title="bbox 122 1003 169 1026; baseline 0 0"><span class='ocrx_word' id='word_1_85' title='bbox 122 1003 169 1026; x_wconf 90' lang='eng' dir='ltr'><em>I—I</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 122 1030 168 1049; baseline -0.022 0"><span class='ocrx_word' id='word_1_86' title='bbox 122 1030 168 1049; x_wconf 86' lang='eng'><em>0.02</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 210 736 966 917">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 211 737 966 916">
+     <span class='ocr_line' id='line_1_30' title="bbox 256 737 786 768; baseline 0 -6"><span class='ocrx_word' id='word_1_87' title='bbox 256 740 395 768; x_wconf 81' lang='eng' dir='ltr'><em>Leptospira</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 407 740 531 762; x_wconf 85' lang='eng' dir='ltr'><em>wolbachii</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 539 737 617 762; x_wconf 92' lang='eng' dir='ltr'><em>CDCT</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 627 740 786 768; x_wconf 82' lang='eng' dir='ltr'><em>(AY631879)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 231 775 947 817; baseline 0 -6"><span class='ocrx_word' id='word_1_91' title='bbox 231 775 237 793; x_wconf 66' lang='eng'>1</span> <span class='ocrx_word' id='word_1_92' title='bbox 263 788 402 817; x_wconf 78' lang='eng' dir='ltr'><em>Leptospira</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 412 788 622 817; x_wconf 86' lang='eng' dir='ltr'><em>genomospecies</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 632 789 648 811; x_wconf 89' lang='eng'>4</span> <span class='ocrx_word' id='word_1_95' title='bbox 660 788 692 811; x_wconf 97' lang='eng' dir='ltr'>LT</span> <span class='ocrx_word' id='word_1_96' title='bbox 704 788 777 811; x_wconf 81' lang='eng'><em>11-33</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 789 788 947 817; x_wconf 82' lang='eng' dir='ltr'><em>(AY631888)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 211 838 966 867; baseline -0.003 -5"><span class='ocrx_word' id='word_1_98' title='bbox 211 844 237 862; x_wconf 85' lang='eng'><em>64</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 264 838 403 866; x_wconf 78' lang='eng' dir='ltr'><em>Leptospira</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 413 838 623 867; x_wconf 82' lang='eng' dir='ltr'><em>genomospecies</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 634 838 648 860; x_wconf 93' lang='eng'>5</span> <span class='ocrx_word' id='word_1_102' title='bbox 660 838 711 860; x_wconf 85' lang='eng' dir='ltr'>Sao</span> <span class='ocrx_word' id='word_1_103' title='bbox 723 838 797 860; x_wconf 89' lang='eng' dir='ltr'>Paulo</span> <span class='ocrx_word' id='word_1_104' title='bbox 808 838 966 866; x_wconf 85' lang='eng' dir='ltr'><em>(AY631882)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 212 881 889 916; baseline 0 -6"><span class='ocrx_word' id='word_1_105' title='bbox 212 881 237 899; x_wconf 72' lang='eng'><em>84</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 264 888 403 916; x_wconf 81' lang='eng' dir='ltr'><em>Leptospira</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 414 888 505 916; x_wconf 84' lang='eng' dir='ltr'><em>meyeri</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 515 888 575 910; x_wconf 86' lang='eng' dir='ltr'><em>Iowa</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 586 887 636 916; x_wconf 85' lang='eng' dir='ltr'><em>City</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 648 885 721 916; x_wconf 82' lang='eng' dir='ltr'>FrogT</span> <span class='ocrx_word' id='word_1_111' title='bbox 731 888 889 916; x_wconf 83' lang='eng' dir='ltr'><em>(AY631878)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 177 936 641 966">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 177 937 641 965">
+     <span class='ocr_line' id='line_1_34' title="bbox 177 937 641 965; baseline 0 -6"><span class='ocrx_word' id='word_1_112' title='bbox 177 937 310 965; x_wconf 79' lang='eng' dir='ltr'><em>eptonema</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 320 937 371 959; x_wconf 81' lang='eng' dir='ltr'><em>iI/in/</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 381 937 471 959; x_wconf 87' lang='eng' dir='ltr'><em>Habaki</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 483 937 641 965; x_wconf 86' lang='eng' dir='ltr'><em>(AY996806)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002808-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002808-0-001.pbm.png
new file mode 100644
index 00000000..84653ed3
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002808-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002808-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002808-0-001.pbm.png.hocr
new file mode 100644
index 00000000..acbc4e95
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002808-0-001.pbm.png.hocr
@@ -0,0 +1,125 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002808-0-001.pbm.png"; bbox 0 0 2012 679; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 139 10 1305 622">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 139 22 1294 622">
+     <span class='ocr_line' id='line_1_1' title="bbox 1126 22 1284 89; baseline 0 -10"><span class='ocrx_word' id='word_1_1' title='bbox 1126 22 1284 89; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 1094 89 1245 114; baseline 0 565"><span class='ocrx_word' id='word_1_2' title='bbox 1094 89 1245 114; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 942 114 1228 145; baseline 0 534"><span class='ocrx_word' id='word_1_3' title='bbox 942 114 1228 145; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 800 145 1228 178; baseline 0 501"><span class='ocrx_word' id='word_1_4' title='bbox 800 145 1228 178; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 766 178 1225 214; baseline 0.004 -2"><span class='ocrx_word' id='word_1_5' title='bbox 766 178 1225 214; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 723 214 1223 255; baseline 0 424"><span class='ocrx_word' id='word_1_6' title='bbox 723 214 1223 255; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 723 255 1130 282; baseline 0 -1"><span class='ocrx_word' id='word_1_7' title='bbox 723 255 1130 282; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 279 282 1087 311; baseline 0 368"><span class='ocrx_word' id='word_1_8' title='bbox 279 282 1087 311; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 279 311 1087 346; baseline 0 333"><span class='ocrx_word' id='word_1_9' title='bbox 279 311 1087 346; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 279 346 1205 380; baseline 0 299"><span class='ocrx_word' id='word_1_10' title='bbox 279 346 1205 380; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 279 380 1294 415; baseline 0.004 -4"><span class='ocrx_word' id='word_1_11' title='bbox 279 380 1294 415; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 256 479 1086 513; baseline 0 -26"><span class='ocrx_word' id='word_1_12' title='bbox 256 479 1086 513; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 139 513 876 543; baseline 0 136"><span class='ocrx_word' id='word_1_13' title='bbox 139 513 876 543; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 161 543 876 578; baseline 0 101"><span class='ocrx_word' id='word_1_14' title='bbox 161 543 876 578; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 161 578 914 622; baseline 0 57"><span class='ocrx_word' id='word_1_15' title='bbox 161 578 914 622; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 876 3 2009 629">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 1191 3 2009 131">
+     <span class='ocr_line' id='line_1_16' title="bbox 1191 3 2009 32; baseline 0 -6"><span class='ocrx_word' id='word_1_16' title='bbox 1191 8 1216 26; x_wconf 92' lang='eng'><em>75</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 1322 4 1479 26; x_wconf 81' lang='eng' dir='ltr'><em>Thiobacillus</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 1489 3 1651 26; x_wconf 81' lang='eng' dir='ltr'><em>denitriﬁcans</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 1660 3 1741 26; x_wconf 93' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 1752 4 1835 26; x_wconf 89' lang='eng'>25259</span> <span class='ocrx_word' id='word_1_21' title='bbox 1847 3 2009 32; x_wconf 89' lang='eng' dir='ltr'><em>(CPOOO116)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 1271 36 1861 65; baseline 0 -6"><span class='ocrx_word' id='word_1_22' title='bbox 1271 37 1428 59; x_wconf 81' lang='eng' dir='ltr'><em>Thiobacillus</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 1438 36 1601 59; x_wconf 85' lang='eng' dir='ltr'><em>denitrificans</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 1611 37 1688 59; x_wconf 89' lang='eng' dir='ltr'>ME16</span> <span class='ocrx_word' id='word_1_25' title='bbox 1699 37 1861 65; x_wconf 90' lang='eng' dir='ltr'><em>(EU546130)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 1301 66 1881 98; baseline 0 -6"><span class='ocrx_word' id='word_1_26' title='bbox 1301 70 1459 92; x_wconf 87' lang='eng' dir='ltr'><em>Thiobacillus</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 1469 70 1594 98; x_wconf 77' lang='eng' dir='ltr'><em>thioparus</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 1605 69 1668 92; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 1680 66 1743 92; x_wconf 89' lang='eng' dir='ltr'><em>505T</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 1753 70 1881 98; x_wconf 86' lang='eng' dir='ltr'><em>(M79426)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 1245 103 1787 131; baseline 0 -6"><span class='ocrx_word' id='word_1_31' title='bbox 1245 103 1403 125; x_wconf 88' lang='eng' dir='ltr'><em>Thiobacillus</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 1413 103 1537 131; x_wconf 84' lang='eng' dir='ltr'><em>thioparus</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 1549 103 1616 125; x_wconf 89' lang='eng' dir='ltr'><em>LV43</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 1628 103 1787 131; x_wconf 89' lang='eng' dir='ltr'><em>(AF005628)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 1230 136 1918 198">
+     <span class='ocr_line' id='line_1_20' title="bbox 1243 136 1918 164; baseline 0 -6"><span class='ocrx_word' id='word_1_35' title='bbox 1243 136 1400 158; x_wconf 79' lang='eng' dir='ltr'><em>Thiobacillus</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 1410 136 1572 158; x_wconf 83' lang='eng' dir='ltr'><em>denitriﬁcans</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 1583 136 1678 158; x_wconf 92' lang='eng' dir='ltr'><em>NCIMB</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 1689 136 1754 158; x_wconf 83' lang='eng'><em>9548</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 1767 136 1918 164; x_wconf 88' lang='eng' dir='ltr'><em>(AJ243144)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 1230 165 1851 198; baseline 0 -6"><span class='ocrx_word' id='word_1_40' title='bbox 1230 169 1404 192; x_wconf 89' lang='eng' dir='ltr'><em>Thiobacillus</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 1415 169 1559 198; x_wconf 86' lang='eng' dir='ltr'><em>thiophilus</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 1570 165 1678 192; x_wconf 92' lang='eng' dir='ltr'><em>D24TNT</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 1688 169 1851 197; x_wconf 86' lang='eng' dir='ltr'><em>(EU685841)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 1334 202 1783 230">
+     <span class='ocr_line' id='line_1_22' title="bbox 1334 202 1783 230; baseline 0 -5"><span class='ocrx_word' id='word_1_44' title='bbox 1334 202 1492 225; x_wconf 76' lang='eng' dir='ltr'><em>Thiobacillus</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 1502 202 1647 230; x_wconf 86' lang='eng' dir='ltr'><em>aquaesu/is</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 1657 202 1783 230; x_wconf 88' lang='eng' dir='ltr'><em>(U58019)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 1087 229 1928 463">
+     <span class='ocr_line' id='line_1_23' title="bbox 1223 229 1896 264; baseline 0 -6"><span class='ocrx_word' id='word_1_47' title='bbox 1223 229 1388 258; x_wconf 45' lang='eng' dir='ltr'><em>“Thiobacillus</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 1396 230 1581 264; x_wconf 72' lang='eng' dir='ltr'><em>p/umbophi/us&#39;</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 1588 235 1651 258; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 1663 235 1728 258; x_wconf 86' lang='eng'>6690</span> <span class='ocrx_word' id='word_1_51' title='bbox 1740 235 1896 264; x_wconf 88' lang='eng' dir='ltr'><em>(AJ316618)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 1146 269 1695 297; baseline 0 -6"><span class='ocrx_word' id='word_1_52' title='bbox 1146 269 1370 297; x_wconf 81' lang='eng' dir='ltr'><em>Methyloversatilis</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 1381 269 1524 291; x_wconf 82' lang='eng' dir='ltr'><em>universal/s</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 1534 269 1695 297; x_wconf 88' lang='eng' dir='ltr'><em>(AY436796)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 1087 298 1796 330; baseline 0 -6"><span class='ocrx_word' id='word_1_55' title='bbox 1087 302 1274 325; x_wconf 83' lang='eng' dir='ltr'><em>Denitratisoma</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 1284 302 1480 325; x_wconf 83' lang='eng' dir='ltr'><em>oestradiolicum</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 1489 298 1627 324; x_wconf 88' lang='eng' dir='ltr'><em>AcBE2—1T</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 1636 302 1796 330; x_wconf 86' lang='eng' dir='ltr'><em>(AY879297)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 1205 331 1810 364; baseline 0 -6"><span class='ocrx_word' id='word_1_59' title='bbox 1205 331 1423 358; x_wconf 66' lang='eng' dir='ltr'><em>‘Dech/oromonas</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 1432 331 1568 358; x_wconf 73' lang='eng' dir='ltr'><em>aromat/ca&#39;</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 1577 335 1637 358; x_wconf 91' lang='eng' dir='ltr'><em>RCB</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 1649 335 1810 364; x_wconf 87' lang='eng' dir='ltr'><em>(AY032610)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 1245 369 1704 397; baseline 0 -6"><span class='ocrx_word' id='word_1_63' title='bbox 1245 369 1419 397; x_wconf 87' lang='eng' dir='ltr'><em>Rhodocyc/us</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 1428 374 1566 397; x_wconf 88' lang='eng' dir='ltr'><em>purpureus</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 1576 369 1704 397; x_wconf 84' lang='eng' dir='ltr'><em>(M34132)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 1312 398 1928 430; baseline 0 -6"><span class='ocrx_word' id='word_1_66' title='bbox 1312 402 1459 424; x_wconf 80' lang='eng' dir='ltr'><em>Thiomonas</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 1469 402 1572 424; x_wconf 75' lang='eng' dir='ltr'><em>delicate</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 1584 403 1661 423; x_wconf 91' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 1672 398 1759 423; x_wconf 90' lang='eng' dir='ltr'><em>14566T</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 1768 402 1928 430; x_wconf 82' lang='eng' dir='ltr'><em>(ABZ45481)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 1087 431 1701 463; baseline 0 -6"><span class='ocrx_word' id='word_1_71' title='bbox 1087 435 1300 457; x_wconf 79' lang='eng' dir='ltr'><em>Halothiobacillus</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 1310 435 1324 457; x_wconf 93' lang='eng' dir='ltr'><em>h</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 1326 435 1510 463; x_wconf 83' lang='eng' dir='ltr'><em>ydrothermalis</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 1520 431 1564 456; x_wconf 83' lang='eng' dir='ltr'><em>R3T</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 1573 435 1701 463; x_wconf 86' lang='eng' dir='ltr'>(M90662)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 876 468 1739 596">
+     <span class='ocr_line' id='line_1_30' title="bbox 1100 468 1594 496; baseline 0 -6"><span class='ocrx_word' id='word_1_76' title='bbox 1100 468 1313 490; x_wconf 78' lang='eng' dir='ltr'><em>Halothiobaci/Ius</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 1323 468 1459 496; x_wconf 89' lang='eng' dir='ltr'><em>halophilus</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 1469 468 1594 496; x_wconf 88' lang='eng' dir='ltr'><em>(U58020)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 1039 501 1739 529; baseline 0 -6"><span class='ocrx_word' id='word_1_79' title='bbox 1039 501 1251 523; x_wconf 81' lang='eng' dir='ltr'><em>Halothiobacillus</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 1261 501 1434 529; x_wconf 82' lang='eng' dir='ltr'><em>neapolitanus</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 1445 501 1508 523; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 1521 501 1564 523; x_wconf 88' lang='eng'><em>581</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 1580 501 1739 529; x_wconf 85' lang='eng' dir='ltr'><em>(AF173169)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 876 529 1597 562; baseline 0 -5"><span class='ocrx_word' id='word_1_84' title='bbox 876 534 1094 557; x_wconf 84' lang='eng' dir='ltr'><em>Acidithiobacillus</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 1104 534 1251 557; x_wconf 86' lang='eng' dir='ltr'><em>albertensis</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 1262 534 1325 557; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 1339 529 1432 557; x_wconf 89' lang='eng' dir='ltr'><em>14366T</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 1441 533 1597 562; x_wconf 84' lang='eng' dir='ltr'><em>(AJ459804)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 915 567 1480 596; baseline 0 -6"><span class='ocrx_word' id='word_1_89' title='bbox 915 567 1133 590; x_wconf 85' lang='eng' dir='ltr'><em>Acidithiobaci/lus</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 1143 567 1309 590; x_wconf 82' lang='eng' dir='ltr'><em>ferrooxidans</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 1320 567 1480 596; x_wconf 81' lang='eng' dir='ltr'><em>(A3039820)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 928 595 1533 629">
+     <span class='ocr_line' id='line_1_34' title="bbox 928 595 1533 629; baseline 0 -6"><span class='ocrx_word' id='word_1_92' title='bbox 928 601 1145 623; x_wconf 80' lang='eng' dir='ltr'><em>AcidithiobaciI/us</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 1155 601 1242 623; x_wconf 88' lang='eng' dir='ltr'><em>caldus</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 1253 600 1317 623; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 1329 595 1533 629; x_wconf 74' lang='eng' dir='ltr'><em>8584T(Z29975)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 250 403 275 421">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 250 403 275 421">
+     <span class='ocr_line' id='line_1_35' title="bbox 250 403 275 421; baseline 0 0"><span class='ocrx_word' id='word_1_96' title='bbox 250 403 275 421; x_wconf 86' lang='eng'>67</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 3 519 128 547">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 3 519 128 547">
+     <span class='ocr_line' id='line_1_36' title="bbox 3 519 128 547; baseline 0 -6"><span class='ocrx_word' id='word_1_97' title='bbox 3 519 128 547; x_wconf 78' lang='eng' dir='ltr'><em>Outgroup</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 489 640 546 662">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 489 640 546 662">
+     <span class='ocr_line' id='line_1_37' title="bbox 489 640 546 662; baseline 0 0"><span class='ocrx_word' id='word_1_98' title='bbox 489 640 546 662; x_wconf 87' lang='eng'><em>0.10</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002816-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002816-0-001.pbm.png
new file mode 100644
index 00000000..82b6b8f8
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002816-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002816-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002816-0-001.pbm.png.hocr
new file mode 100644
index 00000000..57e50ddd
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002816-0-001.pbm.png.hocr
@@ -0,0 +1,258 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002816-0-001.pbm.png"; bbox 0 0 1302 798; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 352 2 971 51">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 352 2 971 51">
+     <span class='ocr_line' id='line_1_1' title="bbox 352 2 971 51; baseline 0 -27"><span class='ocrx_word' id='word_1_1' title='bbox 352 12 416 51; x_wconf 48' lang='eng'><em>91&#39;:</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 423 3 562 24; x_wconf 82' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 570 4 647 30; x_wconf 75' lang='eng' dir='ltr'><em>ghoni/</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 655 3 743 24; x_wconf 91' lang='eng' dir='ltr'><em>NCIMB</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 755 3 845 24; x_wconf 78' lang='eng' dir='ltr'><em>10636T</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 854 2 971 28; x_wconf 86' lang='eng' dir='ltr'>(X73451)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 316 38 988 65">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 316 38 988 65">
+     <span class='ocr_line' id='line_1_2' title="bbox 316 38 988 65; baseline -0.001 -4"><span class='ocrx_word' id='word_1_7' title='bbox 316 41 350 55; x_wconf 68' lang='eng'>‘00</span> <span class='ocrx_word' id='word_1_8' title='bbox 414 40 552 61; x_wconf 77' lang='eng' dir='ltr'><em>C/ostr/dium</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 562 41 657 61; x_wconf 78' lang='eng' dir='ltr'><em>sorde/lii</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 665 40 740 61; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 750 39 825 60; x_wconf 73' lang='eng' dir='ltr'><em>9714T</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 834 38 944 65; x_wconf 89' lang='eng' dir='ltr'>(ABO757</span> <span class='ocrx_word' id='word_1_13' title='bbox 950 38 988 65; x_wconf 88' lang='eng'>71)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 355 31 357 85">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 355 31 357 85">
+     <span class='ocr_line' id='line_1_3' title="bbox 355 31 357 85; baseline 0 713"><span class='ocrx_word' id='word_1_14' title='bbox 355 31 357 85; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 358 86 444 88">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 358 86 444 88">
+     <span class='ocr_line' id='line_1_4' title="bbox 358 86 444 88; baseline 0 710"><span class='ocrx_word' id='word_1_15' title='bbox 358 86 444 88; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 175 152 258 154">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 175 152 258 154">
+     <span class='ocr_line' id='line_1_5' title="bbox 175 152 258 154; baseline 0 644"><span class='ocrx_word' id='word_1_16' title='bbox 175 152 258 154; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 256 90 258 216">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 256 90 258 216">
+     <span class='ocr_line' id='line_1_6' title="bbox 256 90 258 216; baseline 0 582"><span class='ocrx_word' id='word_1_17' title='bbox 256 90 258 216; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 256 214 323 216">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 256 214 323 216">
+     <span class='ocr_line' id='line_1_7' title="bbox 256 214 323 216; baseline 0 582"><span class='ocrx_word' id='word_1_18' title='bbox 256 214 323 216; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 321 196 323 234">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 321 196 323 234">
+     <span class='ocr_line' id='line_1_8' title="bbox 321 196 323 234; baseline 0 564"><span class='ocrx_word' id='word_1_19' title='bbox 321 196 323 234; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 85 57 1140 250">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 85 57 1140 250">
+     <span class='ocr_line' id='line_1_9' title="bbox 85 57 159 71; baseline 0 0"><span class='ocrx_word' id='word_1_20' title='bbox 85 57 159 71; x_wconf 69' lang='eng'><em>1—4</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 102 58 1035 125; baseline 0 -28"><span class='ocrx_word' id='word_1_21' title='bbox 102 72 138 86; x_wconf 77' lang='eng'><em>0-0‘</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 258 58 291 125; x_wconf 37' lang='eng'><em>&lt;{51</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 452 77 590 97; x_wconf 79' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 600 77 756 97; x_wconf 77' lang='eng' dir='ltr'><em>bifermentans</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 765 77 841 98; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 851 76 909 97; x_wconf 58' lang='eng' dir='ltr'><em>638T</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 918 75 1035 101; x_wconf 85' lang='eng' dir='ltr'>(X75906)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 227 111 1027 149; baseline 0 -15"><span class='ocrx_word' id='word_1_28' title='bbox 227 134 250 149; x_wconf 70' lang='eng'><em>56</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 451 113 589 134; x_wconf 77' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 599 114 696 134; x_wconf 73' lang='eng' dir='ltr'><em>bart/ettfi</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 703 114 765 134; x_wconf 93' lang='eng' dir='ltr'>WAL</span> <span class='ocrx_word' id='word_1_32' title='bbox 776 112 865 134; x_wconf 81' lang='eng' dir='ltr'><em>16138T</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 874 111 1027 138; x_wconf 86' lang='eng' dir='ltr'>(AY438672)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 443 148 984 176; baseline 0 -6"><span class='ocrx_word' id='word_1_34' title='bbox 443 150 581 170; x_wconf 78' lang='eng' dir='ltr'><em>C/ostridium</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 590 150 703 176; x_wconf 81' lang='eng' dir='ltr'><em>irregulare</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 713 150 771 170; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 783 149 857 170; x_wconf 73' lang='eng' dir='ltr'><em>2635T</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 867 148 984 174; x_wconf 88' lang='eng' dir='ltr'><em>(X73447)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 150 184 1043 217; baseline 0 -10"><span class='ocrx_word' id='word_1_39' title='bbox 150 202 171 217; x_wconf 60' lang='eng'>74</span> <span class='ocrx_word' id='word_1_40' title='bbox 323 196 470 198; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_41' title='bbox 478 186 616 207; x_wconf 77' lang='eng' dir='ltr'><em>C/ostridium</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 626 187 710 207; x_wconf 60' lang='eng' dir='ltr'><em>diff/tile</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 720 186 796 207; x_wconf 88' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 806 185 880 207; x_wconf 69' lang='eng' dir='ltr'><em>9689T</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 889 184 1043 211; x_wconf 88' lang='eng' dir='ltr'>(ABO75770)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 152 220 1140 250; baseline -0.001 -6"><span class='ocrx_word' id='word_1_46' title='bbox 152 220 174 222; x_wconf 77' lang='eng'>_</span> <span class='ocrx_word' id='word_1_47' title='bbox 293 222 315 236; x_wconf 70' lang='eng'>56</span> <span class='ocrx_word' id='word_1_48' title='bbox 323 232 534 234; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_49' title='bbox 542 223 680 244; x_wconf 82' lang='eng' dir='ltr'><em>C/ostridium</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 690 223 824 250; x_wconf 83' lang='eng' dir='ltr'><em>mangenotii</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 832 223 908 244; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 918 224 993 243; x_wconf 83' lang='eng'>25761</span> <span class='ocrx_word' id='word_1_53' title='bbox 1000 222 1009 234; x_wconf 67' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_54' title='bbox 1018 221 1140 248; x_wconf 84' lang='eng' dir='ltr'><em>(M59098)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 175 152 177 289">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 175 152 177 289">
+     <span class='ocr_line' id='line_1_15' title="bbox 175 152 177 289; baseline 0 509"><span class='ocrx_word' id='word_1_55' title='bbox 175 152 177 289; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 56 281 152 283">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 56 281 152 283">
+     <span class='ocr_line' id='line_1_16' title="bbox 56 281 152 283; baseline 0 515"><span class='ocrx_word' id='word_1_56' title='bbox 56 281 152 283; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 121 257 1275 323">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 121 257 1275 323">
+     <span class='ocr_line' id='line_1_17' title="bbox 121 257 1275 308; baseline 0 -28"><span class='ocrx_word' id='word_1_57' title='bbox 121 263 144 277; x_wconf 82' lang='eng'><em>99</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 484 269 532 308; x_wconf 81' lang='eng' dir='ltr'><em>I:</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 539 260 783 286; x_wconf 74' lang='eng' dir='ltr'><em>Peptostreptococcus</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 792 260 925 280; x_wconf 81' lang='eng' dir='ltr'><em>anaerobius</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 936 259 1012 280; x_wconf 90' lang='eng' dir='ltr'><em>NCTC</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 1024 261 1030 280; x_wconf 99' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 1040 258 1113 280; x_wconf 84' lang='eng' dir='ltr'><em>1460T</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 1122 257 1275 284; x_wconf 85' lang='eng' dir='ltr'>(AY326462)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 446 293 1169 323; baseline 0 -6"><span class='ocrx_word' id='word_1_65' title='bbox 446 293 480 308; x_wconf 63' lang='eng'><em>‘00</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 534 296 776 323; x_wconf 79' lang='eng' dir='ltr'><em>Peptostreptococcus</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 787 296 887 317; x_wconf 74' lang='eng' dir='ltr'><em>stomatis</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 896 295 1000 317; x_wconf 87' lang='eng' dir='ltr'><em>W2278T</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 1009 294 1169 321; x_wconf 86' lang='eng' dir='ltr'>(DO160208)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 401 330 1036 359">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 401 330 1036 359">
+     <span class='ocr_line' id='line_1_19' title="bbox 401 330 1036 359; baseline 0 -6"><span class='ocrx_word' id='word_1_70' title='bbox 401 333 606 359; x_wconf 78' lang='eng' dir='ltr'><em>Sporacetigenium</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 616 333 763 359; x_wconf 82' lang='eng' dir='ltr'><em>mesophi/um</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 772 333 825 353; x_wconf 90' lang='eng' dir='ltr'><em>ZLJ1</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 835 334 841 353; x_wconf 99' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 850 332 873 353; x_wconf 75' lang='eng' dir='ltr'><em>5T</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 883 330 1036 357; x_wconf 81' lang='eng' dir='ltr'>(AY682207)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 31 351 52 365">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 31 351 52 365">
+     <span class='ocr_line' id='line_1_20' title="bbox 31 351 52 365; baseline 0 0"><span class='ocrx_word' id='word_1_76' title='bbox 31 351 52 365; x_wconf 83' lang='eng'>79</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 113 367 1170 432">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 113 367 1170 432">
+     <span class='ocr_line' id='line_1_21' title="bbox 113 367 947 418; baseline -0.002 -27"><span class='ocrx_word' id='word_1_77' title='bbox 113 369 577 418; x_wconf 68' lang='eng' dir='ltr'><em>—100:C/OSMd/le</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 587 369 666 390; x_wconf 74' lang='eng' dir='ltr'><em>litora/e</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 677 369 735 390; x_wconf 82' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 746 368 820 389; x_wconf 79' lang='eng' dir='ltr'><em>5388T</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 829 367 947 394; x_wconf 82' lang='eng' dir='ltr'><em>(X77845)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 488 404 1170 432; baseline 0 -6"><span class='ocrx_word' id='word_1_82' title='bbox 488 406 640 426; x_wconf 79' lang='eng' dir='ltr'><em>Eubacterium</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 650 406 856 432; x_wconf 76' lang='eng' dir='ltr'><em>acidaminophi/um</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 867 406 925 427; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 936 405 1011 426; x_wconf 74' lang='eng' dir='ltr'><em>3953T</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 1020 404 1138 430; x_wconf 94' lang='eng' dir='ltr'>(AFO7141</span> <span class='ocrx_word' id='word_1_87' title='bbox 1147 404 1170 430; x_wconf 86' lang='eng'><em>6)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 0 364 62 616">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 0 364 62 616">
+     <span class='ocr_line' id='line_1_23' title="bbox 0 364 62 474; baseline 0 0"><span class='ocrx_word' id='word_1_88' title='bbox 0 364 62 474; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 0 474 28 616; baseline 0 182"><span class='ocrx_word' id='word_1_89' title='bbox 0 474 28 616; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 56 281 58 458">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 56 281 58 458">
+     <span class='ocr_line' id='line_1_25' title="bbox 56 281 58 458; baseline 0 340"><span class='ocrx_word' id='word_1_90' title='bbox 56 281 58 458; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 56 456 112 458">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 56 456 112 458">
+     <span class='ocr_line' id='line_1_26' title="bbox 56 456 112 458; baseline 0 340"><span class='ocrx_word' id='word_1_91' title='bbox 56 456 112 458; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 238 440 1301 796">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 238 440 1301 505">
+     <span class='ocr_line' id='line_1_27' title="bbox 238 440 1301 469; baseline 0 -6"><span class='ocrx_word' id='word_1_92' title='bbox 238 443 812 467; x_wconf 74' lang='eng' dir='ltr'><em>99—Acidaminobacter</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 820 442 1046 469; x_wconf 75' lang='eng' dir='ltr'><em>hydrogenoformans</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 1056 443 1090 469; x_wconf 90' lang='eng' dir='ltr'><em>glu</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 1101 440 1301 467; x_wconf 66' lang='eng' dir='ltr'>65T(AF016691)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 266 477 1208 505; baseline 0 -6"><span class='ocrx_word' id='word_1_96' title='bbox 266 489 593 491; x_wconf 94' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_97' title='bbox 600 479 729 499; x_wconf 78' lang='eng' dir='ltr'><em>Fusibacter</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 735 479 882 505; x_wconf 85' lang='eng' dir='ltr'><em>pauc/vorans</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 891 479 965 499; x_wconf 91' lang='eng' dir='ltr'><em>SEBR</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 974 480 1017 499; x_wconf 82' lang='eng'>421</span> <span class='ocrx_word' id='word_1_101' title='bbox 1027 478 1049 499; x_wconf 78' lang='eng' dir='ltr'><em>1T</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 1058 477 1208 503; x_wconf 83' lang='eng' dir='ltr'><em>(AF050099)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 589 513 1223 542">
+     <span class='ocr_line' id='line_1_29' title="bbox 589 513 1223 542; baseline 0 -6"><span class='ocrx_word' id='word_1_103' title='bbox 589 516 787 542; x_wconf 77' lang='eng' dir='ltr'><em>Geosporobacter</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 795 516 952 536; x_wconf 84' lang='eng' dir='ltr'><em>subterraneus</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 961 514 1054 536; x_wconf 76' lang='eng' dir='ltr'><em>VN568T</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 1063 513 1223 540; x_wconf 82' lang='eng' dir='ltr'>(D0643978)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 539 550 1137 578">
+     <span class='ocr_line' id='line_1_30' title="bbox 539 550 1137 578; baseline 0 -6"><span class='ocrx_word' id='word_1_107' title='bbox 539 552 678 578; x_wconf 84' lang='eng' dir='ltr'><em>Alkaliphi/us</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 689 552 879 573; x_wconf 78' lang='eng' dir='ltr'><em>crotonatoxidans</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 890 552 918 572; x_wconf 88' lang='eng' dir='ltr'><em>B1</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 928 551 977 572; x_wconf 83' lang='eng' dir='ltr'><em>1—2T</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 986 550 1075 576; x_wconf 87' lang='eng' dir='ltr'>(AF467</span> <span class='ocrx_word' id='word_1_112' title='bbox 1081 550 1137 576; x_wconf 85' lang='eng'><em>248)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 579 586 1107 613">
+     <span class='ocr_line' id='line_1_31' title="bbox 579 586 1107 613; baseline 0 -4"><span class='ocrx_word' id='word_1_113' title='bbox 579 588 717 609; x_wconf 78' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 727 589 843 609; x_wconf 78' lang='eng' dir='ltr'><em>fe/sineum</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 854 588 912 609; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 924 587 980 609; x_wconf 83' lang='eng' dir='ltr'><em>794T</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 989 586 1107 613; x_wconf 86' lang='eng' dir='ltr'>(X77851)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 624 623 1208 650">
+     <span class='ocr_line' id='line_1_32' title="bbox 624 623 1208 650; baseline 0 -5"><span class='ocrx_word' id='word_1_118' title='bbox 624 626 777 646; x_wconf 80' lang='eng' dir='ltr'><em>Natroninco/a</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 787 626 969 646; x_wconf 82' lang='eng' dir='ltr'><em>histidinovorans</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 979 624 1082 645; x_wconf 73' lang='eng' dir='ltr'><em>2—7940T</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 1091 623 1177 650; x_wconf 90' lang='eng' dir='ltr'>(Y1671</span> <span class='ocrx_word' id='word_1_122' title='bbox 1186 623 1208 650; x_wconf 86' lang='eng'>6)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 373 659 810 686">
+     <span class='ocr_line' id='line_1_33' title="bbox 373 659 810 686; baseline 0 -4"><span class='ocrx_word' id='word_1_123' title='bbox 373 662 511 682; x_wconf 81' lang='eng' dir='ltr'><em>Clostridium</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 520 662 642 682; x_wconf 81' lang='eng' dir='ltr'><em>stick/and/i</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 650 662 686 682; x_wconf 85' lang='eng' dir='ltr'><em>SR</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 696 659 810 686; x_wconf 87' lang='eng' dir='ltr'>(LO4167)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 365 696 909 724">
+     <span class='ocr_line' id='line_1_34' title="bbox 365 696 909 724; baseline 0 -5"><span class='ocrx_word' id='word_1_127' title='bbox 365 698 533 719; x_wconf 81' lang='eng' dir='ltr'><em>Proteocatella</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 543 698 666 724; x_wconf 88' lang='eng' dir='ltr'><em>sphenisci</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 675 697 752 719; x_wconf 90' lang='eng' dir='ltr'><em>PPP2T</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 761 696 909 723; x_wconf 89' lang='eng' dir='ltr'>(AF450134)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 616 733 1130 759">
+     <span class='ocr_line' id='line_1_35' title="bbox 616 733 1130 759; baseline 0 -4"><span class='ocrx_word' id='word_1_131' title='bbox 616 735 720 755; x_wconf 78' lang='eng' dir='ltr'><em>Filifactor</em></span> <span class='ocrx_word' id='word_1_132' title='bbox 729 735 816 755; x_wconf 81' lang='eng' dir='ltr'><em>vi/losus</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 827 734 885 755; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_134' title='bbox 898 734 970 755; x_wconf 81' lang='eng' dir='ltr'><em>1645T</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 980 733 1098 759; x_wconf 87' lang='eng' dir='ltr'><em>(AF53721</em></span> <span class='ocrx_word' id='word_1_136' title='bbox 1108 733 1130 759; x_wconf 94' lang='eng'><em>1)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 624 769 1145 796">
+     <span class='ocr_line' id='line_1_36' title="bbox 624 769 1145 796; baseline -0.002 -4"><span class='ocrx_word' id='word_1_137' title='bbox 624 772 728 792; x_wconf 64' lang='eng' dir='ltr'><em>Fi/I&#39;factor</em></span> <span class='ocrx_word' id='word_1_138' title='bbox 735 772 804 792; x_wconf 78' lang='eng' dir='ltr'><em>aloe/s</em></span> <span class='ocrx_word' id='word_1_139' title='bbox 814 771 889 792; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_140' title='bbox 899 770 990 791; x_wconf 71' lang='eng' dir='ltr'><em>35896T</em></span> <span class='ocrx_word' id='word_1_141' title='bbox 1000 769 1145 796; x_wconf 78' lang='eng' dir='ltr'>(AJ006962)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 81 463 104 478">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 81 463 104 478">
+     <span class='ocr_line' id='line_1_37' title="bbox 81 463 104 478; baseline 0 0"><span class='ocrx_word' id='word_1_142' title='bbox 81 463 104 478; x_wconf 84' lang='eng'><em>87</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 264 452 266 491">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 264 452 266 491">
+     <span class='ocr_line' id='line_1_38' title="bbox 264 452 266 491; baseline 0 307"><span class='ocrx_word' id='word_1_143' title='bbox 264 452 266 491; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 110 401 112 516">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 110 401 112 516">
+     <span class='ocr_line' id='line_1_39' title="bbox 110 401 112 516; baseline 0 282"><span class='ocrx_word' id='word_1_144' title='bbox 110 401 112 516; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 0 522 585 645">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 0 522 585 645">
+     <span class='ocr_line' id='line_1_40' title="bbox 205 522 585 536; baseline 0 262"><span class='ocrx_word' id='word_1_145' title='bbox 205 522 585 536; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 150 536 539 556; baseline 0 242"><span class='ocrx_word' id='word_1_146' title='bbox 150 536 539 556; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 150 556 539 592; baseline 0 206"><span class='ocrx_word' id='word_1_147' title='bbox 150 556 539 592; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 150 592 575 616; baseline 0 182"><span class='ocrx_word' id='word_1_148' title='bbox 150 592 575 616; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 0 616 328 645; baseline 0 -19"><span class='ocrx_word' id='word_1_149' title='bbox 0 616 328 645; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 150 220 153 557">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 150 220 153 557">
+     <span class='ocr_line' id='line_1_45' title="bbox 150 220 153 557; baseline 0 241"><span class='ocrx_word' id='word_1_150' title='bbox 150 220 153 557; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 0 616 617 766">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 0 616 617 766">
+     <span class='ocr_line' id='line_1_46' title="bbox 0 616 617 646; baseline -0.002 0"><span class='ocrx_word' id='word_1_151' title='bbox 0 616 617 646; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 0 646 369 682; baseline 0 116"><span class='ocrx_word' id='word_1_152' title='bbox 0 646 369 682; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_48' title="bbox 0 682 365 699; baseline 0 99"><span class='ocrx_word' id='word_1_153' title='bbox 0 682 365 699; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_49' title="bbox 0 699 363 738; baseline 0 60"><span class='ocrx_word' id='word_1_154' title='bbox 0 699 363 738; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_50' title="bbox 0 738 373 766; baseline 0 0"><span class='ocrx_word' id='word_1_155' title='bbox 0 738 363 766; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> <span class='ocrx_word' id='word_1_156' title='bbox 369 739 373 766; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 328 623 361 638">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 328 623 361 638">
+     <span class='ocr_line' id='line_1_51' title="bbox 328 623 361 638; baseline 0 0"><span class='ocrx_word' id='word_1_157' title='bbox 328 623 361 638; x_wconf 87' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 335 746 369 760">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 335 746 369 760">
+     <span class='ocr_line' id='line_1_52' title="bbox 335 746 369 760; baseline 0 0"><span class='ocrx_word' id='word_1_158' title='bbox 335 746 369 760; x_wconf 90' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 374 746 376 784">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 374 746 376 784">
+     <span class='ocr_line' id='line_1_53' title="bbox 374 746 376 784; baseline 0 14"><span class='ocrx_word' id='word_1_159' title='bbox 374 746 376 784; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002873-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002873-0-000.pbm.png
new file mode 100644
index 00000000..c0ea48bc
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002873-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002873-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002873-0-000.pbm.png.hocr
new file mode 100644
index 00000000..15e8ae49
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002873-0-000.pbm.png.hocr
@@ -0,0 +1,250 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002873-0-000.pbm.png"; bbox 0 0 1231 1103; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 199 4 247 21">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 199 4 247 21">
+     <span class='ocr_line' id='line_1_1' title="bbox 199 4 247 21; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 199 4 247 21; x_wconf 87' lang='eng'>0.05</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 12 16 433 34">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 12 16 433 34">
+     <span class='ocr_line' id='line_1_2' title="bbox 12 16 433 34; baseline 0 1069"><span class='ocrx_word' id='word_1_2' title='bbox 12 16 433 34; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 135 57 1152 510">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 135 57 1152 510">
+     <span class='ocr_line' id='line_1_3' title="bbox 168 57 1152 88; baseline 0 -7"><span class='ocrx_word' id='word_1_3' title='bbox 168 69 193 85; x_wconf 75' lang='eng' dir='ltr'><em>e7</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 203 67 399 69; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_5' title='bbox 411 60 664 88; x_wconf 84' lang='eng' dir='ltr'><em>Novosphingobium</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 675 60 885 88; x_wconf 80' lang='eng' dir='ltr'><em>nitrogen/figens</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 894 59 961 81; x_wconf 82' lang='eng' dir='ltr'><em>Y88T</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 970 57 1152 85; x_wconf 86' lang='eng' dir='ltr'>(DO448852)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 337 99 1066 130; baseline 0 -7"><span class='ocrx_word' id='word_1_9' title='bbox 337 102 591 130; x_wconf 86' lang='eng' dir='ltr'><em>Novosphingobium</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 602 99 1066 130; x_wconf 78' lang='eng' dir='ltr'><em>stygiumlFO16085T(A8025013)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 205 142 1138 196; baseline -0.001 -30"><span class='ocrx_word' id='word_1_11' title='bbox 205 152 283 196; x_wconf 47' lang='eng' dir='ltr'><em>gé‘:</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 294 144 549 172; x_wconf 80' lang='eng' dir='ltr'><em>Novosphingobium</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 559 142 1138 170; x_wconf 76' lang='eng' dir='ltr'><em>aromaticivoranleO16084T(ABOQ5012)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 182 183 1104 214; baseline 0 -6"><span class='ocrx_word' id='word_1_14' title='bbox 182 183 204 199; x_wconf 74' lang='eng'>5‘</span> <span class='ocrx_word' id='word_1_15' title='bbox 290 186 544 214; x_wconf 79' lang='eng' dir='ltr'><em>Novosphingobium</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 554 184 1104 212; x_wconf 74' lang='eng' dir='ltr'><em>subterraneumlFO16086T(ABOQ5014)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 368 226 1132 256; baseline 0 -6"><span class='ocrx_word' id='word_1_17' title='bbox 368 229 622 256; x_wconf 83' lang='eng' dir='ltr'><em>Novosphingobium</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 633 229 792 256; x_wconf 81' lang='eng' dir='ltr'><em>capsulatum</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 802 226 1132 254; x_wconf 83' lang='eng' dir='ltr'><em>GIFU11526T(D16147)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 191 268 1005 299; baseline 0 -7"><span class='ocrx_word' id='word_1_20' title='bbox 191 278 306 280; x_wconf 91' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_21' title='bbox 315 271 569 299; x_wconf 85' lang='eng' dir='ltr'><em>Novosphingobium</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 580 271 714 292; x_wconf 82' lang='eng' dir='ltr'><em>taihuense</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 723 270 823 292; x_wconf 75' lang='eng' dir='ltr'><em>T3—BQT</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 833 268 1005 297; x_wconf 85' lang='eng' dir='ltr'><em>(AY500142)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 335 311 1025 341; baseline 0 -6"><span class='ocrx_word' id='word_1_25' title='bbox 335 313 589 341; x_wconf 84' lang='eng' dir='ltr'><em>Novosphingobium</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 600 313 747 335; x_wconf 84' lang='eng' dir='ltr'><em>hassiacum</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 757 311 1025 339; x_wconf 85' lang='eng' dir='ltr'><em>W-51T(AJ416411)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 358 353 972 383; baseline 0 -6"><span class='ocrx_word' id='word_1_28' title='bbox 358 356 612 383; x_wconf 81' lang='eng' dir='ltr'><em>Novosphingobium</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 622 356 715 377; x_wconf 80' lang='eng' dir='ltr'><em>lentum</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 726 356 779 377; x_wconf 93' lang='eng' dir='ltr'><em>MT1</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 787 355 796 367; x_wconf 99' lang='eng' dir='ltr'><em>T</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 806 353 972 381; x_wconf 83' lang='eng' dir='ltr'><em>(AJ303009)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 340 395 1046 426; baseline 0 -7"><span class='ocrx_word' id='word_1_33' title='bbox 340 398 594 426; x_wconf 85' lang='eng' dir='ltr'><em>Novosphingob/um</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 605 398 760 426; x_wconf 83' lang='eng' dir='ltr'><em>tardaugens</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 769 397 860 419; x_wconf 91' lang='eng' dir='ltr'><em>ARI-1T</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 870 395 1046 424; x_wconf 85' lang='eng' dir='ltr'><em>(ABO70237)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 319 438 971 467; baseline 0 -5"><span class='ocrx_word' id='word_1_37' title='bbox 319 440 585 467; x_wconf 88' lang='eng' dir='ltr'><em>Novosphingobium</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 595 440 711 462; x_wconf 88' lang='eng' dir='ltr'><em>indicum</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 723 439 791 462; x_wconf 87' lang='eng' dir='ltr'><em>H25T</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 801 438 971 466; x_wconf 87' lang='eng' dir='ltr'><em>(EF549586)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 135 480 1127 510; baseline 0.001 -7"><span class='ocrx_word' id='word_1_41' title='bbox 135 490 299 492; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_42' title='bbox 310 482 564 510; x_wconf 85' lang='eng' dir='ltr'><em>Novosphingobium</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 572 482 833 510; x_wconf 76' lang='eng' dir='ltr'><em>pentaromativorans</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 844 482 928 504; x_wconf 69' lang='eng' dir='ltr'><em>USES-1</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 937 481 946 493; x_wconf 90' lang='eng' dir='ltr'><em>T</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 955 480 1127 508; x_wconf 77' lang='eng' dir='ltr'>(AF502400)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 201 67 203 111">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 201 67 203 111">
+     <span class='ocr_line' id='line_1_14' title="bbox 201 67 203 111; baseline 0 992"><span class='ocrx_word' id='word_1_47' title='bbox 201 67 203 111; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 189 204 211 206">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 189 204 211 206">
+     <span class='ocr_line' id='line_1_15' title="bbox 189 204 211 206; baseline 0 897"><span class='ocrx_word' id='word_1_48' title='bbox 189 204 211 206; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 46 185 333 665">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 46 185 333 665">
+     <span class='ocr_line' id='line_1_16' title="bbox 147 185 170 229; baseline 0 0"><span class='ocrx_word' id='word_1_49' title='bbox 147 185 170 229; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 69 229 315 314; baseline 0 -61"><span class='ocrx_word' id='word_1_50' title='bbox 69 229 315 314; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 46 314 333 525; baseline 0 0"><span class='ocrx_word' id='word_1_51' title='bbox 46 314 333 525; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 69 525 270 665; baseline 0 -13"><span class='ocrx_word' id='word_1_52' title='bbox 69 525 270 665; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 209 173 211 238">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 209 173 211 238">
+     <span class='ocr_line' id='line_1_20' title="bbox 209 173 211 238; baseline 0 865"><span class='ocrx_word' id='word_1_53' title='bbox 209 173 211 238; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 172 240 191 242">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 172 240 191 242">
+     <span class='ocr_line' id='line_1_21' title="bbox 172 240 191 242; baseline 0 861"><span class='ocrx_word' id='word_1_54' title='bbox 172 240 191 242; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 171 241 173 344">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 171 241 173 344">
+     <span class='ocr_line' id='line_1_22' title="bbox 171 241 173 344; baseline 0 759"><span class='ocrx_word' id='word_1_55' title='bbox 171 241 173 344; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 171 342 193 344">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 171 342 193 344">
+     <span class='ocr_line' id='line_1_23' title="bbox 171 342 193 344; baseline 0 759"><span class='ocrx_word' id='word_1_56' title='bbox 171 342 193 344; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 189 204 193 365">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 189 204 193 365">
+     <span class='ocr_line' id='line_1_24' title="bbox 189 204 193 365; baseline 0 738"><span class='ocrx_word' id='word_1_57' title='bbox 189 204 193 365; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 43 422 66 438">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 43 422 66 438">
+     <span class='ocr_line' id='line_1_25' title="bbox 43 422 66 438; baseline 0 0"><span class='ocrx_word' id='word_1_58' title='bbox 43 422 66 438; x_wconf 86' lang='eng'><em>81</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 116 469 135 471">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 116 469 135 471">
+     <span class='ocr_line' id='line_1_26' title="bbox 116 469 135 471; baseline 0 632"><span class='ocrx_word' id='word_1_59' title='bbox 116 469 135 471; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 135 522 1156 764">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 135 522 1156 764">
+     <span class='ocr_line' id='line_1_27' title="bbox 219 522 1108 576; baseline -0.002 -28"><span class='ocrx_word' id='word_1_60' title='bbox 219 532 276 576; x_wconf 64' lang='eng' dir='ltr'>1oo[</span> <span class='ocrx_word' id='word_1_61' title='bbox 287 524 541 552; x_wconf 81' lang='eng' dir='ltr'><em>Novosphingobium</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 551 524 723 546; x_wconf 86' lang='eng' dir='ltr'><em>resinovorum</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 734 524 833 546; x_wconf 88' lang='eng' dir='ltr'><em>NCIMB</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 844 522 1108 550; x_wconf 84' lang='eng' dir='ltr'><em>8767T(EF029110)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 282 564 936 594; baseline 0 -6"><span class='ocrx_word' id='word_1_65' title='bbox 282 567 536 594; x_wconf 82' lang='eng' dir='ltr'><em>Novosphingobium</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 546 567 717 588; x_wconf 79' lang='eng' dir='ltr'><em>subarcticum</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 728 564 936 593; x_wconf 86' lang='eng' dir='ltr'><em>KF1T(X94102)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 135 607 1072 637; baseline 0 -6"><span class='ocrx_word' id='word_1_68' title='bbox 135 617 220 619; x_wconf 90' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_69' title='bbox 231 609 485 637; x_wconf 82' lang='eng' dir='ltr'><em>Novosphingobium</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 496 609 753 637; x_wconf 70' lang='eng' dir='ltr'><em>naphtha/enivorans</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 762 607 1072 635; x_wconf 84' lang='eng' dir='ltr'><em>TUT562T(AB177883)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 277 649 920 679; baseline 0 -6"><span class='ocrx_word' id='word_1_72' title='bbox 277 652 531 679; x_wconf 83' lang='eng' dir='ltr'><em>Novosphingobium</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 541 658 599 673; x_wconf 85' lang='eng' dir='ltr'><em>rosa</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 610 652 659 673; x_wconf 94' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 673 649 920 677; x_wconf 87' lang='eng' dir='ltr'><em>14222T(D13945)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 279 691 1123 722; baseline 0 -7"><span class='ocrx_word' id='word_1_76' title='bbox 279 699 318 715; x_wconf 88' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 335 701 447 703; x_wconf 91' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_78' title='bbox 456 693 665 722; x_wconf 85' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 676 694 842 715; x_wconf 83' lang='eng' dir='ltr'><em>desiccab/Iis</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 852 691 1123 720; x_wconf 85' lang='eng' dir='ltr'><em>CP1DT(AJ871435)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 474 733 1156 764; baseline -0.001 -6"><span class='ocrx_word' id='word_1_81' title='bbox 474 735 683 764; x_wconf 85' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 693 736 871 758; x_wconf 87' lang='eng' dir='ltr'><em>dokdonensis</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 882 735 965 758; x_wconf 89' lang='eng' dir='ltr'>DS-4T</span> <span class='ocrx_word' id='word_1_84' title='bbox 975 733 1044 762; x_wconf 80' lang='eng' dir='ltr'><em>(D01</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 1055 737 1106 757; x_wconf 84' lang='eng'><em>789</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 1113 734 1156 762; x_wconf 89' lang='eng'><em>75)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 116 469 118 587">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 116 469 118 587">
+     <span class='ocr_line' id='line_1_33' title="bbox 116 469 118 587; baseline 0 516"><span class='ocrx_word' id='word_1_87' title='bbox 116 469 118 587; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 116 585 135 587">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 116 585 135 587">
+     <span class='ocr_line' id='line_1_34' title="bbox 116 585 135 587; baseline 0 516"><span class='ocrx_word' id='word_1_88' title='bbox 116 585 135 587; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 133 448 135 618">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 133 448 135 618">
+     <span class='ocr_line' id='line_1_35' title="bbox 133 448 135 618; baseline 0 485"><span class='ocrx_word' id='word_1_89' title='bbox 133 448 135 618; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 48 443 50 756">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 48 443 50 756">
+     <span class='ocr_line' id='line_1_36' title="bbox 48 443 50 756; baseline 0 347"><span class='ocrx_word' id='word_1_90' title='bbox 48 443 50 756; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 333 701 335 745">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 333 701 335 745">
+     <span class='ocr_line' id='line_1_37' title="bbox 333 701 335 745; baseline -2393 22752"><span class='ocrx_word' id='word_1_91' title='bbox 333 701 335 745; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 126 870 128 915">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 126 870 128 915">
+     <span class='ocr_line' id='line_1_38' title="bbox 126 870 128 915; baseline -2392.5 26389"><span class='ocrx_word' id='word_1_92' title='bbox 126 870 128 915; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 20 764 1230 976">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 20 764 1230 976">
+     <span class='ocr_line' id='line_1_39' title="bbox 178 764 1230 806; baseline -0.001 -6"><span class='ocrx_word' id='word_1_93' title='bbox 178 764 217 781; x_wconf 64' lang='eng'><em>10°</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 469 778 678 806; x_wconf 83' lang='eng' dir='ltr'><em>Sphingomonas</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 688 778 840 800; x_wconf 85' lang='eng' dir='ltr'><em>ech/noides</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 850 776 1230 804; x_wconf 74' lang='eng' dir='ltr'><em>ATCC14820T(ABOQ1370)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 83 818 1018 852; baseline 0 -10"><span class='ocrx_word' id='word_1_97' title='bbox 83 836 108 852; x_wconf 74' lang='eng'><em>74</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 296 820 553 848; x_wconf 80' lang='eng' dir='ltr'><em>Altereryth/obacter</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 561 820 662 842; x_wconf 84' lang='eng' dir='ltr'><em>indicus</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 672 819 826 842; x_wconf 89' lang='eng' dir='ltr'><em>MSSRF26T</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 836 818 1018 846; x_wconf 85' lang='eng' dir='ltr'><em>(DO399262)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 128 860 1025 891; baseline 0 -7"><span class='ocrx_word' id='word_1_102' title='bbox 128 863 583 891; x_wconf 81' lang='eng' dir='ltr'><em>—Altererythrobacter</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 591 863 701 884; x_wconf 85' lang='eng' dir='ltr'><em>Iuteolus</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 711 860 1025 888; x_wconf 85' lang='eng' dir='ltr'><em>SW—109T(AY739662)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 301 903 1089 933; baseline 0 -6"><span class='ocrx_word' id='word_1_105' title='bbox 301 905 558 933; x_wconf 82' lang='eng' dir='ltr'><em>Altererythrobacter</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 567 905 761 933; x_wconf 78' lang='eng' dir='ltr'><em>epoxidivorans</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 769 904 897 927; x_wconf 84' lang='eng' dir='ltr'><em>JCS350T</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 907 903 1089 931; x_wconf 78' lang='eng'>(00304436)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 20 945 944 976; baseline -0.002 -5"><span class='ocrx_word' id='word_1_109' title='bbox 20 948 45 964; x_wconf 68' lang='eng'>72</span> <span class='ocrx_word' id='word_1_110' title='bbox 190 955 212 971; x_wconf 80' lang='eng'><em>91</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 226 947 552 976; x_wconf 85' lang='eng' dir='ltr'><em>—Erythrobacter</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 560 947 640 969; x_wconf 81' lang='eng' dir='ltr'><em>flavus</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 650 946 763 969; x_wconf 86' lang='eng' dir='ltr'><em>SW-46T</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 773 945 944 973; x_wconf 90' lang='eng' dir='ltr'>(AF500004)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 184 976 226 978">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 184 976 226 978">
+     <span class='ocr_line' id='line_1_44' title="bbox 184 976 226 978; baseline -832.333 18623"><span class='ocrx_word' id='word_1_115' title='bbox 184 976 226 978; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 224 955 226 998">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 224 955 226 998">
+     <span class='ocr_line' id='line_1_45' title="bbox 224 955 226 998; baseline 0 105"><span class='ocrx_word' id='word_1_116' title='bbox 224 955 226 998; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 48 443 52 1020">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 48 443 52 1020">
+     <span class='ocr_line' id='line_1_46' title="bbox 48 443 52 1020; baseline -2392.75 16306"><span class='ocrx_word' id='word_1_117' title='bbox 48 443 52 1020; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 201 987 1125 1103">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 201 987 1125 1103">
+     <span class='ocr_line' id='line_1_47' title="bbox 241 987 822 1018; baseline 0 -7"><span class='ocrx_word' id='word_1_118' title='bbox 241 990 432 1018; x_wconf 80' lang='eng' dir='ltr'><em>Erythrobacter</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 440 990 532 1017; x_wconf 86' lang='eng' dir='ltr'><em>longus</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 543 987 822 1015; x_wconf 86' lang='eng' dir='ltr'><em>OCh101T(L017B6)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_48' title="bbox 320 1029 1060 1060; baseline 0 -7"><span class='ocrx_word' id='word_1_121' title='bbox 320 1032 537 1060; x_wconf 80' lang='eng' dir='ltr'><em>Porphyrobacter</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 545 1032 723 1053; x_wconf 84' lang='eng' dir='ltr'><em>dokdonensis</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 734 1029 1060 1058; x_wconf 85' lang='eng' dir='ltr'><em>DSW—74T(DOO11529)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_49' title="bbox 201 1071 1125 1103; baseline -0.001 -7"><span class='ocrx_word' id='word_1_124' title='bbox 201 1071 227 1087; x_wconf 76' lang='eng'>99</span> <span class='ocrx_word' id='word_1_125' title='bbox 240 1081 349 1084; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_126' title='bbox 358 1074 575 1103; x_wconf 81' lang='eng' dir='ltr'><em>Porphyrobacter</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 583 1074 769 1096; x_wconf 84' lang='eng' dir='ltr'><em>neustonens/s</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 780 1073 844 1096; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 856 1073 940 1095; x_wconf 87' lang='eng' dir='ltr'>9434T</span> <span class='ocrx_word' id='word_1_130' title='bbox 949 1072 1094 1100; x_wconf 83' lang='eng' dir='ltr'><em>(AB03332</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 1101 1072 1125 1100; x_wconf 92' lang='eng'><em>7)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 50 1018 186 1020">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 50 1018 186 1020">
+     <span class='ocr_line' id='line_1_50' title="bbox 50 1018 186 1020; baseline 16.728 11520"><span class='ocrx_word' id='word_1_132' title='bbox 50 1018 186 1020; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 130 1028 169 1045">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 130 1028 169 1045">
+     <span class='ocr_line' id='line_1_51' title="bbox 130 1028 169 1045; baseline 0.026 -1"><span class='ocrx_word' id='word_1_133' title='bbox 130 1028 169 1045; x_wconf 93' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 241 1039 311 1041">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 241 1039 311 1041">
+     <span class='ocr_line' id='line_1_52' title="bbox 241 1039 311 1041; baseline 0 62"><span class='ocrx_word' id='word_1_134' title='bbox 241 1039 311 1041; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 184 976 186 1062">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 184 976 186 1062">
+     <span class='ocr_line' id='line_1_53' title="bbox 184 976 186 1062; baseline 0 41"><span class='ocrx_word' id='word_1_135' title='bbox 184 976 186 1062; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 184 1060 241 1062">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 184 1060 241 1062">
+     <span class='ocr_line' id='line_1_54' title="bbox 184 1060 241 1062; baseline -668.07 18539"><span class='ocrx_word' id='word_1_136' title='bbox 184 1060 241 1062; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 239 1039 241 1083">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 239 1039 241 1083">
+     <span class='ocr_line' id='line_1_55' title="bbox 239 1039 241 1083; baseline -2393 -14776"><span class='ocrx_word' id='word_1_137' title='bbox 239 1039 241 1083; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002881-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002881-0-000.pbm.png
new file mode 100644
index 00000000..e7ebfcc1
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002881-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002881-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002881-0-000.pbm.png.hocr
new file mode 100644
index 00000000..ca0afff1
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002881-0-000.pbm.png.hocr
@@ -0,0 +1,551 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002881-0-000.pbm.png"; bbox 0 0 1657 2107; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 6 1360 8 2085">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 6 1360 8 2085">
+     <span class='ocr_line' id='line_1_1' title="bbox 6 1360 8 2085; baseline 0 22"><span class='ocrx_word' id='word_1_1' title='bbox 6 1360 8 2085; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 165 168 211 187">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 165 168 211 187">
+     <span class='ocr_line' id='line_1_2' title="bbox 165 168 211 187; baseline -0.022 0"><span class='ocrx_word' id='word_1_2' title='bbox 165 168 211 187; x_wconf 88' lang='eng'><em>0.02</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 366 657 391 659">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 366 657 391 659">
+     <span class='ocr_line' id='line_1_3' title="bbox 366 657 391 659; baseline 0 1448"><span class='ocrx_word' id='word_1_3' title='bbox 366 657 391 659; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 390 569 391 746">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 390 569 391 746">
+     <span class='ocr_line' id='line_1_4' title="bbox 390 569 391 746; baseline 0 1361"><span class='ocrx_word' id='word_1_4' title='bbox 390 569 391 746; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 348 808 368 810">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 348 808 368 810">
+     <span class='ocr_line' id='line_1_5' title="bbox 348 808 368 810; baseline 0 1297"><span class='ocrx_word' id='word_1_5' title='bbox 348 808 368 810; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 366 657 368 963">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 366 657 368 963">
+     <span class='ocr_line' id='line_1_6' title="bbox 366 657 368 963; baseline 0 1144"><span class='ocrx_word' id='word_1_6' title='bbox 366 657 368 963; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 600 348 625 366">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 600 348 625 366">
+     <span class='ocr_line' id='line_1_7' title="bbox 600 348 625 366; baseline 0 0"><span class='ocrx_word' id='word_1_7' title='bbox 600 348 625 366; x_wconf 88' lang='eng'>72</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 731 9 1575 261">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 731 9 1575 261">
+     <span class='ocr_line' id='line_1_8' title="bbox 831 9 1512 38; baseline 0 -6"><span class='ocrx_word' id='word_1_8' title='bbox 831 17 856 35; x_wconf 88' lang='eng'>73</span> <span class='ocrx_word' id='word_1_9' title='bbox 871 9 1032 32; x_wconf 81' lang='eng' dir='ltr'><em>‘Candidatus</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 1043 9 1151 32; x_wconf 85' lang='eng' dir='ltr'><em>Devosia</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 1162 9 1272 38; x_wconf 89' lang='eng' dir='ltr'><em>euplotis’</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 1285 9 1345 32; x_wconf 90' lang='eng' dir='ltr'><em>L|V5</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 1356 9 1512 38; x_wconf 91' lang='eng' dir='ltr'><em>(AJ548825)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 808 20 1495 133; baseline 0 -45"><span class='ocrx_word' id='word_1_14' title='bbox 808 20 1032 133; x_wconf 30' lang='eng' dir='ltr'><em>1°04‘Candidatus</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 1043 65 1151 88; x_wconf 88' lang='eng' dir='ltr'><em>Devosia</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 1162 65 1272 94; x_wconf 88' lang='eng' dir='ltr'><em>euplotis’</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 1284 65 1328 88; x_wconf 89' lang='eng' dir='ltr'>co</span> <span class='ocrx_word' id='word_1_18' title='bbox 1340 65 1495 94; x_wconf 89' lang='eng' dir='ltr'>(AJ548823)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 731 121 1575 151; baseline 0 -7"><span class='ocrx_word' id='word_1_19' title='bbox 731 138 739 140; x_wconf 86' lang='eng'><strong>_</strong></span> <span class='ocrx_word' id='word_1_20' title='bbox 865 121 1026 144; x_wconf 80' lang='eng' dir='ltr'><em>‘Candidatus</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 1037 122 1145 144; x_wconf 85' lang='eng' dir='ltr'><em>Devosia</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 1155 121 1266 150; x_wconf 83' lang='eng' dir='ltr'><em>euplotis’</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 1277 121 1407 144; x_wconf 91' lang='eng' dir='ltr'><em>CAMP4.4</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 1418 121 1575 151; x_wconf 89' lang='eng' dir='ltr'><em>(AJ548824)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 856 174 1370 205; baseline 0 -6"><span class='ocrx_word' id='word_1_25' title='bbox 856 177 966 199; x_wconf 85' lang='eng' dir='ltr'><em>Devosia</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 976 177 1023 199; x_wconf 89' lang='eng' dir='ltr'><em>Iimi</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 1032 176 1095 199; x_wconf 93' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 1106 174 1204 199; x_wconf 89' lang='eng' dir='ltr'><em>22951T</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 1214 176 1370 205; x_wconf 87' lang='eng' dir='ltr'>(AJ786801)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 836 230 1314 261; baseline 0 -6"><span class='ocrx_word' id='word_1_30' title='bbox 836 232 946 255; x_wconf 87' lang='eng' dir='ltr'><em>Devosia</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 956 232 1090 261; x_wconf 86' lang='eng' dir='ltr'><em>neptuniae</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 1099 232 1125 255; x_wconf 90' lang='eng' dir='ltr'>J1</span> <span class='ocrx_word' id='word_1_33' title='bbox 1132 230 1144 245; x_wconf 79' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_34' title='bbox 1155 232 1314 261; x_wconf 89' lang='eng' dir='ltr'>(AF469072)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 783 285 1450 373">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 783 285 1450 373">
+     <span class='ocr_line' id='line_1_13' title="bbox 841 285 1450 317; baseline 0 -6"><span class='ocrx_word' id='word_1_35' title='bbox 841 288 950 311; x_wconf 87' lang='eng' dir='ltr'><em>Devosia</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 961 288 1127 317; x_wconf 87' lang='eng' dir='ltr'><em>subaequoris</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 1138 285 1272 311; x_wconf 88' lang='eng' dir='ltr'><em>HST3-14T</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 1283 288 1450 317; x_wconf 88' lang='eng' dir='ltr'>(AM293857)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 783 341 1409 373; baseline 0.002 -7"><span class='ocrx_word' id='word_1_39' title='bbox 783 354 820 356; x_wconf 97' lang='eng'>—</span> <span class='ocrx_word' id='word_1_40' title='bbox 831 344 940 367; x_wconf 86' lang='eng' dir='ltr'><em>Devosia</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 951 344 1089 367; x_wconf 84' lang='eng' dir='ltr'><em>riboﬂavina</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 1099 344 1182 367; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 1193 341 1273 367; x_wconf 89' lang='eng' dir='ltr'><em>9526T</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 1283 344 1409 373; x_wconf 91' lang='eng' dir='ltr'>(D49423)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 739 89 741 188">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 739 89 741 188">
+     <span class='ocr_line' id='line_1_15' title="bbox 739 89 741 188; baseline 0 1919"><span class='ocrx_word' id='word_1_45' title='bbox 739 89 741 188; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 741 187 845 188">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 741 187 845 188">
+     <span class='ocr_line' id='line_1_16' title="bbox 741 187 845 188; baseline 0 1919"><span class='ocrx_word' id='word_1_46' title='bbox 741 187 845 188; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 703 190 731 192">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 703 190 731 192">
+     <span class='ocr_line' id='line_1_17' title="bbox 703 190 731 192; baseline 0 1915"><span class='ocrx_word' id='word_1_47' title='bbox 703 190 731 192; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 729 138 731 244">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 729 138 731 244">
+     <span class='ocr_line' id='line_1_18' title="bbox 729 138 731 244; baseline 0 1863"><span class='ocrx_word' id='word_1_48' title='bbox 729 138 731 244; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 731 242 826 244">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 731 242 826 244">
+     <span class='ocr_line' id='line_1_19' title="bbox 731 242 826 244; baseline 0 1863"><span class='ocrx_word' id='word_1_49' title='bbox 731 242 826 244; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 665 234 691 252">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 665 234 691 252">
+     <span class='ocr_line' id='line_1_20' title="bbox 665 234 691 252; baseline 0 0"><span class='ocrx_word' id='word_1_50' title='bbox 665 234 691 252; x_wconf 87' lang='eng'>98</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 725 298 830 300">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 725 298 830 300">
+     <span class='ocr_line' id='line_1_21' title="bbox 725 298 830 300; baseline 0 1807"><span class='ocrx_word' id='word_1_51' title='bbox 725 298 830 300; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 703 190 705 342">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 703 190 705 342">
+     <span class='ocr_line' id='line_1_22' title="bbox 703 190 705 342; baseline 0 1765"><span class='ocrx_word' id='word_1_52' title='bbox 703 190 705 342; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 723 298 725 384">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 723 298 725 384">
+     <span class='ocr_line' id='line_1_23' title="bbox 723 298 725 384; baseline 0 1723"><span class='ocrx_word' id='word_1_53' title='bbox 723 298 725 384; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 616 379 774 384">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 616 379 774 384">
+     <span class='ocr_line' id='line_1_24' title="bbox 616 379 774 384; baseline 0 1723"><span class='ocrx_word' id='word_1_54' title='bbox 616 379 774 384; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 578 447 604 465">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 578 447 604 465">
+     <span class='ocr_line' id='line_1_25' title="bbox 578 447 604 465; baseline 0 0"><span class='ocrx_word' id='word_1_55' title='bbox 578 447 604 465; x_wconf 90' lang='eng'><strong>99</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 484 538 522 556">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 484 538 522 556">
+     <span class='ocr_line' id='line_1_26' title="bbox 484 538 522 556; baseline 0 0"><span class='ocrx_word' id='word_1_56' title='bbox 484 538 522 556; x_wconf 92' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 616 379 617 579">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 616 379 617 579">
+     <span class='ocr_line' id='line_1_27' title="bbox 616 379 617 579; baseline 0 1528"><span class='ocrx_word' id='word_1_57' title='bbox 616 379 617 579; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 533 478 535 663">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 533 478 535 663">
+     <span class='ocr_line' id='line_1_28' title="bbox 533 478 535 663; baseline 0 1444"><span class='ocrx_word' id='word_1_58' title='bbox 533 478 535 663; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 601 633 602 691">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 601 633 602 691">
+     <span class='ocr_line' id='line_1_29' title="bbox 601 633 602 691; baseline 0 1416"><span class='ocrx_word' id='word_1_59' title='bbox 601 633 602 691; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 563 676 589 694">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 563 676 589 694">
+     <span class='ocr_line' id='line_1_30' title="bbox 563 676 589 694; baseline 0 0"><span class='ocrx_word' id='word_1_60' title='bbox 563 676 589 694; x_wconf 87' lang='eng'><em>96</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 422 862 716 879">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 422 862 716 879">
+     <span class='ocr_line' id='line_1_31' title="bbox 422 862 716 879; baseline 0 -4"><span class='ocrx_word' id='word_1_61' title='bbox 422 862 716 879; x_wconf 71' lang='eng'><em>—.</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 366 961 422 963">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 366 961 422 963">
+     <span class='ocr_line' id='line_1_32' title="bbox 366 961 422 963; baseline 0 -88"><span class='ocrx_word' id='word_1_62' title='bbox 366 961 422 963; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 383 976 409 994">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 383 976 409 994">
+     <span class='ocr_line' id='line_1_33' title="bbox 383 976 409 994; baseline 0 0"><span class='ocrx_word' id='word_1_63' title='bbox 383 976 409 994; x_wconf 87' lang='eng'>75</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 323 999 350 1001">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 323 999 350 1001">
+     <span class='ocr_line' id='line_1_34' title="bbox 323 999 350 1001; baseline 0 1106"><span class='ocrx_word' id='word_1_64' title='bbox 323 999 350 1001; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 291 1122 325 1124">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 291 1122 325 1124">
+     <span class='ocr_line' id='line_1_35' title="bbox 291 1122 325 1124; baseline 0 983"><span class='ocrx_word' id='word_1_65' title='bbox 291 1122 325 1124; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 348 808 350 1192">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 348 808 350 1192">
+     <span class='ocr_line' id='line_1_36' title="bbox 348 808 350 1192; baseline 0 915"><span class='ocrx_word' id='word_1_66' title='bbox 348 808 350 1192; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 323 999 326 1248">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 323 999 326 1248">
+     <span class='ocr_line' id='line_1_37' title="bbox 323 999 326 1248; baseline 0 859"><span class='ocrx_word' id='word_1_67' title='bbox 323 999 326 1248; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 291 1122 293 1600">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 291 1122 293 1600">
+     <span class='ocr_line' id='line_1_38' title="bbox 291 1122 293 1600; baseline 0 507"><span class='ocrx_word' id='word_1_68' title='bbox 291 1122 293 1600; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 361 1613 399 1632">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 361 1613 399 1632">
+     <span class='ocr_line' id='line_1_39' title="bbox 361 1613 399 1632; baseline 0 0"><span class='ocrx_word' id='word_1_69' title='bbox 361 1613 399 1632; x_wconf 91' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 411 1421 413 1778">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 411 1421 413 1778">
+     <span class='ocr_line' id='line_1_40' title="bbox 411 1421 413 1778; baseline 0 329"><span class='ocrx_word' id='word_1_70' title='bbox 411 1421 413 1778; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 744 374 1320 429">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 744 374 1320 429">
+     <span class='ocr_line' id='line_1_41' title="bbox 774 374 792 392; baseline 0 0"><span class='ocrx_word' id='word_1_71' title='bbox 774 374 792 392; x_wconf 76' lang='eng' dir='ltr'><strong><em>o</em></strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 744 397 1320 429; baseline -0.002 -6"><span class='ocrx_word' id='word_1_72' title='bbox 744 397 770 415; x_wconf 81' lang='eng'><em>99</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 783 410 837 412; x_wconf 95' lang='eng'>—</span> <span class='ocrx_word' id='word_1_74' title='bbox 847 400 957 423; x_wconf 87' lang='eng' dir='ltr'><em>Devosia</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 968 400 1014 423; x_wconf 87' lang='eng' dir='ltr'><em>soli</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 1023 397 1142 423; x_wconf 90' lang='eng' dir='ltr'><em>GH2—10T</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 1153 399 1320 429; x_wconf 87' lang='eng' dir='ltr'><em>(DQ303125)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_37' title="bbox 781 354 783 412">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 781 354 783 412">
+     <span class='ocr_line' id='line_1_43' title="bbox 781 354 783 412; baseline 0 1695"><span class='ocrx_word' id='word_1_78' title='bbox 781 354 783 412; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_38' title="bbox 637 265 639 495">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 637 265 639 495">
+     <span class='ocr_line' id='line_1_44' title="bbox 637 265 639 495; baseline 0 1612"><span class='ocrx_word' id='word_1_79' title='bbox 637 265 639 495; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_39' title="bbox 639 455 1608 875">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 708 455 1526 763">
+     <span class='ocr_line' id='line_1_45' title="bbox 760 455 1428 484; baseline 0 -6"><span class='ocrx_word' id='word_1_80' title='bbox 760 466 805 467; x_wconf 38' lang='eng' dir='ltr'><em>i</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 824 455 940 478; x_wconf 86' lang='eng' dir='ltr'><em>‘Devosia</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 950 455 1115 484; x_wconf 80' lang='eng' dir='ltr'><em>ginsengisolf</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 1127 455 1195 478; x_wconf 86' lang='eng' dir='ltr'>Gsoil</span> <span class='ocrx_word' id='word_1_84' title='bbox 1206 455 1255 478; x_wconf 84' lang='eng'><em>326</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 1266 455 1428 484; x_wconf 91' lang='eng' dir='ltr'>(AB271045)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 708 508 1307 540; baseline 0 -6"><span class='ocrx_word' id='word_1_86' title='bbox 708 508 746 527; x_wconf 76' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 760 521 792 523; x_wconf 96' lang='eng'>—</span> <span class='ocrx_word' id='word_1_88' title='bbox 811 511 920 534; x_wconf 88' lang='eng' dir='ltr'><em>Devosia</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 930 511 1027 534; x_wconf 86' lang='eng' dir='ltr'><em>insulae</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 1038 508 1136 534; x_wconf 88' lang='eng' dir='ltr'><em>DS-56T</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 1147 511 1307 540; x_wconf 88' lang='eng' dir='ltr'>(EF012357)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 771 564 1332 596; baseline 0 -6"><span class='ocrx_word' id='word_1_92' title='bbox 771 567 880 590; x_wconf 83' lang='eng' dir='ltr'><em>Devosia</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 890 567 1020 596; x_wconf 88' lang='eng' dir='ltr'><em>geojensis</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 1031 564 1161 590; x_wconf 91' lang='eng' dir='ltr'><em>BD-c194T</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 1172 566 1332 596; x_wconf 89' lang='eng' dir='ltr'>(EF575560)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_48' title="bbox 896 620 1526 652; baseline -0.002 -6"><span class='ocrx_word' id='word_1_96' title='bbox 896 623 1087 646; x_wconf 83' lang='eng' dir='ltr'><em>Cucumibacter</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 1094 623 1203 646; x_wconf 89' lang='eng' dir='ltr'><em>marinus</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 1213 620 1355 646; x_wconf 89' lang='eng' dir='ltr'><em>CL-GR60T</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 1366 623 1443 652; x_wconf 90' lang='eng' dir='ltr'>(EF21</span> <span class='ocrx_word' id='word_1_100' title='bbox 1451 623 1526 652; x_wconf 90' lang='eng'><em>1830)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_49' title="bbox 951 677 1358 708; baseline 0 -6"><span class='ocrx_word' id='word_1_101' title='bbox 951 679 1036 702; x_wconf 89' lang='eng' dir='ltr'><em>Strain</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 1048 677 1188 702; x_wconf 91' lang='eng' dir='ltr'><em>CL-SK30T</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 1199 679 1358 708; x_wconf 86' lang='eng' dir='ltr'>(EF988631)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_50' title="bbox 801 732 1489 763; baseline 0 -6"><span class='ocrx_word' id='word_1_104' title='bbox 801 734 1038 757; x_wconf 88' lang='eng' dir='ltr'><em>Ancalomicrob/um</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 1048 734 1149 757; x_wconf 88' lang='eng' dir='ltr'><em>adetum</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 1161 734 1226 757; x_wconf 92' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 1236 732 1317 757; x_wconf 90' lang='eng' dir='ltr'><em>4722T</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 1328 734 1489 763; x_wconf 88' lang='eng' dir='ltr'>(ABO95950)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 744 787 1608 819">
+     <span class='ocr_line' id='line_1_51' title="bbox 744 787 1608 819; baseline 0.001 -7"><span class='ocrx_word' id='word_1_109' title='bbox 744 797 782 815; x_wconf 83' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 817 790 1056 819; x_wconf 86' lang='eng' dir='ltr'><em>Angulomicrobium</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 1066 790 1243 813; x_wconf 84' lang='eng' dir='ltr'><em>amanitiforme</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 1254 790 1350 813; x_wconf 93' lang='eng' dir='ltr'><em>NCIMB</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 1363 787 1442 813; x_wconf 88' lang='eng' dir='ltr'><em>1785T</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 1452 790 1608 819; x_wconf 89' lang='eng' dir='ltr'>(AJ535709)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 707 800 1544 875">
+     <span class='ocr_line' id='line_1_52' title="bbox 707 800 1544 875; baseline 0 -7"><span class='ocrx_word' id='word_1_115' title='bbox 707 800 804 858; x_wconf 26' lang='eng' dir='ltr'><strong><em>A</em></strong></span> <span class='ocrx_word' id='word_1_116' title='bbox 815 846 1054 875; x_wconf 87' lang='eng' dir='ltr'><em>Angulomicrobium</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 1065 846 1210 868; x_wconf 82' lang='eng' dir='ltr'><em>tetraedrale</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 1221 845 1286 868; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 1297 843 1377 868; x_wconf 90' lang='eng' dir='ltr'><em>5895T</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 1388 845 1544 875; x_wconf 89' lang='eng' dir='ltr'>(AJ535708)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_40' title="bbox 864 899 1523 931">
+    <p class='ocr_par' dir='ltr' id='par_1_42' title="bbox 864 899 1523 931">
+     <span class='ocr_line' id='line_1_53' title="bbox 864 899 1523 931; baseline -0.002 -6"><span class='ocrx_word' id='word_1_121' title='bbox 864 902 1082 931; x_wconf 87' lang='eng' dir='ltr'><em>Methylorhabdus</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 1091 902 1248 925; x_wconf 89' lang='eng' dir='ltr'><em>multivorans</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 1259 899 1352 925; x_wconf 89' lang='eng' dir='ltr'><em>DM13T</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 1363 902 1523 931; x_wconf 91' lang='eng' dir='ltr'>(AF004845)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_41' title="bbox 758 466 760 523">
+    <p class='ocr_par' dir='ltr' id='par_1_43' title="bbox 758 466 760 523">
+     <span class='ocr_line' id='line_1_54' title="bbox 758 466 760 523; baseline 0 1584"><span class='ocrx_word' id='word_1_125' title='bbox 758 466 760 523; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_42' title="bbox 655 839 693 857">
+    <p class='ocr_par' dir='ltr' id='par_1_44' title="bbox 655 839 693 857">
+     <span class='ocr_line' id='line_1_55' title="bbox 655 839 693 857; baseline 0 0"><span class='ocrx_word' id='word_1_126' title='bbox 655 839 693 857; x_wconf 90' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_43' title="bbox 705 828 707 914">
+    <p class='ocr_par' dir='ltr' id='par_1_45' title="bbox 705 828 707 914">
+     <span class='ocr_line' id='line_1_56' title="bbox 705 828 707 914; baseline 0 1193"><span class='ocrx_word' id='word_1_127' title='bbox 705 828 707 914; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_44' title="bbox 609 955 1352 986">
+    <p class='ocr_par' dir='ltr' id='par_1_46' title="bbox 609 955 1352 986">
+     <span class='ocr_line' id='line_1_57' title="bbox 609 955 1352 986; baseline 0 -6"><span class='ocrx_word' id='word_1_128' title='bbox 609 965 647 983; x_wconf 85' lang='eng'>100</span> <span class='ocrx_word' id='word_1_129' title='bbox 660 968 712 969; x_wconf 38' lang='eng' dir='ltr'><em>i</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 731 958 905 980; x_wconf 84' lang='eng' dir='ltr'><em>Blastochloris</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 914 957 1058 980; x_wconf 86' lang='eng' dir='ltr'><em>sulfoviridis</em></span> <span class='ocrx_word' id='word_1_132' title='bbox 1069 957 1133 980; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 1145 955 1208 980; x_wconf 92' lang='eng' dir='ltr'><em>729T</em></span> <span class='ocrx_word' id='word_1_134' title='bbox 1219 957 1334 986; x_wconf 87' lang='eng' dir='ltr'><em>(D86514</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 1345 957 1352 986; x_wconf 95' lang='eng'><em>)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_45' title="bbox 421 870 422 1053">
+    <p class='ocr_par' dir='ltr' id='par_1_47' title="bbox 421 870 422 1053">
+     <span class='ocr_line' id='line_1_58' title="bbox 421 870 422 1053; baseline 0 1054"><span class='ocrx_word' id='word_1_136' title='bbox 421 870 422 1053; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_46' title="bbox 422 1043 509 1084">
+    <p class='ocr_par' dir='ltr' id='par_1_48' title="bbox 422 1043 509 1084">
+     <span class='ocr_line' id='line_1_59' title="bbox 422 1043 509 1062; baseline 0 0"><span class='ocrx_word' id='word_1_137' title='bbox 422 1043 509 1062; x_wconf 73' lang='eng' dir='ltr'><em>—o</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_60' title="bbox 461 1066 487 1084; baseline 0 0"><span class='ocrx_word' id='word_1_138' title='bbox 461 1066 487 1084; x_wconf 89' lang='eng'><em>96</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_47' title="bbox 499 996 501 1109">
+    <p class='ocr_par' dir='ltr' id='par_1_49' title="bbox 499 996 501 1109">
+     <span class='ocr_line' id='line_1_61' title="bbox 499 996 501 1109; baseline 0 998"><span class='ocrx_word' id='word_1_139' title='bbox 499 996 501 1109; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_48' title="bbox 501 987 668 1006">
+    <p class='ocr_par' dir='ltr' id='par_1_50' title="bbox 501 987 668 1006">
+     <span class='ocr_line' id='line_1_62' title="bbox 501 987 668 1006; baseline 0 0"><span class='ocrx_word' id='word_1_140' title='bbox 501 987 668 1006; x_wconf 75' lang='eng' dir='ltr'><em>—o</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_49' title="bbox 501 1100 670 1118">
+    <p class='ocr_par' dir='ltr' id='par_1_51' title="bbox 501 1100 670 1118">
+     <span class='ocr_line' id='line_1_63' title="bbox 501 1100 670 1118; baseline 0 0"><span class='ocrx_word' id='word_1_141' title='bbox 501 1100 670 1118; x_wconf 77' lang='eng' dir='ltr'><em>—o</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_50' title="bbox 660 1011 1342 1098">
+    <p class='ocr_par' dir='ltr' id='par_1_52' title="bbox 660 1011 1342 1098">
+     <span class='ocr_line' id='line_1_64' title="bbox 660 1011 1342 1042; baseline 0 -6"><span class='ocrx_word' id='word_1_142' title='bbox 660 1023 726 1025; x_wconf 94' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_143' title='bbox 745 1013 918 1036; x_wconf 85' lang='eng' dir='ltr'><em>Blastoch/oris</em></span> <span class='ocrx_word' id='word_1_144' title='bbox 930 1013 1007 1036; x_wconf 88' lang='eng' dir='ltr'><em>viridis</em></span> <span class='ocrx_word' id='word_1_145' title='bbox 1015 1013 1098 1036; x_wconf 93' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_146' title='bbox 1111 1011 1206 1036; x_wconf 89' lang='eng' dir='ltr'><em>19567T</em></span> <span class='ocrx_word' id='word_1_147' title='bbox 1217 1013 1342 1042; x_wconf 87' lang='eng' dir='ltr'>(D25314)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_65' title="bbox 662 1066 1270 1098; baseline -0.002 -6"><span class='ocrx_word' id='word_1_148' title='bbox 662 1079 705 1081; x_wconf 96' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_149' title='bbox 724 1069 903 1097; x_wconf 89' lang='eng' dir='ltr'><em>Rhodoplanes</em></span> <span class='ocrx_word' id='word_1_150' title='bbox 913 1069 1020 1098; x_wconf 86' lang='eng' dir='ltr'><em>elegans</em></span> <span class='ocrx_word' id='word_1_151' title='bbox 1029 1066 1133 1092; x_wconf 89' lang='eng' dir='ltr'><em>AS130T</em></span> <span class='ocrx_word' id='word_1_152' title='bbox 1144 1069 1270 1098; x_wconf 89' lang='eng' dir='ltr'>(D25311)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_51' title="bbox 659 968 662 1137">
+    <p class='ocr_par' dir='ltr' id='par_1_53' title="bbox 659 968 662 1137">
+     <span class='ocr_line' id='line_1_66' title="bbox 659 968 662 1137; baseline 0 970"><span class='ocrx_word' id='word_1_153' title='bbox 659 968 662 1137; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_52' title="bbox 592 1122 1438 1210">
+    <p class='ocr_par' dir='ltr' id='par_1_54' title="bbox 592 1122 1438 1210">
+     <span class='ocr_line' id='line_1_67' title="bbox 610 1122 1252 1154; baseline 0 -7"><span class='ocrx_word' id='word_1_154' title='bbox 610 1122 648 1140; x_wconf 79' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_155' title='bbox 662 1135 742 1137; x_wconf 95' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_156' title='bbox 761 1125 941 1153; x_wconf 88' lang='eng' dir='ltr'><em>Rhodoplanes</em></span> <span class='ocrx_word' id='word_1_157' title='bbox 951 1130 1042 1147; x_wconf 82' lang='eng' dir='ltr'><em>rose-us</em></span> <span class='ocrx_word' id='word_1_158' title='bbox 1052 1122 1115 1147; x_wconf 90' lang='eng' dir='ltr'><em>941T</em></span> <span class='ocrx_word' id='word_1_159' title='bbox 1125 1124 1252 1154; x_wconf 88' lang='eng' dir='ltr'>(D25313)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_68' title="bbox 592 1178 1438 1210; baseline 0 -6"><span class='ocrx_word' id='word_1_160' title='bbox 592 1180 872 1204; x_wconf 89' lang='eng' dir='ltr'><em>Prosthecomicrobium</em></span> <span class='ocrx_word' id='word_1_161' title='bbox 881 1180 1066 1209; x_wconf 86' lang='eng' dir='ltr'><em>pneumaticum</em></span> <span class='ocrx_word' id='word_1_162' title='bbox 1075 1180 1158 1204; x_wconf 93' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_163' title='bbox 1168 1178 1266 1204; x_wconf 84' lang='eng' dir='ltr'><em>23633T</em></span> <span class='ocrx_word' id='word_1_164' title='bbox 1277 1180 1438 1210; x_wconf 89' lang='eng' dir='ltr'>(ABO17203)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_53' title="bbox 627 1525 629 1583">
+    <p class='ocr_par' dir='ltr' id='par_1_55' title="bbox 627 1525 629 1583">
+     <span class='ocr_line' id='line_1_69' title="bbox 627 1525 629 1583; baseline 0 524"><span class='ocrx_word' id='word_1_165' title='bbox 627 1525 629 1583; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_54' title="bbox 600 1553 601 1639">
+    <p class='ocr_par' dir='ltr' id='par_1_56' title="bbox 600 1553 601 1639">
+     <span class='ocr_line' id='line_1_70' title="bbox 600 1553 601 1639; baseline 0 468"><span class='ocrx_word' id='word_1_166' title='bbox 600 1553 601 1639; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_55' title="bbox 532 1613 570 1631">
+    <p class='ocr_par' dir='ltr' id='par_1_57' title="bbox 532 1613 570 1631">
+     <span class='ocr_line' id='line_1_71' title="bbox 532 1613 570 1631; baseline 0 0"><span class='ocrx_word' id='word_1_167' title='bbox 532 1613 570 1631; x_wconf 89' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_56' title="bbox 581 1595 583 1694">
+    <p class='ocr_par' dir='ltr' id='par_1_58' title="bbox 581 1595 583 1694">
+     <span class='ocr_line' id='line_1_72' title="bbox 581 1595 583 1694; baseline 0 413"><span class='ocrx_word' id='word_1_168' title='bbox 581 1595 583 1694; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_57' title="bbox 439 1696 465 1698">
+    <p class='ocr_par' dir='ltr' id='par_1_59' title="bbox 439 1696 465 1698">
+     <span class='ocr_line' id='line_1_73' title="bbox 439 1696 465 1698; baseline 0 409"><span class='ocrx_word' id='word_1_169' title='bbox 439 1696 465 1698; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_58' title="bbox 463 1644 465 1750">
+    <p class='ocr_par' dir='ltr' id='par_1_60' title="bbox 463 1644 465 1750">
+     <span class='ocr_line' id='line_1_74' title="bbox 463 1644 465 1750; baseline 0 357"><span class='ocrx_word' id='word_1_170' title='bbox 463 1644 465 1750; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_59' title="bbox 411 1776 441 1778">
+    <p class='ocr_par' dir='ltr' id='par_1_61' title="bbox 411 1776 441 1778">
+     <span class='ocr_line' id='line_1_75' title="bbox 411 1776 441 1778; baseline 0 329"><span class='ocrx_word' id='word_1_171' title='bbox 411 1776 441 1778; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_60' title="bbox 439 1696 441 1859">
+    <p class='ocr_par' dir='ltr' id='par_1_62' title="bbox 439 1696 441 1859">
+     <span class='ocr_line' id='line_1_76' title="bbox 439 1696 441 1859; baseline 0 248"><span class='ocrx_word' id='word_1_172' title='bbox 439 1696 441 1859; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_61' title="bbox 448 1804 450 1911">
+    <p class='ocr_par' dir='ltr' id='par_1_63' title="bbox 448 1804 450 1911">
+     <span class='ocr_line' id='line_1_77' title="bbox 448 1804 450 1911; baseline 0 196"><span class='ocrx_word' id='word_1_173' title='bbox 448 1804 450 1911; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_62' title="bbox 450 1901 550 1942">
+    <p class='ocr_par' dir='ltr' id='par_1_64' title="bbox 450 1901 550 1942">
+     <span class='ocr_line' id='line_1_78' title="bbox 450 1901 550 1919; baseline 0 0"><span class='ocrx_word' id='word_1_174' title='bbox 450 1901 550 1919; x_wconf 72' lang='eng' dir='ltr'><em>—o</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_79' title="bbox 502 1924 528 1942; baseline 0 0"><span class='ocrx_word' id='word_1_175' title='bbox 502 1924 528 1942; x_wconf 86' lang='eng'><em>97</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_63' title="bbox 540 1860 541 1959">
+    <p class='ocr_par' dir='ltr' id='par_1_65' title="bbox 540 1860 541 1959">
+     <span class='ocr_line' id='line_1_80' title="bbox 540 1860 541 1959; baseline 0 148"><span class='ocrx_word' id='word_1_176' title='bbox 540 1860 541 1959; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_64' title="bbox 541 1949 1422 2029">
+    <p class='ocr_par' dir='ltr' id='par_1_66' title="bbox 610 1949 1422 2029">
+     <span class='ocr_line' id='line_1_81' title="bbox 610 1949 1422 2029; baseline 0 -45"><span class='ocrx_word' id='word_1_177' title='bbox 610 1972 648 1991; x_wconf 76' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_178' title='bbox 656 1949 718 2029; x_wconf 35' lang='eng'><em>&#39;4+*</em></span> <span class='ocrx_word' id='word_1_179' title='bbox 728 1961 941 1984; x_wconf 90' lang='eng' dir='ltr'><em>Pedomicrobium</em></span> <span class='ocrx_word' id='word_1_180' title='bbox 952 1961 1119 1984; x_wconf 86' lang='eng' dir='ltr'><em>americanum</em></span> <span class='ocrx_word' id='word_1_181' title='bbox 1129 1961 1196 1984; x_wconf 92' lang='eng' dir='ltr'><em>ACM</em></span> <span class='ocrx_word' id='word_1_182' title='bbox 1207 1959 1288 1984; x_wconf 91' lang='eng' dir='ltr'><em>3090T</em></span> <span class='ocrx_word' id='word_1_183' title='bbox 1298 1961 1422 1990; x_wconf 87' lang='eng' dir='ltr'>(X97692)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_65' title="bbox 650 1234 1655 1321">
+    <p class='ocr_par' dir='ltr' id='par_1_67' title="bbox 650 1234 1655 1321">
+     <span class='ocr_line' id='line_1_82' title="bbox 706 1234 1348 1265; baseline 0 -6"><span class='ocrx_word' id='word_1_184' title='bbox 706 1236 937 1259; x_wconf 86' lang='eng' dir='ltr'><em>Rhodomicrobium</em></span> <span class='ocrx_word' id='word_1_185' title='bbox 949 1236 1059 1259; x_wconf 86' lang='eng' dir='ltr'><em>vannie/ii</em></span> <span class='ocrx_word' id='word_1_186' title='bbox 1069 1236 1133 1259; x_wconf 92' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_187' title='bbox 1147 1234 1208 1259; x_wconf 88' lang='eng' dir='ltr'><em>162T</em></span> <span class='ocrx_word' id='word_1_188' title='bbox 1219 1236 1348 1265; x_wconf 90' lang='eng' dir='ltr'><em>(M34127)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_83' title="bbox 650 1289 1655 1321; baseline -0.003 -3"><span class='ocrx_word' id='word_1_189' title='bbox 650 1299 676 1318; x_wconf 86' lang='eng'>78</span> <span class='ocrx_word' id='word_1_190' title='bbox 689 1302 887 1304; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_191' title='bbox 906 1292 1136 1321; x_wconf 86' lang='eng' dir='ltr'><em>Hyphomicrobium</em></span> <span class='ocrx_word' id='word_1_192' title='bbox 1147 1292 1397 1315; x_wconf 85' lang='eng' dir='ltr'><em>chloromethanicum</em></span> <span class='ocrx_word' id='word_1_193' title='bbox 1407 1289 1485 1315; x_wconf 92' lang='eng' dir='ltr'><em>CM2T</em></span> <span class='ocrx_word' id='word_1_194' title='bbox 1495 1292 1655 1321; x_wconf 87' lang='eng' dir='ltr'>(AF198623)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_66' title="bbox 668 1330 689 1332">
+    <p class='ocr_par' dir='ltr' id='par_1_68' title="bbox 668 1330 689 1332">
+     <span class='ocr_line' id='line_1_84' title="bbox 668 1330 689 1332; baseline 0 775"><span class='ocrx_word' id='word_1_195' title='bbox 668 1330 689 1332; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_67' title="bbox 688 1302 689 1360">
+    <p class='ocr_par' dir='ltr' id='par_1_69' title="bbox 688 1302 689 1360">
+     <span class='ocr_line' id='line_1_85' title="bbox 688 1302 689 1360; baseline 0 747"><span class='ocrx_word' id='word_1_196' title='bbox 688 1302 689 1360; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_68' title="bbox 631 1341 1361 1377">
+    <p class='ocr_par' dir='ltr' id='par_1_70' title="bbox 631 1341 1361 1377">
+     <span class='ocr_line' id='line_1_86' title="bbox 631 1341 1361 1377; baseline 0.001 -7"><span class='ocrx_word' id='word_1_197' title='bbox 631 1341 653 1359; x_wconf 67' lang='eng'>71</span> <span class='ocrx_word' id='word_1_198' title='bbox 689 1358 708 1360; x_wconf 98' lang='eng'>—</span> <span class='ocrx_word' id='word_1_199' title='bbox 728 1348 958 1377; x_wconf 86' lang='eng' dir='ltr'><em>Hyphomicrobium</em></span> <span class='ocrx_word' id='word_1_200' title='bbox 968 1347 1038 1371; x_wconf 77' lang='eng' dir='ltr'><em>facile</em></span> <span class='ocrx_word' id='word_1_201' title='bbox 1050 1348 1119 1370; x_wconf 94' lang='eng' dir='ltr'><em>IFAM</em></span> <span class='ocrx_word' id='word_1_202' title='bbox 1132 1345 1227 1371; x_wconf 78' lang='eng' dir='ltr'>H-526T</span> <span class='ocrx_word' id='word_1_203' title='bbox 1238 1347 1361 1377; x_wconf 90' lang='eng' dir='ltr'>(Y14309)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_69' title="bbox 640 1372 670 1374">
+    <p class='ocr_par' dir='ltr' id='par_1_71' title="bbox 640 1372 670 1374">
+     <span class='ocr_line' id='line_1_87' title="bbox 640 1372 670 1374; baseline 0 733"><span class='ocrx_word' id='word_1_204' title='bbox 640 1372 670 1374; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_70' title="bbox 668 1330 670 1415">
+    <p class='ocr_par' dir='ltr' id='par_1_72' title="bbox 668 1330 670 1415">
+     <span class='ocr_line' id='line_1_88' title="bbox 668 1330 670 1415; baseline 0 692"><span class='ocrx_word' id='word_1_205' title='bbox 668 1330 670 1415; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_71' title="bbox 642 1401 1452 1488">
+    <p class='ocr_par' dir='ltr' id='par_1_73' title="bbox 642 1401 1452 1488">
+     <span class='ocr_line' id='line_1_89' title="bbox 670 1401 1452 1432; baseline 0 -6"><span class='ocrx_word' id='word_1_206' title='bbox 670 1414 737 1415; x_wconf 40' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_207' title='bbox 756 1404 986 1432; x_wconf 88' lang='eng' dir='ltr'><em>Hyphomicrobium</em></span> <span class='ocrx_word' id='word_1_208' title='bbox 997 1404 1189 1432; x_wconf 86' lang='eng' dir='ltr'><em>methylovorum</em></span> <span class='ocrx_word' id='word_1_209' title='bbox 1200 1404 1243 1426; x_wconf 94' lang='eng' dir='ltr'><em>KM</em></span> <span class='ocrx_word' id='word_1_210' title='bbox 1256 1401 1317 1426; x_wconf 82' lang='eng' dir='ltr'><em>146T</em></span> <span class='ocrx_word' id='word_1_211' title='bbox 1328 1403 1452 1432; x_wconf 90' lang='eng' dir='ltr'>(Y14307)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_90' title="bbox 642 1457 1423 1488; baseline 0 -6"><span class='ocrx_word' id='word_1_212' title='bbox 642 1469 737 1471; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_213' title='bbox 747 1459 977 1488; x_wconf 90' lang='eng' dir='ltr'><em>Hyphomicrobium</em></span> <span class='ocrx_word' id='word_1_214' title='bbox 988 1459 1150 1482; x_wconf 78' lang='eng' dir='ltr'><em>denitriﬁcans</em></span> <span class='ocrx_word' id='word_1_215' title='bbox 1160 1459 1199 1482; x_wconf 95' lang='eng' dir='ltr'>TK</span> <span class='ocrx_word' id='word_1_216' title='bbox 1209 1457 1289 1482; x_wconf 91' lang='eng' dir='ltr'><em>0145T</em></span> <span class='ocrx_word' id='word_1_217' title='bbox 1299 1459 1423 1488; x_wconf 88' lang='eng' dir='ltr'>(Y14308)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_72' title="bbox 640 1372 642 1471">
+    <p class='ocr_par' dir='ltr' id='par_1_74' title="bbox 640 1372 642 1471">
+     <span class='ocr_line' id='line_1_91' title="bbox 640 1372 642 1471; baseline 0 636"><span class='ocrx_word' id='word_1_218' title='bbox 640 1372 642 1471; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_73' title="bbox 465 1513 1410 1711">
+    <p class='ocr_par' dir='ltr' id='par_1_75' title="bbox 465 1513 1408 1656">
+     <span class='ocr_line' id='line_1_92' title="bbox 629 1513 1401 1544; baseline 0 -6"><span class='ocrx_word' id='word_1_219' title='bbox 629 1525 693 1527; x_wconf 21' lang='eng'><strong>#</strong></span> <span class='ocrx_word' id='word_1_220' title='bbox 712 1515 942 1544; x_wconf 89' lang='eng' dir='ltr'><em>Hyphomicrobium</em></span> <span class='ocrx_word' id='word_1_221' title='bbox 954 1515 1052 1544; x_wconf 89' lang='eng' dir='ltr'><em>vulgare</em></span> <span class='ocrx_word' id='word_1_222' title='bbox 1063 1515 1133 1538; x_wconf 92' lang='eng' dir='ltr'><em>IFAM</em></span> <span class='ocrx_word' id='word_1_223' title='bbox 1145 1513 1267 1538; x_wconf 92' lang='eng' dir='ltr'><em>MC-750T</em></span> <span class='ocrx_word' id='word_1_224' title='bbox 1277 1515 1401 1544; x_wconf 90' lang='eng' dir='ltr'>(Y14302)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_93' title="bbox 629 1568 1408 1600; baseline 0 -7"><span class='ocrx_word' id='word_1_225' title='bbox 629 1581 682 1583; x_wconf 96' lang='eng'>—</span> <span class='ocrx_word' id='word_1_226' title='bbox 701 1571 931 1600; x_wconf 87' lang='eng' dir='ltr'><em>Hyphomicrobium</em></span> <span class='ocrx_word' id='word_1_227' title='bbox 941 1571 1070 1594; x_wconf 83' lang='eng' dir='ltr'><em>zavarzinii</em></span> <span class='ocrx_word' id='word_1_228' title='bbox 1080 1571 1149 1593; x_wconf 94' lang='eng' dir='ltr'><em>IFAM</em></span> <span class='ocrx_word' id='word_1_229' title='bbox 1160 1568 1274 1594; x_wconf 89' lang='eng' dir='ltr'><em>ZV-622T</em></span> <span class='ocrx_word' id='word_1_230' title='bbox 1285 1571 1408 1600; x_wconf 90' lang='eng' dir='ltr'>(Y14305)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_94' title="bbox 465 1624 1339 1656; baseline 0 -7"><span class='ocrx_word' id='word_1_231' title='bbox 465 1635 592 1653; x_wconf 73' lang='eng'><em>—.</em></span> <span class='ocrx_word' id='word_1_232' title='bbox 601 1637 671 1639; x_wconf 94' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_233' title='bbox 682 1627 912 1656; x_wconf 88' lang='eng' dir='ltr'><em>Hyphomicrobium</em></span> <span class='ocrx_word' id='word_1_234' title='bbox 922 1627 1039 1649; x_wconf 82' lang='eng' dir='ltr'><em>aestuarii</em></span> <span class='ocrx_word' id='word_1_235' title='bbox 1048 1626 1113 1649; x_wconf 85' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_236' title='bbox 1127 1624 1205 1649; x_wconf 89' lang='eng' dir='ltr'><em>1564T</em></span> <span class='ocrx_word' id='word_1_237' title='bbox 1215 1626 1339 1656; x_wconf 86' lang='eng' dir='ltr'>(Y14304)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_76' title="bbox 583 1680 1410 1711">
+     <span class='ocr_line' id='line_1_95' title="bbox 583 1680 1410 1711; baseline 0 -6"><span class='ocrx_word' id='word_1_238' title='bbox 583 1693 655 1694; x_wconf 41' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_239' title='bbox 665 1682 895 1711; x_wconf 90' lang='eng' dir='ltr'><em>Hyphomicrobium</em></span> <span class='ocrx_word' id='word_1_240' title='bbox 906 1682 1068 1705; x_wconf 89' lang='eng' dir='ltr'><em>ho/landicum</em></span> <span class='ocrx_word' id='word_1_241' title='bbox 1080 1682 1149 1705; x_wconf 93' lang='eng' dir='ltr'><em>IFAM</em></span> <span class='ocrx_word' id='word_1_242' title='bbox 1162 1680 1276 1705; x_wconf 89' lang='eng' dir='ltr'><em>KB-677T</em></span> <span class='ocrx_word' id='word_1_243' title='bbox 1287 1682 1410 1711; x_wconf 88' lang='eng' dir='ltr'>(Y14303)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_74' title="bbox 657 1735 1329 1823">
+    <p class='ocr_par' dir='ltr' id='par_1_77' title="bbox 657 1735 1329 1823">
+     <span class='ocr_line' id='line_1_96' title="bbox 701 1735 1329 1767; baseline 0.002 -7"><span class='ocrx_word' id='word_1_244' title='bbox 701 1738 892 1761; x_wconf 89' lang='eng' dir='ltr'><em>Filomicrobium</em></span> <span class='ocrx_word' id='word_1_245' title='bbox 902 1738 1027 1761; x_wconf 87' lang='eng' dir='ltr'><em>fusiforme</em></span> <span class='ocrx_word' id='word_1_246' title='bbox 1039 1738 1103 1761; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_247' title='bbox 1115 1735 1196 1761; x_wconf 89' lang='eng' dir='ltr'><em>5304T</em></span> <span class='ocrx_word' id='word_1_248' title='bbox 1206 1738 1329 1767; x_wconf 90' lang='eng' dir='ltr'>(Y14313)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_97' title="bbox 657 1791 1307 1823; baseline 0 -6"><span class='ocrx_word' id='word_1_249' title='bbox 657 1794 887 1823; x_wconf 88' lang='eng' dir='ltr'><em>Hyphomicrobium</em></span> <span class='ocrx_word' id='word_1_250' title='bbox 897 1793 1078 1817; x_wconf 87' lang='eng' dir='ltr'><em>sulfonivorans</em></span> <span class='ocrx_word' id='word_1_251' title='bbox 1088 1791 1137 1817; x_wconf 89' lang='eng' dir='ltr'><em>S1T</em></span> <span class='ocrx_word' id='word_1_252' title='bbox 1147 1794 1307 1823; x_wconf 87' lang='eng' dir='ltr'>(AF235089)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_75' title="bbox 541 1847 1370 1879">
+    <p class='ocr_par' dir='ltr' id='par_1_78' title="bbox 541 1847 1370 1879">
+     <span class='ocr_line' id='line_1_98' title="bbox 541 1847 1370 1879; baseline 0 -6"><span class='ocrx_word' id='word_1_253' title='bbox 541 1860 659 1862; x_wconf 91' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_254' title='bbox 670 1850 882 1873; x_wconf 89' lang='eng' dir='ltr'><em>Pedomicrobium</em></span> <span class='ocrx_word' id='word_1_255' title='bbox 893 1850 1068 1879; x_wconf 88' lang='eng' dir='ltr'><em>manganicum</em></span> <span class='ocrx_word' id='word_1_256' title='bbox 1077 1850 1144 1873; x_wconf 94' lang='eng' dir='ltr'><em>ACM</em></span> <span class='ocrx_word' id='word_1_257' title='bbox 1155 1847 1236 1873; x_wconf 90' lang='eng' dir='ltr'><em>3038T</em></span> <span class='ocrx_word' id='word_1_258' title='bbox 1246 1850 1370 1879; x_wconf 89' lang='eng' dir='ltr'>(X97691)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_76' title="bbox 662 1903 1388 1935">
+    <p class='ocr_par' dir='ltr' id='par_1_79' title="bbox 662 1903 1388 1935">
+     <span class='ocr_line' id='line_1_99' title="bbox 662 1903 1388 1935; baseline 0 -7"><span class='ocrx_word' id='word_1_259' title='bbox 662 1916 690 1918; x_wconf 98' lang='eng'>—</span> <span class='ocrx_word' id='word_1_260' title='bbox 700 1906 913 1928; x_wconf 86' lang='eng' dir='ltr'><em>Pedomicrobium</em></span> <span class='ocrx_word' id='word_1_261' title='bbox 924 1905 1086 1934; x_wconf 87' lang='eng' dir='ltr'><em>ferrugineum</em></span> <span class='ocrx_word' id='word_1_262' title='bbox 1098 1905 1162 1928; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_263' title='bbox 1176 1903 1254 1928; x_wconf 92' lang='eng' dir='ltr'><em>1540T</em></span> <span class='ocrx_word' id='word_1_264' title='bbox 1265 1905 1388 1935; x_wconf 88' lang='eng' dir='ltr'>(X97690)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_77' title="bbox 660 1916 662 2000">
+    <p class='ocr_par' dir='ltr' id='par_1_80' title="bbox 660 1916 662 2000">
+     <span class='ocr_line' id='line_1_100' title="bbox 660 1916 662 2000; baseline 0 107"><span class='ocrx_word' id='word_1_265' title='bbox 660 1916 662 2000; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_78' title="bbox 639 2014 1422 2046">
+    <p class='ocr_par' dir='ltr' id='par_1_81' title="bbox 639 2014 1422 2046">
+     <span class='ocr_line' id='line_1_101' title="bbox 639 2014 1422 2046; baseline 0 -6"><span class='ocrx_word' id='word_1_266' title='bbox 639 2014 677 2032; x_wconf 68' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_267' title='bbox 707 2017 920 2040; x_wconf 87' lang='eng' dir='ltr'><em>Pedomicrobium</em></span> <span class='ocrx_word' id='word_1_268' title='bbox 930 2017 1086 2040; x_wconf 86' lang='eng' dir='ltr'><em>australicum</em></span> <span class='ocrx_word' id='word_1_269' title='bbox 1096 2017 1179 2040; x_wconf 94' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_270' title='bbox 1189 2014 1287 2040; x_wconf 89' lang='eng' dir='ltr'><em>43611T</em></span> <span class='ocrx_word' id='word_1_271' title='bbox 1298 2017 1422 2046; x_wconf 91' lang='eng' dir='ltr'>(X97693)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_79' title="bbox 6 2083 937 2085">
+    <p class='ocr_par' dir='ltr' id='par_1_82' title="bbox 6 2083 937 2085">
+     <span class='ocr_line' id='line_1_102' title="bbox 6 2083 937 2085; baseline 0 22"><span class='ocrx_word' id='word_1_272' title='bbox 6 2083 937 2085; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_80' title="bbox 939 2070 1365 2102">
+    <p class='ocr_par' dir='ltr' id='par_1_83' title="bbox 939 2070 1365 2102">
+     <span class='ocr_line' id='line_1_103' title="bbox 939 2070 1365 2102; baseline 0 -7"><span class='ocrx_word' id='word_1_273' title='bbox 939 2073 1097 2095; x_wconf 88' lang='eng' dir='ltr'><em>Escherichia</em></span> <span class='ocrx_word' id='word_1_274' title='bbox 1108 2073 1154 2095; x_wconf 89' lang='eng' dir='ltr'><em>coli</em></span> <span class='ocrx_word' id='word_1_275' title='bbox 1163 2070 1229 2095; x_wconf 89' lang='eng' dir='ltr'><em>K12T</em></span> <span class='ocrx_word' id='word_1_276' title='bbox 1240 2072 1365 2102; x_wconf 88' lang='eng' dir='ltr'>(U00096)</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002899-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002899-0-000.pbm.png
new file mode 100644
index 00000000..5aad8fad
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002899-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002899-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002899-0-000.pbm.png.hocr
new file mode 100644
index 00000000..737fa19b
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002899-0-000.pbm.png.hocr
@@ -0,0 +1,132 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002899-0-000.pbm.png"; bbox 0 0 994 808; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 38 0 870 35">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 38 2 870 30">
+     <span class='ocr_line' id='line_1_1' title="bbox 38 2 870 30; baseline -0.002 -4"><span class='ocrx_word' id='word_1_1' title='bbox 38 11 238 26; x_wconf 63' lang='eng' dir='ltr'><em>.—u</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 373 12 398 30; x_wconf 73' lang='eng'>99</span> <span class='ocrx_word' id='word_1_3' title='bbox 426 3 451 24; x_wconf 91' lang='eng' dir='ltr'><em>N.</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 463 3 554 24; x_wconf 84' lang='eng' dir='ltr'><em>sienata</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 566 3 610 24; x_wconf 93' lang='eng' dir='ltr'><em>IFM</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 624 2 711 24; x_wconf 80' lang='eng' dir='ltr'><em>10088T</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 719 3 870 30; x_wconf 81' lang='eng' dir='ltr'><em>(AB121770)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 114 32 901 168">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 115 33 901 166">
+     <span class='ocr_line' id='line_1_2' title="bbox 115 33 901 75; baseline -0.001 -5"><span class='ocrx_word' id='word_1_8' title='bbox 115 33 158 51; x_wconf 56' lang='eng'><em>0&#39;01</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 308 46 333 64; x_wconf 79' lang='eng'><em>84</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 391 38 420 60; x_wconf 69' lang='eng' dir='ltr'><em>*L</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 431 49 456 69; x_wconf 92' lang='eng' dir='ltr'><em>N.</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 469 49 575 70; x_wconf 83' lang='eng' dir='ltr'><em>testacea</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 585 48 641 70; x_wconf 83' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 654 48 742 70; x_wconf 84' lang='eng' dir='ltr'><em>12235T</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 750 48 901 75; x_wconf 82' lang='eng' dir='ltr'><em>(AB192415)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 281 72 867 137; baseline 0 -22"><span class='ocrx_word' id='word_1_16' title='bbox 281 85 306 137; x_wconf 59' lang='eng' dir='ltr'><em>97f</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 325 72 416 106; x_wconf 63' lang='eng' dir='ltr'><em>fl—</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 426 94 450 115; x_wconf 93' lang='eng' dir='ltr'><em>N.</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 463 94 594 115; x_wconf 87' lang='eng' dir='ltr'><em>ﬂavorosea</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 604 94 660 115; x_wconf 91' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 671 93 745 115; x_wconf 80' lang='eng' dir='ltr'><em>3332T</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 753 94 867 121; x_wconf 87' lang='eng'><em>(246754)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 195 137 830 166; baseline 0.002 -6"><span class='ocrx_word' id='word_1_23' title='bbox 195 137 220 155; x_wconf 79' lang='eng'><em>79</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 315 149 368 151; x_wconf 96' lang='eng'>—</span> <span class='ocrx_word' id='word_1_25' title='bbox 377 139 402 160; x_wconf 96' lang='eng' dir='ltr'><em>N.</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 415 145 501 161; x_wconf 86' lang='eng' dir='ltr'><em>carnea</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 512 139 572 161; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 582 138 673 161; x_wconf 79' lang='eng' dir='ltr'><em>43397T</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 680 139 830 166; x_wconf 88' lang='eng' dir='ltr'><em>(AF430035)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 312 69 316 151">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 312 69 316 151">
+     <span class='ocr_line' id='line_1_5' title="bbox 312 69 316 151; baseline 0 657"><span class='ocrx_word' id='word_1_30' title='bbox 312 69 316 151; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 41 158 317 224">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 41 160 317 221">
+     <span class='ocr_line' id='line_1_6' title="bbox 109 160 232 185; baseline 0 0"><span class='ocrx_word' id='word_1_31' title='bbox 109 160 232 185; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 41 185 317 221; baseline 0 587"><span class='ocrx_word' id='word_1_32' title='bbox 41 185 317 221; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 22 179 975 714">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 48 184 970 712">
+     <span class='ocr_line' id='line_1_8' title="bbox 317 184 920 212; baseline 0 -6"><span class='ocrx_word' id='word_1_33' title='bbox 317 194 354 212; x_wconf 78' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 453 185 479 206; x_wconf 96' lang='eng' dir='ltr'><em>N.</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 485 185 630 212; x_wconf 88' lang='eng' dir='ltr'><em>jinanensis</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 639 184 755 206; x_wconf 79' lang='eng' dir='ltr'><em>04-5195T</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 765 185 920 212; x_wconf 86' lang='eng' dir='ltr'><em>(DQ462650)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 341 220 868 257; baseline 0 -6"><span class='ocrx_word' id='word_1_38' title='bbox 341 227 349 234; x_wconf 61' lang='eng'>*</span> <span class='ocrx_word' id='word_1_39' title='bbox 358 220 430 242; x_wconf 72' lang='eng' dir='ltr'><em>I—</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 440 230 465 251; x_wconf 96' lang='eng' dir='ltr'><em>N.</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 477 230 607 257; x_wconf 84' lang='eng' dir='ltr'><em>speluncae</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 618 229 868 257; x_wconf 62' lang='eng' dir='ltr'><em>N2-11T(AM422449)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 318 275 834 303; baseline -0.002 -6"><span class='ocrx_word' id='word_1_43' title='bbox 318 276 343 296; x_wconf 95' lang='eng' dir='ltr'><em>N.</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 355 276 502 297; x_wconf 85' lang='eng' dir='ltr'><em>brevicatena</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 513 275 573 297; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 583 275 674 297; x_wconf 81' lang='eng' dir='ltr'><em>43024T</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 684 275 834 303; x_wconf 88' lang='eng' dir='ltr'><em>(AF430040)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 240 321 732 348; baseline 0.002 -6"><span class='ocrx_word' id='word_1_48' title='bbox 240 322 264 342; x_wconf 95' lang='eng' dir='ltr'><em>N.</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 277 322 467 348; x_wconf 82' lang='eng' dir='ltr'><em>cyriac/georgica</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 478 321 572 343; x_wconf 86' lang='eng' dir='ltr'><em>D1627T</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 582 321 732 348; x_wconf 87' lang='eng' dir='ltr'><em>(AF282889)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 117 366 776 413; baseline 0 -25"><span class='ocrx_word' id='word_1_52' title='bbox 117 374 232 413; x_wconf 69' lang='eng' dir='ltr'><em>L—</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 242 367 266 388; x_wconf 94' lang='eng' dir='ltr'><em>N.</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 279 367 414 388; x_wconf 85' lang='eng' dir='ltr'><em>abscessus</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 424 367 504 388; x_wconf 93' lang='eng' dir='ltr'><em>IMMIB</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 516 366 776 394; x_wconf 74' lang='eng' dir='ltr'><em>D—1592T(AF218292)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 207 411 793 439; baseline 0 -6"><span class='ocrx_word' id='word_1_57' title='bbox 207 422 286 424; x_wconf 96' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_58' title='bbox 296 412 321 433; x_wconf 96' lang='eng' dir='ltr'><em>N.</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 333 412 465 433; x_wconf 87' lang='eng' dir='ltr'><em>asteroides</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 475 412 535 433; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 546 411 636 433; x_wconf 88' lang='eng' dir='ltr'><em>43757T</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 644 412 793 439; x_wconf 87' lang='eng' dir='ltr'><em>(AF430019)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 367 457 856 484; baseline 0.002 -6"><span class='ocrx_word' id='word_1_63' title='bbox 367 458 392 478; x_wconf 97' lang='eng' dir='ltr'><em>N.</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 404 458 540 479; x_wconf 74' lang='eng' dir='ltr'><em>tha/‘Iandica</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 551 458 596 478; x_wconf 92' lang='eng' dir='ltr'><em>IFM</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 609 457 697 479; x_wconf 91' lang='eng' dir='ltr'><em>10145T</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 705 457 856 484; x_wconf 90' lang='eng' dir='ltr'><em>(AB126874)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 227 502 726 530; baseline 0 -6"><span class='ocrx_word' id='word_1_68' title='bbox 227 503 252 524; x_wconf 95' lang='eng' dir='ltr'><em>N.</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 263 503 414 524; x_wconf 85' lang='eng' dir='ltr'><em>Xishanensis</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 422 503 459 524; x_wconf 88' lang='eng' dir='ltr'><em>AS</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 469 502 726 530; x_wconf 64' lang='eng' dir='ltr'><em>4.1860T(AY333115)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 253 548 857 575; baseline -0.002 -5"><span class='ocrx_word' id='word_1_72' title='bbox 253 549 277 569; x_wconf 95' lang='eng' dir='ltr'><em>N.</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 288 549 526 575; x_wconf 75' lang='eng' dir='ltr'><em>pseudobrasiliensis</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 536 548 596 570; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 606 548 697 570; x_wconf 89' lang='eng' dir='ltr'><em>44290T</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 707 548 857 575; x_wconf 86' lang='eng' dir='ltr'><em>(AF430042)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 48 588 703 621; baseline 0.002 -6"><span class='ocrx_word' id='word_1_77' title='bbox 48 588 59 609; x_wconf 53' lang='eng' dir='ltr'><em>fv</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 70 593 81 611; x_wconf 77' lang='eng' dir='ltr'>P</span> <span class='ocrx_word' id='word_1_79' title='bbox 290 594 314 615; x_wconf 97' lang='eng' dir='ltr'><em>N.</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 326 599 387 616; x_wconf 87' lang='eng' dir='ltr'><em>nova</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 398 594 443 615; x_wconf 93' lang='eng' dir='ltr'><em>IFM</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 456 593 703 621; x_wconf 52' lang='eng' dir='ltr'><em>102657(AB162790)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 130 639 730 667; baseline 0 -6"><span class='ocrx_word' id='word_1_83' title='bbox 130 650 313 652; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_84' title='bbox 322 640 347 661; x_wconf 95' lang='eng' dir='ltr'><em>N.</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 359 640 412 661; x_wconf 87' lang='eng' dir='ltr'><em>alba</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 421 640 470 661; x_wconf 95' lang='eng' dir='ltr'><em>YIM</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 481 639 571 661; x_wconf 81' lang='eng' dir='ltr'><em>30243T</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 578 640 730 667; x_wconf 85' lang='eng' dir='ltr'><em>(AY222321)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 93 667 970 712; baseline 0 -6"><span class='ocrx_word' id='word_1_89' title='bbox 93 667 118 685; x_wconf 68' lang='eng'><em>92</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 454 685 478 706; x_wconf 95' lang='eng' dir='ltr'><em>N.</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 490 685 641 706; x_wconf 84' lang='eng' dir='ltr'><em>salmonicida</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 652 685 712 706; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_93' title='bbox 722 684 970 712; x_wconf 83' lang='eng' dir='ltr'><em>40472T(AF430050)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 80 693 991 775">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 81 696 991 761">
+     <span class='ocr_line' id='line_1_20' title="bbox 81 696 121 713; baseline 0 0"><span class='ocrx_word' id='word_1_94' title='bbox 81 696 88 713; x_wconf 91' lang='eng' dir='ltr'>f</span> <span class='ocrx_word' id='word_1_95' title='bbox 103 700 121 713; x_wconf 93' lang='eng' dir='ltr'>m</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 90 707 389 725; baseline 0 0"><span class='ocrx_word' id='word_1_96' title='bbox 90 711 92 717; x_wconf 49' lang='eng' dir='ltr'><strong>v</strong></span> <span class='ocrx_word' id='word_1_97' title='bbox 351 707 389 725; x_wconf 87' lang='eng'><em>100</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 345 730 991 761; baseline 0 -9"><span class='ocrx_word' id='word_1_98' title='bbox 345 739 357 761; x_wconf 33' lang='eng' dir='ltr'>f,</span> <span class='ocrx_word' id='word_1_99' title='bbox 367 744 385 757; x_wconf 83' lang='eng' dir='ltr'>m</span> <span class='ocrx_word' id='word_1_100' title='bbox 412 742 437 760; x_wconf 73' lang='eng'>99</span> <span class='ocrx_word' id='word_1_101' title='bbox 457 731 481 751; x_wconf 97' lang='eng' dir='ltr'><em>N.</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 494 731 662 752; x_wconf 84' lang='eng' dir='ltr'><em>cummidelens</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 673 730 732 752; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 743 730 991 757; x_wconf 76' lang='eng' dir='ltr'><em>44490T(AF430052)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 396 767 867 805">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 396 767 867 803">
+     <span class='ocr_line' id='line_1_23' title="bbox 396 767 867 803; baseline 0 -6"><span class='ocrx_word' id='word_1_105' title='bbox 396 772 408 793; x_wconf 50' lang='eng' dir='ltr'><em>fv</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 419 777 436 790; x_wconf 82' lang='eng' dir='ltr'>m</span> <span class='ocrx_word' id='word_1_107' title='bbox 445 767 447 788; x_wconf 74' lang='eng' dir='ltr'><strong>I</strong></span> <span class='ocrx_word' id='word_1_108' title='bbox 457 776 481 797; x_wconf 95' lang='eng' dir='ltr'><em>N.</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 493 776 537 797; x_wconf 82' lang='eng' dir='ltr'><em>soli</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 546 776 606 797; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 616 775 707 797; x_wconf 93' lang='eng' dir='ltr'><em>44488T</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 717 776 867 803; x_wconf 88' lang='eng' dir='ltr'><em>(AF430051)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 17 184 446 614">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 18 221 312 611">
+     <span class='ocr_line' id='line_1_24' title="bbox 20 221 312 361; baseline 0 0"><span class='ocrx_word' id='word_1_113' title='bbox 20 221 312 361; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 20 361 124 451; baseline 0 -43"><span class='ocrx_word' id='word_1_114' title='bbox 20 361 124 451; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 18 451 220 488; baseline 0 -35"><span class='ocrx_word' id='word_1_115' title='bbox 18 451 220 488; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 18 488 283 611; baseline 0 -67"><span class='ocrx_word' id='word_1_116' title='bbox 18 488 283 611; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 153 377 155 448">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 153 377 155 448">
+     <span class='ocr_line' id='line_1_28' title="bbox 153 377 155 448; baseline 0 360"><span class='ocrx_word' id='word_1_117' title='bbox 153 377 155 448; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 173 424 199 442">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 173 424 199 442">
+     <span class='ocr_line' id='line_1_29' title="bbox 173 424 199 442; baseline 0 0"><span class='ocrx_word' id='word_1_118' title='bbox 173 424 199 442; x_wconf 87' lang='eng'><em>69</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 153 444 207 448">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 153 444 207 448">
+     <span class='ocr_line' id='line_1_30' title="bbox 153 444 207 448; baseline 0 360"><span class='ocrx_word' id='word_1_119' title='bbox 153 444 207 448; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 204 422 208 470">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 204 422 208 470">
+     <span class='ocr_line' id='line_1_31' title="bbox 204 422 208 470; baseline 0 338"><span class='ocrx_word' id='word_1_120' title='bbox 204 422 208 470; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 127 650 131 732">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 127 650 131 732">
+     <span class='ocr_line' id='line_1_32' title="bbox 127 650 131 732; baseline 0 76"><span class='ocrx_word' id='word_1_121' title='bbox 127 650 131 732; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002907-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002907-0-001.pbm.png
new file mode 100644
index 00000000..ccf28e5d
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002907-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002907-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002907-0-001.pbm.png.hocr
new file mode 100644
index 00000000..0727faaf
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002907-0-001.pbm.png.hocr
@@ -0,0 +1,170 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002907-0-001.pbm.png"; bbox 0 0 994 608; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 2 0 994 608">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 2 0 994 608">
+     <span class='ocr_line' id='line_1_1' title="bbox 234 0 915 28; baseline 0 -6"><span class='ocrx_word' id='word_1_1' title='bbox 234 11 270 13; x_wconf 97' lang='eng'>—</span> <span class='ocrx_word' id='word_1_2' title='bbox 277 2 422 27; x_wconf 76' lang='eng' dir='ltr'><em>Kineosporia</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 432 2 577 22; x_wconf 77' lang='eng' dir='ltr'><em>mikuniensis</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 588 1 663 22; x_wconf 91' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 675 0 870 28; x_wconf 72' lang='eng' dir='ltr'><em>16234T(ABB771</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 879 1 915 28; x_wconf 91' lang='eng'><em>17)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 311 45 895 72; baseline 0 -5"><span class='ocrx_word' id='word_1_7' title='bbox 311 46 456 72; x_wconf 86' lang='eng' dir='ltr'><em>Kineosporia</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 466 46 595 67; x_wconf 78' lang='eng' dir='ltr'><em>aurantiaca</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 604 46 659 67; x_wconf 90' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 670 45 741 67; x_wconf 89' lang='eng' dir='ltr'><em>3230T</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 749 46 895 72; x_wconf 80' lang='eng' dir='ltr'><em>(A8003931)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 234 89 805 117; baseline 0 -6"><span class='ocrx_word' id='word_1_12' title='bbox 234 100 297 102; x_wconf 96' lang='eng'>—</span> <span class='ocrx_word' id='word_1_13' title='bbox 305 91 450 116; x_wconf 85' lang='eng' dir='ltr'><em>Kineosporia</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 460 91 568 111; x_wconf 86' lang='eng' dir='ltr'><em>succinea</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 580 89 651 111; x_wconf 89' lang='eng' dir='ltr'><em>I-273T</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 659 90 805 117; x_wconf 80' lang='eng' dir='ltr'><em>(A8003932)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 276 135 634 163; baseline 0 -8"><span class='ocrx_word' id='word_1_17' title='bbox 276 147 308 163; x_wconf 69' lang='eng'><em>861</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 324 135 474 156; x_wconf 87' lang='eng' dir='ltr'><em>VN05A0342</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 484 135 634 161; x_wconf 87' lang='eng' dir='ltr'><em>(AB377118)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 240 145 646 235; baseline -0.005 -33"><span class='ocrx_word' id='word_1_20' title='bbox 240 145 455 235; x_wconf 38' lang='eng' dir='ltr'><em>MVNOSAOM</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 461 178 486 200; x_wconf 79' lang='eng' dir='ltr'><strong>ST</strong></span> <span class='ocrx_word' id='word_1_22' title='bbox 496 179 646 206; x_wconf 88' lang='eng' dir='ltr'><em>(AB377116)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 328 224 639 250; baseline -0.003 -5"><span class='ocrx_word' id='word_1_23' title='bbox 328 224 475 245; x_wconf 84' lang='eng' dir='ltr'><em>VN05A0351</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 489 224 639 250; x_wconf 82' lang='eng' dir='ltr'><em>(A3377119)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 336 267 846 295; baseline 0 -6"><span class='ocrx_word' id='word_1_25' title='bbox 336 269 481 294; x_wconf 72' lang='eng' dir='ltr'><em>Kineosporia</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 491 269 609 294; x_wconf 82' lang='eng' dir='ltr'><em>rhizophi/a</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 620 267 692 289; x_wconf 84' lang='eng' dir='ltr'><em>l-449T</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 699 268 846 295; x_wconf 82' lang='eng' dir='ltr'><em>(ABOO3933)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 272 312 787 340; baseline 0 -6"><span class='ocrx_word' id='word_1_29' title='bbox 272 314 417 339; x_wconf 80' lang='eng' dir='ltr'><em>Kineosporia</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 427 314 550 334; x_wconf 81' lang='eng' dir='ltr'><em>rhamnosa</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 561 312 633 334; x_wconf 82' lang='eng' dir='ltr'><em>I-132T</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 640 313 787 340; x_wconf 80' lang='eng' dir='ltr'><em>(A8003935)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 381 357 994 384; baseline 0 -5"><span class='ocrx_word' id='word_1_33' title='bbox 381 358 539 379; x_wconf 84' lang='eng' dir='ltr'><em>Kineococcus</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 548 358 691 379; x_wconf 75' lang='eng' dir='ltr'><em>aurantiacus</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 701 358 777 379; x_wconf 90' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 789 357 875 379; x_wconf 80' lang='eng' dir='ltr'><em>15268T</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 882 358 994 384; x_wconf 84' lang='eng' dir='ltr'><em>(X77958)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 2 401 887 429; baseline -0.002 -4"><span class='ocrx_word' id='word_1_38' title='bbox 2 423 23 425; x_wconf 97' lang='eng'>_</span> <span class='ocrx_word' id='word_1_39' title='bbox 100 412 288 414; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_40' title='bbox 296 402 477 428; x_wconf 79' lang='eng' dir='ltr'><em>Quadrisphaera</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 487 403 627 429; x_wconf 84' lang='eng' dir='ltr'><em>granu/orum</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 635 401 887 429; x_wconf 79' lang='eng' dir='ltr'><em>AGO19T(AY831385)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 345 446 978 473; baseline -0.002 -5"><span class='ocrx_word' id='word_1_43' title='bbox 345 447 571 473; x_wconf 85' lang='eng' dir='ltr'><em>Geodermatophi/us</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 580 447 692 468; x_wconf 83' lang='eng' dir='ltr'><em>obscurus</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 702 447 760 468; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 770 446 858 468; x_wconf 81' lang='eng' dir='ltr'><em>43162T</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 865 447 978 473; x_wconf 87' lang='eng' dir='ltr'><em>(X92357)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 362 492 618 518; baseline 0 -6"><span class='ocrx_word' id='word_1_48' title='bbox 362 492 453 512; x_wconf 84' lang='eng' dir='ltr'><em>Frankia</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 463 497 497 517; x_wconf 86' lang='eng' dir='ltr'><em>sp.</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 509 492 618 518; x_wconf 89' lang='eng' dir='ltr'><em>(L41048)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 243 535 880 562; baseline -0.002 -5"><span class='ocrx_word' id='word_1_51' title='bbox 243 536 388 562; x_wconf 84' lang='eng' dir='ltr'><em>Sporichthya</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 397 536 542 562; x_wconf 86' lang='eng' dir='ltr'><em>polymorpha</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 553 536 629 557; x_wconf 92' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_54' title='bbox 641 535 880 562; x_wconf 78' lang='eng' dir='ltr'><em>12702T(A8025317)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 315 579 819 608; baseline 0 -6"><span class='ocrx_word' id='word_1_55' title='bbox 315 581 417 602; x_wconf 75' lang='eng' dir='ltr'><em>PiI/me/ia</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 427 582 532 602; x_wconf 83' lang='eng' dir='ltr'><em>terevasa</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 543 581 600 602; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 611 579 819 608; x_wconf 75' lang='eng' dir='ltr'><em>43040T(X93190)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 72 27 113 90">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 72 27 113 90">
+     <span class='ocr_line' id='line_1_15' title="bbox 72 27 111 43; baseline 0 0"><span class='ocrx_word' id='word_1_59' title='bbox 72 27 111 43; x_wconf 84' lang='eng'><em>0.01</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 74 68 113 90; baseline 0 0"><span class='ocrx_word' id='word_1_60' title='bbox 74 68 113 90; x_wconf 67' lang='eng' dir='ltr'><em>Km</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 234 55 303 57">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 234 55 303 57">
+     <span class='ocr_line' id='line_1_17' title="bbox 234 55 303 57; baseline 0 551"><span class='ocrx_word' id='word_1_61' title='bbox 234 55 303 57; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 232 11 235 102">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 232 11 235 102">
+     <span class='ocr_line' id='line_1_18' title="bbox 232 11 235 102; baseline 0 506"><span class='ocrx_word' id='word_1_62' title='bbox 232 11 235 102; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 181 120 217 137">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 181 120 217 137">
+     <span class='ocr_line' id='line_1_19' title="bbox 181 120 217 137; baseline -0.028 0"><span class='ocrx_word' id='word_1_63' title='bbox 181 120 217 137; x_wconf 83' lang='eng'><em>972</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 124 210 159 227">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 124 210 159 227">
+     <span class='ocr_line' id='line_1_20' title="bbox 124 210 159 227; baseline 0 0"><span class='ocrx_word' id='word_1_64' title='bbox 124 210 159 227; x_wconf 80' lang='eng'><em>992</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 126 232 185 234">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 126 232 185 234">
+     <span class='ocr_line' id='line_1_21' title="bbox 126 232 185 234; baseline 0 374"><span class='ocrx_word' id='word_1_65' title='bbox 126 232 185 234; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 197 245 232 261">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 197 245 232 261">
+     <span class='ocr_line' id='line_1_22' title="bbox 197 245 232 261; baseline 0 0"><span class='ocrx_word' id='word_1_66' title='bbox 197 245 232 261; x_wconf 87' lang='eng'><em>522</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 238 201 240 280">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 238 201 240 280">
+     <span class='ocr_line' id='line_1_23' title="bbox 238 201 240 280; baseline 0 328"><span class='ocrx_word' id='word_1_67' title='bbox 238 201 240 280; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 240 278 329 280">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 240 278 329 280">
+     <span class='ocr_line' id='line_1_24' title="bbox 240 278 329 280; baseline 0 328"><span class='ocrx_word' id='word_1_68' title='bbox 240 278 329 280; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 86 278 121 294">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 86 278 121 294">
+     <span class='ocr_line' id='line_1_25' title="bbox 86 278 121 294; baseline 0 0"><span class='ocrx_word' id='word_1_69' title='bbox 86 278 121 294; x_wconf 82' lang='eng'><em>800</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 98 300 128 302">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 98 300 128 302">
+     <span class='ocr_line' id='line_1_26' title="bbox 98 300 128 302; baseline 0 306"><span class='ocrx_word' id='word_1_70' title='bbox 98 300 128 302; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 183 142 185 324">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 183 142 185 324">
+     <span class='ocr_line' id='line_1_27' title="bbox 183 142 185 324; baseline 0 284"><span class='ocrx_word' id='word_1_71' title='bbox 183 142 185 324; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 185 323 265 325">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 185 323 265 325">
+     <span class='ocr_line' id='line_1_28' title="bbox 185 323 265 325; baseline 0 283"><span class='ocrx_word' id='word_1_72' title='bbox 185 323 265 325; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 126 232 128 370">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 126 232 128 370">
+     <span class='ocr_line' id='line_1_29' title="bbox 126 232 128 370; baseline 0 238"><span class='ocrx_word' id='word_1_73' title='bbox 126 232 128 370; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 22 336 57 352">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 22 336 57 352">
+     <span class='ocr_line' id='line_1_30' title="bbox 22 336 57 352; baseline 0 0"><span class='ocrx_word' id='word_1_74' title='bbox 22 336 57 352; x_wconf 84' lang='eng'><em>979</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 26 356 97 358">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 26 356 97 358">
+     <span class='ocr_line' id='line_1_31' title="bbox 26 356 97 358; baseline 0 250"><span class='ocrx_word' id='word_1_75' title='bbox 26 356 97 358; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 98 301 100 414">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 98 301 100 414">
+     <span class='ocr_line' id='line_1_32' title="bbox 98 301 100 414; baseline 0 194"><span class='ocrx_word' id='word_1_76' title='bbox 98 301 100 414; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 24 356 26 492">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 24 356 26 492">
+     <span class='ocr_line' id='line_1_33' title="bbox 24 356 26 492; baseline 0 116"><span class='ocrx_word' id='word_1_77' title='bbox 24 356 26 492; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 43 457 48 548">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 43 457 48 548">
+     <span class='ocr_line' id='line_1_34' title="bbox 43 457 48 548; baseline 0 60"><span class='ocrx_word' id='word_1_78' title='bbox 43 457 48 548; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 0 423 2 592">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 0 423 2 592">
+     <span class='ocr_line' id='line_1_35' title="bbox 0 423 2 592; baseline 0 16"><span class='ocrx_word' id='word_1_79' title='bbox 0 423 2 592; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002915-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002915-0-000.pbm.png
new file mode 100644
index 00000000..6af14390
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002915-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002915-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002915-0-000.pbm.png.hocr
new file mode 100644
index 00000000..59b1a821
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002915-0-000.pbm.png.hocr
@@ -0,0 +1,76 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002915-0-000.pbm.png"; bbox 0 0 994 800; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 103 8 993 711">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 103 8 993 711">
+     <span class='ocr_line' id='line_1_1' title="bbox 122 8 606 38; baseline 0 -7"><span class='ocrx_word' id='word_1_1' title='bbox 122 22 146 38; x_wconf 71' lang='eng'><em>96</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 160 10 184 31; x_wconf 91' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 194 10 323 38; x_wconf 81' lang='eng' dir='ltr'><em>gallinarum</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 331 10 387 32; x_wconf 89' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 398 9 474 31; x_wconf 84' lang='eng' dir='ltr'><em>6291T</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 483 8 606 36; x_wconf 79' lang='eng'><em>(088191)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 103 56 605 84; baseline -0.002 -4"><span class='ocrx_word' id='word_1_7' title='bbox 103 60 139 75; x_wconf 80' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 162 58 185 79; x_wconf 88' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 196 58 316 80; x_wconf 83' lang='eng' dir='ltr'><em>saeculare</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 326 58 386 80; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 397 57 473 79; x_wconf 80' lang='eng' dir='ltr'><em>6531T</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 482 56 605 84; x_wconf 87' lang='eng' dir='ltr'><em>(D89328)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 162 104 587 134; baseline 0 -7"><span class='ocrx_word' id='word_1_13' title='bbox 162 106 185 127; x_wconf 90' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 195 106 304 134; x_wconf 89' lang='eng' dir='ltr'><em>pullorum</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 313 106 368 128; x_wconf 89' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 381 104 587 132; x_wconf 58' lang='eng' dir='ltr'><em>1214T(D86196)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 124 152 573 180; baseline 0 -5"><span class='ocrx_word' id='word_1_17' title='bbox 124 154 148 175; x_wconf 92' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 159 154 251 176; x_wconf 85' lang='eng' dir='ltr'><em>biﬁdum</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 260 154 335 176; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 345 155 422 176; x_wconf 83' lang='eng'><em>29521</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 429 153 438 166; x_wconf 78' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_22' title='bbox 447 152 573 180; x_wconf 90' lang='eng' dir='ltr'><em>(M84777)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 141 200 876 230; baseline -0.001 -6"><span class='ocrx_word' id='word_1_23' title='bbox 141 202 164 223; x_wconf 89' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 176 202 398 230; x_wconf 78' lang='eng' dir='ltr'><em>thermacidophilum</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 407 202 487 230; x_wconf 88' lang='eng' dir='ltr'><em>subsp.</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 497 202 614 230; x_wconf 82' lang='eng' dir='ltr'><em>porcinum</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 625 201 712 223; x_wconf 78' lang='eng' dir='ltr'><em>P3-14T</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 721 200 876 228; x_wconf 89' lang='eng' dir='ltr'>(AY148470)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 189 248 712 278; baseline 0 -7"><span class='ocrx_word' id='word_1_29' title='bbox 189 250 213 271; x_wconf 94' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 225 250 394 278; x_wconf 84' lang='eng' dir='ltr'><em>thermophilum</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 403 250 478 272; x_wconf 88' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 488 249 581 271; x_wconf 85' lang='eng' dir='ltr'><em>25525T</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 590 248 712 276; x_wconf 91' lang='eng' dir='ltr'>(U10151)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 162 296 993 326; baseline 0 -6"><span class='ocrx_word' id='word_1_34' title='bbox 162 298 185 320; x_wconf 91' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 197 298 435 326; x_wconf 77' lang='eng' dir='ltr'><em>thermoacidophi/um</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 444 298 525 326; x_wconf 89' lang='eng' dir='ltr'><em>subsp.</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 537 298 774 326; x_wconf 76' lang='eng' dir='ltr'><em>thermoacidophi/um</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 784 297 826 320; x_wconf 78' lang='eng' dir='ltr'><em>36T</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 835 296 993 324; x_wconf 85' lang='eng' dir='ltr'><em>(ABO16246)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 131 344 518 372; baseline 0 -4"><span class='ocrx_word' id='word_1_40' title='bbox 131 347 154 368; x_wconf 88' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 166 347 235 368; x_wconf 90' lang='eng' dir='ltr'><em>boum</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 244 346 299 368; x_wconf 90' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 312 344 518 372; x_wconf 72' lang='eng' dir='ltr'><em>1211T(D86190)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 137 392 661 420; baseline 0 -4"><span class='ocrx_word' id='word_1_44' title='bbox 137 395 161 416; x_wconf 92' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 172 395 300 416; x_wconf 87' lang='eng' dir='ltr'><em>asteroides</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 310 394 395 416; x_wconf 90' lang='eng' dir='ltr'><strong>CCUG</strong></span> <span class='ocrx_word' id='word_1_47' title='bbox 407 394 500 416; x_wconf 87' lang='eng' dir='ltr'><em>24607T</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 509 392 661 420; x_wconf 90' lang='eng' dir='ltr'><em>(EF187235)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 147 440 658 470; baseline 0 -6"><span class='ocrx_word' id='word_1_49' title='bbox 147 443 171 464; x_wconf 92' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 182 442 336 470; x_wconf 85' lang='eng' dir='ltr'><em>coryneforme</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 345 442 420 464; x_wconf 93' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 431 444 490 464; x_wconf 86' lang='eng'>2591</span> <span class='ocrx_word' id='word_1_53' title='bbox 500 442 523 464; x_wconf 86' lang='eng' dir='ltr'><em>1T</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 532 440 658 468; x_wconf 88' lang='eng' dir='ltr'><em>(M58733)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 174 488 597 516; baseline 0 -4"><span class='ocrx_word' id='word_1_55' title='bbox 174 491 199 512; x_wconf 90' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 210 491 294 512; x_wconf 90' lang='eng' dir='ltr'><strong><em>bombi</em></strong></span> <span class='ocrx_word' id='word_1_57' title='bbox 303 490 431 512; x_wconf 66' lang='eng' dir='ltr'><em>BluCl/TPT</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 441 489 501 516; x_wconf 93' lang='eng' dir='ltr'>(EU1</span> <span class='ocrx_word' id='word_1_59' title='bbox 508 488 597 516; x_wconf 86' lang='eng'><em>27549)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 147 536 637 564; baseline 0 -4"><span class='ocrx_word' id='word_1_60' title='bbox 147 539 171 560; x_wconf 93' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 183 539 334 560; x_wconf 82' lang='eng' dir='ltr'><em>tsurumiense</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 343 536 637 564; x_wconf 69' lang='eng' dir='ltr'><em>OMB115T(A3241106)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 191 585 826 612; baseline 0 -4"><span class='ocrx_word' id='word_1_63' title='bbox 191 587 366 609; x_wconf 82' lang='eng' dir='ltr'><em>Parascardovia</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 376 587 519 609; x_wconf 81' lang='eng' dir='ltr'><em>dentico/ens</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 530 586 590 609; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 603 586 694 608; x_wconf 88' lang='eng' dir='ltr'><em>10105T</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 703 585 826 612; x_wconf 85' lang='eng' dir='ltr'><em>(D89331)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 232 633 784 663; baseline -0.002 -6"><span class='ocrx_word' id='word_1_68' title='bbox 232 635 355 657; x_wconf 78' lang='eng' dir='ltr'><em>Scardovia</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 364 635 477 663; x_wconf 83' lang='eng' dir='ltr'><em>inopinata</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 487 635 548 657; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 561 634 652 656; x_wconf 91' lang='eng' dir='ltr'><em>10107T</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 661 633 784 661; x_wconf 86' lang='eng' dir='ltr'><em>(D89332)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 202 681 709 711; baseline 0 -7"><span class='ocrx_word' id='word_1_73' title='bbox 202 683 372 705; x_wconf 83' lang='eng' dir='ltr'><em>Aeriscardovia</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 382 683 495 711; x_wconf 84' lang='eng' dir='ltr'><em>aerophila</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 504 682 546 704; x_wconf 90' lang='eng' dir='ltr'><em>T6T</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 555 681 609 708; x_wconf 95' lang='eng' dir='ltr'>(AY1</span> <span class='ocrx_word' id='word_1_77' title='bbox 618 681 709 708; x_wconf 90' lang='eng'>74107)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 94 729 699 786">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 94 729 699 786">
+     <span class='ocr_line' id='line_1_16' title="bbox 117 729 699 759; baseline -0.002 -6"><span class='ocrx_word' id='word_1_78' title='bbox 117 731 261 753; x_wconf 84' lang='eng' dir='ltr'><em>Gardnerella</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 272 731 378 759; x_wconf 80' lang='eng' dir='ltr'><em>vaginal/s</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 386 731 461 753; x_wconf 87' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 473 730 564 752; x_wconf 90' lang='eng' dir='ltr'><em>14018T</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 574 729 699 757; x_wconf 87' lang='eng' dir='ltr'><em>(M58744)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 94 770 119 786; baseline -0.04 0"><span class='ocrx_word' id='word_1_83' title='bbox 94 770 119 786; x_wconf 86' lang='eng'><em>0.1</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 0 53 223 747">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 0 53 223 747">
+     <span class='ocr_line' id='line_1_18' title="bbox 42 53 160 194; baseline 0 0"><span class='ocrx_word' id='word_1_84' title='bbox 42 53 160 194; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 31 194 180 293; baseline 0 -48"><span class='ocrx_word' id='word_1_85' title='bbox 31 194 180 293; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 0 293 154 341; baseline 0 -11"><span class='ocrx_word' id='word_1_86' title='bbox 0 293 154 341; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 0 341 147 485; baseline 0 -51"><span class='ocrx_word' id='word_1_87' title='bbox 0 341 147 485; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 0 485 171 530; baseline 0 0"><span class='ocrx_word' id='word_1_88' title='bbox 0 485 171 530; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 0 530 223 666; baseline 0 -88"><span class='ocrx_word' id='word_1_89' title='bbox 0 530 223 666; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 0 666 202 747; baseline 0 0"><span class='ocrx_word' id='word_1_90' title='bbox 0 666 202 747; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002915-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002915-0-001.pbm.png
new file mode 100644
index 00000000..a36da84c
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002915-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002915-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002915-0-001.pbm.png.hocr
new file mode 100644
index 00000000..b371853b
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002915-0-001.pbm.png.hocr
@@ -0,0 +1,93 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002915-0-001.pbm.png"; bbox 0 0 1065 691; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 89 11 1064 690">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 156 11 622 41">
+     <span class='ocr_line' id='line_1_1' title="bbox 156 11 622 41; baseline 0 -7"><span class='ocrx_word' id='word_1_1' title='bbox 156 14 179 34; x_wconf 88' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 189 14 315 41; x_wconf 84' lang='eng' dir='ltr'><em>gallinarum</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 323 13 377 35; x_wconf 90' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 388 15 447 35; x_wconf 85' lang='eng'><em>6291</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 454 13 463 25; x_wconf 70' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_6' title='bbox 471 11 622 39; x_wconf 85' lang='eng' dir='ltr'><em>(AY004279)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 140 61 587 90">
+     <span class='ocr_line' id='line_1_2' title="bbox 140 61 587 90; baseline -0.002 -5"><span class='ocrx_word' id='word_1_7' title='bbox 140 64 163 84; x_wconf 88' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 173 64 279 90; x_wconf 89' lang='eng' dir='ltr'><em>pullorum</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 288 63 342 85; x_wconf 94' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 355 63 427 84; x_wconf 77' lang='eng' dir='ltr'><em>1214T</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 436 61 587 89; x_wconf 85' lang='eng' dir='ltr'><em>(AYOO4278)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 149 111 581 139">
+     <span class='ocr_line' id='line_1_3' title="bbox 149 111 581 139; baseline 0 -5"><span class='ocrx_word' id='word_1_12' title='bbox 149 114 172 134; x_wconf 87' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 184 113 273 134; x_wconf 83' lang='eng' dir='ltr'><em>bifidum</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 282 113 336 135; x_wconf 91' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 349 113 421 134; x_wconf 78' lang='eng' dir='ltr'><em>1255T</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 430 111 581 139; x_wconf 77' lang='eng' dir='ltr'><em>(AYOO4280)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 143 161 862 238">
+     <span class='ocr_line' id='line_1_4' title="bbox 143 161 862 190; baseline 0 -6"><span class='ocrx_word' id='word_1_17' title='bbox 143 164 166 184; x_wconf 90' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 178 164 395 190; x_wconf 78' lang='eng' dir='ltr'><em>thermacidophi/um</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 404 164 482 190; x_wconf 87' lang='eng' dir='ltr'><em>subsp.</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 492 164 606 190; x_wconf 83' lang='eng' dir='ltr'><em>porcinum</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 617 162 702 184; x_wconf 89' lang='eng' dir='ltr'><em>P3-14T</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 711 161 862 188; x_wconf 87' lang='eng' dir='ltr'><em>(AY166561)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 170 211 580 238; baseline 0 -4"><span class='ocrx_word' id='word_1_23' title='bbox 170 213 193 234; x_wconf 87' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 204 213 272 234; x_wconf 83' lang='eng' dir='ltr'><em>boum</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 281 213 335 234; x_wconf 89' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 348 211 580 238; x_wconf 66' lang='eng' dir='ltr'><em>1211T(AYOO4285)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 152 261 1064 340">
+     <span class='ocr_line' id='line_1_6' title="bbox 152 261 1064 290; baseline 0 -6"><span class='ocrx_word' id='word_1_27' title='bbox 152 263 176 284; x_wconf 92' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 188 263 420 290; x_wconf 81' lang='eng' dir='ltr'><em>thermoacidophi/um</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 429 263 507 290; x_wconf 86' lang='eng' dir='ltr'><em>subsp.</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 519 263 751 290; x_wconf 79' lang='eng' dir='ltr'><em>thermoacidophi/um</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 760 263 796 284; x_wconf 86' lang='eng' dir='ltr'><em>AS</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 809 262 905 284; x_wconf 85' lang='eng' dir='ltr'><em>1.2282T</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 913 261 1064 288; x_wconf 83' lang='eng' dir='ltr'><em>(AY004276)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 153 311 660 340; baseline 0 -6"><span class='ocrx_word' id='word_1_34' title='bbox 153 314 176 334; x_wconf 92' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 188 314 353 340; x_wconf 79' lang='eng' dir='ltr'><em>thermophilum</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 361 313 415 335; x_wconf 92' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 428 315 435 334; x_wconf 94' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 444 313 500 334; x_wconf 86' lang='eng' dir='ltr'><em>207T</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 509 311 660 338; x_wconf 88' lang='eng' dir='ltr'><em>(AF240567)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 176 361 669 391">
+     <span class='ocr_line' id='line_1_8' title="bbox 176 361 669 391; baseline 0 -7"><span class='ocrx_word' id='word_1_40' title='bbox 176 364 199 384; x_wconf 89' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 211 363 362 391; x_wconf 81' lang='eng' dir='ltr'><em>coryneforme</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 370 363 424 384; x_wconf 92' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 435 364 477 384; x_wconf 88' lang='eng'><em>581</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 485 362 509 384; x_wconf 69' lang='eng' dir='ltr'><em>QT</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 518 361 669 388; x_wconf 83' lang='eng' dir='ltr'><em>(AY004275)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 159 411 596 438">
+     <span class='ocr_line' id='line_1_9' title="bbox 159 411 596 438; baseline 0 -4"><span class='ocrx_word' id='word_1_46' title='bbox 159 413 182 434; x_wconf 93' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 193 413 289 434; x_wconf 82' lang='eng' dir='ltr'><em>ind/cum</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 298 413 351 434; x_wconf 91' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 364 412 437 434; x_wconf 84' lang='eng' dir='ltr'><em>1302T</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 445 411 596 438; x_wconf 84' lang='eng' dir='ltr'><em>(AF240574)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 164 461 630 488">
+     <span class='ocr_line' id='line_1_10' title="bbox 164 461 630 488; baseline 0 -4"><span class='ocrx_word' id='word_1_51' title='bbox 164 463 187 484; x_wconf 90' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 197 463 323 484; x_wconf 83' lang='eng' dir='ltr'><em>asteroides</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 331 463 385 484; x_wconf 93' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 396 462 470 484; x_wconf 85' lang='eng' dir='ltr'><em>8230T</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 479 461 630 488; x_wconf 82' lang='eng' dir='ltr'><em>(AF240570)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 226 511 641 538">
+     <span class='ocr_line' id='line_1_11' title="bbox 226 511 641 538; baseline 0 -4"><span class='ocrx_word' id='word_1_56' title='bbox 226 513 251 534; x_wconf 89' lang='eng' dir='ltr'><em>B.</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 262 513 344 534; x_wconf 90' lang='eng' dir='ltr'><strong><em>bombi</em></strong></span> <span class='ocrx_word' id='word_1_58' title='bbox 353 512 479 534; x_wconf 73' lang='eng' dir='ltr'><em>BluCl/TPT</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 488 511 641 538; x_wconf 83' lang='eng' dir='ltr'><em>(EU869281)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 89 561 794 690">
+     <span class='ocr_line' id='line_1_12' title="bbox 188 561 794 590; baseline 0 -7"><span class='ocrx_word' id='word_1_60' title='bbox 188 563 354 584; x_wconf 82' lang='eng' dir='ltr'><em>Aeriscardov/a</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 363 563 465 590; x_wconf 81' lang='eng' dir='ltr'><em>aeriphi/a</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 475 563 533 584; x_wconf 91' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 545 564 570 583; x_wconf 86' lang='eng'>21</span> <span class='ocrx_word' id='word_1_64' title='bbox 579 562 635 584; x_wconf 90' lang='eng' dir='ltr'><em>773T</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 644 561 794 588; x_wconf 87' lang='eng' dir='ltr'><em>(AY339131)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 89 611 745 638; baseline 0 -4"><span class='ocrx_word' id='word_1_66' title='bbox 89 613 260 634; x_wconf 84' lang='eng' dir='ltr'><em>Parascardovia</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 270 613 410 634; x_wconf 84' lang='eng' dir='ltr'><em>dentico/ens</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 420 613 479 634; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 491 614 571 634; x_wconf 92' lang='eng'>10105</span> <span class='ocrx_word' id='word_1_70' title='bbox 577 612 586 624; x_wconf 71' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_71' title='bbox 594 611 745 638; x_wconf 85' lang='eng' dir='ltr'><em>(AF240565)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 182 661 779 690; baseline 0 -6"><span class='ocrx_word' id='word_1_72' title='bbox 182 663 323 684; x_wconf 83' lang='eng' dir='ltr'><em>Gardnere/Ia</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 334 663 437 690; x_wconf 86' lang='eng' dir='ltr'><em>vagina/is</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 446 663 519 684; x_wconf 93' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 530 664 588 684; x_wconf 91' lang='eng'>1401</span> <span class='ocrx_word' id='word_1_76' title='bbox 596 662 620 684; x_wconf 77' lang='eng' dir='ltr'><em>BT</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 629 661 779 688; x_wconf 86' lang='eng' dir='ltr'><em>(AF240579)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 0 17 222 679">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 0 17 222 679">
+     <span class='ocr_line' id='line_1_15' title="bbox 98 17 151 56; baseline 0 -9"><span class='ocrx_word' id='word_1_78' title='bbox 98 17 151 56; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 94 56 145 153; baseline -0.118 0"><span class='ocrx_word' id='word_1_79' title='bbox 94 56 145 153; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 31 153 168 304; baseline 0.022 -57"><span class='ocrx_word' id='word_1_80' title='bbox 31 153 168 304; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 31 304 172 406; baseline 0 -8"><span class='ocrx_word' id='word_1_81' title='bbox 31 304 172 406; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 0 406 222 547; baseline 0 -46"><span class='ocrx_word' id='word_1_82' title='bbox 0 406 222 547; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 0 547 188 651; baseline 0.032 -53"><span class='ocrx_word' id='word_1_83' title='bbox 0 547 188 651; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 0 651 178 679; baseline 0 12"><span class='ocrx_word' id='word_1_84' title='bbox 0 651 178 679; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002931-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002931-0-000.pbm.png
new file mode 100644
index 00000000..b2910e71
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002931-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002931-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002931-0-000.pbm.png.hocr
new file mode 100644
index 00000000..4d7a9ab3
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.002931-0-000.pbm.png.hocr
@@ -0,0 +1,110 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.002931-0-000.pbm.png"; bbox 0 0 1124 1272; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 145 3 1123 314">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 145 3 1123 314">
+     <span class='ocr_line' id='line_1_1' title="bbox 311 3 865 30; baseline 0 -4"><span class='ocrx_word' id='word_1_1' title='bbox 311 5 480 26; x_wconf 74' lang='eng' dir='ltr'><em>GraCi/ibaclllus</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 490 6 636 26; x_wconf 83' lang='eng' dir='ltr'><em>haloto/erans</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 656 3 705 26; x_wconf 92' lang='eng' dir='ltr'><em>NNT</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 716 3 865 30; x_wconf 82' lang='eng' dir='ltr'>(AF036922)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 230 59 999 94; baseline 0 -11"><span class='ocrx_word' id='word_1_5' title='bbox 230 74 275 94; x_wconf 69' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 404 62 552 83; x_wconf 84' lang='eng' dir='ltr'><em>Halobac/llus</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 563 62 684 89; x_wconf 77' lang='eng' dir='ltr'><em>halophl/us</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 702 62 789 83; x_wconf 90' lang='eng' dir='ltr'><em>NCIMB</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 799 59 872 83; x_wconf 74' lang='eng' dir='ltr'><em>9251T</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 883 60 999 87; x_wconf 85' lang='eng' dir='ltr'>(X62174)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 281 69 783 144; baseline -0.002 -4"><span class='ocrx_word' id='word_1_11' title='bbox 281 69 477 140; x_wconf 59' lang='eng' dir='ltr'><em>L—l-lal;3bazcillus</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 487 119 570 140; x_wconf 75' lang='eng' dir='ltr'><em>literal/s</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 586 116 655 140; x_wconf 88' lang='eng' dir='ltr'><em>SL—4T</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 667 117 783 144; x_wconf 87' lang='eng' dir='ltr'><em>(X94558)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 145 173 1123 207; baseline 0 -11"><span class='ocrx_word' id='word_1_15' title='bbox 145 188 175 207; x_wconf 79' lang='eng'><em>74</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 453 176 612 197; x_wconf 83' lang='eng' dir='ltr'><em>Alkalibacillus</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 622 176 805 202; x_wconf 83' lang='eng' dir='ltr'><em>ha/oalkaliphilus</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 823 176 882 197; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 892 173 965 196; x_wconf 82' lang='eng' dir='ltr'><em>5271T</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 979 174 1123 201; x_wconf 82' lang='eng' dir='ltr'>(AJ238041)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 301 230 927 264; baseline 0 -11"><span class='ocrx_word' id='word_1_21' title='bbox 301 245 346 264; x_wconf 76' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 426 233 521 253; x_wconf 86' lang='eng' dir='ltr'><em>Bacillus</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 531 233 615 253; x_wconf 82' lang='eng' dir='ltr'><em>subtllis</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 628 233 709 253; x_wconf 91' lang='eng' dir='ltr'><em>NCDO</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 721 230 796 253; x_wconf 82' lang='eng' dir='ltr'><em>1769T</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 810 230 927 257; x_wconf 88' lang='eng' dir='ltr'>(X60646)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 350 239 946 314; baseline -0.002 -3"><span class='ocrx_word' id='word_1_27' title='bbox 350 239 406 300; x_wconf 84' lang='eng' dir='ltr'>I:</span> <span class='ocrx_word' id='word_1_28' title='bbox 430 290 525 311; x_wconf 71' lang='eng' dir='ltr'><em>Bacillus</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 534 289 687 311; x_wconf 73' lang='eng' dir='ltr'><em>lichenilormls</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 702 289 760 311; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 772 286 815 310; x_wconf 79' lang='eng' dir='ltr'><em>13T</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 829 288 946 314; x_wconf 88' lang='eng' dir='ltr'>(X68416)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 90 338 1040 373">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 90 338 1040 373">
+     <span class='ocr_line' id='line_1_7' title="bbox 90 338 1040 373; baseline 0 -6"><span class='ocrx_word' id='word_1_33' title='bbox 90 338 115 358; x_wconf 74' lang='eng'>71</span> <span class='ocrx_word' id='word_1_34' title='bbox 501 347 644 373; x_wconf 85' lang='eng' dir='ltr'><em>Virgibacillus</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 653 347 779 373; x_wconf 79' lang='eng' dir='ltr'><em>salexigens</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 797 344 907 368; x_wconf 84' lang='eng' dir='ltr'><em>C-20MoT</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 924 344 1040 371; x_wconf 87' lang='eng' dir='ltr'>(Y11603)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 207 349 479 389">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 207 349 479 389">
+     <span class='ocr_line' id='line_1_8' title="bbox 207 349 479 389; baseline 0 883"><span class='ocrx_word' id='word_1_38' title='bbox 207 349 479 389; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 176 400 785 435">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 176 400 785 435">
+     <span class='ocr_line' id='line_1_9' title="bbox 176 400 785 435; baseline 0 -11"><span class='ocrx_word' id='word_1_39' title='bbox 176 416 206 435; x_wconf 78' lang='eng'>55</span> <span class='ocrx_word' id='word_1_40' title='bbox 230 415 275 435; x_wconf 72' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 309 404 451 430; x_wconf 81' lang='eng' dir='ltr'><em>Virgibacillus</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 461 404 529 424; x_wconf 81' lang='eng' dir='ltr'><em>olivae</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 548 400 613 430; x_wconf 64' lang='eng' dir='ltr'><em>E308T</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 626 401 785 428; x_wconf 83' lang='eng' dir='ltr'>(DQ139839)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 278 410 283 499">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 278 410 283 499">
+     <span class='ocr_line' id='line_1_10' title="bbox 278 410 283 499; baseline 0 773"><span class='ocrx_word' id='word_1_45' title='bbox 278 410 283 499; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 109 457 1002 727">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 109 457 1002 727">
+     <span class='ocr_line' id='line_1_11' title="bbox 309 457 838 487; baseline 0 -6"><span class='ocrx_word' id='word_1_46' title='bbox 309 460 451 487; x_wconf 80' lang='eng' dir='ltr'><em>Virgibacillus</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 461 460 552 481; x_wconf 82' lang='eng' dir='ltr'><em>salarius</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 572 457 675 481; x_wconf 56' lang='eng' dir='ltr'><em>SA»Vb1T</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 685 458 838 485; x_wconf 86' lang='eng' dir='ltr'>(AB197851)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 284 468 839 544; baseline 0 -6"><span class='ocrx_word' id='word_1_50' title='bbox 284 468 288 527; x_wconf 79' lang='eng' dir='ltr'>I</span> <span class='ocrx_word' id='word_1_51' title='bbox 312 517 454 544; x_wconf 80' lang='eng' dir='ltr'><em>Virgibacillus</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 464 517 606 538; x_wconf 80' lang='eng' dir='ltr'><em>marlsmortui</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 621 514 678 538; x_wconf 83' lang='eng' dir='ltr'><em>123T</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 695 515 839 542; x_wconf 84' lang='eng' dir='ltr'>(AJ009793)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 109 564 939 601; baseline 0 -7"><span class='ocrx_word' id='word_1_55' title='bbox 109 564 135 583; x_wconf 73' lang='eng'><em>5‘</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 362 574 505 601; x_wconf 84' lang='eng' dir='ltr'><em>Virgibacillus</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 513 574 605 601; x_wconf 82' lang='eng' dir='ltr'><em>proomii</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 621 574 677 595; x_wconf 86' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 690 571 781 594; x_wconf 84' lang='eng' dir='ltr'><em>1237oT</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 794 572 939 599; x_wconf 85' lang='eng' dir='ltr'>(AJO12667)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 212 580 1002 670; baseline -0.001 -18"><span class='ocrx_word' id='word_1_61' title='bbox 212 580 336 670; x_wconf 43' lang='eng'><em>86?</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 359 631 502 658; x_wconf 83' lang='eng' dir='ltr'><em>Virgibacillus</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 510 631 688 658; x_wconf 82' lang='eng' dir='ltr'><em>pantothenticus</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 706 631 787 652; x_wconf 92' lang='eng' dir='ltr'><em>NCDO</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 799 628 872 651; x_wconf 88' lang='eng' dir='ltr'><em>1765T</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 886 629 1002 656; x_wconf 86' lang='eng' dir='ltr'>(X60627)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 161 638 984 727; baseline 0 -19"><span class='ocrx_word' id='word_1_67' title='bbox 161 700 191 719; x_wconf 71' lang='eng'><em>87</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 261 638 343 727; x_wconf 62' lang='eng'>991:</span> <span class='ocrx_word' id='word_1_69' title='bbox 375 688 518 715; x_wconf 81' lang='eng' dir='ltr'><em>Virgibacillus</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 527 688 681 709; x_wconf 80' lang='eng' dir='ltr'><em>dokdonensis</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 700 685 984 713; x_wconf 72' lang='eng' dir='ltr'>DSW—1OT(AY822043)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 295 695 965 828">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 295 695 965 828">
+     <span class='ocr_line' id='line_1_16' title="bbox 295 695 944 771; baseline 0 -6"><span class='ocrx_word' id='word_1_72' title='bbox 295 695 349 753; x_wconf 67' lang='eng'><em>100&#39;</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 369 745 511 771; x_wconf 82' lang='eng' dir='ltr'><em>Virgibacillus</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 521 745 650 771; x_wconf 82' lang='eng' dir='ltr'><em>chiguensls</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 669 742 782 766; x_wconf 72' lang='eng' dir='ltr'>NTU1O1T</span> <span class='ocrx_word' id='word_1_76' title='bbox 796 742 944 769; x_wconf 89' lang='eng' dir='ltr'>(EF101168)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 400 798 965 828; baseline 0 -6"><span class='ocrx_word' id='word_1_77' title='bbox 400 802 543 828; x_wconf 81' lang='eng' dir='ltr'><em>Virgibacillus</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 552 802 674 828; x_wconf 85' lang='eng' dir='ltr'><em>halophilus</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 693 798 794 822; x_wconf 78' lang='eng' dir='ltr'><em>5B73CT</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 811 799 965 826; x_wconf 73' lang='eng' dir='ltr'>(ABQ43851)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 258 913 1029 954">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 258 853 1029 942">
+     <span class='ocr_line' id='line_1_18' title="bbox 258 853 1029 890; baseline 0 -11"><span class='ocrx_word' id='word_1_81' title='bbox 258 870 304 890; x_wconf 74' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 418 856 608 885; x_wconf 88' lang='eng' dir='ltr'><em>Virgibacillus</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 618 856 742 879; x_wconf 86' lang='eng' dir='ltr'><em>arcticus</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 758 856 805 879; x_wconf 88' lang='eng' dir='ltr'><em>Hal</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 820 853 846 879; x_wconf 93' lang='eng' dir='ltr'><em>1T</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 864 853 1029 884; x_wconf 85' lang='eng' dir='ltr'><em>(EF675742)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 366 913 984 942; baseline 0 -6"><span class='ocrx_word' id='word_1_87' title='bbox 366 916 508 942; x_wconf 73' lang='eng' dir='ltr'><em>Virgibacillus</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 518 916 642 942; x_wconf 81' lang='eng' dir='ltr'><em>necropolis</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 661 915 717 936; x_wconf 87' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 730 913 823 936; x_wconf 83' lang='eng' dir='ltr'><em>19488T</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 840 913 984 940; x_wconf 75' lang='eng' dir='ltr'>(N315056)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 117 932 1000 999">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 117 932 1000 999">
+     <span class='ocr_line' id='line_1_20' title="bbox 117 932 148 951; baseline 0 0"><span class='ocrx_word' id='word_1_92' title='bbox 117 932 148 951; x_wconf 82' lang='eng'>53</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 294 959 1000 999; baseline 0 -6"><span class='ocrx_word' id='word_1_93' title='bbox 294 959 320 978; x_wconf 75' lang='eng'>91</span> <span class='ocrx_word' id='word_1_94' title='bbox 353 972 495 999; x_wconf 74' lang='eng' dir='ltr'><em>Virgibacillus</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 505 972 658 993; x_wconf 81' lang='eng' dir='ltr'><em>carmonensis</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 679 972 736 993; x_wconf 89' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 748 969 839 993; x_wconf 79' lang='eng' dir='ltr'><em>20964T</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 856 970 1000 997; x_wconf 84' lang='eng' dir='ltr'>(AJ316302)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 312 1026 1031 1169">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 312 1026 1031 1169">
+     <span class='ocr_line' id='line_1_22' title="bbox 337 1026 940 1056; baseline -0.002 -6"><span class='ocrx_word' id='word_1_99' title='bbox 337 1029 480 1056; x_wconf 77' lang='eng' dir='ltr'><em>Virgibacillus</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 489 1029 593 1050; x_wconf 87' lang='eng' dir='ltr'><em>kekensis</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 612 1026 771 1056; x_wconf 91' lang='eng' dir='ltr'><em>YIM—kkny16T</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 788 1027 841 1054; x_wconf 93' lang='eng' dir='ltr'>(AY1</span> <span class='ocrx_word' id='word_1_103' title='bbox 851 1027 940 1054; x_wconf 80' lang='eng'>21439)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 312 1083 1031 1111; baseline 0.003 -8"><span class='ocrx_word' id='word_1_104' title='bbox 312 1083 454 1109; x_wconf 83' lang='eng' dir='ltr'><em>Virgibacillus</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 464 1083 661 1103; x_wconf 75' lang='eng' dir='ltr'><em>halodenitrificans</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 681 1086 756 1107; x_wconf 85' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 766 1083 861 1106; x_wconf 79' lang='eng' dir='ltr'><em>49067T</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 878 1084 1031 1111; x_wconf 82' lang='eng' dir='ltr'>(AB021186)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 312 1140 900 1169; baseline 0 -6"><span class='ocrx_word' id='word_1_109' title='bbox 312 1143 454 1169; x_wconf 78' lang='eng' dir='ltr'><em>Virgibacillus</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 464 1143 579 1163; x_wconf 84' lang='eng' dir='ltr'><em>koreensis</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 599 1140 732 1163; x_wconf 79' lang='eng' dir='ltr'><em>BH30097T</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 749 1141 869 1168; x_wconf 87' lang='eng' dir='ltr'>(AY61601</span> <span class='ocrx_word' id='word_1_113' title='bbox 878 1141 900 1167; x_wconf 87' lang='eng'>2)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 44 1220 98 1239">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 44 1220 98 1239">
+     <span class='ocr_line' id='line_1_25' title="bbox 44 1220 98 1239; baseline 0 0"><span class='ocrx_word' id='word_1_114' title='bbox 44 1220 98 1239; x_wconf 85' lang='eng'>0.02</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003046-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003046-0-000.pbm.png
new file mode 100644
index 00000000..23a0962a
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003046-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003046-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003046-0-000.pbm.png.hocr
new file mode 100644
index 00000000..aa1a3326
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003046-0-000.pbm.png.hocr
@@ -0,0 +1,96 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003046-0-000.pbm.png"; bbox 0 0 1183 1228; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 55 2 1182 1227">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 55 2 1182 1227">
+     <span class='ocr_line' id='line_1_1' title="bbox 491 2 1054 31; baseline 0 -5"><span class='ocrx_word' id='word_1_1' title='bbox 491 10 531 27; x_wconf 87' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 552 4 577 26; x_wconf 92' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 589 4 759 26; x_wconf 82' lang='eng' dir='ltr'><em>mumbaiensis</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 769 2 1054 31; x_wconf 50' lang='eng' dir='ltr'><em>CON—17(DQOO3135)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 302 33 994 67; baseline 0 -5"><span class='ocrx_word' id='word_1_5' title='bbox 302 33 329 50; x_wconf 66' lang='eng'><em>42</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 552 41 577 62; x_wconf 92' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 589 40 649 62; x_wconf 86' lang='eng' dir='ltr'><em>ficus</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 659 38 994 67; x_wconf 57' lang='eng' dir='ltr'><em>CC—FR2—1OT(AY941086)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 55 73 899 105; baseline 0.001 -8"><span class='ocrx_word' id='word_1_9' title='bbox 55 87 191 104; x_wconf 51' lang='eng'><em>,—.</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 273 73 297 90; x_wconf 70' lang='eng'>41</span> <span class='ocrx_word' id='word_1_11' title='bbox 471 77 495 98; x_wconf 92' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 506 77 601 105; x_wconf 83' lang='eng' dir='ltr'><em>grand/s</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 613 76 675 99; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 686 74 899 103; x_wconf 69' lang='eng' dir='ltr'><em>3963T(Y11329)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 98 110 1025 139; baseline 0.001 -5"><span class='ocrx_word' id='word_1_15' title='bbox 98 111 145 129; x_wconf 69' lang='eng'><em>0-09</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 521 113 546 134; x_wconf 90' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 558 113 710 135; x_wconf 85' lang='eng' dir='ltr'><em>radiodurans</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 721 112 783 135; x_wconf 86' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 796 112 891 135; x_wconf 78' lang='eng' dir='ltr'><em>20539T</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 901 110 939 139; x_wconf 89' lang='eng' dir='ltr'>(Y1</span> <span class='ocrx_word' id='word_1_21' title='bbox 950 110 1025 139; x_wconf 85' lang='eng'>1332)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 254 137 872 175; baseline 0.006 -8"><span class='ocrx_word' id='word_1_22' title='bbox 254 137 281 155; x_wconf 73' lang='eng'><em>48</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 349 151 375 168; x_wconf 72' lang='eng'><em>87</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 479 149 504 170; x_wconf 92' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 516 149 608 171; x_wconf 85' lang='eng' dir='ltr'><em>indicus</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 617 146 872 175; x_wconf 68' lang='eng' dir='ltr'><em>Wt/1aT(AJ549111)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 432 183 857 212; baseline 0 -5"><span class='ocrx_word' id='word_1_27' title='bbox 432 185 457 207; x_wconf 93' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 469 185 637 207; x_wconf 79' lang='eng' dir='ltr'><em>desert/VCD1</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 648 184 689 207; x_wconf 90' lang='eng' dir='ltr'><em>15T</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 699 183 857 212; x_wconf 87' lang='eng' dir='ltr'><em>(AY876378)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 227 219 975 249; baseline 0 -6"><span class='ocrx_word' id='word_1_31' title='bbox 227 229 253 246; x_wconf 76' lang='eng'>27</span> <span class='ocrx_word' id='word_1_32' title='bbox 300 232 325 249; x_wconf 80' lang='eng'>73</span> <span class='ocrx_word' id='word_1_33' title='bbox 479 221 504 243; x_wconf 97' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 516 221 701 243; x_wconf 80' lang='eng' dir='ltr'><em>hohokamensis</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 712 220 805 243; x_wconf 87' lang='eng' dir='ltr'><em>KR-40T</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 815 219 975 248; x_wconf 84' lang='eng' dir='ltr'><em>(AY743256)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 374 255 950 286; baseline 0 -7"><span class='ocrx_word' id='word_1_37' title='bbox 374 255 401 273; x_wconf 75' lang='eng'><em>95</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 413 265 462 266; x_wconf 38' lang='eng' dir='ltr'><em>i</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 472 257 497 279; x_wconf 94' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 509 257 659 286; x_wconf 83' lang='eng' dir='ltr'><em>navajonesis</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 670 258 730 279; x_wconf 92' lang='eng' dir='ltr'>KR—1</span> <span class='ocrx_word' id='word_1_42' title='bbox 740 256 781 279; x_wconf 79' lang='eng' dir='ltr'><em>14T</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 791 255 950 284; x_wconf 87' lang='eng' dir='ltr'><em>(AY743259)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 531 291 1035 323; baseline 0 -7"><span class='ocrx_word' id='word_1_44' title='bbox 531 294 556 316; x_wconf 95' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 565 294 726 323; x_wconf 80' lang='eng' dir='ltr'><em>yunweiensis</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 736 294 784 316; x_wconf 93' lang='eng' dir='ltr'><em>YIM</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 796 293 856 316; x_wconf 90' lang='eng' dir='ltr'><em>007T</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 866 291 1035 320; x_wconf 84' lang='eng' dir='ltr'><em>(D0344634)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 506 328 956 358; baseline 0 -6"><span class='ocrx_word' id='word_1_49' title='bbox 506 330 531 352; x_wconf 93' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 543 330 665 358; x_wconf 86' lang='eng' dir='ltr'><em>hopiensis</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 676 329 787 352; x_wconf 65' lang='eng' dir='ltr'><em>KFl-140T</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 797 328 956 356; x_wconf 86' lang='eng' dir='ltr'><em>(AY743262)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 504 364 1179 394; baseline 0 -6"><span class='ocrx_word' id='word_1_53' title='bbox 504 372 531 389; x_wconf 83' lang='eng'>39</span> <span class='ocrx_word' id='word_1_54' title='bbox 640 366 665 388; x_wconf 96' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 677 366 851 394; x_wconf 82' lang='eng' dir='ltr'><em>rad/opugnans</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 861 366 939 389; x_wconf 88' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 951 364 1179 393; x_wconf 50' lang='eng' dir='ltr'><em>191727(Y11334)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 602 400 1024 429; baseline 0 -5"><span class='ocrx_word' id='word_1_58' title='bbox 602 402 627 424; x_wconf 95' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 639 402 757 424; x_wconf 84' lang='eng' dir='ltr'><em>marmoris</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 767 401 861 424; x_wconf 86' lang='eng' dir='ltr'><em>AA—63T</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 870 400 1024 429; x_wconf 88' lang='eng' dir='ltr'><em>(AJ585986)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 493 436 1037 467; baseline 0.006 -9"><span class='ocrx_word' id='word_1_62' title='bbox 493 441 519 458; x_wconf 81' lang='eng'>99</span> <span class='ocrx_word' id='word_1_63' title='bbox 629 439 654 460; x_wconf 92' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 666 438 752 467; x_wconf 84' lang='eng' dir='ltr'><em>frigens</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 761 438 873 461; x_wconf 70' lang='eng' dir='ltr'><em>AA—692T</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 883 436 1037 465; x_wconf 86' lang='eng' dir='ltr'><em>(AJ585981)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 149 472 1069 501; baseline 0.001 -5"><span class='ocrx_word' id='word_1_67' title='bbox 149 483 171 500; x_wconf 76' lang='eng'>21</span> <span class='ocrx_word' id='word_1_68' title='bbox 532 474 558 492; x_wconf 72' lang='eng'><em>56</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 627 475 652 496; x_wconf 94' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 664 475 765 497; x_wconf 80' lang='eng' dir='ltr'><em>saxicola</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 775 474 905 496; x_wconf 89' lang='eng' dir='ltr'><em>AA-1444T</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 915 472 1069 501; x_wconf 84' lang='eng' dir='ltr'><em>(AJ585984)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 491 508 867 539; baseline 0.003 -7"><span class='ocrx_word' id='word_1_73' title='bbox 491 511 516 532; x_wconf 95' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 528 510 733 539; x_wconf 73' lang='eng' dir='ltr'><em>murrayiALT—1bT</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 743 508 867 537; x_wconf 83' lang='eng' dir='ltr'><em>(Y13041)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 250 545 959 575; baseline 0 -6"><span class='ocrx_word' id='word_1_76' title='bbox 250 558 277 575; x_wconf 75' lang='eng'><em>80</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 518 547 542 569; x_wconf 94' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 553 547 719 575; x_wconf 84' lang='eng' dir='ltr'><em>geotherma/is</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 728 546 825 569; x_wconf 63' lang='eng' dir='ltr'><em>ACE-3aT</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 835 545 959 574; x_wconf 87' lang='eng' dir='ltr'>(Y13038)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 321 581 998 612; baseline 0.006 -10"><span class='ocrx_word' id='word_1_81' title='bbox 321 584 348 602; x_wconf 89' lang='eng'><em>80</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 543 583 568 605; x_wconf 97' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 579 583 725 612; x_wconf 85' lang='eng' dir='ltr'><em>apachensis</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 736 582 829 606; x_wconf 80' lang='eng' dir='ltr'><em>KR-36T</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 838 581 998 610; x_wconf 86' lang='eng' dir='ltr'><em>(AY743264)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 466 617 1113 648; baseline 0.002 -8"><span class='ocrx_word' id='word_1_86' title='bbox 466 623 506 640; x_wconf 89' lang='eng'>100</span> <span class='ocrx_word' id='word_1_87' title='bbox 598 620 623 641; x_wconf 95' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 633 620 798 648; x_wconf 80' lang='eng' dir='ltr'><em>proteolyticus</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 809 620 871 642; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 883 619 979 642; x_wconf 78' lang='eng' dir='ltr'><em>20540T</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 989 617 1027 646; x_wconf 92' lang='eng' dir='ltr'>(Y1</span> <span class='ocrx_word' id='word_1_92' title='bbox 1037 617 1113 646; x_wconf 85' lang='eng'>1331)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 113 649 933 683; baseline 0.001 -6"><span class='ocrx_word' id='word_1_93' title='bbox 113 652 140 670; x_wconf 85' lang='eng'><em>40</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 352 649 391 666; x_wconf 78' lang='eng'><em>‘00</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 574 656 601 677; x_wconf 94' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 611 656 691 683; x_wconf 87' lang='eng' dir='ltr'><em>piscis</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 701 655 758 678; x_wconf 77' lang='eng' dir='ltr'><em>saxT</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 768 653 933 682; x_wconf 82' lang='eng' dir='ltr'><em>(D0683348)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 513 690 1005 720; baseline 0 -6"><span class='ocrx_word' id='word_1_99' title='bbox 513 692 538 714; x_wconf 94' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 550 692 690 720; x_wconf 83' lang='eng' dir='ltr'><em>radiophi/us</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 702 692 764 714; x_wconf 92' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 776 693 855 714; x_wconf 83' lang='eng'>20551</span> <span class='ocrx_word' id='word_1_103' title='bbox 863 691 871 703; x_wconf 54' lang='eng' dir='ltr'><em>T</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 881 690 920 718; x_wconf 91' lang='eng' dir='ltr'>(Y1</span> <span class='ocrx_word' id='word_1_105' title='bbox 930 690 1005 718; x_wconf 86' lang='eng'>1333)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 496 726 1058 755; baseline 0 -5"><span class='ocrx_word' id='word_1_106' title='bbox 496 728 521 750; x_wconf 96' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 533 728 672 750; x_wconf 85' lang='eng' dir='ltr'><em>radiomo/lis</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 683 727 890 750; x_wconf 86' lang='eng' dir='ltr'><em>PO-O4-20-132T</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 901 726 1058 755; x_wconf 87' lang='eng' dir='ltr'><em>(EF635404)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 357 762 1071 791; baseline 0 -5"><span class='ocrx_word' id='word_1_110' title='bbox 357 772 384 789; x_wconf 83' lang='eng'><em>99</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 518 764 543 786; x_wconf 96' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 555 764 685 786; x_wconf 77' lang='eng' dir='ltr'><em>c/aud/onis</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 696 763 904 787; x_wconf 75' lang='eng' dir='ltr'><em>PO—04—19—125T</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 914 762 1071 791; x_wconf 88' lang='eng' dir='ltr'><em>(EF635406)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 412 798 1001 827; baseline 0 -5"><span class='ocrx_word' id='word_1_115' title='bbox 412 799 439 816; x_wconf 82' lang='eng'><em>92</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 521 801 546 822; x_wconf 88' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 557 801 680 822; x_wconf 81' lang='eng' dir='ltr'><em>altitudinis</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 691 800 834 822; x_wconf 86' lang='eng' dir='ltr'><em>ME-o4-32T</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 844 798 1001 827; x_wconf 86' lang='eng' dir='ltr'><em>(EF635407)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 418 834 867 863; baseline 0 -5"><span class='ocrx_word' id='word_1_120' title='bbox 418 837 443 858; x_wconf 93' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 455 837 595 859; x_wconf 85' lang='eng' dir='ltr'><em>sonorensis</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 606 836 699 859; x_wconf 89' lang='eng' dir='ltr'><em>KR-87T</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 709 834 867 863; x_wconf 82' lang='eng' dir='ltr'><em>(AY743283)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 56 862 968 901; baseline 0.001 -8"><span class='ocrx_word' id='word_1_124' title='bbox 56 862 83 880; x_wconf 70' lang='eng'>36</span> <span class='ocrx_word' id='word_1_125' title='bbox 491 873 516 894; x_wconf 94' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 528 873 698 901; x_wconf 84' lang='eng' dir='ltr'><em>maricopensis</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 709 872 799 895; x_wconf 73' lang='eng' dir='ltr'><em>LB-34T</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 809 871 968 899; x_wconf 87' lang='eng' dir='ltr'>(AY743274)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 95 907 970 942; baseline 0 -11"><span class='ocrx_word' id='word_1_129' title='bbox 95 924 122 942; x_wconf 72' lang='eng'>34</span> <span class='ocrx_word' id='word_1_130' title='bbox 479 910 504 931; x_wconf 94' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 514 909 681 938; x_wconf 82' lang='eng' dir='ltr'><em>peraridi/itoris</em></span> <span class='ocrx_word' id='word_1_132' title='bbox 692 908 802 931; x_wconf 79' lang='eng' dir='ltr'><em>KR—200T</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 812 907 970 936; x_wconf 88' lang='eng' dir='ltr'><em>(EF141348)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 154 943 947 976; baseline 0 -9"><span class='ocrx_word' id='word_1_134' title='bbox 154 959 180 976; x_wconf 72' lang='eng'><em>69</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 506 946 531 967; x_wconf 97' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_136' title='bbox 541 946 656 974; x_wconf 84' lang='eng' dir='ltr'><em>pimensis</em></span> <span class='ocrx_word' id='word_1_137' title='bbox 667 945 778 968; x_wconf 78' lang='eng' dir='ltr'><em>KR—235T</em></span> <span class='ocrx_word' id='word_1_138' title='bbox 788 943 947 972; x_wconf 85' lang='eng' dir='ltr'><em>(AY743277)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 194 979 1042 1010; baseline 0 -7"><span class='ocrx_word' id='word_1_139' title='bbox 194 991 220 1008; x_wconf 73' lang='eng'><em>62</em></span> <span class='ocrx_word' id='word_1_140' title='bbox 551 982 576 1003; x_wconf 94' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_141' title='bbox 585 982 751 1010; x_wconf 83' lang='eng' dir='ltr'><em>yavapaiensis</em></span> <span class='ocrx_word' id='word_1_142' title='bbox 762 981 873 1004; x_wconf 77' lang='eng' dir='ltr'><em>KR-236T</em></span> <span class='ocrx_word' id='word_1_143' title='bbox 882 979 1042 1008; x_wconf 83' lang='eng' dir='ltr'><em>(AY743279)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 230 1015 1074 1046; baseline 0.001 -7"><span class='ocrx_word' id='word_1_144' title='bbox 230 1015 257 1033; x_wconf 74' lang='eng'><em>60</em></span> <span class='ocrx_word' id='word_1_145' title='bbox 568 1018 593 1039; x_wconf 96' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_146' title='bbox 604 1018 784 1046; x_wconf 82' lang='eng' dir='ltr'><em>papagonensis</em></span> <span class='ocrx_word' id='word_1_147' title='bbox 795 1017 906 1040; x_wconf 88' lang='eng' dir='ltr'><em>KR-241T</em></span> <span class='ocrx_word' id='word_1_148' title='bbox 915 1015 1074 1044; x_wconf 88' lang='eng' dir='ltr'><em>(AY743280)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 445 1052 1007 1083; baseline 0 -7"><span class='ocrx_word' id='word_1_149' title='bbox 445 1066 485 1083; x_wconf 70' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_150' title='bbox 536 1054 561 1076; x_wconf 96' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_151' title='bbox 573 1061 658 1076; x_wconf 89' lang='eng' dir='ltr'><em>roseus</em></span> <span class='ocrx_word' id='word_1_152' title='bbox 667 1053 834 1076; x_wconf 78' lang='eng' dir='ltr'><em>TDMA-uv51T</em></span> <span class='ocrx_word' id='word_1_153' title='bbox 844 1052 1007 1080; x_wconf 75' lang='eng' dir='ltr'><em>(ABQ64136)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 595 1088 1162 1119; baseline 0 -7"><span class='ocrx_word' id='word_1_154' title='bbox 595 1090 620 1112; x_wconf 93' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_155' title='bbox 633 1090 819 1119; x_wconf 82' lang='eng' dir='ltr'><em>cellulosilyticus</em></span> <span class='ocrx_word' id='word_1_156' title='bbox 829 1091 874 1112; x_wconf 87' lang='eng'><em>551</em></span> <span class='ocrx_word' id='word_1_157' title='bbox 884 1089 983 1112; x_wconf 76' lang='eng' dir='ltr'><em>161-15T</em></span> <span class='ocrx_word' id='word_1_158' title='bbox 993 1088 1162 1117; x_wconf 83' lang='eng' dir='ltr'><em>(D0883809)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 481 1124 1053 1153; baseline 0 -5"><span class='ocrx_word' id='word_1_159' title='bbox 481 1127 507 1145; x_wconf 91' lang='eng'><em>75</em></span> <span class='ocrx_word' id='word_1_160' title='bbox 519 1138 546 1139; x_wconf 0' lang='eng'><em></em></span> <span class='ocrx_word' id='word_1_161' title='bbox 555 1126 580 1148; x_wconf 96' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_162' title='bbox 592 1126 733 1148; x_wconf 78' lang='eng' dir='ltr'><em>misasens/s</em></span> <span class='ocrx_word' id='word_1_163' title='bbox 742 1125 880 1148; x_wconf 86' lang='eng' dir='ltr'><em>TDMA-25T</em></span> <span class='ocrx_word' id='word_1_164' title='bbox 890 1124 1053 1153; x_wconf 90' lang='eng' dir='ltr'><em>(AB264135)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 533 1160 1103 1191; baseline 0 -7"><span class='ocrx_word' id='word_1_165' title='bbox 533 1163 558 1184; x_wconf 94' lang='eng' dir='ltr'><em>D.</em></span> <span class='ocrx_word' id='word_1_166' title='bbox 569 1163 735 1191; x_wconf 83' lang='eng' dir='ltr'><em>alpinitundrae</em></span> <span class='ocrx_word' id='word_1_167' title='bbox 746 1161 936 1184; x_wconf 86' lang='eng' dir='ltr'><em>ME—O4—04—52T</em></span> <span class='ocrx_word' id='word_1_168' title='bbox 946 1160 1103 1189; x_wconf 84' lang='eng' dir='ltr'><em>(EF635408)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 638 1196 1182 1227; baseline 0 -6"><span class='ocrx_word' id='word_1_169' title='bbox 638 1199 746 1227; x_wconf 80' lang='eng' dir='ltr'><em>Truepera</em></span> <span class='ocrx_word' id='word_1_170' title='bbox 756 1199 896 1221; x_wconf 81' lang='eng' dir='ltr'><em>radiovictr/X</em></span> <span class='ocrx_word' id='word_1_171' title='bbox 905 1198 1003 1221; x_wconf 85' lang='eng' dir='ltr'><em>RO-24T</em></span> <span class='ocrx_word' id='word_1_172' title='bbox 1013 1196 1182 1225; x_wconf 82' lang='eng' dir='ltr'>(D0022076)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 246 353 303 409">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 246 353 303 409">
+     <span class='ocr_line' id='line_1_35' title="bbox 246 353 271 371; baseline 0.04 -1"><span class='ocrx_word' id='word_1_173' title='bbox 246 353 271 371; x_wconf 84' lang='eng'>16</span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 276 392 303 409; baseline 0 0"><span class='ocrx_word' id='word_1_174' title='bbox 276 392 303 409; x_wconf 86' lang='eng'>46</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003053-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003053-0-000.pbm.png
new file mode 100644
index 00000000..757c0a22
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003053-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003053-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003053-0-000.pbm.png.hocr
new file mode 100644
index 00000000..d5b7da62
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003053-0-000.pbm.png.hocr
@@ -0,0 +1,163 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003053-0-000.pbm.png"; bbox 0 0 1243 1493; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 184 4 1243 1490">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 184 4 235 22">
+     <span class='ocr_line' id='line_1_1' title="bbox 184 4 235 22; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 184 4 214 22; x_wconf 89' lang='eng'>0.1</span> <span class='ocrx_word' id='word_1_2' title='bbox 221 4 235 22; x_wconf 88' lang='eng'>0</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 406 36 1163 278">
+     <span class='ocr_line' id='line_1_2' title="bbox 406 36 1163 67; baseline 0 -5"><span class='ocrx_word' id='word_1_3' title='bbox 406 49 422 67; x_wconf 75' lang='eng'><strong><em>.</em></strong></span> <span class='ocrx_word' id='word_1_4' title='bbox 442 39 654 62; x_wconf 84' lang='eng' dir='ltr'><em>Allochromatium</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 665 39 851 62; x_wconf 84' lang='eng' dir='ltr'><em>minutissimum</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 863 39 928 62; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 942 36 1163 66; x_wconf 70' lang='eng' dir='ltr'>1376T(Y12369)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 439 78 1109 108; baseline -0.001 -4"><span class='ocrx_word' id='word_1_8' title='bbox 439 81 651 104; x_wconf 87' lang='eng' dir='ltr'><em>Allochromatium</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 664 81 774 104; x_wconf 87' lang='eng' dir='ltr'><em>vinosum</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 785 80 851 104; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 865 79 927 103; x_wconf 90' lang='eng' dir='ltr'><em>180T</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 937 78 1000 108; x_wconf 93' lang='eng' dir='ltr'><em>(FM1</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 1010 78 1109 108; x_wconf 86' lang='eng'>78268)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 500 120 1145 152; baseline 0 -7"><span class='ocrx_word' id='word_1_14' title='bbox 500 123 712 146; x_wconf 82' lang='eng' dir='ltr'><em>Al/ochromatium</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 724 123 854 152; x_wconf 76' lang='eng' dir='ltr'><em>warming/&#39;1&#39;</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 864 122 928 146; x_wconf 92' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 942 124 950 145; x_wconf 97' lang='eng'>1</span> <span class='ocrx_word' id='word_1_18' title='bbox 960 121 1004 145; x_wconf 84' lang='eng' dir='ltr'><em>73T</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 1014 120 1145 150; x_wconf 88' lang='eng' dir='ltr'>(Y12365)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 461 162 1083 192; baseline 0 -5"><span class='ocrx_word' id='word_1_20' title='bbox 461 165 673 187; x_wconf 85' lang='eng' dir='ltr'><em>Allochromatium</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 684 165 790 187; x_wconf 85' lang='eng' dir='ltr'><em>renukae</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 800 163 897 187; x_wconf 89' lang='eng' dir='ltr'><em>JA136T</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 907 162 1083 192; x_wconf 86' lang='eng' dir='ltr'>(AM399029)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 460 204 1030 236; baseline 0 -7"><span class='ocrx_word' id='word_1_24' title='bbox 460 206 591 236; x_wconf 86' lang='eng' dir='ltr'><em>Thiocystis</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 600 206 738 236; x_wconf 82' lang='eng' dir='ltr'><em>gelatinosa</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 750 206 814 229; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 827 207 855 229; x_wconf 92' lang='eng'>21</span> <span class='ocrx_word' id='word_1_28' title='bbox 864 205 890 229; x_wconf 69' lang='eng' dir='ltr'>ST</span> <span class='ocrx_word' id='word_1_29' title='bbox 900 204 940 234; x_wconf 93' lang='eng' dir='ltr'><em>(Y1</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 951 207 996 229; x_wconf 89' lang='eng'>131</span> <span class='ocrx_word' id='word_1_31' title='bbox 1006 204 1030 234; x_wconf 92' lang='eng'><em>7)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 462 245 973 278; baseline 0 -7"><span class='ocrx_word' id='word_1_32' title='bbox 462 248 594 278; x_wconf 83' lang='eng' dir='ltr'><em>Thiocystis</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 604 248 682 271; x_wconf 80' lang='eng' dir='ltr'><em>minor</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 691 248 756 271; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 770 249 778 271; x_wconf 98' lang='eng'>1</span> <span class='ocrx_word' id='word_1_36' title='bbox 788 247 833 271; x_wconf 84' lang='eng' dir='ltr'><em>78T</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 842 246 882 276; x_wconf 94' lang='eng' dir='ltr'><em>(Y1</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 892 245 973 276; x_wconf 89' lang='eng'>2372)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 440 288 1076 445">
+     <span class='ocr_line' id='line_1_8' title="bbox 459 288 1003 320; baseline 0 -7"><span class='ocrx_word' id='word_1_39' title='bbox 459 290 591 320; x_wconf 83' lang='eng' dir='ltr'><em>Thiocystis</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 602 290 710 313; x_wconf 85' lang='eng' dir='ltr'><em>vio/acea</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 722 289 787 313; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 799 288 863 313; x_wconf 90' lang='eng' dir='ltr'><em>207T</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 873 288 913 317; x_wconf 91' lang='eng' dir='ltr'><em>(Y1</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 923 288 1003 317; x_wconf 90' lang='eng'>1315)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 486 329 1034 359; baseline 0 -4"><span class='ocrx_word' id='word_1_45' title='bbox 486 332 650 355; x_wconf 80' lang='eng' dir='ltr'><em>Chromatium</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 661 332 742 355; x_wconf 84' lang='eng' dir='ltr'><em>okeni/</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 752 332 817 355; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 831 331 893 355; x_wconf 87' lang='eng' dir='ltr'><em>169T</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 903 329 1034 359; x_wconf 93' lang='eng' dir='ltr'>(Y12376)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 440 371 1076 403; baseline 0 -6"><span class='ocrx_word' id='word_1_50' title='bbox 440 374 574 403; x_wconf 88' lang='eng' dir='ltr'><em>Thiocapsa</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 585 374 783 403; x_wconf 84' lang='eng' dir='ltr'><em>roseopersicina</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 793 374 858 397; x_wconf 93' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 871 375 899 397; x_wconf 96' lang='eng'>21</span> <span class='ocrx_word' id='word_1_54' title='bbox 909 371 1076 401; x_wconf 73' lang='eng' dir='ltr'>7T(Y12364)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 446 413 999 445; baseline -0.002 -6"><span class='ocrx_word' id='word_1_55' title='bbox 446 416 580 445; x_wconf 87' lang='eng' dir='ltr'><em>Thiocapsa</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 591 423 664 439; x_wconf 85' lang='eng' dir='ltr'><em>rosea</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 675 415 740 439; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 753 413 999 443; x_wconf 76' lang='eng' dir='ltr'>235T(FM178269)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 385 455 1236 778">
+     <span class='ocr_line' id='line_1_12' title="bbox 446 455 1034 487; baseline 0 -7"><span class='ocrx_word' id='word_1_59' title='bbox 446 458 580 487; x_wconf 85' lang='eng' dir='ltr'><em>Thiocapsa</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 591 458 680 480; x_wconf 83' lang='eng' dir='ltr'><em>marina</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 692 457 757 481; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 769 456 852 480; x_wconf 84' lang='eng' dir='ltr'><em>5653T</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 862 455 925 485; x_wconf 93' lang='eng' dir='ltr'><em>(FM1</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 935 455 1034 485; x_wconf 87' lang='eng'>78270)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 517 497 1236 529; baseline 0 -7"><span class='ocrx_word' id='word_1_65' title='bbox 517 499 721 529; x_wconf 85' lang='eng' dir='ltr'><em>Thio/amprovum</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 731 499 884 529; x_wconf 80' lang='eng' dir='ltr'><em>pedioforme</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 895 499 960 522; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 972 498 1055 522; x_wconf 90' lang='eng' dir='ltr'><em>3802T</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 1065 497 1128 527; x_wconf 88' lang='eng' dir='ltr'><em>(FM1</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 1138 497 1236 527; x_wconf 89' lang='eng'>78271)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 443 539 934 571; baseline 0 -7"><span class='ocrx_word' id='word_1_71' title='bbox 443 541 563 564; x_wconf 82' lang='eng' dir='ltr'><em>Thiobaca</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 575 541 677 571; x_wconf 84' lang='eng' dir='ltr'><em>trueperi</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 686 540 763 564; x_wconf 89' lang='eng' dir='ltr'><em>BCHT</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 773 539 934 569; x_wconf 90' lang='eng' dir='ltr'>(AJ404006)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 407 581 1128 613; baseline 0 -7"><span class='ocrx_word' id='word_1_75' title='bbox 407 583 640 606; x_wconf 85' lang='eng' dir='ltr'><em>Thiorhodococcus</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 650 583 872 613; x_wconf 82' lang='eng' dir='ltr'><em>mannito/iphagus</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 882 581 945 606; x_wconf 89' lang='eng' dir='ltr'><em>WST</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 955 581 1019 610; x_wconf 94' lang='eng' dir='ltr'><em>(FM1</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 1029 581 1128 611; x_wconf 88' lang='eng'>78272)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 407 622 1055 652; baseline 0 -4"><span class='ocrx_word' id='word_1_80' title='bbox 407 625 640 648; x_wconf 87' lang='eng' dir='ltr'><em>Thiorhodococcus</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 650 625 727 648; x_wconf 85' lang='eng' dir='ltr'><em>minor</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 736 625 801 648; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 815 626 823 648; x_wconf 92' lang='eng'>1</span> <span class='ocrx_word' id='word_1_84' title='bbox 834 626 879 648; x_wconf 90' lang='eng'>151</span> <span class='ocrx_word' id='word_1_85' title='bbox 887 624 914 648; x_wconf 88' lang='eng' dir='ltr'><em>BT</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 924 623 964 652; x_wconf 95' lang='eng' dir='ltr'><em>(Y1</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 975 622 1055 652; x_wconf 90' lang='eng'>1316)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 388 664 1079 694; baseline 0 -4"><span class='ocrx_word' id='word_1_88' title='bbox 388 667 620 690; x_wconf 83' lang='eng' dir='ltr'><em>Thiorhodococcus</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 631 666 893 690; x_wconf 77' lang='eng' dir='ltr'><em>bheemlic:usJA132T</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 903 664 1079 694; x_wconf 91' lang='eng' dir='ltr'>(AM282559)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 385 706 1095 736; baseline -0.001 -4"><span class='ocrx_word' id='word_1_91' title='bbox 385 709 617 732; x_wconf 85' lang='eng' dir='ltr'><em>Thiorhodococcus</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 628 709 726 732; x_wconf 90' lang='eng' dir='ltr'><em>drewsii</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 735 708 800 732; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 814 707 913 731; x_wconf 81' lang='eng' dir='ltr'><em>15006T</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 923 706 986 736; x_wconf 94' lang='eng' dir='ltr'><em>(FM1</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 996 706 1095 736; x_wconf 85' lang='eng'>78273)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 407 748 1117 778; baseline -0.001 -4"><span class='ocrx_word' id='word_1_97' title='bbox 407 751 640 774; x_wconf 86' lang='eng' dir='ltr'><em>Thiorhodococcus</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 650 751 824 774; x_wconf 84' lang='eng' dir='ltr'><em>kakinadensis</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 833 749 931 774; x_wconf 92' lang='eng' dir='ltr'><em>JA13OT</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 941 748 1117 778; x_wconf 85' lang='eng' dir='ltr'>(AM282561)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 367 790 1015 822">
+     <span class='ocr_line' id='line_1_20' title="bbox 367 790 1015 822; baseline 0 -7"><span class='ocrx_word' id='word_1_101' title='bbox 367 805 381 822; x_wconf 78' lang='eng' dir='ltr'><strong><em>o</em></strong></span> <span class='ocrx_word' id='word_1_102' title='bbox 405 793 622 815; x_wconf 83' lang='eng' dir='ltr'><em>Marichromatium</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 632 793 721 822; x_wconf 84' lang='eng' dir='ltr'><em>gracile</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 733 792 798 815; x_wconf 92' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 811 791 874 815; x_wconf 89' lang='eng' dir='ltr'><em>203T</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 884 790 1015 820; x_wconf 86' lang='eng' dir='ltr'>(X93473)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 248 832 1243 1490">
+     <span class='ocr_line' id='line_1_21' title="bbox 362 832 1132 864; baseline 0 -7"><span class='ocrx_word' id='word_1_107' title='bbox 362 840 377 857; x_wconf 78' lang='eng' dir='ltr'><strong>o</strong></span> <span class='ocrx_word' id='word_1_108' title='bbox 408 834 625 857; x_wconf 81' lang='eng' dir='ltr'><em>Marichromatium</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 634 837 789 864; x_wconf 87' lang='eng' dir='ltr'><em>purpuratum</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 801 834 866 857; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 880 835 888 857; x_wconf 95' lang='eng'>1</span> <span class='ocrx_word' id='word_1_112' title='bbox 897 833 961 857; x_wconf 87' lang='eng' dir='ltr'><em>591T</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 971 832 1132 862; x_wconf 87' lang='eng' dir='ltr'>(AJ224439)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 405 874 1017 904; baseline 0 -5"><span class='ocrx_word' id='word_1_114' title='bbox 405 876 623 899; x_wconf 85' lang='eng' dir='ltr'><em>Marichromatium</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 633 876 739 899; x_wconf 79' lang='eng' dir='ltr'><em>ind/cum</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 749 875 847 899; x_wconf 88' lang='eng' dir='ltr'><em>JA100T</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 856 874 1017 904; x_wconf 86' lang='eng' dir='ltr'>(AJ543328)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 411 916 1096 946; baseline 0 -5"><span class='ocrx_word' id='word_1_118' title='bbox 411 918 628 941; x_wconf 80' lang='eng' dir='ltr'><em>Mar/chromatium</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 638 918 803 941; x_wconf 81' lang='eng' dir='ltr'><em>bheem/icum</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 812 918 856 941; x_wconf 87' lang='eng' dir='ltr'>JA1</span> <span class='ocrx_word' id='word_1_121' title='bbox 866 917 910 941; x_wconf 88' lang='eng' dir='ltr'><em>24T</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 920 916 1096 946; x_wconf 89' lang='eng' dir='ltr'>(AM180952)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 389 957 999 990; baseline 0 -7"><span class='ocrx_word' id='word_1_123' title='bbox 389 960 610 983; x_wconf 83' lang='eng' dir='ltr'><em>Ha/ochromatium</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 619 960 764 990; x_wconf 81' lang='eng' dir='ltr'><em>glycol/cum</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 776 959 858 983; x_wconf 88' lang='eng' dir='ltr'><em>6340T</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 868 957 999 988; x_wconf 90' lang='eng' dir='ltr'>(X93472)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 402 999 1009 1032; baseline 0 -7"><span class='ocrx_word' id='word_1_127' title='bbox 402 1002 624 1025; x_wconf 83' lang='eng' dir='ltr'><em>Ha/ochromatium</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 635 1002 775 1032; x_wconf 81' lang='eng' dir='ltr'><em>sa/eXigens</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 786 1003 833 1025; x_wconf 88' lang='eng'><em>631</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 842 1000 868 1025; x_wconf 88' lang='eng' dir='ltr'><em>OT</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 878 999 1009 1029; x_wconf 87' lang='eng' dir='ltr'>(X98597)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 378 1041 1001 1071; baseline -0.002 -4"><span class='ocrx_word' id='word_1_132' title='bbox 378 1044 599 1067; x_wconf 82' lang='eng' dir='ltr'><em>Halochromatium</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 610 1051 709 1067; x_wconf 88' lang='eng' dir='ltr'><em>roseum</em></span> <span class='ocrx_word' id='word_1_134' title='bbox 719 1042 816 1067; x_wconf 92' lang='eng' dir='ltr'><em>JA134T</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 826 1041 1001 1071; x_wconf 90' lang='eng' dir='ltr'>(AM283535)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 355 1083 975 1125; baseline 0 -17"><span class='ocrx_word' id='word_1_136' title='bbox 355 1086 576 1125; x_wconf 48' lang='eng' dir='ltr'><em>Mghiohalocapsa</em></span> <span class='ocrx_word' id='word_1_137' title='bbox 587 1086 686 1108; x_wconf 83' lang='eng' dir='ltr'><em>marina</em></span> <span class='ocrx_word' id='word_1_138' title='bbox 697 1084 793 1109; x_wconf 84' lang='eng' dir='ltr'><em>JA142T</em></span> <span class='ocrx_word' id='word_1_139' title='bbox 803 1083 975 1113; x_wconf 86' lang='eng' dir='ltr'>(AM491592)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 382 1125 1049 1157; baseline 0 -7"><span class='ocrx_word' id='word_1_140' title='bbox 382 1127 574 1157; x_wconf 83' lang='eng' dir='ltr'><em>Thiohalocapsa</em></span> <span class='ocrx_word' id='word_1_141' title='bbox 585 1127 705 1157; x_wconf 82' lang='eng' dir='ltr'><em>halophi/a</em></span> <span class='ocrx_word' id='word_1_142' title='bbox 717 1127 782 1150; x_wconf 92' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_143' title='bbox 794 1126 877 1150; x_wconf 81' lang='eng' dir='ltr'><em>6210T</em></span> <span class='ocrx_word' id='word_1_144' title='bbox 887 1125 1049 1155; x_wconf 87' lang='eng' dir='ltr'>(AJ002796)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 399 1167 969 1199; baseline 0 -7"><span class='ocrx_word' id='word_1_145' title='bbox 399 1169 552 1192; x_wconf 79' lang='eng' dir='ltr'><em>Thiococcus</em></span> <span class='ocrx_word' id='word_1_146' title='bbox 561 1169 678 1199; x_wconf 79' lang='eng' dir='ltr'><em>pfennigii</em></span> <span class='ocrx_word' id='word_1_147' title='bbox 687 1169 752 1192; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_148' title='bbox 765 1168 828 1192; x_wconf 90' lang='eng' dir='ltr'><em>226T</em></span> <span class='ocrx_word' id='word_1_149' title='bbox 838 1167 969 1197; x_wconf 89' lang='eng' dir='ltr'>(Y12373)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 402 1209 979 1239; baseline 0 -5"><span class='ocrx_word' id='word_1_150' title='bbox 402 1211 608 1234; x_wconf 83' lang='eng' dir='ltr'><em>Thiof/avicoccus</em></span> <span class='ocrx_word' id='word_1_151' title='bbox 618 1211 714 1234; x_wconf 81' lang='eng' dir='ltr'><em>mobi/is</em></span> <span class='ocrx_word' id='word_1_152' title='bbox 724 1210 807 1234; x_wconf 80' lang='eng' dir='ltr'><em>8321T</em></span> <span class='ocrx_word' id='word_1_153' title='bbox 817 1209 979 1239; x_wconf 89' lang='eng' dir='ltr'>(AJ010126)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 501 1250 1100 1281; baseline 0 -5"><span class='ocrx_word' id='word_1_154' title='bbox 501 1253 722 1276; x_wconf 84' lang='eng' dir='ltr'><em>Thioa/ka/icoccus</em></span> <span class='ocrx_word' id='word_1_155' title='bbox 733 1253 853 1276; x_wconf 83' lang='eng' dir='ltr'><em>limnaeus</em></span> <span class='ocrx_word' id='word_1_156' title='bbox 862 1252 929 1276; x_wconf 90' lang='eng' dir='ltr'><em>A26T</em></span> <span class='ocrx_word' id='word_1_157' title='bbox 939 1250 1100 1281; x_wconf 91' lang='eng' dir='ltr'>(AJ277023)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 424 1292 1128 1322; baseline 0 -4"><span class='ocrx_word' id='word_1_158' title='bbox 424 1295 689 1318; x_wconf 80' lang='eng' dir='ltr'><em>Rhabdochromatium</em></span> <span class='ocrx_word' id='word_1_159' title='bbox 700 1295 815 1318; x_wconf 84' lang='eng' dir='ltr'><em>marinum</em></span> <span class='ocrx_word' id='word_1_160' title='bbox 827 1295 892 1318; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_161' title='bbox 904 1293 987 1318; x_wconf 90' lang='eng' dir='ltr'><em>5261T</em></span> <span class='ocrx_word' id='word_1_162' title='bbox 997 1292 1128 1322; x_wconf 88' lang='eng' dir='ltr'>(X84316)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 388 1334 1096 1367; baseline 0 -8"><span class='ocrx_word' id='word_1_163' title='bbox 388 1337 596 1360; x_wconf 87' lang='eng' dir='ltr'><em>Thiorhodovibrio</em></span> <span class='ocrx_word' id='word_1_164' title='bbox 609 1337 787 1367; x_wconf 88' lang='eng' dir='ltr'><em>Winogradskyi</em></span> <span class='ocrx_word' id='word_1_165' title='bbox 795 1336 861 1360; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_166' title='bbox 873 1335 955 1359; x_wconf 83' lang='eng' dir='ltr'><em>6702T</em></span> <span class='ocrx_word' id='word_1_167' title='bbox 965 1334 1005 1364; x_wconf 95' lang='eng' dir='ltr'><em>(Y1</em></span> <span class='ocrx_word' id='word_1_168' title='bbox 1015 1334 1096 1364; x_wconf 88' lang='eng'>2368)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 479 1376 1243 1408; baseline -0.001 -6"><span class='ocrx_word' id='word_1_169' title='bbox 479 1379 734 1408; x_wconf 79' lang='eng' dir='ltr'><em>Ectothiorhodospira</em></span> <span class='ocrx_word' id='word_1_170' title='bbox 744 1379 946 1408; x_wconf 85' lang='eng' dir='ltr'><em>shaposhnikovii</em></span> <span class='ocrx_word' id='word_1_171' title='bbox 955 1378 1020 1402; x_wconf 86' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_172' title='bbox 1033 1377 1096 1401; x_wconf 88' lang='eng' dir='ltr'><em>243T</em></span> <span class='ocrx_word' id='word_1_173' title='bbox 1106 1376 1189 1406; x_wconf 87' lang='eng' dir='ltr'>(M591</span> <span class='ocrx_word' id='word_1_174' title='bbox 1198 1376 1243 1406; x_wconf 87' lang='eng'><em>51)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 576 1418 1135 1450; baseline 0 -7"><span class='ocrx_word' id='word_1_175' title='bbox 576 1421 782 1450; x_wconf 85' lang='eng' dir='ltr'><em>Ha/orhodospira</em></span> <span class='ocrx_word' id='word_1_176' title='bbox 793 1421 913 1450; x_wconf 85' lang='eng' dir='ltr'><em>ha/ophila</em></span> <span class='ocrx_word' id='word_1_177' title='bbox 924 1419 988 1443; x_wconf 84' lang='eng' dir='ltr'><em>SL1T</em></span> <span class='ocrx_word' id='word_1_178' title='bbox 998 1418 1135 1448; x_wconf 87' lang='eng' dir='ltr'>(M26630)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 248 1460 808 1490; baseline 0 -5"><span class='ocrx_word' id='word_1_179' title='bbox 248 1462 404 1485; x_wconf 82' lang='eng' dir='ltr'><em>Escherichia</em></span> <span class='ocrx_word' id='word_1_180' title='bbox 416 1462 464 1485; x_wconf 84' lang='eng' dir='ltr'><em>co/i</em></span> <span class='ocrx_word' id='word_1_181' title='bbox 471 1462 560 1485; x_wconf 87' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_182' title='bbox 576 1461 668 1485; x_wconf 92' lang='eng' dir='ltr'><em>11775T</em></span> <span class='ocrx_word' id='word_1_183' title='bbox 678 1460 808 1490; x_wconf 91' lang='eng' dir='ltr'>(X80725)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 0 49 566 1479">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 0 49 566 1479">
+     <span class='ocr_line' id='line_1_37' title="bbox 327 49 406 82; baseline 0 1411"><span class='ocrx_word' id='word_1_184' title='bbox 327 49 406 82; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 327 82 439 123; baseline 0 1370"><span class='ocrx_word' id='word_1_185' title='bbox 327 82 439 123; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 308 123 492 207; baseline 0 -39"><span class='ocrx_word' id='word_1_186' title='bbox 308 123 492 207; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 308 207 453 252; baseline 0 1241"><span class='ocrx_word' id='word_1_187' title='bbox 308 207 453 252; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 308 252 450 294; baseline 0 1199"><span class='ocrx_word' id='word_1_188' title='bbox 308 252 450 294; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 286 294 475 355; baseline 0 -19"><span class='ocrx_word' id='word_1_189' title='bbox 286 294 475 355; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 286 355 440 419; baseline 0 -45"><span class='ocrx_word' id='word_1_190' title='bbox 286 355 440 419; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 286 419 434 461; baseline 0 1032"><span class='ocrx_word' id='word_1_191' title='bbox 286 419 434 461; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 287 461 505 523; baseline 0 0"><span class='ocrx_word' id='word_1_192' title='bbox 287 461 505 523; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 275 523 443 565; baseline 0 -20"><span class='ocrx_word' id='word_1_193' title='bbox 275 523 443 565; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 275 565 407 649; baseline 0 -20"><span class='ocrx_word' id='word_1_194' title='bbox 275 565 407 649; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_48' title="bbox 275 649 388 709; baseline 0 -42"><span class='ocrx_word' id='word_1_195' title='bbox 275 649 388 709; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_49' title="bbox 275 709 395 793; baseline 0 -19"><span class='ocrx_word' id='word_1_196' title='bbox 275 709 395 793; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_50' title="bbox 275 793 313 838; baseline 0 655"><span class='ocrx_word' id='word_1_197' title='bbox 275 793 313 838; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_51' title="bbox 275 838 362 880; baseline 0 613"><span class='ocrx_word' id='word_1_198' title='bbox 275 838 362 880; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_52' title="bbox 234 880 400 961; baseline 0 -20"><span class='ocrx_word' id='word_1_199' title='bbox 234 880 400 961; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_53' title="bbox 234 961 392 1026; baseline 0 0"><span class='ocrx_word' id='word_1_200' title='bbox 234 961 392 1026; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_54' title="bbox 234 1026 378 1062; baseline 0 0"><span class='ocrx_word' id='word_1_201' title='bbox 234 1026 378 1062; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_55' title="bbox 234 1062 355 1086; baseline 0 407"><span class='ocrx_word' id='word_1_202' title='bbox 234 1062 355 1086; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_56' title="bbox 234 1086 382 1173; baseline 0 0"><span class='ocrx_word' id='word_1_203' title='bbox 234 1086 382 1173; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_57' title="bbox 234 1173 390 1215; baseline 0 278"><span class='ocrx_word' id='word_1_204' title='bbox 234 1173 390 1215; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_58' title="bbox 234 1215 489 1296; baseline 0 -42"><span class='ocrx_word' id='word_1_205' title='bbox 234 1215 489 1296; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_59' title="bbox 0 1296 415 1337; baseline 0 -19"><span class='ocrx_word' id='word_1_206' title='bbox 0 1296 415 1337; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_60' title="bbox 0 1337 388 1383; baseline 0 110"><span class='ocrx_word' id='word_1_207' title='bbox 0 1337 388 1383; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_61' title="bbox 0 1383 479 1424; baseline 0 69"><span class='ocrx_word' id='word_1_208' title='bbox 0 1383 479 1424; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_62' title="bbox 0 1424 566 1479; baseline 0 -34"><span class='ocrx_word' id='word_1_209' title='bbox 0 1424 566 1479; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003061-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003061-0-000.pbm.png
new file mode 100644
index 00000000..654bf000
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003061-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003061-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003061-0-000.pbm.png.hocr
new file mode 100644
index 00000000..11a604ef
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003061-0-000.pbm.png.hocr
@@ -0,0 +1,240 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003061-0-000.pbm.png"; bbox 0 0 1539 1104; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 605 2 1263 221">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 605 2 1263 221">
+     <span class='ocr_line' id='line_1_1' title="bbox 625 2 1263 32; baseline 0 -6"><span class='ocrx_word' id='word_1_1' title='bbox 625 4 779 26; x_wconf 83' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 784 4 950 32; x_wconf 81' lang='eng' dir='ltr'><em>panaciterrae</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 960 4 1024 26; x_wconf 89' lang='eng' dir='ltr'><em>Gsoil</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 1036 2 1097 26; x_wconf 91' lang='eng' dir='ltr'><em>042T</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 1108 4 1263 32; x_wconf 81' lang='eng' dir='ltr'>(ABZ45368)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 623 40 1236 70; baseline 0 -6"><span class='ocrx_word' id='word_1_6' title='bbox 623 42 776 64; x_wconf 83' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 783 42 913 70; x_wconf 89' lang='eng' dir='ltr'><em>heparinus</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 924 42 986 64; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 997 40 1075 64; x_wconf 82' lang='eng' dir='ltr'><em>2366T</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 1085 42 1236 70; x_wconf 89' lang='eng' dir='ltr'><em>(AJ438172)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 620 77 1238 108; baseline -0.002 -6"><span class='ocrx_word' id='word_1_11' title='bbox 620 80 774 102; x_wconf 84' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 781 79 901 102; x_wconf 83' lang='eng' dir='ltr'><em>africanus</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 911 79 973 102; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 987 77 1079 102; x_wconf 81' lang='eng' dir='ltr'><em>12126T</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 1087 79 1238 108; x_wconf 82' lang='eng' dir='ltr'><em>(AJ438171)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 613 118 1179 148; baseline -0.002 -5"><span class='ocrx_word' id='word_1_16' title='bbox 613 121 766 143; x_wconf 82' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 774 121 845 143; x_wconf 82' lang='eng' dir='ltr'><em>caeni</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 853 120 915 143; x_wconf 91' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 926 118 1020 143; x_wconf 81' lang='eng' dir='ltr'><em>22862T</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 1028 120 1179 148; x_wconf 87' lang='eng' dir='ltr'><em>(AJ786798)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 605 153 1233 183; baseline 0 -6"><span class='ocrx_word' id='word_1_21' title='bbox 605 155 758 177; x_wconf 83' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 765 155 921 183; x_wconf 86' lang='eng' dir='ltr'><em>ginsengisoli</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 930 155 994 177; x_wconf 88' lang='eng' dir='ltr'><em>Gsoil</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 1008 153 1067 177; x_wconf 93' lang='eng' dir='ltr'><em>104T</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 1077 155 1233 183; x_wconf 91' lang='eng' dir='ltr'><em>(AB245371)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 651 191 1175 221; baseline 0 -6"><span class='ocrx_word' id='word_1_26' title='bbox 651 193 805 215; x_wconf 84' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 811 193 904 215; x_wconf 89' lang='eng' dir='ltr'><em>insulae</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 916 191 1010 215; x_wconf 82' lang='eng' dir='ltr'><em>DS—39T</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 1021 193 1175 221; x_wconf 86' lang='eng' dir='ltr'>(EF100697)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 580 229 1285 298">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 580 229 1285 298">
+     <span class='ocr_line' id='line_1_7' title="bbox 580 229 1285 265; baseline 0 -6"><span class='ocrx_word' id='word_1_30' title='bbox 580 229 621 249; x_wconf 69' lang='eng'>100</span> <span class='ocrx_word' id='word_1_31' title='bbox 642 237 880 265; x_wconf 84' lang='eng' dir='ltr'><em>Sphingobacterium</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 890 237 1042 259; x_wconf 77' lang='eng' dir='ltr'><em>antarcticum</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 1052 237 1123 259; x_wconf 90' lang='eng' dir='ltr'>6B1Y</span> <span class='ocrx_word' id='word_1_34' title='bbox 1134 237 1285 265; x_wconf 89' lang='eng' dir='ltr'><em>(AJ576248)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 640 268 1238 298; baseline 0 -6"><span class='ocrx_word' id='word_1_35' title='bbox 640 270 793 292; x_wconf 82' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 799 270 900 298; x_wconf 87' lang='eng' dir='ltr'><em>piscium</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 911 270 974 292; x_wconf 92' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 987 268 1079 292; x_wconf 82' lang='eng' dir='ltr'><em>11725T</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 1087 270 1238 298; x_wconf 87' lang='eng' dir='ltr'><em>(AJ438174)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 516 304 1308 568">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 516 304 1308 568">
+     <span class='ocr_line' id='line_1_9' title="bbox 516 304 1265 334; baseline 0 -6"><span class='ocrx_word' id='word_1_40' title='bbox 516 313 543 332; x_wconf 82' lang='eng'>99</span> <span class='ocrx_word' id='word_1_41' title='bbox 625 307 779 329; x_wconf 83' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 786 307 925 334; x_wconf 86' lang='eng' dir='ltr'><em>cryoconitis</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 936 306 998 329; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 1012 304 1104 329; x_wconf 83' lang='eng' dir='ltr'><em>14825T</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 1114 306 1265 334; x_wconf 88' lang='eng' dir='ltr'>(AJ438170)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 553 344 1273 374; baseline 0 -6"><span class='ocrx_word' id='word_1_46' title='bbox 553 348 581 368; x_wconf 87' lang='eng'>98</span> <span class='ocrx_word' id='word_1_47' title='bbox 654 346 808 368; x_wconf 86' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 815 346 986 374; x_wconf 87' lang='eng' dir='ltr'><em>hima/ayensis</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 997 346 1056 368; x_wconf 89' lang='eng' dir='ltr'><em>HHS</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 1067 344 1112 368; x_wconf 91' lang='eng' dir='ltr'><em>22T</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 1122 346 1273 374; x_wconf 87' lang='eng' dir='ltr'><em>(AJ583425)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 664 381 1216 412; baseline 0 -6"><span class='ocrx_word' id='word_1_52' title='bbox 664 384 817 406; x_wconf 78' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 824 384 932 411; x_wconf 76' lang='eng' dir='ltr'><em>aquatilis</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 940 381 1044 406; x_wconf 92' lang='eng' dir='ltr'><em>AR107T</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 1054 384 1216 412; x_wconf 86' lang='eng' dir='ltr'><em>(AM114396)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 647 421 1213 451; baseline 0 -6"><span class='ocrx_word' id='word_1_56' title='bbox 647 423 801 445; x_wconf 88' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 808 429 896 445; x_wconf 86' lang='eng' dir='ltr'><em>roseus</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 906 421 1041 445; x_wconf 89' lang='eng' dir='ltr'><em>CL—GP80T</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 1052 423 1116 451; x_wconf 83' lang='eng' dir='ltr'><em>(DQ1</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 1125 423 1213 451; x_wconf 85' lang='eng'><em>12353)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 528 435 1271 514; baseline 0 -31"><span class='ocrx_word' id='word_1_61' title='bbox 528 435 841 514; x_wconf 42' lang='eng' dir='ltr'><em>ELEPedobacter</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 848 461 1003 483; x_wconf 87' lang='eng' dir='ltr'><em>suwonensis</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 1014 459 1100 483; x_wconf 81' lang='eng' dir='ltr'><em>15—52T</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 1111 461 1271 489; x_wconf 82' lang='eng' dir='ltr'>(DQOQ7274)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 573 498 1308 529; baseline -0.001 -6"><span class='ocrx_word' id='word_1_65' title='bbox 573 501 600 520; x_wconf 84' lang='eng'><em>68</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 695 501 848 523; x_wconf 85' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 855 501 1031 523; x_wconf 87' lang='eng' dir='ltr'><em>sandarakinus</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 1042 498 1137 523; x_wconf 90' lang='eng' dir='ltr'><em>DS—27T</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 1147 500 1308 529; x_wconf 87' lang='eng' dir='ltr'>(DQ235228)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 622 538 1215 568; baseline 0 -6"><span class='ocrx_word' id='word_1_70' title='bbox 622 540 786 562; x_wconf 86' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 794 540 927 568; x_wconf 89' lang='eng' dir='ltr'><em>composti</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 934 538 1045 562; x_wconf 90' lang='eng' dir='ltr'><em>TR6-06T</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 1055 540 1215 568; x_wconf 77' lang='eng' dir='ltr'>(A8267720)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 589 574 1144 642">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 589 574 1144 642">
+     <span class='ocr_line' id='line_1_16' title="bbox 589 574 1099 605; baseline 0 -7"><span class='ocrx_word' id='word_1_74' title='bbox 589 576 743 598; x_wconf 82' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 749 576 828 598; x_wconf 83' lang='eng' dir='ltr'><em>lentus</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 838 574 934 598; x_wconf 89' lang='eng' dir='ltr'><em>DS—40T</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 944 576 1099 605; x_wconf 81' lang='eng' dir='ltr'><em>(EF446146)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 608 612 1144 642; baseline 0 -6"><span class='ocrx_word' id='word_1_78' title='bbox 608 614 761 636; x_wconf 83' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 768 614 872 636; x_wconf 87' lang='eng' dir='ltr'><em>terrico/a</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 884 612 979 636; x_wconf 90' lang='eng' dir='ltr'><em>DS—45T</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 989 614 1144 642; x_wconf 88' lang='eng' dir='ltr'><em>(EF446147)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 395 17 618 552">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 395 17 618 552">
+     <span class='ocr_line' id='line_1_18' title="bbox 465 17 618 211; baseline 0 -48"><span class='ocrx_word' id='word_1_82' title='bbox 465 17 618 211; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 395 211 521 396; baseline 0 -113"><span class='ocrx_word' id='word_1_83' title='bbox 395 211 521 396; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 395 396 528 552; baseline 0 552"><span class='ocrx_word' id='word_1_84' title='bbox 395 396 528 552; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 46 83 108 107">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 46 83 108 107">
+     <span class='ocr_line' id='line_1_21' title="bbox 46 83 108 107; baseline 0 0"><span class='ocrx_word' id='word_1_85' title='bbox 46 83 108 107; x_wconf 89' lang='eng'><em>0.02</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 515 207 517 303">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 515 207 517 303">
+     <span class='ocr_line' id='line_1_22' title="bbox 515 207 517 303; baseline 0 801"><span class='ocrx_word' id='word_1_86' title='bbox 515 207 517 303; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 365 394 393 414">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 365 394 393 414">
+     <span class='ocr_line' id='line_1_23' title="bbox 365 394 393 414; baseline 0 0"><span class='ocrx_word' id='word_1_87' title='bbox 365 394 393 414; x_wconf 88' lang='eng'>66</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 368 431 528 433">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 368 431 528 433">
+     <span class='ocr_line' id='line_1_24' title="bbox 368 431 528 433; baseline 0 671"><span class='ocrx_word' id='word_1_88' title='bbox 368 431 528 433; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 526 398 528 467">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 526 398 528 467">
+     <span class='ocr_line' id='line_1_25' title="bbox 526 398 528 467; baseline 0 637"><span class='ocrx_word' id='word_1_89' title='bbox 526 398 528 467; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 332 494 359 514">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 332 494 359 514">
+     <span class='ocr_line' id='line_1_26' title="bbox 332 494 359 514; baseline 0.037 -1"><span class='ocrx_word' id='word_1_90' title='bbox 332 494 359 514; x_wconf 89' lang='eng'><em>74</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 491 587 582 590">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 491 587 582 590">
+     <span class='ocr_line' id='line_1_27' title="bbox 491 587 582 590; baseline 0 514"><span class='ocrx_word' id='word_1_91' title='bbox 491 587 582 590; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 368 431 370 608">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 368 431 370 608">
+     <span class='ocr_line' id='line_1_28' title="bbox 368 431 370 608; baseline 0 496"><span class='ocrx_word' id='word_1_92' title='bbox 368 431 370 608; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 368 606 492 608">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 368 606 492 608">
+     <span class='ocr_line' id='line_1_29' title="bbox 368 606 492 608; baseline 0 496"><span class='ocrx_word' id='word_1_93' title='bbox 368 606 492 608; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 490 588 492 628">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 490 588 492 628">
+     <span class='ocr_line' id='line_1_30' title="bbox 490 588 492 628; baseline 0 476"><span class='ocrx_word' id='word_1_94' title='bbox 490 588 492 628; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 492 626 605 628">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 492 626 605 628">
+     <span class='ocr_line' id='line_1_31' title="bbox 492 626 605 628; baseline 0 476"><span class='ocrx_word' id='word_1_95' title='bbox 492 626 605 628; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 436 615 477 635">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 436 615 477 635">
+     <span class='ocr_line' id='line_1_32' title="bbox 436 615 477 635; baseline 0 0"><span class='ocrx_word' id='word_1_96' title='bbox 436 615 477 635; x_wconf 91' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 2 633 302 635">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 2 633 302 635">
+     <span class='ocr_line' id='line_1_33' title="bbox 2 633 302 635; baseline 0 469"><span class='ocrx_word' id='word_1_97' title='bbox 2 633 302 635; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 2 633 4 1085">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 2 633 4 1085">
+     <span class='ocr_line' id='line_1_34' title="bbox 2 633 4 1085; baseline 0 19"><span class='ocrx_word' id='word_1_98' title='bbox 2 633 4 1085; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 349 649 1534 1058">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 446 649 1534 793">
+     <span class='ocr_line' id='line_1_35' title="bbox 608 649 1201 680; baseline 0 -6"><span class='ocrx_word' id='word_1_99' title='bbox 608 652 761 674; x_wconf 82' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 768 652 861 674; x_wconf 82' lang='eng' dir='ltr'><em>saltans</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 872 652 935 674; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 948 649 1040 674; x_wconf 91' lang='eng' dir='ltr'><em>12145T</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 1050 652 1201 680; x_wconf 87' lang='eng' dir='ltr'><em>(AJ438173)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 506 687 1438 718; baseline 0 -7"><span class='ocrx_word' id='word_1_104' title='bbox 506 694 534 713; x_wconf 87' lang='eng'>83</span> <span class='ocrx_word' id='word_1_105' title='bbox 918 689 1059 712; x_wconf 89' lang='eng' dir='ltr'><em>Olivibacter</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 1066 690 1171 712; x_wconf 84' lang='eng' dir='ltr'><em>sitiensis</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 1179 687 1267 712; x_wconf 89' lang='eng' dir='ltr'><em>AW-6T</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 1277 689 1438 718; x_wconf 85' lang='eng' dir='ltr'><em>(DQ421387)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 446 702 1392 755; baseline 0 -6"><span class='ocrx_word' id='word_1_109' title='bbox 446 725 474 745; x_wconf 85' lang='eng'><em>93</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 485 702 994 755; x_wconf 53' lang='eng' dir='ltr'><em>mbacmr</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 1001 727 1128 749; x_wconf 85' lang='eng' dir='ltr'><em>koreensis</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 1137 725 1220 755; x_wconf 81' lang='eng' dir='ltr'><em>Jip14T</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 1230 727 1392 755; x_wconf 78' lang='eng' dir='ltr'><em>(D0680836)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 485 751 1534 793; baseline 0 -6"><span class='ocrx_word' id='word_1_114' title='bbox 485 751 1068 793; x_wconf 82' lang='eng' dir='ltr'><em>|—Pseudosphingobacterium</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 1079 765 1238 787; x_wconf 84' lang='eng' dir='ltr'><em>domesticum</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 1249 763 1363 787; x_wconf 83' lang='eng' dir='ltr'><em>DC—186T</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 1373 765 1534 793; x_wconf 92' lang='eng' dir='ltr'>(AM407725)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 349 799 1405 1047">
+     <span class='ocr_line' id='line_1_39' title="bbox 533 799 1380 830; baseline 0 -7"><span class='ocrx_word' id='word_1_118' title='bbox 533 810 574 830; x_wconf 73' lang='eng'>100</span> <span class='ocrx_word' id='word_1_119' title='bbox 679 801 916 829; x_wconf 81' lang='eng' dir='ltr'><em>Sphingobacter/um</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 927 801 1095 829; x_wconf 87' lang='eng' dir='ltr'><em>daejeonense</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 1105 799 1216 823; x_wconf 90' lang='eng' dir='ltr'><em>TR6—04T</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 1224 801 1380 829; x_wconf 87' lang='eng' dir='ltr'><em>(AB249372)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 349 836 1366 866; baseline 0.001 -7"><span class='ocrx_word' id='word_1_123' title='bbox 349 845 376 864; x_wconf 80' lang='eng'><em>97</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 473 840 500 859; x_wconf 85' lang='eng'><em>99</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 681 838 918 866; x_wconf 86' lang='eng' dir='ltr'><em>Sphingobacterium</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 928 839 1030 861; x_wconf 87' lang='eng' dir='ltr'><em>mizutaii</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 1039 838 1102 861; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 1115 836 1366 866; x_wconf 78' lang='eng' dir='ltr'><em>11724T(AJ438175)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 684 876 1310 907; baseline -0.002 -6"><span class='ocrx_word' id='word_1_129' title='bbox 684 878 921 907; x_wconf 84' lang='eng' dir='ltr'><em>Sphingobacterium</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 931 878 1051 906; x_wconf 80' lang='eng' dir='ltr'><em>composti</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 1058 876 1145 900; x_wconf 91' lang='eng' dir='ltr'><em>4M24T</em></span> <span class='ocrx_word' id='word_1_132' title='bbox 1155 878 1310 907; x_wconf 89' lang='eng' dir='ltr'><em>(EF122436)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 681 916 1389 944; baseline 0 -6"><span class='ocrx_word' id='word_1_133' title='bbox 681 916 919 944; x_wconf 84' lang='eng' dir='ltr'><em>Sphingobacterium</em></span> <span class='ocrx_word' id='word_1_134' title='bbox 929 916 1080 944; x_wconf 84' lang='eng' dir='ltr'><em>spiritivorum</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 1091 916 1154 938; x_wconf 86' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_136' title='bbox 1165 916 1229 938; x_wconf 90' lang='eng'>2582</span> <span class='ocrx_word' id='word_1_137' title='bbox 1238 916 1389 944; x_wconf 88' lang='eng' dir='ltr'><em>(AJ459411)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 687 952 1377 982; baseline 0 -6"><span class='ocrx_word' id='word_1_138' title='bbox 687 954 925 982; x_wconf 85' lang='eng' dir='ltr'><em>Sphingobacterium</em></span> <span class='ocrx_word' id='word_1_139' title='bbox 935 954 1037 976; x_wconf 86' lang='eng' dir='ltr'><em>faecium</em></span> <span class='ocrx_word' id='word_1_140' title='bbox 1048 954 1111 976; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_141' title='bbox 1124 952 1216 976; x_wconf 79' lang='eng' dir='ltr'><em>11690T</em></span> <span class='ocrx_word' id='word_1_142' title='bbox 1226 954 1377 982; x_wconf 86' lang='eng' dir='ltr'><em>(AJ438176)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 401 969 1405 1047; baseline 0 -33"><span class='ocrx_word' id='word_1_143' title='bbox 401 979 425 999; x_wconf 63' lang='eng'><em>71</em></span> <span class='ocrx_word' id='word_1_144' title='bbox 440 969 888 1047; x_wconf 47' lang='eng' dir='ltr'><em>@hiﬂgobacterium</em></span> <span class='ocrx_word' id='word_1_145' title='bbox 898 992 1065 1020; x_wconf 86' lang='eng' dir='ltr'><em>thalpophilum</em></span> <span class='ocrx_word' id='word_1_146' title='bbox 1076 992 1139 1014; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_147' title='bbox 1152 990 1244 1014; x_wconf 80' lang='eng' dir='ltr'><em>11723T</em></span> <span class='ocrx_word' id='word_1_148' title='bbox 1254 992 1405 1020; x_wconf 87' lang='eng' dir='ltr'><em>(AJ438177)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 513 1027 1390 1058">
+     <span class='ocr_line' id='line_1_45' title="bbox 513 1027 1390 1058; baseline -0.001 -6"><span class='ocrx_word' id='word_1_149' title='bbox 513 1036 540 1056; x_wconf 82' lang='eng'><em>98</em></span> <span class='ocrx_word' id='word_1_150' title='bbox 665 1029 903 1057; x_wconf 85' lang='eng' dir='ltr'><em>Sphingobacterium</em></span> <span class='ocrx_word' id='word_1_151' title='bbox 913 1030 1057 1052; x_wconf 85' lang='eng' dir='ltr'><em>multivorum</em></span> <span class='ocrx_word' id='word_1_152' title='bbox 1069 1030 1118 1051; x_wconf 94' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_153' title='bbox 1131 1027 1223 1052; x_wconf 89' lang='eng' dir='ltr'><em>14316T</em></span> <span class='ocrx_word' id='word_1_154' title='bbox 1233 1029 1390 1058; x_wconf 87' lang='eng' dir='ltr'>(AB100738)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 916 1067 1495 1097">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 916 1067 1495 1097">
+     <span class='ocr_line' id='line_1_46' title="bbox 916 1067 1495 1097; baseline 0 -6"><span class='ocrx_word' id='word_1_155' title='bbox 916 1069 1072 1091; x_wconf 82' lang='eng' dir='ltr'><em>Bacteroides</em></span> <span class='ocrx_word' id='word_1_156' title='bbox 1082 1069 1167 1097; x_wconf 87' lang='eng' dir='ltr'><em>fragilis</em></span> <span class='ocrx_word' id='word_1_157' title='bbox 1178 1069 1240 1091; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_158' title='bbox 1251 1067 1329 1091; x_wconf 89' lang='eng' dir='ltr'><em>2151T</em></span> <span class='ocrx_word' id='word_1_159' title='bbox 1339 1069 1495 1097; x_wconf 81' lang='eng' dir='ltr'>(A8050106)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 300 521 302 749">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 300 521 302 749">
+     <span class='ocr_line' id='line_1_47' title="bbox 300 521 302 749; baseline 0 355"><span class='ocrx_word' id='word_1_160' title='bbox 300 521 302 749; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 301 747 487 751">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 301 747 487 751">
+     <span class='ocr_line' id='line_1_48' title="bbox 301 747 487 751; baseline 0 353"><span class='ocrx_word' id='word_1_161' title='bbox 301 747 487 751; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 316 667 318 834">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 316 667 318 834">
+     <span class='ocr_line' id='line_1_49' title="bbox 316 667 318 834; baseline 0 270"><span class='ocrx_word' id='word_1_162' title='bbox 316 667 318 834; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 316 832 392 834">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 316 832 392 834">
+     <span class='ocr_line' id='line_1_50' title="bbox 316 832 392 834; baseline 0 270"><span class='ocrx_word' id='word_1_163' title='bbox 316 832 392 834; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 390 749 392 915">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 390 749 392 915">
+     <span class='ocr_line' id='line_1_51' title="bbox 390 749 392 915; baseline 0 189"><span class='ocrx_word' id='word_1_164' title='bbox 390 749 392 915; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 438 931 440 1000">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 438 931 440 1000">
+     <span class='ocr_line' id='line_1_52' title="bbox 438 931 440 1000; baseline 0 104"><span class='ocrx_word' id='word_1_165' title='bbox 438 931 440 1000; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 2 1083 907 1085">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 2 1083 907 1085">
+     <span class='ocr_line' id='line_1_53' title="bbox 2 1083 907 1085; baseline 0 19"><span class='ocrx_word' id='word_1_166' title='bbox 2 1083 907 1085; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003087-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003087-0-000.pbm.png
new file mode 100644
index 00000000..a3cd7289
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003087-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003087-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003087-0-000.pbm.png.hocr
new file mode 100644
index 00000000..9b003787
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003087-0-000.pbm.png.hocr
@@ -0,0 +1,309 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003087-0-000.pbm.png"; bbox 0 0 1183 966; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 256 5 888 303">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 284 5 861 124">
+     <span class='ocr_line' id='line_1_1' title="bbox 361 5 861 34; baseline -0.002 -5"><span class='ocrx_word' id='word_1_1' title='bbox 361 7 433 29; x_wconf 84' lang='eng' dir='ltr'>Clone</span> <span class='ocrx_word' id='word_1_2' title='bbox 443 7 677 34; x_wconf 84' lang='eng' dir='ltr'>SWPT5_aaaO4e11</span> <span class='ocrx_word' id='word_1_3' title='bbox 692 8 700 15; x_wconf 78' lang='eng'><strong><em>*</em></strong></span> <span class='ocrx_word' id='word_1_4' title='bbox 710 5 861 33; x_wconf 84' lang='eng' dir='ltr'>(EF100091)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 295 46 849 87; baseline 0 -18"><span class='ocrx_word' id='word_1_5' title='bbox 295 72 331 87; x_wconf 68' lang='eng'>836</span> <span class='ocrx_word' id='word_1_6' title='bbox 366 48 438 69; x_wconf 86' lang='eng' dir='ltr'>Clone</span> <span class='ocrx_word' id='word_1_7' title='bbox 449 48 670 76; x_wconf 81' lang='eng' dir='ltr'>obob2_aaa03g05</span> <span class='ocrx_word' id='word_1_8' title='bbox 680 48 688 56; x_wconf 73' lang='eng'>*</span> <span class='ocrx_word' id='word_1_9' title='bbox 698 46 849 73; x_wconf 83' lang='eng' dir='ltr'>(EF096493)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 284 85 752 124; baseline 0 -14"><span class='ocrx_word' id='word_1_10' title='bbox 284 108 332 124; x_wconf 62' lang='eng'><strong>#661</strong></span> <span class='ocrx_word' id='word_1_11' title='bbox 347 98 355 100; x_wconf 76' lang='eng'>&#39;</span> <span class='ocrx_word' id='word_1_12' title='bbox 368 88 443 110; x_wconf 85' lang='eng' dir='ltr'>Strain</span> <span class='ocrx_word' id='word_1_13' title='bbox 455 88 498 110; x_wconf 71' lang='eng' dir='ltr'>M11</span> <span class='ocrx_word' id='word_1_14' title='bbox 507 88 554 110; x_wconf 69' lang='eng' dir='ltr'>BET</span> <span class='ocrx_word' id='word_1_15' title='bbox 563 85 752 114; x_wconf 61' lang='eng' dir='ltr'>&#39;(AM747811)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 256 126 759 156">
+     <span class='ocr_line' id='line_1_4' title="bbox 256 126 759 156; baseline -0.002 -6"><span class='ocrx_word' id='word_1_16' title='bbox 256 132 292 146; x_wconf 79' lang='eng'>999</span> <span class='ocrx_word' id='word_1_17' title='bbox 347 139 360 140; x_wconf 48' lang='eng'><em>’</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 374 128 446 150; x_wconf 82' lang='eng' dir='ltr'>Clone</span> <span class='ocrx_word' id='word_1_19' title='bbox 457 128 575 156; x_wconf 82' lang='eng' dir='ltr'>C16_E16</span> <span class='ocrx_word' id='word_1_20' title='bbox 586 129 594 137; x_wconf 56' lang='eng'><strong>*</strong></span> <span class='ocrx_word' id='word_1_21' title='bbox 605 126 759 154; x_wconf 75' lang='eng' dir='ltr'>(AYQQQQQO)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 338 169 888 198">
+     <span class='ocr_line' id='line_1_5' title="bbox 338 169 888 198; baseline 0 -6"><span class='ocrx_word' id='word_1_22' title='bbox 338 179 362 181; x_wconf 85' lang='eng'>—</span> <span class='ocrx_word' id='word_1_23' title='bbox 378 171 450 192; x_wconf 88' lang='eng' dir='ltr'>Clone</span> <span class='ocrx_word' id='word_1_24' title='bbox 460 171 708 198; x_wconf 81' lang='eng' dir='ltr'>SWPT12_aaaO4fO4</span> <span class='ocrx_word' id='word_1_25' title='bbox 718 171 726 179; x_wconf 77' lang='eng'>*</span> <span class='ocrx_word' id='word_1_26' title='bbox 737 169 888 197; x_wconf 86' lang='eng' dir='ltr'>(EF098044)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 296 208 772 303">
+     <span class='ocr_line' id='line_1_6' title="bbox 296 208 772 303; baseline 0 -72"><span class='ocrx_word' id='word_1_27' title='bbox 296 219 360 303; x_wconf 38' lang='eng'>#9:?</span> <span class='ocrx_word' id='word_1_28' title='bbox 374 210 446 231; x_wconf 84' lang='eng' dir='ltr'>Clone</span> <span class='ocrx_word' id='word_1_29' title='bbox 457 210 581 237; x_wconf 84' lang='eng' dir='ltr'>M3_f06_3</span> <span class='ocrx_word' id='word_1_30' title='bbox 592 210 600 219; x_wconf 79' lang='eng'><strong><em>*</em></strong></span> <span class='ocrx_word' id='word_1_31' title='bbox 611 208 772 235; x_wconf 83' lang='eng' dir='ltr'>(DOO15649)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 285 30 335 46">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 285 30 335 46">
+     <span class='ocr_line' id='line_1_7' title="bbox 285 30 335 46; baseline 0 0"><span class='ocrx_word' id='word_1_32' title='bbox 285 30 335 46; x_wconf 74' lang='eng'>#885</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 299 128 338 130">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 299 128 338 130">
+     <span class='ocr_line' id='line_1_8' title="bbox 299 128 338 130; baseline 0 836"><span class='ocrx_word' id='word_1_33' title='bbox 299 128 338 130; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 336 77 338 181">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 336 77 338 181">
+     <span class='ocr_line' id='line_1_9' title="bbox 336 77 338 181; baseline 0 785"><span class='ocrx_word' id='word_1_34' title='bbox 336 77 338 181; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 260 199 300 201">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 260 199 300 201">
+     <span class='ocr_line' id='line_1_10' title="bbox 260 199 300 201; baseline 0 765"><span class='ocrx_word' id='word_1_35' title='bbox 260 199 300 201; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 205 194 256 209">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 205 194 256 209">
+     <span class='ocr_line' id='line_1_11' title="bbox 205 194 256 209; baseline 0 0"><span class='ocrx_word' id='word_1_36' title='bbox 205 194 256 209; x_wconf 73' lang='eng'>#999</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 299 128 300 272">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 299 128 300 272">
+     <span class='ocr_line' id='line_1_12' title="bbox 299 128 300 272; baseline 0 694"><span class='ocrx_word' id='word_1_37' title='bbox 299 128 300 272; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 367 250 849 317">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 367 250 849 317">
+     <span class='ocr_line' id='line_1_13' title="bbox 371 250 849 279; baseline 0 -7"><span class='ocrx_word' id='word_1_38' title='bbox 371 251 443 273; x_wconf 88' lang='eng' dir='ltr'>Clone</span> <span class='ocrx_word' id='word_1_39' title='bbox 454 252 677 279; x_wconf 85' lang='eng' dir='ltr'>RL176_aah44cO5</span> <span class='ocrx_word' id='word_1_40' title='bbox 688 250 849 277; x_wconf 84' lang='eng' dir='ltr'>(DO793846)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 367 290 724 317; baseline 0 -4"><span class='ocrx_word' id='word_1_41' title='bbox 367 292 488 313; x_wconf 83' lang='eng' dir='ltr'>Bacterium</span> <span class='ocrx_word' id='word_1_42' title='bbox 501 292 533 313; x_wconf 89' lang='eng' dir='ltr'>B7</span> <span class='ocrx_word' id='word_1_43' title='bbox 544 292 552 300; x_wconf 78' lang='eng'><strong>*</strong></span> <span class='ocrx_word' id='word_1_44' title='bbox 562 290 724 317; x_wconf 86' lang='eng' dir='ltr'>(DO789120)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 214 331 903 425">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 214 331 903 416">
+     <span class='ocr_line' id='line_1_15' title="bbox 288 331 903 372; baseline -0.002 -17"><span class='ocrx_word' id='word_1_45' title='bbox 288 357 320 372; x_wconf 63' lang='eng' dir='ltr'>7B1</span> <span class='ocrx_word' id='word_1_46' title='bbox 346 334 561 355; x_wconf 78' lang='eng' dir='ltr'>Asaccharobacter</span> <span class='ocrx_word' id='word_1_47' title='bbox 568 334 656 355; x_wconf 80' lang='eng' dir='ltr'>ce/afus</span> <span class='ocrx_word' id='word_1_48' title='bbox 663 334 737 355; x_wconf 78' lang='eng' dir='ltr'>doOST</span> <span class='ocrx_word' id='word_1_49' title='bbox 747 331 854 359; x_wconf 79' lang='eng' dir='ltr'>(A82661</span> <span class='ocrx_word' id='word_1_50' title='bbox 862 331 903 359; x_wconf 85' lang='eng'>02)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 214 400 278 416; baseline 0 0"><span class='ocrx_word' id='word_1_51' title='bbox 214 400 278 416; x_wconf 74' lang='eng'>#1000</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 271 279 335 295">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 271 279 335 295">
+     <span class='ocr_line' id='line_1_17' title="bbox 271 279 335 295; baseline 0 0"><span class='ocrx_word' id='word_1_52' title='bbox 271 279 335 295; x_wconf 80' lang='eng'>#1000</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 190 296 262 298">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 190 296 262 298">
+     <span class='ocr_line' id='line_1_18' title="bbox 190 296 262 298; baseline 0 668"><span class='ocrx_word' id='word_1_53' title='bbox 190 296 262 298; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 120 291 184 307">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 120 291 184 307">
+     <span class='ocr_line' id='line_1_19' title="bbox 120 291 184 307; baseline 0 0"><span class='ocrx_word' id='word_1_54' title='bbox 120 291 184 307; x_wconf 78' lang='eng'>#1000</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 249 372 1180 888">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 249 372 1180 888">
+     <span class='ocr_line' id='line_1_20' title="bbox 347 372 958 402; baseline -0.002 -6"><span class='ocrx_word' id='word_1_55' title='bbox 347 375 509 396; x_wconf 73' lang='eng' dir='ltr'>Adlercreuz‘ZIla</span> <span class='ocrx_word' id='word_1_56' title='bbox 519 375 680 402; x_wconf 78' lang='eng' dir='ltr'>equalifac/ens</span> <span class='ocrx_word' id='word_1_57' title='bbox 688 375 710 396; x_wconf 91' lang='eng' dir='ltr'>FJ</span> <span class='ocrx_word' id='word_1_58' title='bbox 714 374 792 396; x_wconf 75' lang='eng' dir='ltr'>C—BQT</span> <span class='ocrx_word' id='word_1_59' title='bbox 801 372 958 400; x_wconf 78' lang='eng' dir='ltr'>(A8306661)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 356 412 1062 442; baseline -0.001 -6"><span class='ocrx_word' id='word_1_60' title='bbox 356 415 440 436; x_wconf 89' lang='eng' dir='ltr'>Human</span> <span class='ocrx_word' id='word_1_61' title='bbox 453 415 557 436; x_wconf 68' lang='eng' dir='ltr'>intestinal</span> <span class='ocrx_word' id='word_1_62' title='bbox 568 415 688 436; x_wconf 84' lang='eng' dir='ltr'>bacterium</span> <span class='ocrx_word' id='word_1_63' title='bbox 698 414 897 442; x_wconf 84' lang='eng' dir='ltr'>SNU—Julong732</span> <span class='ocrx_word' id='word_1_64' title='bbox 908 412 1062 440; x_wconf 88' lang='eng' dir='ltr'>(AY310748)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 359 454 935 483; baseline -0.002 -6"><span class='ocrx_word' id='word_1_65' title='bbox 359 456 498 483; x_wconf 63' lang='eng' dir='ltr'>Eggedhe/la</span> <span class='ocrx_word' id='word_1_66' title='bbox 506 456 565 477; x_wconf 74' lang='eng' dir='ltr'><em>lenfa</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 572 455 769 477; x_wconf 82' lang='eng' dir='ltr'>SECO—Mt75m2</span> <span class='ocrx_word' id='word_1_68' title='bbox 781 454 935 481; x_wconf 85' lang='eng' dir='ltr'>(AY937880)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 347 494 866 523; baseline 0 -6"><span class='ocrx_word' id='word_1_69' title='bbox 347 496 486 523; x_wconf 71' lang='eng' dir='ltr'>Eggertheﬂa</span> <span class='ocrx_word' id='word_1_70' title='bbox 495 496 593 517; x_wconf 52' lang='eng' dir='ltr'>s/nensﬂs</span> <span class='ocrx_word' id='word_1_71' title='bbox 602 496 702 517; x_wconf 70' lang='eng' dir='ltr'>HKU14T</span> <span class='ocrx_word' id='word_1_72' title='bbox 712 494 866 521; x_wconf 85' lang='eng' dir='ltr'>(AY321958)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 350 535 958 564; baseline -0.002 -6"><span class='ocrx_word' id='word_1_73' title='bbox 350 537 489 564; x_wconf 74' lang='eng' dir='ltr'>Eggerthe/la</span> <span class='ocrx_word' id='word_1_74' title='bbox 498 537 685 564; x_wconf 66' lang='eng' dir='ltr'>hongkongenS/Ls</span> <span class='ocrx_word' id='word_1_75' title='bbox 693 537 794 558; x_wconf 80' lang='eng' dir='ltr'>HKU1OT</span> <span class='ocrx_word' id='word_1_76' title='bbox 803 535 926 562; x_wconf 83' lang='eng' dir='ltr'>(AY28851</span> <span class='ocrx_word' id='word_1_77' title='bbox 936 535 958 562; x_wconf 92' lang='eng'>7)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 360 575 972 603; baseline 0 -5"><span class='ocrx_word' id='word_1_78' title='bbox 360 577 572 598; x_wconf 64' lang='eng' dir='ltr'>Den/Yrobacter/ijm</span> <span class='ocrx_word' id='word_1_79' title='bbox 580 577 726 598; x_wconf 69' lang='eng' dir='ltr'>detox/ﬁcans</span> <span class='ocrx_word' id='word_1_80' title='bbox 734 577 842 598; x_wconf 74' lang='eng' dir='ltr'>NPOH1T</span> <span class='ocrx_word' id='word_1_81' title='bbox 851 575 876 603; x_wconf 93' lang='eng' dir='ltr'>(U</span> <span class='ocrx_word' id='word_1_82' title='bbox 881 575 972 603; x_wconf 83' lang='eng'>43492)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 334 616 873 645; baseline 0 -6"><span class='ocrx_word' id='word_1_83' title='bbox 334 618 421 639; x_wconf 61' lang='eng' dir='ltr'>S/ac/(I&#39;a</span> <span class='ocrx_word' id='word_1_84' title='bbox 431 618 507 645; x_wconf 77' lang='eng' dir='ltr'><em>eX/gua</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 515 618 592 639; x_wconf 89' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_86' title='bbox 604 619 712 639; x_wconf 78' lang='eng' dir='ltr'>700122T</span> <span class='ocrx_word' id='word_1_87' title='bbox 722 616 873 643; x_wconf 86' lang='eng' dir='ltr'>(AF101240)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 372 655 1008 686; baseline 0 -7"><span class='ocrx_word' id='word_1_88' title='bbox 372 658 577 686; x_wconf 65' lang='eng' dir='ltr'>C/yptobacz‘er/ijm</span> <span class='ocrx_word' id='word_1_89' title='bbox 586 661 671 679; x_wconf 79' lang='eng' dir='ltr'><em>cum/m</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 679 658 738 679; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_91' title='bbox 752 659 826 679; x_wconf 89' lang='eng'>15641</span> <span class='ocrx_word' id='word_1_92' title='bbox 833 658 842 671; x_wconf 62' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_93' title='bbox 852 655 1008 683; x_wconf 86' lang='eng' dir='ltr'>(ABO19260)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 378 696 1006 724; baseline -0.002 -4"><span class='ocrx_word' id='word_1_94' title='bbox 378 698 502 720; x_wconf 66' lang='eng' dir='ltr'>Co/ﬂhse/la</span> <span class='ocrx_word' id='word_1_95' title='bbox 510 699 653 720; x_wconf 78' lang='eng' dir='ltr'>aerofac/ens</span> <span class='ocrx_word' id='word_1_96' title='bbox 659 698 737 720; x_wconf 90' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_97' title='bbox 748 699 840 719; x_wconf 78' lang='eng' dir='ltr'>25986T</span> <span class='ocrx_word' id='word_1_98' title='bbox 849 696 923 724; x_wconf 78' lang='eng' dir='ltr'>(A801</span> <span class='ocrx_word' id='word_1_99' title='bbox 933 696 1006 724; x_wconf 86' lang='eng'>1816)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 320 738 947 767; baseline 0 -6"><span class='ocrx_word' id='word_1_100' title='bbox 320 740 510 761; x_wconf 74' lang='eng' dir='ltr'>Cor/bbacter/um</span> <span class='ocrx_word' id='word_1_101' title='bbox 517 740 647 767; x_wconf 80' lang='eng' dir='ltr'>g/amerans</span> <span class='ocrx_word' id='word_1_102' title='bbox 655 740 714 761; x_wconf 91' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_103' title='bbox 726 741 818 761; x_wconf 79' lang='eng' dir='ltr'>20642T</span> <span class='ocrx_word' id='word_1_104' title='bbox 828 738 947 765; x_wconf 84' lang='eng' dir='ltr'>(X79048)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 351 779 898 808; baseline 0 -6"><span class='ocrx_word' id='word_1_105' title='bbox 351 781 487 808; x_wconf 80' lang='eng' dir='ltr'><em>Atapob/um</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 495 781 600 802; x_wconf 79' lang='eng' dir='ltr'>m/nutum</span> <span class='ocrx_word' id='word_1_107' title='bbox 608 781 683 802; x_wconf 91' lang='eng' dir='ltr'>NCFB</span> <span class='ocrx_word' id='word_1_108' title='bbox 695 781 770 802; x_wconf 84' lang='eng' dir='ltr'>2751T</span> <span class='ocrx_word' id='word_1_109' title='bbox 779 779 898 806; x_wconf 88' lang='eng' dir='ltr'>(X67148)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 249 819 746 847; baseline -0.002 -4"><span class='ocrx_word' id='word_1_110' title='bbox 249 821 362 843; x_wconf 78' lang='eng' dir='ltr'>O/sene/la</span> <span class='ocrx_word' id='word_1_111' title='bbox 371 821 481 843; x_wconf 74' lang='eng' dir='ltr'>u/iATCC</span> <span class='ocrx_word' id='word_1_112' title='bbox 492 822 584 842; x_wconf 75' lang='eng' dir='ltr'>49627T</span> <span class='ocrx_word' id='word_1_113' title='bbox 594 819 746 847; x_wconf 74' lang='eng' dir='ltr'>(AF292373)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 593 860 1180 888; baseline 0 -5"><span class='ocrx_word' id='word_1_114' title='bbox 593 862 748 883; x_wconf 72' lang='eng' dir='ltr'>Eubaoler/i/m</span> <span class='ocrx_word' id='word_1_115' title='bbox 756 862 857 883; x_wconf 73' lang='eng' dir='ltr'>//&#39;mosum</span> <span class='ocrx_word' id='word_1_116' title='bbox 864 862 942 883; x_wconf 88' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_117' title='bbox 952 862 1028 883; x_wconf 80' lang='eng' dir='ltr'>8486T</span> <span class='ocrx_word' id='word_1_118' title='bbox 1037 863 1045 871; x_wconf 78' lang='eng'>*</span> <span class='ocrx_word' id='word_1_119' title='bbox 1055 860 1180 888; x_wconf 82' lang='eng' dir='ltr'>(M59120)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 145 401 181 416">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 145 401 181 416">
+     <span class='ocr_line' id='line_1_33' title="bbox 145 401 181 416; baseline 0 0"><span class='ocrx_word' id='word_1_120' title='bbox 145 401 181 416; x_wconf 85' lang='eng'>316</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 260 465 343 466">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 260 465 343 466">
+     <span class='ocr_line' id='line_1_34' title="bbox 260 465 343 466; baseline 0 500"><span class='ocrx_word' id='word_1_121' title='bbox 260 465 343 466; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 221 485 260 486">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 221 485 260 486">
+     <span class='ocr_line' id='line_1_35' title="bbox 221 485 260 486; baseline 0 480"><span class='ocrx_word' id='word_1_122' title='bbox 221 485 260 486; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 145 496 189 498">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 145 496 189 498">
+     <span class='ocr_line' id='line_1_36' title="bbox 145 496 189 498; baseline 0 468"><span class='ocrx_word' id='word_1_123' title='bbox 145 496 189 498; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 258 199 263 507">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 258 199 263 507">
+     <span class='ocr_line' id='line_1_37' title="bbox 258 199 263 507; baseline 0 459"><span class='ocrx_word' id='word_1_124' title='bbox 258 199 263 507; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 190 296 191 517">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 190 296 191 517">
+     <span class='ocr_line' id='line_1_38' title="bbox 190 296 191 517; baseline 0 449"><span class='ocrx_word' id='word_1_125' title='bbox 190 296 191 517; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 190 296 192 517">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 190 296 192 517">
+     <span class='ocr_line' id='line_1_39' title="bbox 190 296 192 517; baseline 0 449"><span class='ocrx_word' id='word_1_126' title='bbox 190 296 192 517; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 103 492 139 507">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 103 492 139 507">
+     <span class='ocr_line' id='line_1_40' title="bbox 103 492 139 507; baseline 0 0"><span class='ocrx_word' id='word_1_127' title='bbox 103 492 139 507; x_wconf 81' lang='eng'>995</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 260 505 330 507">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 260 505 330 507">
+     <span class='ocr_line' id='line_1_41' title="bbox 260 505 330 507; baseline 0 459"><span class='ocrx_word' id='word_1_128' title='bbox 260 505 330 507; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 190 515 222 517">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 190 515 222 517">
+     <span class='ocr_line' id='line_1_42' title="bbox 190 515 222 517; baseline 0 449"><span class='ocrx_word' id='word_1_129' title='bbox 190 515 222 517; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 221 485 222 547">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 221 485 222 547">
+     <span class='ocr_line' id='line_1_43' title="bbox 221 485 222 547; baseline 0 419"><span class='ocrx_word' id='word_1_130' title='bbox 221 485 222 547; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 118 572 147 574">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 118 572 147 574">
+     <span class='ocr_line' id='line_1_44' title="bbox 118 572 147 574; baseline 0 392"><span class='ocrx_word' id='word_1_131' title='bbox 118 572 147 574; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 61 564 111 580">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 61 564 111 580">
+     <span class='ocr_line' id='line_1_45' title="bbox 61 564 111 580; baseline 0 0"><span class='ocrx_word' id='word_1_132' title='bbox 61 564 111 580; x_wconf 81' lang='eng'>#815</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 145 496 147 650">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 145 496 147 650">
+     <span class='ocr_line' id='line_1_46' title="bbox 145 496 147 650; baseline 0 316"><span class='ocrx_word' id='word_1_133' title='bbox 145 496 147 650; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 67 651 120 652">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 67 651 120 652">
+     <span class='ocr_line' id='line_1_47' title="bbox 67 651 120 652; baseline 0 314"><span class='ocrx_word' id='word_1_134' title='bbox 67 651 120 652; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 152 628 154 670">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 152 628 154 670">
+     <span class='ocr_line' id='line_1_48' title="bbox 152 628 154 670; baseline 0 296"><span class='ocrx_word' id='word_1_135' title='bbox 152 628 154 670; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 9 640 207 659">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 9 640 207 659">
+     <span class='ocr_line' id='line_1_49' title="bbox 9 640 207 659; baseline 0 -4"><span class='ocrx_word' id='word_1_136' title='bbox 9 644 61 659; x_wconf 68' lang='eng'>#950</span> <span class='ocrx_word' id='word_1_137' title='bbox 157 640 207 655; x_wconf 80' lang='eng'>#492</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 118 572 120 731">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 118 572 120 731">
+     <span class='ocr_line' id='line_1_50' title="bbox 118 572 120 731; baseline 0 235"><span class='ocrx_word' id='word_1_138' title='bbox 118 572 120 731; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 118 729 190 731">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 118 729 190 731">
+     <span class='ocr_line' id='line_1_51' title="bbox 118 729 190 731; baseline 0 235"><span class='ocrx_word' id='word_1_139' title='bbox 118 729 190 731; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 188 296 194 751">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 188 296 194 751">
+     <span class='ocr_line' id='line_1_52' title="bbox 188 296 194 751; baseline 0 215"><span class='ocrx_word' id='word_1_140' title='bbox 188 296 194 751; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 195 722 259 738">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 195 722 259 738">
+     <span class='ocr_line' id='line_1_53' title="bbox 195 722 259 738; baseline 0 0"><span class='ocrx_word' id='word_1_141' title='bbox 195 722 259 738; x_wconf 81' lang='eng'>#1000</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 67 811 131 812">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 67 811 131 812">
+     <span class='ocr_line' id='line_1_54' title="bbox 67 811 131 812; baseline 0 154"><span class='ocrx_word' id='word_1_142' title='bbox 67 811 131 812; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 129 791 131 833">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 129 791 131 833">
+     <span class='ocr_line' id='line_1_55' title="bbox 129 791 131 833; baseline 0 133"><span class='ocrx_word' id='word_1_143' title='bbox 129 791 131 833; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_37' title="bbox 134 804 185 819">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 134 804 185 819">
+     <span class='ocr_line' id='line_1_56' title="bbox 134 804 185 819; baseline 0 0"><span class='ocrx_word' id='word_1_144' title='bbox 134 804 185 819; x_wconf 73' lang='eng'>#893</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_38' title="bbox 131 831 231 833">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 131 831 231 833">
+     <span class='ocr_line' id='line_1_57' title="bbox 131 831 231 833; baseline 0 133"><span class='ocrx_word' id='word_1_145' title='bbox 131 831 231 833; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_39' title="bbox 67 651 68 873">
+    <p class='ocr_par' dir='ltr' id='par_1_42' title="bbox 67 651 68 873">
+     <span class='ocr_line' id='line_1_58' title="bbox 67 651 68 873; baseline 0 93"><span class='ocrx_word' id='word_1_146' title='bbox 67 651 68 873; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_40' title="bbox 67 872 578 873">
+    <p class='ocr_par' dir='ltr' id='par_1_43' title="bbox 67 872 578 873">
+     <span class='ocr_line' id='line_1_59' title="bbox 67 872 578 873; baseline 0 93"><span class='ocrx_word' id='word_1_147' title='bbox 67 872 578 873; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_41' title="bbox 236 941 268 961">
+    <p class='ocr_par' dir='ltr' id='par_1_44' title="bbox 236 941 268 961">
+     <span class='ocr_line' id='line_1_60' title="bbox 236 941 268 961; baseline 0 0"><span class='ocrx_word' id='word_1_148' title='bbox 236 941 268 961; x_wconf 93' lang='eng'>0.1</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003087-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003087-0-001.pbm.png
new file mode 100644
index 00000000..991173be
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003087-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003087-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003087-0-001.pbm.png.hocr
new file mode 100644
index 00000000..584a1a00
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003087-0-001.pbm.png.hocr
@@ -0,0 +1,108 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003087-0-001.pbm.png"; bbox 0 0 947 562; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 10 3 430 65">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 10 3 430 65">
+     <span class='ocr_line' id='line_1_1' title="bbox 200 3 358 29; baseline 0 -7"><span class='ocrx_word' id='word_1_1' title='bbox 200 3 358 29; x_wconf 81' lang='eng' dir='ltr'><em>Heterogeneity</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 10 46 430 65; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 10 46 53 65; x_wconf 84' lang='eng'><em>250</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 103 46 146 65; x_wconf 83' lang='eng'><em>200</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 202 46 245 65; x_wconf 84' lang='eng'><em>150</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 303 46 345 65; x_wconf 90' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 402 46 430 65; x_wconf 89' lang='eng'><em>50</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 513 46 525 65">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 513 46 525 65">
+     <span class='ocr_line' id='line_1_3' title="bbox 513 46 525 65; textangle 90"><span class='ocrx_word' id='word_1_7' title='bbox 513 46 525 65; x_wconf 86' lang='eng' dir='ltr'>O</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 5 80 523 92">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 5 80 523 92">
+     <span class='ocr_line' id='line_1_4' title="bbox 5 80 523 92; baseline 0 470"><span class='ocrx_word' id='word_1_8' title='bbox 5 80 523 92; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 449 105 451 150">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 449 105 451 150">
+     <span class='ocr_line' id='line_1_5' title="bbox 449 105 451 150; baseline 0 936"><span class='ocrx_word' id='word_1_9' title='bbox 449 105 451 150; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 571 136 766 162">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 571 136 766 162">
+     <span class='ocr_line' id='line_1_6' title="bbox 571 136 766 162; baseline -0.005 0"><span class='ocrx_word' id='word_1_10' title='bbox 571 138 648 162; x_wconf 86' lang='eng' dir='ltr'><em>Strain</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 661 136 766 162; x_wconf 81' lang='eng' dir='ltr'><em>Mt1BBT</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 173 136 175 262">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 173 136 175 262">
+     <span class='ocr_line' id='line_1_7' title="bbox 173 136 175 262; baseline 0 300"><span class='ocrx_word' id='word_1_12' title='bbox 173 136 175 262; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 570 233 912 295">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 570 233 912 295">
+     <span class='ocr_line' id='line_1_8' title="bbox 570 233 912 256; baseline 0 0"><span class='ocrx_word' id='word_1_13' title='bbox 570 233 808 256; x_wconf 76' lang='eng' dir='ltr'><em>Asacoharobacter</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 815 233 912 256; x_wconf 78' lang='eng' dir='ltr'><em>ce/atus</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 572 268 754 295; baseline 0.005 -1"><span class='ocrx_word' id='word_1_15' title='bbox 572 271 612 295; x_wconf 86' lang='eng' dir='ltr'><em>DS</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 616 272 638 294; x_wconf 94' lang='eng' dir='ltr'>M</span> <span class='ocrx_word' id='word_1_17' title='bbox 653 273 660 294; x_wconf 99' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 669 272 684 295; x_wconf 92' lang='eng'>8</span> <span class='ocrx_word' id='word_1_19' title='bbox 689 272 722 295; x_wconf 92' lang='eng'><em>78</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 726 268 754 295; x_wconf 89' lang='eng' dir='ltr'><em>5T</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 173 260 444 262">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 173 260 444 262">
+     <span class='ocr_line' id='line_1_10' title="bbox 173 260 444 262; baseline 0 300"><span class='ocrx_word' id='word_1_21' title='bbox 173 260 444 262; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 442 232 444 283">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 442 232 444 283">
+     <span class='ocr_line' id='line_1_11' title="bbox 442 232 444 283; baseline 0 279"><span class='ocrx_word' id='word_1_22' title='bbox 442 232 444 283; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 572 344 943 405">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 572 344 943 405">
+     <span class='ocr_line' id='line_1_12' title="bbox 573 344 943 374; baseline 0.003 -8"><span class='ocrx_word' id='word_1_23' title='bbox 573 344 726 374; x_wconf 82' lang='eng' dir='ltr'><em>Eggen‘he/la</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 736 344 943 374; x_wconf 83' lang='eng' dir='ltr'><em>hongkongens/s</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 572 379 754 405; baseline 0 0"><span class='ocrx_word' id='word_1_25' title='bbox 572 382 638 405; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 653 384 660 405; x_wconf 99' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 669 383 698 405; x_wconf 89' lang='eng'><em>61</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 706 379 754 405; x_wconf 76' lang='eng' dir='ltr'><em>OST</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 572 456 801 518">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 572 456 801 518">
+     <span class='ocr_line' id='line_1_14' title="bbox 573 456 801 486; baseline 0 -7"><span class='ocrx_word' id='word_1_29' title='bbox 573 456 726 486; x_wconf 78' lang='eng' dir='ltr'><em>Eggert/Ie/Ia</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 736 456 801 479; x_wconf 79' lang='eng' dir='ltr'><em>/enl‘a</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 572 492 735 518; baseline 0 0"><span class='ocrx_word' id='word_1_31' title='bbox 572 494 612 518; x_wconf 87' lang='eng' dir='ltr'><em>DS</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 616 495 638 518; x_wconf 95' lang='eng' dir='ltr'>M</span> <span class='ocrx_word' id='word_1_33' title='bbox 651 496 665 518; x_wconf 87' lang='eng'>2</span> <span class='ocrx_word' id='word_1_34' title='bbox 670 492 735 518; x_wconf 81' lang='eng' dir='ltr'><em>243T</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 343 373 345 509">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 343 373 345 509">
+     <span class='ocr_line' id='line_1_16' title="bbox 343 373 345 509; baseline 0 53"><span class='ocrx_word' id='word_1_35' title='bbox 343 373 345 509; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 345 103 555 535">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 345 103 555 535">
+     <span class='ocr_line' id='line_1_17' title="bbox 345 103 555 535; textangle 90"><span class='ocrx_word' id='word_1_36' title='bbox 345 103 555 535; x_wconf 38' lang='eng' dir='ltr'>ﬂee</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 5 546 520 548">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 5 546 520 548">
+     <span class='ocr_line' id='line_1_18' title="bbox 5 546 520 548; baseline 0 14"><span class='ocrx_word' id='word_1_37' title='bbox 5 546 520 548; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003145-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003145-0-000.pbm.png
new file mode 100644
index 00000000..7bf0d82d
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003145-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003145-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003145-0-000.pbm.png.hocr
new file mode 100644
index 00000000..9a1e9625
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003145-0-000.pbm.png.hocr
@@ -0,0 +1,163 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003145-0-000.pbm.png"; bbox 0 0 971 828; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 19 4 709 57">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 19 4 709 57">
+     <span class='ocr_line' id='line_1_1' title="bbox 19 4 85 24; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 19 4 85 24; x_wconf 88' lang='eng'>0.005</span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 266 28 709 57; baseline 0 -6"><span class='ocrx_word' id='word_1_2' title='bbox 266 28 297 51; x_wconf 90' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 310 28 415 57; x_wconf 86' lang='eng' dir='ltr'><em>a/gicola</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 427 28 536 51; x_wconf 83' lang='eng' dir='ltr'><em>DG893T</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 543 28 659 57; x_wconf 89' lang='eng' dir='ltr'>(AY2581</span> <span class='ocrx_word' id='word_1_6' title='bbox 669 28 709 57; x_wconf 93' lang='eng'>10)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 182 68 964 826">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 262 68 746 98">
+     <span class='ocr_line' id='line_1_3' title="bbox 262 68 746 98; baseline 0 -7"><span class='ocrx_word' id='word_1_7' title='bbox 262 69 293 91; x_wconf 92' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 306 69 443 98; x_wconf 88' lang='eng' dir='ltr'><em>salsuginis</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 453 68 574 92; x_wconf 85' lang='eng' dir='ltr'><em>SD—14BT</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 582 68 746 98; x_wconf 88' lang='eng' dir='ltr'>(EF028328)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 233 110 719 139">
+     <span class='ocr_line' id='line_1_4' title="bbox 233 110 719 139; baseline 0 -6"><span class='ocrx_word' id='word_1_11' title='bbox 233 110 263 133; x_wconf 91' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 276 110 408 133; x_wconf 86' lang='eng' dir='ltr'><em>ﬂavimaris</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 418 110 542 133; x_wconf 90' lang='eng' dir='ltr'><em>SW-145T</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 553 110 719 139; x_wconf 87' lang='eng' dir='ltr'>(AY517632)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 204 150 658 180">
+     <span class='ocr_line' id='line_1_5' title="bbox 204 150 658 180; baseline 0 -7"><span class='ocrx_word' id='word_1_15' title='bbox 204 150 234 173; x_wconf 90' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 247 150 383 180; x_wconf 80' lang='eng' dir='ltr'><em>lipolyticus</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 393 150 485 173; x_wconf 84' lang='eng' dir='ltr'><em>SM19T</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 493 150 658 180; x_wconf 87' lang='eng' dir='ltr'><em>(AY147906)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 276 190 721 220">
+     <span class='ocr_line' id='line_1_6' title="bbox 276 190 721 220; baseline 0.002 -7"><span class='ocrx_word' id='word_1_19' title='bbox 276 191 306 213; x_wconf 90' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 319 191 470 214; x_wconf 87' lang='eng' dir='ltr'><em>sediminum</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 482 191 549 214; x_wconf 80' lang='eng' dir='ltr'><em>R65T</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 560 190 721 220; x_wconf 85' lang='eng' dir='ltr'><em>(AJ609270)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 331 231 789 260">
+     <span class='ocr_line' id='line_1_7' title="bbox 331 231 789 260; baseline 0 -6"><span class='ocrx_word' id='word_1_23' title='bbox 331 231 361 254; x_wconf 95' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 375 231 509 254; x_wconf 84' lang='eng' dir='ltr'><em>maritimus</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 519 231 561 254; x_wconf 88' lang='eng' dir='ltr'><em>CK</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 571 231 617 254; x_wconf 88' lang='eng' dir='ltr'><em>47T</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 629 231 789 260; x_wconf 84' lang='eng' dir='ltr'><em>(AJ704395)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 397 271 858 301">
+     <span class='ocr_line' id='line_1_8' title="bbox 397 271 858 301; baseline 0 -7"><span class='ocrx_word' id='word_1_28' title='bbox 397 271 427 294; x_wconf 96' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 440 271 571 301; x_wconf 86' lang='eng' dir='ltr'><em>salicampi</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 581 271 683 294; x_wconf 91' lang='eng' dir='ltr'><em>ISL-40T</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 694 271 858 301; x_wconf 85' lang='eng' dir='ltr'>(EF486354)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 185 312 775 342">
+     <span class='ocr_line' id='line_1_9' title="bbox 185 312 775 342; baseline 0 -7"><span class='ocrx_word' id='word_1_32' title='bbox 185 312 216 335; x_wconf 96' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 229 312 408 341; x_wconf 87' lang='eng' dir='ltr'><em>gudaonensis</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 418 312 597 335; x_wconf 77' lang='eng' dir='ltr'><em>SLO14BB1AT</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 605 312 775 342; x_wconf 89' lang='eng' dir='ltr'><em>(DQ414419)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 292 352 774 382">
+     <span class='ocr_line' id='line_1_10' title="bbox 292 352 774 382; baseline -0.002 -6"><span class='ocrx_word' id='word_1_36' title='bbox 292 353 322 375; x_wconf 97' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 335 353 500 382; x_wconf 88' lang='eng' dir='ltr'><em>bryozoorum</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 511 352 567 376; x_wconf 90' lang='eng'>50—1</span> <span class='ocrx_word' id='word_1_39' title='bbox 576 352 602 375; x_wconf 95' lang='eng' dir='ltr'><em>1T</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 613 352 774 382; x_wconf 87' lang='eng' dir='ltr'><em>(AJ609271)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 245 393 847 422">
+     <span class='ocr_line' id='line_1_11' title="bbox 245 393 847 422; baseline 0 -6"><span class='ocrx_word' id='word_1_41' title='bbox 245 393 275 416; x_wconf 98' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 288 393 489 422; x_wconf 89' lang='eng' dir='ltr'><em>segnicrescens</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 499 393 569 416; x_wconf 80' lang='eng'>8801</span> <span class='ocrx_word' id='word_1_44' title='bbox 578 393 587 416; x_wconf 86' lang='eng'>1</span> <span class='ocrx_word' id='word_1_45' title='bbox 595 393 671 416; x_wconf 91' lang='eng' dir='ltr'><em>B1-4T</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 683 393 847 422; x_wconf 88' lang='eng' dir='ltr'>(EF157832)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 230 433 709 463">
+     <span class='ocr_line' id='line_1_12' title="bbox 230 433 709 463; baseline 0 -7"><span class='ocrx_word' id='word_1_47' title='bbox 230 433 261 456; x_wconf 98' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 273 433 408 456; x_wconf 85' lang='eng' dir='ltr'><em>koreensis</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 419 433 527 456; x_wconf 91' lang='eng' dir='ltr'><em>DD-M3T</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 539 433 709 463; x_wconf 86' lang='eng' dir='ltr'>(DQ325514)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 245 471 808 501">
+     <span class='ocr_line' id='line_1_13' title="bbox 245 471 808 501; baseline 0 -6"><span class='ocrx_word' id='word_1_51' title='bbox 245 472 276 495; x_wconf 96' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 288 472 501 495; x_wconf 89' lang='eng' dir='ltr'><em>santoriniensis</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 513 471 630 495; x_wconf 92' lang='eng' dir='ltr'><em>NKSG1T</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 641 472 808 501; x_wconf 88' lang='eng' dir='ltr'><em>(EU496088)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 212 514 671 543">
+     <span class='ocr_line' id='line_1_14' title="bbox 212 514 671 543; baseline 0 -6"><span class='ocrx_word' id='word_1_55' title='bbox 212 514 242 537; x_wconf 97' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 255 514 372 543; x_wconf 85' lang='eng' dir='ltr'><em>pelagius</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 383 514 489 537; x_wconf 80' lang='eng' dir='ltr'><em>H8225T</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 500 514 671 543; x_wconf 90' lang='eng' dir='ltr'><em>(DQ458821)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 182 554 964 624">
+     <span class='ocr_line' id='line_1_15' title="bbox 182 554 964 584; baseline 0 -7"><span class='ocrx_word' id='word_1_59' title='bbox 182 557 223 577; x_wconf 85' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 270 554 300 577; x_wconf 98' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 313 554 626 584; x_wconf 83' lang='eng' dir='ltr'><em>hydrocarbonoclasticus</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 635 554 720 577; x_wconf 93' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 730 554 830 577; x_wconf 87' lang='eng' dir='ltr'><em>49840T</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 837 554 964 584; x_wconf 90' lang='eng' dir='ltr'>(X67022)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 239 594 668 624; baseline 0 -6"><span class='ocrx_word' id='word_1_65' title='bbox 239 595 269 618; x_wconf 98' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 282 595 420 624; x_wconf 86' lang='eng' dir='ltr'><em>aquaeolei</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 427 595 496 618; x_wconf 90' lang='eng' dir='ltr'><em>VT8T</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 508 594 668 624; x_wconf 84' lang='eng' dir='ltr'>(AJOOO726)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 387 635 903 665">
+     <span class='ocr_line' id='line_1_17' title="bbox 387 635 903 665; baseline 0 -6"><span class='ocrx_word' id='word_1_69' title='bbox 387 635 417 658; x_wconf 98' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 431 635 591 664; x_wconf 86' lang='eng' dir='ltr'><em>daepoensis</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 602 635 725 659; x_wconf 88' lang='eng' dir='ltr'><em>SW—156T</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 737 635 903 665; x_wconf 87' lang='eng' dir='ltr'><em>(AY517633)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 379 675 814 705">
+     <span class='ocr_line' id='line_1_18' title="bbox 379 675 814 705; baseline 0 -6"><span class='ocrx_word' id='word_1_73' title='bbox 379 676 409 699; x_wconf 98' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 424 675 553 699; x_wconf 88' lang='eng' dir='ltr'><em>viniﬁrmus</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 565 676 632 699; x_wconf 91' lang='eng' dir='ltr'><em>FB1T</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 643 675 814 705; x_wconf 84' lang='eng' dir='ltr'>(DQ235263)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 236 716 962 826">
+     <span class='ocr_line' id='line_1_19' title="bbox 409 716 933 746; baseline 0 -7"><span class='ocrx_word' id='word_1_77' title='bbox 409 716 440 739; x_wconf 98' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 453 716 583 739; x_wconf 83' lang='eng' dir='ltr'><em>excel/ens</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 595 716 663 739; x_wconf 93' lang='eng' dir='ltr'><em>KMM</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 675 716 756 739; x_wconf 83' lang='eng' dir='ltr'><em>3809T</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 767 716 933 746; x_wconf 90' lang='eng' dir='ltr'>(AY180101)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 261 756 962 786; baseline 0.006 -10"><span class='ocrx_word' id='word_1_82' title='bbox 261 756 288 776; x_wconf 90' lang='eng'>57</span> <span class='ocrx_word' id='word_1_83' title='bbox 531 756 561 779; x_wconf 97' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 574 756 671 780; x_wconf 87' lang='eng' dir='ltr'><em>litoralis</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 681 756 787 780; x_wconf 89' lang='eng' dir='ltr'><em>SW—45T</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 799 756 962 786; x_wconf 87' lang='eng' dir='ltr'><em>(AF479689)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 236 797 702 826; baseline 0 -6"><span class='ocrx_word' id='word_1_87' title='bbox 236 797 266 820; x_wconf 99' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 279 797 420 820; x_wconf 77' lang='eng' dir='ltr'><em>Iutaoensis</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 430 797 530 820; x_wconf 91' lang='eng' dir='ltr'><em>T5054T</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 538 797 702 826; x_wconf 88' lang='eng' dir='ltr'>(AF288157)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 0 38 409 786">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 0 38 409 786">
+     <span class='ocr_line' id='line_1_22' title="bbox 58 38 261 113; baseline 0 0"><span class='ocrx_word' id='word_1_91' title='bbox 58 38 261 113; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 58 113 231 135; baseline 0 693"><span class='ocrx_word' id='word_1_92' title='bbox 58 113 231 135; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 58 135 204 153; baseline 0 675"><span class='ocrx_word' id='word_1_93' title='bbox 58 135 204 153; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 21 153 204 195; baseline 0 633"><span class='ocrx_word' id='word_1_94' title='bbox 21 153 204 195; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 21 195 276 235; baseline 0 593"><span class='ocrx_word' id='word_1_95' title='bbox 21 195 276 235; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 21 235 331 274; baseline 0 554"><span class='ocrx_word' id='word_1_96' title='bbox 21 235 331 274; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 21 274 392 297; baseline 0 531"><span class='ocrx_word' id='word_1_97' title='bbox 21 274 392 297; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 21 297 185 316; baseline 0 512"><span class='ocrx_word' id='word_1_98' title='bbox 21 297 185 316; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 0 316 288 379; baseline 0 -22"><span class='ocrx_word' id='word_1_99' title='bbox 0 316 288 379; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 0 379 245 478; baseline 0 -42"><span class='ocrx_word' id='word_1_100' title='bbox 0 379 245 478; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 0 478 242 557; baseline 0 -57"><span class='ocrx_word' id='word_1_101' title='bbox 0 478 242 557; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 0 557 236 599; baseline 0 0"><span class='ocrx_word' id='word_1_102' title='bbox 0 557 236 599; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 0 599 385 660; baseline 0 0"><span class='ocrx_word' id='word_1_103' title='bbox 0 599 385 660; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 0 660 379 680; baseline 0 148"><span class='ocrx_word' id='word_1_104' title='bbox 0 660 379 680; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 0 680 379 720; baseline 0 108"><span class='ocrx_word' id='word_1_105' title='bbox 0 680 379 720; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 0 720 404 746; baseline 0 82"><span class='ocrx_word' id='word_1_106' title='bbox 0 720 404 746; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 0 746 409 786; baseline 0 -25"><span class='ocrx_word' id='word_1_107' title='bbox 0 746 261 786; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> <span class='ocrx_word' id='word_1_108' title='bbox 288 746 409 761; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 223 557 268 587">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 223 557 268 587">
+     <span class='ocr_line' id='line_1_39' title="bbox 223 557 268 587; baseline 0 -8"><span class='ocrx_word' id='word_1_109' title='bbox 223 557 268 587; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 0 761 525 812">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 0 761 525 812">
+     <span class='ocr_line' id='line_1_40' title="bbox 290 761 525 783; baseline 0 45"><span class='ocrx_word' id='word_1_110' title='bbox 290 761 525 783; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 0 786 232 812; baseline 0 16"><span class='ocrx_word' id='word_1_111' title='bbox 0 786 232 812; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003152-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003152-0-001.pbm.png
new file mode 100644
index 00000000..75030ed3
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003152-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003152-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003152-0-001.pbm.png.hocr
new file mode 100644
index 00000000..1b9d0da9
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003152-0-001.pbm.png.hocr
@@ -0,0 +1,114 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003152-0-001.pbm.png"; bbox 0 0 1479 1433; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 1 1067 48 1087">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 1 1067 48 1087">
+     <span class='ocr_line' id='line_1_1' title="bbox 1 1067 48 1087; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 1 1067 48 1087; x_wconf 89' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 81 1 137 21">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 81 1 137 21">
+     <span class='ocr_line' id='line_1_2' title="bbox 81 1 137 21; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 81 1 137 21; x_wconf 91' lang='eng'><em>0.05</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 288 22 1478 1431">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 288 22 1478 1431">
+     <span class='ocr_line' id='line_1_3' title="bbox 465 22 1386 60; baseline 0 -9"><span class='ocrx_word' id='word_1_3' title='bbox 465 40 513 60; x_wconf 67' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 583 25 803 51; x_wconf 85' lang='eng' dir='ltr'><em>Chelativorans</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 816 25 1044 59; x_wconf 91' lang='eng' dir='ltr'><em>oligotrophicus</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 1058 22 1177 51; x_wconf 96' lang='eng' dir='ltr'><em>LPM-4T</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 1190 22 1386 56; x_wconf 89' lang='eng' dir='ltr'>(EF457242)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 481 63 1415 100; baseline 0.001 -9"><span class='ocrx_word' id='word_1_8' title='bbox 481 70 512 91; x_wconf 85' lang='eng'><em>56</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 548 66 768 93; x_wconf 85' lang='eng' dir='ltr'><em>Che/ativorans</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 781 66 1008 100; x_wconf 88' lang='eng' dir='ltr'><em>multitrophicus</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 1020 66 1096 92; x_wconf 94' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 1111 63 1415 98; x_wconf 74' lang='eng' dir='ltr'>9103T(EF457243)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 541 106 878 142; baseline 0 -7"><span class='ocrx_word' id='word_1_13' title='bbox 541 108 632 135; x_wconf 86' lang='eng' dir='ltr'><em>BNC1</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 652 106 878 142; x_wconf 79' lang='eng' dir='ltr'>(NC_008254)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 600 147 1382 181; baseline 0.001 -6"><span class='ocrx_word' id='word_1_15' title='bbox 600 150 795 176; x_wconf 80' lang='eng' dir='ltr'><em>Aminobacter</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 804 150 996 176; x_wconf 84' lang='eng' dir='ltr'><em>aminovorans</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 1009 150 1082 176; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 1097 147 1189 176; x_wconf 90' lang='eng' dir='ltr'><em>7048T</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 1201 147 1280 181; x_wconf 74' lang='eng' dir='ltr'>(A101</span> <span class='ocrx_word' id='word_1_20' title='bbox 1293 151 1301 175; x_wconf 98' lang='eng'>1</span> <span class='ocrx_word' id='word_1_21' title='bbox 1313 147 1382 181; x_wconf 96' lang='eng'>759)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 547 184 1369 222; baseline 0 -5"><span class='ocrx_word' id='word_1_22' title='bbox 547 184 578 205; x_wconf 73' lang='eng'>69</span> <span class='ocrx_word' id='word_1_23' title='bbox 600 192 795 217; x_wconf 86' lang='eng' dir='ltr'><em>Aminobacter</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 804 192 996 217; x_wconf 78' lang='eng' dir='ltr'><em>aminovorans</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 1009 191 1082 217; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 1096 193 1175 217; x_wconf 93' lang='eng'>6450</span> <span class='ocrx_word' id='word_1_27' title='bbox 1187 189 1267 222; x_wconf 89' lang='eng' dir='ltr'>(AJ01</span> <span class='ocrx_word' id='word_1_28' title='bbox 1280 189 1369 222; x_wconf 91' lang='eng'>1762)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 538 230 1272 264; baseline 0.001 -7"><span class='ocrx_word' id='word_1_29' title='bbox 538 237 569 257; x_wconf 91' lang='eng'>64</span> <span class='ocrx_word' id='word_1_30' title='bbox 614 233 808 259; x_wconf 83' lang='eng' dir='ltr'><em>Aminobacter</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 819 233 957 259; x_wconf 85' lang='eng' dir='ltr'><em>ciceronei</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 967 230 1073 258; x_wconf 92' lang='eng' dir='ltr'><em>IMB-1T</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 1085 230 1272 264; x_wconf 86' lang='eng' dir='ltr'>(AF034798)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 516 266 1368 308; baseline 0 -8"><span class='ocrx_word' id='word_1_34' title='bbox 516 266 563 286; x_wconf 71' lang='eng'>100</span> <span class='ocrx_word' id='word_1_35' title='bbox 607 275 802 300; x_wconf 76' lang='eng' dir='ltr'><em>Aminobacter</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 811 275 983 308; x_wconf 80' lang='eng' dir='ltr'><em>aganoens/s</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 995 274 1068 300; x_wconf 92' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 1084 276 1155 300; x_wconf 88' lang='eng'><em>7051</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 1164 272 1176 288; x_wconf 69' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_40' title='bbox 1187 272 1267 305; x_wconf 92' lang='eng' dir='ltr'>(AJO1</span> <span class='ocrx_word' id='word_1_41' title='bbox 1279 272 1368 305; x_wconf 88' lang='eng'>1760)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 457 313 1375 350; baseline 0 -8"><span class='ocrx_word' id='word_1_42' title='bbox 457 324 488 345; x_wconf 90' lang='eng'>53</span> <span class='ocrx_word' id='word_1_43' title='bbox 607 316 802 342; x_wconf 79' lang='eng' dir='ltr'><em>Aminobacter</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 812 316 989 350; x_wconf 81' lang='eng' dir='ltr'><em>niigataensis</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 1002 316 1075 342; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 1090 313 1182 342; x_wconf 90' lang='eng' dir='ltr'><em>7050T</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 1194 313 1273 347; x_wconf 92' lang='eng' dir='ltr'>(AJO1</span> <span class='ocrx_word' id='word_1_48' title='bbox 1286 318 1294 342; x_wconf 96' lang='eng'>1</span> <span class='ocrx_word' id='word_1_49' title='bbox 1306 314 1375 347; x_wconf 86' lang='eng'>761)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 605 355 1304 389; baseline 0 -5"><span class='ocrx_word' id='word_1_50' title='bbox 605 358 799 384; x_wconf 78' lang='eng' dir='ltr'><em>Aminobacter</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 809 358 966 384; x_wconf 86' lang='eng' dir='ltr'><em>lissarensis</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 978 355 1106 384; x_wconf 80' lang='eng' dir='ltr'><em>CC495T</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 1117 355 1304 389; x_wconf 92' lang='eng' dir='ltr'>(AF107722)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 547 396 1236 430; baseline 0 -5"><span class='ocrx_word' id='word_1_54' title='bbox 547 400 778 425; x_wconf 79' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 791 400 954 425; x_wconf 85' lang='eng' dir='ltr'><em>chacoense</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 967 396 1043 425; x_wconf 84' lang='eng' dir='ltr'><em>PR5T</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 1055 397 1236 430; x_wconf 90' lang='eng' dir='ltr'>(AJ278249)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 471 434 1199 468; baseline 0 -5"><span class='ocrx_word' id='word_1_58' title='bbox 471 446 499 466; x_wconf 83' lang='eng'>9</span> <span class='ocrx_word' id='word_1_59' title='bbox 539 438 769 463; x_wconf 84' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 782 438 864 463; x_wconf 84' lang='eng' dir='ltr'><em>Ciceri</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 874 434 1039 463; x_wconf 77' lang='eng' dir='ltr'><em>UPM-Ca7T</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 1050 435 1199 468; x_wconf 90' lang='eng' dir='ltr'>(U07934)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 534 480 1213 514; baseline 0 -6"><span class='ocrx_word' id='word_1_63' title='bbox 534 483 765 509; x_wconf 85' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 777 483 822 509; x_wconf 75' lang='eng' dir='ltr'><em>loti</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 831 483 926 509; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 938 480 1053 509; x_wconf 80' lang='eng' dir='ltr'><em>33669T</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 1064 480 1213 514; x_wconf 89' lang='eng' dir='ltr'>(D14514)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 453 521 1295 557; baseline 0.002 -9"><span class='ocrx_word' id='word_1_68' title='bbox 453 528 483 548; x_wconf 91' lang='eng'>73</span> <span class='ocrx_word' id='word_1_69' title='bbox 505 524 736 550; x_wconf 81' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 750 527 926 557; x_wconf 79' lang='eng' dir='ltr'><em>temperatum</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 938 521 1097 550; x_wconf 89' lang='eng' dir='ltr'><em>SDWO18T</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 1108 521 1295 555; x_wconf 88' lang='eng' dir='ltr'>(AF508208)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 505 563 1326 597; baseline 0.001 -6"><span class='ocrx_word' id='word_1_73' title='bbox 505 566 736 592; x_wconf 85' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 748 566 974 592; x_wconf 82' lang='eng' dir='ltr'><em>mediterraneum</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 987 563 1173 592; x_wconf 89' lang='eng' dir='ltr'><em>UPM-Ca36T</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 1184 563 1326 597; x_wconf 88' lang='eng' dir='ltr'>(L38825)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 597 604 1328 638; baseline 0 -5"><span class='ocrx_word' id='word_1_77' title='bbox 597 608 828 633; x_wconf 85' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 841 608 1039 633; x_wconf 84' lang='eng' dir='ltr'><em>tianshanense</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 1050 608 1099 633; x_wconf 96' lang='eng' dir='ltr'><em>A-1</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 1110 604 1167 633; x_wconf 91' lang='eng' dir='ltr'><em>BST</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 1179 605 1247 638; x_wconf 92' lang='eng' dir='ltr'>(U71</span> <span class='ocrx_word' id='word_1_82' title='bbox 1256 605 1328 638; x_wconf 89' lang='eng' dir='ltr'>O79)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 436 646 1255 684; baseline 0 -10"><span class='ocrx_word' id='word_1_83' title='bbox 436 673 443 679; x_wconf 83' lang='eng'>_</span> <span class='ocrx_word' id='word_1_84' title='bbox 453 676 459 684; x_wconf 41' lang='eng' dir='ltr'><strong><em>I</em></strong></span> <span class='ocrx_word' id='word_1_85' title='bbox 508 649 738 675; x_wconf 86' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 751 649 860 675; x_wconf 80' lang='eng' dir='ltr'><em>huakuii</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 871 649 967 675; x_wconf 90' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 982 646 1094 675; x_wconf 88' lang='eng' dir='ltr'><em>15243T</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 1106 646 1255 680; x_wconf 91' lang='eng' dir='ltr'>(D13431)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 435 681 1294 728; baseline 0 -12"><span class='ocrx_word' id='word_1_90' title='bbox 435 681 472 728; x_wconf 78' lang='eng'>65</span> <span class='ocrx_word' id='word_1_91' title='bbox 523 691 754 716; x_wconf 81' lang='eng' dir='ltr'><em>Mesorhizob/um</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 764 690 923 724; x_wconf 80' lang='eng' dir='ltr'><em>plur/farium</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 936 690 1008 716; x_wconf 85' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 1024 692 1033 716; x_wconf 96' lang='eng'>1</span> <span class='ocrx_word' id='word_1_95' title='bbox 1045 687 1137 716; x_wconf 88' lang='eng' dir='ltr'><em>1892T</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 1148 688 1294 721; x_wconf 91' lang='eng' dir='ltr'>(Y14158)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 448 729 1343 767; baseline 0 -9"><span class='ocrx_word' id='word_1_97' title='bbox 448 747 479 767; x_wconf 69' lang='eng'>72</span> <span class='ocrx_word' id='word_1_98' title='bbox 519 733 750 758; x_wconf 84' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 762 733 974 766; x_wconf 81' lang='eng' dir='ltr'><em>septentriona/e</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 986 729 1145 758; x_wconf 89' lang='eng' dir='ltr'><em>SDW014T</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 1156 730 1343 763; x_wconf 91' lang='eng' dir='ltr'>(AF508207)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 288 771 1334 807; baseline 0.008 -16"><span class='ocrx_word' id='word_1_102' title='bbox 288 771 335 792; x_wconf 94' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 503 774 734 800; x_wconf 80' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 746 774 895 807; x_wconf 87' lang='eng' dir='ltr'><em>amorphae</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 906 774 1009 800; x_wconf 91' lang='eng' dir='ltr'><strong>ACCC</strong></span> <span class='ocrx_word' id='word_1_106' title='bbox 1024 771 1136 800; x_wconf 87' lang='eng' dir='ltr'><em>19665T</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 1147 771 1334 805; x_wconf 89' lang='eng' dir='ltr'>(AFO41442)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 650 813 1478 846; baseline 0 -5"><span class='ocrx_word' id='word_1_108' title='bbox 650 816 881 841; x_wconf 86' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 893 816 1006 841; x_wconf 85' lang='eng' dir='ltr'><em>albiziae</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 1018 815 1140 841; x_wconf 93' lang='eng' dir='ltr'>CCBAU</span> <span class='ocrx_word' id='word_1_111' title='bbox 1154 817 1186 841; x_wconf 88' lang='eng'>61</span> <span class='ocrx_word' id='word_1_112' title='bbox 1198 817 1206 841; x_wconf 98' lang='eng'>1</span> <span class='ocrx_word' id='word_1_113' title='bbox 1217 813 1268 841; x_wconf 90' lang='eng' dir='ltr'><em>58T</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 1280 813 1478 846; x_wconf 80' lang='eng' dir='ltr'>(D0100066)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 688 854 1434 891; baseline 0 -8"><span class='ocrx_word' id='word_1_115' title='bbox 688 857 918 883; x_wconf 81' lang='eng' dir='ltr'><em>Mesorh/zobium</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 932 857 1161 891; x_wconf 80' lang='eng' dir='ltr'><em>thiogangeticum</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 1174 854 1241 883; x_wconf 90' lang='eng' dir='ltr'><em>SJTT</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 1252 854 1434 888; x_wconf 86' lang='eng' dir='ltr'>(AJ864462)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 468 896 1276 930; baseline 0.001 -7"><span class='ocrx_word' id='word_1_119' title='bbox 468 903 499 923; x_wconf 86' lang='eng'>97</span> <span class='ocrx_word' id='word_1_120' title='bbox 567 899 852 925; x_wconf 84' lang='eng' dir='ltr'><em>Pseudaminobacter</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 862 899 970 925; x_wconf 77' lang='eng' dir='ltr'><em>defluvii</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 978 899 1029 924; x_wconf 96' lang='eng' dir='ltr'><em>THI</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 1043 896 1116 925; x_wconf 89' lang='eng' dir='ltr'><em>O51T</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 1127 896 1276 930; x_wconf 88' lang='eng' dir='ltr'>(D32248)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 424 937 1449 974; baseline 0.001 -9"><span class='ocrx_word' id='word_1_125' title='bbox 424 944 454 965; x_wconf 92' lang='eng'>87</span> <span class='ocrx_word' id='word_1_126' title='bbox 606 941 892 966; x_wconf 83' lang='eng' dir='ltr'><em>Pseudam/nobacter</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 901 941 1137 974; x_wconf 75' lang='eng' dir='ltr'><em>salicy/atoxidans</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 1150 941 1210 966; x_wconf 93' lang='eng' dir='ltr'><em>BN1</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 1221 937 1251 966; x_wconf 92' lang='eng' dir='ltr'><em>2T</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 1262 938 1449 972; x_wconf 90' lang='eng' dir='ltr'>(AFO72542)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 500 979 1420 1013; baseline 0.002 -7"><span class='ocrx_word' id='word_1_131' title='bbox 500 986 548 1006; x_wconf 82' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_132' title='bbox 646 982 846 1008; x_wconf 82' lang='eng' dir='ltr'><em>Def/uvibacter</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 856 982 1014 1008; x_wconf 78' lang='eng' dir='ltr'><em>lusatiensis</em></span> <span class='ocrx_word' id='word_1_134' title='bbox 1027 982 1100 1008; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 1116 984 1124 1007; x_wconf 95' lang='eng'>1</span> <span class='ocrx_word' id='word_1_136' title='bbox 1137 979 1228 1008; x_wconf 87' lang='eng' dir='ltr'><em>1099T</em></span> <span class='ocrx_word' id='word_1_137' title='bbox 1239 979 1420 1013; x_wconf 87' lang='eng' dir='ltr'>(AJ132378)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 613 1021 1342 1057; baseline 0.001 -8"><span class='ocrx_word' id='word_1_138' title='bbox 613 1024 852 1057; x_wconf 87' lang='eng' dir='ltr'><em>Aquamicrobium</em></span> <span class='ocrx_word' id='word_1_139' title='bbox 865 1024 973 1050; x_wconf 80' lang='eng' dir='ltr'><em>def/uvii</em></span> <span class='ocrx_word' id='word_1_140' title='bbox 984 1024 1057 1050; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_141' title='bbox 1073 1025 1081 1049; x_wconf 97' lang='eng'>1</span> <span class='ocrx_word' id='word_1_142' title='bbox 1094 1021 1185 1050; x_wconf 79' lang='eng' dir='ltr'><em>1603T</em></span> <span class='ocrx_word' id='word_1_143' title='bbox 1196 1021 1342 1055; x_wconf 90' lang='eng' dir='ltr'>(Y15403)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 410 1062 1188 1096; baseline 0 -5"><span class='ocrx_word' id='word_1_144' title='bbox 410 1064 458 1084; x_wconf 70' lang='eng'>100</span> <span class='ocrx_word' id='word_1_145' title='bbox 493 1065 709 1091; x_wconf 81' lang='eng' dir='ltr'><em>Sinorhizobium</em></span> <span class='ocrx_word' id='word_1_146' title='bbox 722 1065 797 1091; x_wconf 80' lang='eng' dir='ltr'><em>fred/i</em></span> <span class='ocrx_word' id='word_1_147' title='bbox 806 1065 900 1091; x_wconf 93' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_148' title='bbox 913 1062 1027 1091; x_wconf 79' lang='eng' dir='ltr'><em>35423T</em></span> <span class='ocrx_word' id='word_1_149' title='bbox 1039 1063 1188 1096; x_wconf 92' lang='eng' dir='ltr'>(D14516)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 484 1104 1291 1138; baseline 0 -6"><span class='ocrx_word' id='word_1_150' title='bbox 484 1107 700 1132; x_wconf 78' lang='eng' dir='ltr'><em>S/norhizobium</em></span> <span class='ocrx_word' id='word_1_151' title='bbox 712 1107 896 1132; x_wconf 85' lang='eng' dir='ltr'><em>americanum</em></span> <span class='ocrx_word' id='word_1_152' title='bbox 909 1107 1006 1132; x_wconf 92' lang='eng' dir='ltr'>CFNEI</span> <span class='ocrx_word' id='word_1_153' title='bbox 1022 1104 1093 1132; x_wconf 89' lang='eng' dir='ltr'><em>156T</em></span> <span class='ocrx_word' id='word_1_154' title='bbox 1104 1104 1291 1138; x_wconf 87' lang='eng' dir='ltr'>(AF506513)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 600 1146 1273 1182; baseline 0 -8"><span class='ocrx_word' id='word_1_155' title='bbox 600 1148 823 1182; x_wconf 80' lang='eng' dir='ltr'><em>Agrobacter/um</em></span> <span class='ocrx_word' id='word_1_156' title='bbox 836 1148 1017 1174; x_wconf 79' lang='eng' dir='ltr'><em>tumefaciens</em></span> <span class='ocrx_word' id='word_1_157' title='bbox 1029 1148 1074 1174; x_wconf 90' lang='eng' dir='ltr'>C4</span> <span class='ocrx_word' id='word_1_158' title='bbox 1086 1146 1273 1179; x_wconf 87' lang='eng' dir='ltr'>(AF508093)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 618 1187 1299 1224; baseline 0 -8"><span class='ocrx_word' id='word_1_159' title='bbox 618 1190 776 1216; x_wconf 80' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_160' title='bbox 787 1190 905 1224; x_wconf 87' lang='eng' dir='ltr'><em>ga/egae</em></span> <span class='ocrx_word' id='word_1_161' title='bbox 916 1190 1011 1216; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_162' title='bbox 1023 1187 1139 1216; x_wconf 91' lang='eng' dir='ltr'><em>43677T</em></span> <span class='ocrx_word' id='word_1_163' title='bbox 1150 1188 1198 1221; x_wconf 91' lang='eng' dir='ltr'><em>(D1</em></span> <span class='ocrx_word' id='word_1_164' title='bbox 1210 1188 1299 1221; x_wconf 88' lang='eng'>1343)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 473 1228 1256 1265; baseline 0.001 -8"><span class='ocrx_word' id='word_1_165' title='bbox 473 1241 520 1262; x_wconf 83' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_166' title='bbox 661 1232 820 1258; x_wconf 80' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_167' title='bbox 834 1232 926 1265; x_wconf 77' lang='eng' dir='ltr'><em>tropici</em></span> <span class='ocrx_word' id='word_1_168' title='bbox 936 1232 1011 1258; x_wconf 91' lang='eng' dir='ltr'><em>CIAT</em></span> <span class='ocrx_word' id='word_1_169' title='bbox 1023 1228 1096 1258; x_wconf 89' lang='eng' dir='ltr'><em>899T</em></span> <span class='ocrx_word' id='word_1_170' title='bbox 1108 1229 1256 1263; x_wconf 90' lang='eng' dir='ltr'>(U89832)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 547 1269 1469 1307; baseline 0 -8"><span class='ocrx_word' id='word_1_171' title='bbox 547 1269 594 1290; x_wconf 74' lang='eng'>100</span> <span class='ocrx_word' id='word_1_172' title='bbox 632 1274 791 1299; x_wconf 78' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_173' title='bbox 803 1274 1034 1307; x_wconf 82' lang='eng' dir='ltr'><em>leguminosarum</em></span> <span class='ocrx_word' id='word_1_174' title='bbox 1046 1273 1140 1299; x_wconf 93' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_175' title='bbox 1156 1270 1268 1299; x_wconf 94' lang='eng' dir='ltr'><em>10004T</em></span> <span class='ocrx_word' id='word_1_176' title='bbox 1279 1271 1469 1304; x_wconf 88' lang='eng' dir='ltr'>(AY509899)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 644 1312 1150 1346; baseline 0.002 -6"><span class='ocrx_word' id='word_1_177' title='bbox 644 1315 803 1341; x_wconf 82' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_178' title='bbox 815 1315 860 1341; x_wconf 76' lang='eng' dir='ltr'><em>et/i</em></span> <span class='ocrx_word' id='word_1_179' title='bbox 869 1315 936 1341; x_wconf 88' lang='eng' dir='ltr'><em>CFN</em></span> <span class='ocrx_word' id='word_1_180' title='bbox 950 1316 988 1340; x_wconf 82' lang='eng'><em>42</em></span> <span class='ocrx_word' id='word_1_181' title='bbox 1001 1312 1150 1346; x_wconf 80' lang='eng' dir='ltr'>(U28916)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 441 1354 1301 1390; baseline 0 -8"><span class='ocrx_word' id='word_1_182' title='bbox 441 1358 488 1378; x_wconf 89' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_183' title='bbox 580 1357 765 1390; x_wconf 85' lang='eng' dir='ltr'><em>Azospiri/lum</em></span> <span class='ocrx_word' id='word_1_184' title='bbox 777 1356 916 1390; x_wconf 80' lang='eng' dir='ltr'><em>lipoferum</em></span> <span class='ocrx_word' id='word_1_185' title='bbox 928 1356 1023 1382; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_186' title='bbox 1036 1358 1135 1382; x_wconf 87' lang='eng'>29707</span> <span class='ocrx_word' id='word_1_187' title='bbox 1148 1354 1301 1387; x_wconf 87' lang='eng' dir='ltr'>(M59061)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 672 1395 1445 1431; baseline 0 -7"><span class='ocrx_word' id='word_1_188' title='bbox 672 1398 857 1431; x_wconf 84' lang='eng' dir='ltr'><em>Azosp/ri/lum</em></span> <span class='ocrx_word' id='word_1_189' title='bbox 870 1398 1023 1424; x_wconf 83' lang='eng' dir='ltr'><em>bras/lense</em></span> <span class='ocrx_word' id='word_1_190' title='bbox 1034 1398 1129 1424; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_191' title='bbox 1143 1399 1241 1424; x_wconf 89' lang='eng'>29145</span> <span class='ocrx_word' id='word_1_192' title='bbox 1255 1395 1384 1429; x_wconf 89' lang='eng' dir='ltr'>(AY3241</span> <span class='ocrx_word' id='word_1_193' title='bbox 1397 1395 1445 1429; x_wconf 91' lang='eng'><em>10)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 352 421 383 441">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 352 421 383 441">
+     <span class='ocr_line' id='line_1_37' title="bbox 352 421 383 441; baseline 0 0"><span class='ocrx_word' id='word_1_194' title='bbox 352 421 383 441; x_wconf 84' lang='eng'>98</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 385 1172 426 1232">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 385 1172 426 1232">
+     <span class='ocr_line' id='line_1_38' title="bbox 385 1172 416 1193; baseline 0 0"><span class='ocrx_word' id='word_1_195' title='bbox 385 1172 416 1193; x_wconf 86' lang='eng'>89</span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 394 1212 426 1232; baseline 0 0"><span class='ocrx_word' id='word_1_196' title='bbox 394 1212 426 1232; x_wconf 90' lang='eng'><em>65</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003160-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003160-0-001.pbm.png
new file mode 100644
index 00000000..d0112c5a
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003160-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003160-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003160-0-001.pbm.png.hocr
new file mode 100644
index 00000000..eaf0bec4
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003160-0-001.pbm.png.hocr
@@ -0,0 +1,67 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003160-0-001.pbm.png"; bbox 0 0 1243 581; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 0 0 718 76">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 0 0 718 75">
+     <span class='ocr_line' id='line_1_1' title="bbox 54 0 656 35; baseline 0 -7"><span class='ocrx_word' id='word_1_1' title='bbox 54 1 139 28; x_wconf 89' lang='eng' dir='ltr'><em>Mass</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 152 1 279 35; x_wconf 90' lang='eng' dir='ltr'><em>spectral</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 293 1 436 35; x_wconf 85' lang='eng' dir='ltr'><em>similarity</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 450 0 491 35; x_wconf 90' lang='eng'><em>(%</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 506 1 656 35; x_wconf 88' lang='eng' dir='ltr'><em>matches)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 0 48 718 75; baseline 0 0"><span class='ocrx_word' id='word_1_6' title='bbox 0 48 18 75; x_wconf 93' lang='eng'>0</span> <span class='ocrx_word' id='word_1_7' title='bbox 107 48 143 75; x_wconf 93' lang='eng'><strong>10</strong></span> <span class='ocrx_word' id='word_1_8' title='bbox 220 48 258 75; x_wconf 87' lang='eng'><em>20</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 334 48 372 75; x_wconf 88' lang='eng'>30</span> <span class='ocrx_word' id='word_1_10' title='bbox 447 48 487 75; x_wconf 93' lang='eng' dir='ltr'><em>4O</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 566 48 603 75; x_wconf 91' lang='eng'><em>50</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 679 48 718 75; x_wconf 88' lang='eng'><em>60</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 7 81 707 96">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 7 81 707 96">
+     <span class='ocr_line' id='line_1_3' title="bbox 7 81 707 96; baseline 0 0"><span class='ocrx_word' id='word_1_13' title='bbox 7 81 707 96; x_wconf 93' lang='eng' dir='ltr'><em>|—l—l—l—l—l—L</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 759 104 1243 581">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 760 104 1092 135">
+     <span class='ocr_line' id='line_1_4' title="bbox 760 104 1092 135; baseline 0 0"><span class='ocrx_word' id='word_1_14' title='bbox 760 108 872 135; x_wconf 93' lang='eng' dir='ltr'>binotii</span> <span class='ocrx_word' id='word_1_15' title='bbox 882 108 941 135; x_wconf 94' lang='eng' dir='ltr'><em>CIP</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 956 104 1092 135; x_wconf 88' lang='eng' dir='ltr'><em>101303T</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 760 148 1243 581">
+     <span class='ocr_line' id='line_1_5' title="bbox 760 148 1076 176; baseline 0 -1"><span class='ocrx_word' id='word_1_17' title='bbox 760 148 872 176; x_wconf 90' lang='eng' dir='ltr'>binotii</span> <span class='ocrx_word' id='word_1_18' title='bbox 882 148 941 175; x_wconf 94' lang='eng' dir='ltr'><strong>CIP</strong></span> <span class='ocrx_word' id='word_1_19' title='bbox 956 148 1076 176; x_wconf 90' lang='eng'><strong>102116</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 760 185 1147 216; baseline 0 0"><span class='ocrx_word' id='word_1_20' title='bbox 760 189 924 216; x_wconf 89' lang='eng' dir='ltr'><em>aerolatum</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 937 189 995 216; x_wconf 91' lang='eng' dir='ltr'><em>CIP</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 1012 185 1147 216; x_wconf 83' lang='eng' dir='ltr'><em>107636T</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 761 226 1160 257; baseline -0.003 0"><span class='ocrx_word' id='word_1_23' title='bbox 761 229 937 257; x_wconf 89' lang='eng' dir='ltr'><em>thalassium</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 949 229 1008 257; x_wconf 93' lang='eng' dir='ltr'><em>CIP</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 1024 226 1160 257; x_wconf 86' lang='eng' dir='ltr'><em>105728T</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 761 266 1153 297; baseline 0 0"><span class='ocrx_word' id='word_1_26' title='bbox 761 271 930 297; x_wconf 86' lang='eng' dir='ltr'><em>testaceum</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 943 270 1001 297; x_wconf 91' lang='eng' dir='ltr'><em>CIP</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 1018 266 1153 297; x_wconf 84' lang='eng' dir='ltr'><em>104324T</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 760 307 1087 338; baseline 0 0"><span class='ocrx_word' id='word_1_29' title='bbox 760 318 864 338; x_wconf 88' lang='eng' dir='ltr'><em>aurum</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 877 310 935 338; x_wconf 92' lang='eng' dir='ltr'><em>CIP</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 952 307 1087 338; x_wconf 87' lang='eng' dir='ltr'><em>103994T</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 760 348 1131 379; baseline 0 0"><span class='ocrx_word' id='word_1_32' title='bbox 760 352 908 379; x_wconf 85' lang='eng' dir='ltr'><em>resistens</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 920 351 979 379; x_wconf 93' lang='eng' dir='ltr'><em>CIP</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 995 348 1131 379; x_wconf 87' lang='eng' dir='ltr'><em>107265T</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 760 388 1243 426; baseline 0 -7"><span class='ocrx_word' id='word_1_35' title='bbox 760 392 1019 426; x_wconf 83' lang='eng' dir='ltr'><em>keratano/yticum</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 1032 391 1091 419; x_wconf 92' lang='eng' dir='ltr'><em>CIP</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 1108 388 1243 419; x_wconf 87' lang='eng' dir='ltr'><em>103815T</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 760 429 1158 459; baseline 0 0"><span class='ocrx_word' id='word_1_38' title='bbox 760 432 935 459; x_wconf 88' lang='eng' dir='ltr'><em>ﬂavescens</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 947 432 1005 459; x_wconf 93' lang='eng' dir='ltr'><em>CIP</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 1022 429 1158 459; x_wconf 79' lang='eng' dir='ltr'><em>102401T</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 760 469 1234 500; baseline 0 0"><span class='ocrx_word' id='word_1_41' title='bbox 760 473 1012 500; x_wconf 88' lang='eng' dir='ltr'><em>laevaniformans</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 1024 473 1083 500; x_wconf 95' lang='eng' dir='ltr'><em>CIP</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 1099 469 1234 500; x_wconf 81' lang='eng' dir='ltr'><em>100934T</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 760 510 1114 540; baseline 0 0"><span class='ocrx_word' id='word_1_44' title='bbox 760 513 891 540; x_wconf 89' lang='eng' dir='ltr'><em>foliorum</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 904 513 962 540; x_wconf 92' lang='eng' dir='ltr'><em>CIP</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 979 510 1114 540; x_wconf 83' lang='eng' dir='ltr'><em>107137T</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 760 550 1185 581; baseline -0.002 0"><span class='ocrx_word' id='word_1_47' title='bbox 760 554 962 581; x_wconf 89' lang='eng' dir='ltr'><em>halotolerans</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 974 553 1033 581; x_wconf 92' lang='eng' dir='ltr'><em>CIP</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 1050 550 1185 581; x_wconf 89' lang='eng' dir='ltr'><em>108071T</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 707 108 746 580">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 708 108 745 580">
+     <span class='ocr_line' id='line_1_16' title="bbox 708 108 745 580; textangle 90"><span class='ocrx_word' id='word_1_50' title='bbox 708 108 745 580; x_wconf 64' lang='eng'>::::::::::::</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003160-0-002.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003160-0-002.pbm.png
new file mode 100644
index 00000000..ababf40b
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003160-0-002.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003160-0-002.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003160-0-002.pbm.png.hocr
new file mode 100644
index 00000000..280f53f1
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003160-0-002.pbm.png.hocr
@@ -0,0 +1,152 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003160-0-002.pbm.png"; bbox 0 0 994 1926; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 6 1654 113 1695">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 6 1654 113 1695">
+     <span class='ocr_line' id='line_1_1' title="bbox 37 1654 78 1672; baseline -0.024 0"><span class='ocrx_word' id='word_1_1' title='bbox 37 1654 78 1672; x_wconf 80' lang='eng'>0.01</span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 6 1664 113 1695; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 6 1664 113 1695; x_wconf 83' lang='eng'>|—|</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 207 0 954 1027">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 207 0 954 1027">
+     <span class='ocr_line' id='line_1_3' title="bbox 323 0 937 27; baseline 0 -5"><span class='ocrx_word' id='word_1_3' title='bbox 323 3 473 22; x_wconf 78' lang='eng' dir='ltr'>Leucobacter</span> <span class='ocrx_word' id='word_1_4' title='bbox 478 3 610 27; x_wconf 86' lang='eng' dir='ltr'>komagatae</span> <span class='ocrx_word' id='word_1_5' title='bbox 620 2 693 22; x_wconf 87' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_6' title='bbox 705 0 788 22; x_wconf 90' lang='eng' dir='ltr'>15245T</span> <span class='ocrx_word' id='word_1_7' title='bbox 797 3 937 27; x_wconf 87' lang='eng' dir='ltr'>(AB007419)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 207 34 931 62; baseline 0.001 -6"><span class='ocrx_word' id='word_1_8' title='bbox 207 42 232 59; x_wconf 78' lang='eng'>58</span> <span class='ocrx_word' id='word_1_9' title='bbox 451 37 476 56; x_wconf 94' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_10' title='bbox 488 37 634 57; x_wconf 84' lang='eng' dir='ltr'>haloto/erans</span> <span class='ocrx_word' id='word_1_11' title='bbox 641 37 686 56; x_wconf 93' lang='eng' dir='ltr'>YIM</span> <span class='ocrx_word' id='word_1_12' title='bbox 697 34 782 57; x_wconf 74' lang='eng' dir='ltr'>70130T</span> <span class='ocrx_word' id='word_1_13' title='bbox 791 37 931 62; x_wconf 85' lang='eng' dir='ltr'>(AY376165)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 317 70 734 96; baseline 0.002 -6"><span class='ocrx_word' id='word_1_14' title='bbox 317 71 344 90; x_wconf 95' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_15' title='bbox 355 71 435 91; x_wconf 85' lang='eng' dir='ltr'>binotii</span> <span class='ocrx_word' id='word_1_16' title='bbox 443 70 485 90; x_wconf 90' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_17' title='bbox 496 71 583 91; x_wconf 86' lang='eng'>102116</span> <span class='ocrx_word' id='word_1_18' title='bbox 592 71 734 96; x_wconf 88' lang='eng' dir='ltr'>(EU600175)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 250 103 748 130; baseline -0.002 -4"><span class='ocrx_word' id='word_1_19' title='bbox 250 109 287 127; x_wconf 86' lang='eng'>100</span> <span class='ocrx_word' id='word_1_20' title='bbox 339 111 350 125; x_wconf 98' lang='eng'>.</span> <span class='ocrx_word' id='word_1_21' title='bbox 361 105 441 125; x_wconf 88' lang='eng' dir='ltr'>binotii</span> <span class='ocrx_word' id='word_1_22' title='bbox 449 105 491 125; x_wconf 92' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_23' title='bbox 502 103 601 125; x_wconf 90' lang='eng' dir='ltr'>101303T</span> <span class='ocrx_word' id='word_1_24' title='bbox 609 105 748 130; x_wconf 85' lang='eng' dir='ltr'>(EF567306)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 239 135 931 165; baseline -0.001 -5"><span class='ocrx_word' id='word_1_25' title='bbox 239 135 264 152; x_wconf 81' lang='eng'>57</span> <span class='ocrx_word' id='word_1_26' title='bbox 323 140 349 159; x_wconf 94' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_27' title='bbox 361 140 604 165; x_wconf 76' lang='eng' dir='ltr'>trichotheceno/yticum</span> <span class='ocrx_word' id='word_1_28' title='bbox 614 140 687 160; x_wconf 88' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_29' title='bbox 699 137 781 160; x_wconf 80' lang='eng' dir='ltr'>15077T</span> <span class='ocrx_word' id='word_1_30' title='bbox 791 140 931 165; x_wconf 91' lang='eng' dir='ltr'>(ABOO4722)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 462 172 954 199; baseline 0 -5"><span class='ocrx_word' id='word_1_31' title='bbox 462 174 488 194; x_wconf 90' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_32' title='bbox 500 174 628 199; x_wconf 83' lang='eng' dir='ltr'>ha/ophi/um</span> <span class='ocrx_word' id='word_1_33' title='bbox 638 174 710 194; x_wconf 92' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_34' title='bbox 722 172 805 194; x_wconf 74' lang='eng' dir='ltr'>16062T</span> <span class='ocrx_word' id='word_1_35' title='bbox 815 174 954 199; x_wconf 92' lang='eng' dir='ltr'>(ABOO4714)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 325 206 734 233; baseline 0 -5"><span class='ocrx_word' id='word_1_36' title='bbox 325 209 351 228; x_wconf 65' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_37' title='bbox 361 209 513 233; x_wconf 82' lang='eng' dir='ltr'>xylanilyticum</span> <span class='ocrx_word' id='word_1_38' title='bbox 523 206 592 228; x_wconf 75' lang='eng' dir='ltr'>SB-ET</span> <span class='ocrx_word' id='word_1_39' title='bbox 599 209 734 233; x_wconf 81' lang='eng' dir='ltr'>(AJ853908)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 327 241 774 268; baseline 0 -6"><span class='ocrx_word' id='word_1_40' title='bbox 327 243 448 263; x_wconf 86' lang='eng' dir='ltr'><em>M.hominis</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 458 243 530 263; x_wconf 89' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_42' title='bbox 542 241 625 263; x_wconf 74' lang='eng' dir='ltr'>15708T</span> <span class='ocrx_word' id='word_1_43' title='bbox 634 243 774 268; x_wconf 91' lang='eng' dir='ltr'>(ABOO4727)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 297 275 787 303; baseline 0 -6"><span class='ocrx_word' id='word_1_44' title='bbox 297 277 322 297; x_wconf 91' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 334 277 461 297; x_wconf 79' lang='eng' dir='ltr'>tha/assium</span> <span class='ocrx_word' id='word_1_46' title='bbox 471 277 544 297; x_wconf 89' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_47' title='bbox 556 275 638 297; x_wconf 79' lang='eng' dir='ltr'>16060T</span> <span class='ocrx_word' id='word_1_48' title='bbox 647 277 787 303; x_wconf 85' lang='eng' dir='ltr'>(ABOO4713)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 224 309 743 337; baseline 0.002 -6"><span class='ocrx_word' id='word_1_49' title='bbox 224 327 241 335; x_wconf 43' lang='eng'><em>.‘</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 311 312 336 331; x_wconf 93' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_51' title='bbox 348 312 417 332; x_wconf 75' lang='eng' dir='ltr'>terrae</span> <span class='ocrx_word' id='word_1_52' title='bbox 427 312 499 332; x_wconf 89' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_53' title='bbox 512 309 594 332; x_wconf 89' lang='eng' dir='ltr'>15300T</span> <span class='ocrx_word' id='word_1_54' title='bbox 604 312 743 337; x_wconf 87' lang='eng' dir='ltr'>(AB004720)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 234 344 849 371; baseline 0 -5"><span class='ocrx_word' id='word_1_55' title='bbox 234 352 271 370; x_wconf 78' lang='eng'>100</span> <span class='ocrx_word' id='word_1_56' title='bbox 306 346 332 366; x_wconf 90' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_57' title='bbox 343 346 523 366; x_wconf 84' lang='eng' dir='ltr'>ketosireducens</span> <span class='ocrx_word' id='word_1_58' title='bbox 533 346 605 366; x_wconf 88' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_59' title='bbox 617 344 700 366; x_wconf 82' lang='eng' dir='ltr'>14548T</span> <span class='ocrx_word' id='word_1_60' title='bbox 709 346 849 371; x_wconf 91' lang='eng' dir='ltr'>(ABOO4724)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 234 378 822 405; baseline 0 -5"><span class='ocrx_word' id='word_1_61' title='bbox 234 386 256 403; x_wconf 82' lang='eng'>51</span> <span class='ocrx_word' id='word_1_62' title='bbox 333 381 359 400; x_wconf 95' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_63' title='bbox 370 380 496 400; x_wconf 84' lang='eng' dir='ltr'>ﬂavescens</span> <span class='ocrx_word' id='word_1_64' title='bbox 506 380 578 400; x_wconf 91' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_65' title='bbox 590 378 672 400; x_wconf 82' lang='eng' dir='ltr'>15039T</span> <span class='ocrx_word' id='word_1_66' title='bbox 682 381 822 405; x_wconf 89' lang='eng' dir='ltr'>(ABOO4716)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 327 413 872 440; baseline 0 -6"><span class='ocrx_word' id='word_1_67' title='bbox 327 415 353 434; x_wconf 92' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_68' title='bbox 364 415 545 435; x_wconf 83' lang='eng' dir='ltr'>Iaevaniformans</span> <span class='ocrx_word' id='word_1_69' title='bbox 555 415 628 435; x_wconf 90' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_70' title='bbox 639 413 722 434; x_wconf 91' lang='eng' dir='ltr'>14471T</span> <span class='ocrx_word' id='word_1_71' title='bbox 731 415 872 440; x_wconf 88' lang='eng' dir='ltr'>(AB007416)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 325 447 844 475; baseline -0.002 -5"><span class='ocrx_word' id='word_1_72' title='bbox 325 450 351 469; x_wconf 95' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_73' title='bbox 363 450 549 475; x_wconf 79' lang='eng' dir='ltr'>dextranolyticum</span> <span class='ocrx_word' id='word_1_74' title='bbox 559 449 614 470; x_wconf 86' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_75' title='bbox 625 447 695 470; x_wconf 81' lang='eng' dir='ltr'>8607T</span> <span class='ocrx_word' id='word_1_76' title='bbox 704 450 844 475; x_wconf 92' lang='eng' dir='ltr'>(ABOO7417)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 358 482 843 509; baseline 0 -5"><span class='ocrx_word' id='word_1_77' title='bbox 358 484 384 504; x_wconf 67' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_78' title='bbox 396 484 532 504; x_wconf 76' lang='eng' dir='ltr'>chocolatum</span> <span class='ocrx_word' id='word_1_79' title='bbox 542 484 614 504; x_wconf 92' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_80' title='bbox 624 482 694 504; x_wconf 80' lang='eng' dir='ltr'>3758T</span> <span class='ocrx_word' id='word_1_81' title='bbox 703 484 843 509; x_wconf 89' lang='eng' dir='ltr'>(ABOO4725)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 234 516 831 550; baseline 0 -12"><span class='ocrx_word' id='word_1_82' title='bbox 234 533 259 550; x_wconf 72' lang='eng'>96</span> <span class='ocrx_word' id='word_1_83' title='bbox 331 519 357 538; x_wconf 65' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_84' title='bbox 369 519 515 538; x_wconf 77' lang='eng' dir='ltr'><em>aurantiacum</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 524 518 566 538; x_wconf 88' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_86' title='bbox 578 516 689 543; x_wconf 79' lang='eng' dir='ltr'>105730T(</span> <span class='ocrx_word' id='word_1_87' title='bbox 699 519 831 543; x_wconf 86' lang='eng' dir='ltr'>EU863415)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 284 550 801 578; baseline 0.002 -6"><span class='ocrx_word' id='word_1_88' title='bbox 284 558 320 576; x_wconf 87' lang='eng'>100</span> <span class='ocrx_word' id='word_1_89' title='bbox 355 570 357 572; x_wconf 99' lang='eng'>.</span> <span class='ocrx_word' id='word_1_90' title='bbox 369 553 495 573; x_wconf 82' lang='eng' dir='ltr'>kitamiense</span> <span class='ocrx_word' id='word_1_91' title='bbox 505 553 557 573; x_wconf 91' lang='eng' dir='ltr'>JCM</span> <span class='ocrx_word' id='word_1_92' title='bbox 570 550 652 573; x_wconf 92' lang='eng' dir='ltr'>10270T</span> <span class='ocrx_word' id='word_1_93' title='bbox 662 553 801 578; x_wconf 81' lang='eng' dir='ltr'>(AB013907)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 207 583 754 613; baseline 0 -5"><span class='ocrx_word' id='word_1_94' title='bbox 207 583 232 601; x_wconf 73' lang='eng'>55</span> <span class='ocrx_word' id='word_1_95' title='bbox 339 588 365 608; x_wconf 91' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_96' title='bbox 377 588 492 608; x_wconf 78' lang='eng' dir='ltr'>hatanonis</span> <span class='ocrx_word' id='word_1_97' title='bbox 502 585 604 608; x_wconf 89' lang='eng' dir='ltr'>FCC-01T</span> <span class='ocrx_word' id='word_1_98' title='bbox 614 588 754 613; x_wconf 83' lang='eng' dir='ltr'>(AB274908)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 463 620 899 648; baseline 0 -6"><span class='ocrx_word' id='word_1_99' title='bbox 463 623 489 642; x_wconf 95' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_100' title='bbox 501 628 575 643; x_wconf 84' lang='eng' dir='ltr'><em>aurum</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 585 623 658 643; x_wconf 89' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_102' title='bbox 670 620 899 648; x_wconf 63' lang='eng' dir='ltr'>15204T(ABOO7418)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 325 654 794 682; baseline 0 -6"><span class='ocrx_word' id='word_1_103' title='bbox 325 657 351 676; x_wconf 95' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_104' title='bbox 362 657 469 677; x_wconf 81' lang='eng' dir='ltr'>sch/eiferi</span> <span class='ocrx_word' id='word_1_105' title='bbox 477 657 550 677; x_wconf 88' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_106' title='bbox 562 654 644 677; x_wconf 89' lang='eng' dir='ltr'>15075T</span> <span class='ocrx_word' id='word_1_107' title='bbox 654 657 794 682; x_wconf 89' lang='eng' dir='ltr'>(ABOO4723)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 325 689 722 716; baseline 0 -5"><span class='ocrx_word' id='word_1_108' title='bbox 325 692 351 711; x_wconf 95' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_109' title='bbox 362 692 471 711; x_wconf 85' lang='eng' dir='ltr'>koreense</span> <span class='ocrx_word' id='word_1_110' title='bbox 480 689 575 711; x_wconf 65' lang='eng' dir='ltr'>J853»2T</span> <span class='ocrx_word' id='word_1_111' title='bbox 582 692 722 716; x_wconf 83' lang='eng' dir='ltr'>(AY962574)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 309 724 770 751; baseline 0 -5"><span class='ocrx_word' id='word_1_112' title='bbox 309 726 334 746; x_wconf 93' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_113' title='bbox 346 726 443 746; x_wconf 78' lang='eng' dir='ltr'>lacticum</span> <span class='ocrx_word' id='word_1_114' title='bbox 453 726 526 746; x_wconf 90' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_115' title='bbox 538 724 620 746; x_wconf 87' lang='eng' dir='ltr'>14135T</span> <span class='ocrx_word' id='word_1_116' title='bbox 630 726 770 751; x_wconf 91' lang='eng' dir='ltr'>(ABOO7415)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 289 758 696 785; baseline 0 -5"><span class='ocrx_word' id='word_1_117' title='bbox 289 760 314 780; x_wconf 96' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_118' title='bbox 326 760 404 780; x_wconf 87' lang='eng' dir='ltr'><em>ﬂavum</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 412 758 546 780; x_wconf 73' lang='eng' dir='ltr'>YM18-098T</span> <span class='ocrx_word' id='word_1_120' title='bbox 556 760 696 785; x_wconf 82' lang='eng' dir='ltr'>(AB286029)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 315 793 704 820; baseline 0 -5"><span class='ocrx_word' id='word_1_121' title='bbox 315 796 341 815; x_wconf 95' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_122' title='bbox 353 796 446 815; x_wconf 82' lang='eng' dir='ltr'>terrico/a</span> <span class='ocrx_word' id='word_1_123' title='bbox 457 793 555 815; x_wconf 64' lang='eng' dir='ltr'>KV»448T</span> <span class='ocrx_word' id='word_1_124' title='bbox 565 796 704 820; x_wconf 82' lang='eng' dir='ltr'>(ABZ34025)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 273 826 779 855; baseline 0 -5"><span class='ocrx_word' id='word_1_125' title='bbox 273 826 310 844; x_wconf 69' lang='eng'>100</span> <span class='ocrx_word' id='word_1_126' title='bbox 352 830 378 850; x_wconf 72' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_127' title='bbox 390 830 521 850; x_wconf 88' lang='eng' dir='ltr'>deminutum</span> <span class='ocrx_word' id='word_1_128' title='bbox 531 828 629 850; x_wconf 80' lang='eng' dir='ltr'>KV-483T</span> <span class='ocrx_word' id='word_1_129' title='bbox 639 830 779 855; x_wconf 79' lang='eng' dir='ltr'>(A8234026)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 356 862 728 889; baseline 0 -5"><span class='ocrx_word' id='word_1_130' title='bbox 356 881 359 884; x_wconf 68' lang='eng'>.</span> <span class='ocrx_word' id='word_1_131' title='bbox 369 864 470 889; x_wconf 87' lang='eng' dir='ltr'><em>pumilum</em></span> <span class='ocrx_word' id='word_1_132' title='bbox 480 862 579 884; x_wconf 82' lang='eng' dir='ltr'>KV-488T</span> <span class='ocrx_word' id='word_1_133' title='bbox 588 864 728 889; x_wconf 89' lang='eng' dir='ltr'>(AB234027)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 328 897 804 924; baseline 0 -5"><span class='ocrx_word' id='word_1_134' title='bbox 328 899 354 919; x_wconf 92' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_135' title='bbox 366 900 478 924; x_wconf 81' lang='eng' dir='ltr'>terregens</span> <span class='ocrx_word' id='word_1_136' title='bbox 487 899 560 919; x_wconf 85' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_137' title='bbox 572 897 655 919; x_wconf 81' lang='eng' dir='ltr'>12961T</span> <span class='ocrx_word' id='word_1_138' title='bbox 664 899 804 924; x_wconf 90' lang='eng' dir='ltr'>(ABOO4721)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 341 931 697 958; baseline 0 -5"><span class='ocrx_word' id='word_1_139' title='bbox 341 934 367 953; x_wconf 96' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_140' title='bbox 379 934 440 953; x_wconf 85' lang='eng' dir='ltr'><strong><em>Iacus</em></strong></span> <span class='ocrx_word' id='word_1_141' title='bbox 448 931 549 953; x_wconf 66' lang='eng' dir='ltr'>A5552T</span> <span class='ocrx_word' id='word_1_142' title='bbox 558 934 697 958; x_wconf 82' lang='eng' dir='ltr'>(AB286030)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 271 965 772 992; baseline -0.004 -3"><span class='ocrx_word' id='word_1_143' title='bbox 271 971 296 989; x_wconf 85' lang='eng'>68</span> <span class='ocrx_word' id='word_1_144' title='bbox 339 968 365 987; x_wconf 95' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_145' title='bbox 377 973 514 992; x_wconf 82' lang='eng' dir='ltr'>aoyamense</span> <span class='ocrx_word' id='word_1_146' title='bbox 524 965 622 987; x_wconf 82' lang='eng' dir='ltr'>KV-492T</span> <span class='ocrx_word' id='word_1_147' title='bbox 632 968 772 992; x_wconf 81' lang='eng' dir='ltr'>(A8234028)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 415 1000 810 1027; baseline 0 -5"><span class='ocrx_word' id='word_1_148' title='bbox 415 1002 440 1022; x_wconf 69' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_149' title='bbox 452 1002 534 1022; x_wconf 82' lang='eng' dir='ltr'>barkeri</span> <span class='ocrx_word' id='word_1_150' title='bbox 543 1002 598 1022; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_151' title='bbox 609 1000 693 1022; x_wconf 86' lang='eng' dir='ltr'>20145T</span> <span class='ocrx_word' id='word_1_152' title='bbox 702 1002 810 1027; x_wconf 85' lang='eng' dir='ltr'>(X77446)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 614 1037 973 1064">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 614 1037 973 1064">
+     <span class='ocr_line' id='line_1_33' title="bbox 614 1037 973 1064; baseline 0 -5"><span class='ocrx_word' id='word_1_153' title='bbox 614 1039 640 1059; x_wconf 95' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_154' title='bbox 651 1039 813 1064; x_wconf 84' lang='eng' dir='ltr'>gubbeenense</span> <span class='ocrx_word' id='word_1_155' title='bbox 822 1039 864 1059; x_wconf 94' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_156' title='bbox 876 1037 973 1059; x_wconf 85' lang='eng' dir='ltr'>107184T</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 271 1071 994 1167">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 271 1071 994 1167">
+     <span class='ocr_line' id='line_1_34' title="bbox 285 1071 994 1098; baseline -0.003 -5"><span class='ocrx_word' id='word_1_157' title='bbox 285 1075 310 1093; x_wconf 84' lang='eng'>89</span> <span class='ocrx_word' id='word_1_158' title='bbox 419 1073 445 1093; x_wconf 94' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_159' title='bbox 456 1073 547 1093; x_wconf 84' lang='eng' dir='ltr'><em>indicum</em></span> <span class='ocrx_word' id='word_1_160' title='bbox 557 1071 636 1093; x_wconf 90' lang='eng' dir='ltr'>BBH6T</span> <span class='ocrx_word' id='word_1_161' title='bbox 646 1073 790 1098; x_wconf 85' lang='eng' dir='ltr'>(AM158907)</span> <span class='ocrx_word' id='word_1_162' title='bbox 853 1071 994 1096; x_wconf 84' lang='eng' dir='ltr'>(EU863414)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 393 1105 781 1132; baseline 0 -5"><span class='ocrx_word' id='word_1_163' title='bbox 393 1108 419 1127; x_wconf 91' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_164' title='bbox 429 1108 550 1132; x_wconf 85' lang='eng' dir='ltr'><em>paludicola</em></span> <span class='ocrx_word' id='word_1_165' title='bbox 561 1105 636 1127; x_wconf 79' lang='eng' dir='ltr'>US15T</span> <span class='ocrx_word' id='word_1_166' title='bbox 646 1108 781 1132; x_wconf 85' lang='eng' dir='ltr'>(AJ853909)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 271 1140 838 1167; baseline 0 -5"><span class='ocrx_word' id='word_1_167' title='bbox 271 1146 296 1164; x_wconf 85' lang='eng'>97</span> <span class='ocrx_word' id='word_1_168' title='bbox 374 1142 400 1161; x_wconf 93' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_169' title='bbox 412 1142 547 1162; x_wconf 76' lang='eng' dir='ltr'><em>marinilaous</em></span> <span class='ocrx_word' id='word_1_170' title='bbox 555 1140 689 1162; x_wconf 86' lang='eng' dir='ltr'>YM11-607T</span> <span class='ocrx_word' id='word_1_171' title='bbox 698 1142 838 1167; x_wconf 78' lang='eng' dir='ltr'>(A3286020)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 186 1174 931 1926">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 186 1174 931 1926">
+     <span class='ocr_line' id='line_1_37' title="bbox 352 1174 745 1202; baseline 0 -6"><span class='ocrx_word' id='word_1_172' title='bbox 352 1177 378 1196; x_wconf 97' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_173' title='bbox 390 1177 438 1197; x_wconf 91' lang='eng' dir='ltr'><em>ulmi</em></span> <span class='ocrx_word' id='word_1_174' title='bbox 447 1176 502 1197; x_wconf 90' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_175' title='bbox 512 1174 596 1197; x_wconf 79' lang='eng' dir='ltr'>20991T</span> <span class='ocrx_word' id='word_1_176' title='bbox 606 1177 745 1202; x_wconf 86' lang='eng' dir='ltr'>(AY062021)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 347 1209 830 1236; baseline 0 -5"><span class='ocrx_word' id='word_1_177' title='bbox 347 1212 372 1231; x_wconf 93' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_178' title='bbox 391 1212 538 1231; x_wconf 83' lang='eng' dir='ltr'>sediminicola</span> <span class='ocrx_word' id='word_1_179' title='bbox 547 1209 681 1231; x_wconf 87' lang='eng' dir='ltr'>YM1O-847T</span> <span class='ocrx_word' id='word_1_180' title='bbox 690 1212 830 1236; x_wconf 80' lang='eng' dir='ltr'>(A8286021)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 417 1243 875 1270; baseline 0 -5"><span class='ocrx_word' id='word_1_181' title='bbox 417 1246 442 1265; x_wconf 95' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_182' title='bbox 454 1246 595 1270; x_wconf 84' lang='eng' dir='ltr'>ginsengisoli</span> <span class='ocrx_word' id='word_1_183' title='bbox 603 1245 661 1265; x_wconf 86' lang='eng' dir='ltr'>Gsoil</span> <span class='ocrx_word' id='word_1_184' title='bbox 671 1243 725 1265; x_wconf 82' lang='eng' dir='ltr'>259T</span> <span class='ocrx_word' id='word_1_185' title='bbox 735 1246 875 1270; x_wconf 80' lang='eng' dir='ltr'>(ABZ71048)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 362 1278 833 1305; baseline 0 -5"><span class='ocrx_word' id='word_1_186' title='bbox 362 1280 387 1300; x_wconf 94' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_187' title='bbox 399 1280 507 1305; x_wconf 80' lang='eng' dir='ltr'>imperiale</span> <span class='ocrx_word' id='word_1_188' title='bbox 517 1280 589 1300; x_wconf 89' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_189' title='bbox 601 1278 684 1300; x_wconf 90' lang='eng' dir='ltr'>12610T</span> <span class='ocrx_word' id='word_1_190' title='bbox 693 1280 833 1305; x_wconf 90' lang='eng' dir='ltr'>(ABOO7414)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 279 1312 834 1340; baseline -0.002 -5"><span class='ocrx_word' id='word_1_191' title='bbox 279 1315 303 1333; x_wconf 88' lang='eng'>87</span> <span class='ocrx_word' id='word_1_192' title='bbox 339 1315 365 1334; x_wconf 96' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_193' title='bbox 376 1315 523 1335; x_wconf 85' lang='eng' dir='ltr'>arborescens</span> <span class='ocrx_word' id='word_1_194' title='bbox 533 1314 605 1335; x_wconf 90' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_195' title='bbox 615 1312 685 1335; x_wconf 80' lang='eng' dir='ltr'>3750T</span> <span class='ocrx_word' id='word_1_196' title='bbox 694 1315 834 1340; x_wconf 88' lang='eng' dir='ltr'>(ABOO7421)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 242 1347 793 1374; baseline 0 -5"><span class='ocrx_word' id='word_1_197' title='bbox 242 1349 268 1369; x_wconf 97' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_198' title='bbox 279 1349 466 1374; x_wconf 81' lang='eng' dir='ltr'>keratano/yticum</span> <span class='ocrx_word' id='word_1_199' title='bbox 476 1349 549 1369; x_wconf 90' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_200' title='bbox 561 1347 643 1369; x_wconf 78' lang='eng' dir='ltr'>13309T</span> <span class='ocrx_word' id='word_1_201' title='bbox 653 1349 793 1374; x_wconf 92' lang='eng' dir='ltr'>(ABOO4717)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 230 1381 656 1409; baseline 0 -6"><span class='ocrx_word' id='word_1_202' title='bbox 230 1384 255 1403; x_wconf 94' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_203' title='bbox 267 1384 374 1404; x_wconf 81' lang='eng' dir='ltr'>resistens</span> <span class='ocrx_word' id='word_1_204' title='bbox 383 1384 461 1403; x_wconf 92' lang='eng' dir='ltr'><em>DMMZ</em></span> <span class='ocrx_word' id='word_1_205' title='bbox 472 1381 539 1404; x_wconf 83' lang='eng' dir='ltr'>1710T</span> <span class='ocrx_word' id='word_1_206' title='bbox 549 1384 574 1409; x_wconf 91' lang='eng' dir='ltr'>(Y</span> <span class='ocrx_word' id='word_1_207' title='bbox 577 1384 656 1409; x_wconf 85' lang='eng'>14699)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 251 1416 687 1443; baseline 0 -5"><span class='ocrx_word' id='word_1_208' title='bbox 251 1418 277 1438; x_wconf 68' lang='eng' dir='ltr'><em>M,</em></span> <span class='ocrx_word' id='word_1_209' title='bbox 289 1419 410 1438; x_wconf 82' lang='eng' dir='ltr'>testaceum</span> <span class='ocrx_word' id='word_1_210' title='bbox 420 1418 476 1438; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_211' title='bbox 487 1416 571 1438; x_wconf 81' lang='eng' dir='ltr'>20166T</span> <span class='ocrx_word' id='word_1_212' title='bbox 581 1418 687 1443; x_wconf 89' lang='eng' dir='ltr'>(X77445)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 252 1450 715 1477; baseline 0 -5"><span class='ocrx_word' id='word_1_213' title='bbox 252 1453 278 1472; x_wconf 95' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_214' title='bbox 289 1453 411 1472; x_wconf 82' lang='eng' dir='ltr'><em>oleivorans</em></span> <span class='ocrx_word' id='word_1_215' title='bbox 420 1452 475 1472; x_wconf 92' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_216' title='bbox 488 1450 571 1472; x_wconf 73' lang='eng' dir='ltr'>16091T</span> <span class='ocrx_word' id='word_1_217' title='bbox 580 1453 715 1477; x_wconf 87' lang='eng' dir='ltr'>(AJ698725)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 255 1485 716 1513; baseline 0.002 -6"><span class='ocrx_word' id='word_1_218' title='bbox 255 1487 281 1507; x_wconf 95' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_219' title='bbox 293 1487 410 1508; x_wconf 75' lang='eng' dir='ltr'>aero/atum</span> <span class='ocrx_word' id='word_1_220' title='bbox 420 1487 476 1508; x_wconf 86' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_221' title='bbox 488 1485 571 1507; x_wconf 90' lang='eng' dir='ltr'>14217T</span> <span class='ocrx_word' id='word_1_222' title='bbox 581 1487 716 1513; x_wconf 84' lang='eng' dir='ltr'>(AJ309929)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 244 1520 777 1547; baseline 0 -5"><span class='ocrx_word' id='word_1_223' title='bbox 244 1522 270 1542; x_wconf 95' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_224' title='bbox 281 1522 405 1542; x_wconf 82' lang='eng' dir='ltr'>naton&#39;ense</span> <span class='ocrx_word' id='word_1_225' title='bbox 414 1522 485 1542; x_wconf 90' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_226' title='bbox 496 1520 627 1542; x_wconf 85' lang='eng' dir='ltr'>BAA-1032T</span> <span class='ocrx_word' id='word_1_227' title='bbox 637 1522 777 1547; x_wconf 85' lang='eng' dir='ltr'>(AY566291)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_48' title="bbox 247 1556 690 1581; baseline 0 -5"><span class='ocrx_word' id='word_1_228' title='bbox 247 1556 273 1576; x_wconf 95' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_229' title='bbox 285 1556 379 1576; x_wconf 87' lang='eng' dir='ltr'><em>foliorum</em></span> <span class='ocrx_word' id='word_1_230' title='bbox 389 1556 444 1576; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_231' title='bbox 457 1556 545 1576; x_wconf 75' lang='eng' dir='ltr'>1296GT</span> <span class='ocrx_word' id='word_1_232' title='bbox 555 1556 690 1581; x_wconf 84' lang='eng' dir='ltr'>(AJ249780)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_49' title="bbox 228 1589 752 1616; baseline 0.002 -6"><span class='ocrx_word' id='word_1_233' title='bbox 228 1591 254 1610; x_wconf 96' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_234' title='bbox 264 1591 446 1616; x_wconf 85' lang='eng' dir='ltr'>phy/Iosphaerae</span> <span class='ocrx_word' id='word_1_235' title='bbox 456 1591 512 1611; x_wconf 84' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_236' title='bbox 524 1589 607 1611; x_wconf 82' lang='eng' dir='ltr'>13468T</span> <span class='ocrx_word' id='word_1_237' title='bbox 616 1591 752 1616; x_wconf 89' lang='eng' dir='ltr'>(AJ277840)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_50' title="bbox 260 1623 851 1650; baseline 0 -5"><span class='ocrx_word' id='word_1_238' title='bbox 260 1625 286 1645; x_wconf 96' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_239' title='bbox 297 1625 546 1650; x_wconf 77' lang='eng' dir='ltr'>hydrocarbonoxydans</span> <span class='ocrx_word' id='word_1_240' title='bbox 556 1625 611 1645; x_wconf 87' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_241' title='bbox 624 1623 706 1645; x_wconf 74' lang='eng' dir='ltr'>16089T</span> <span class='ocrx_word' id='word_1_242' title='bbox 715 1625 851 1650; x_wconf 79' lang='eng' dir='ltr'>(AJ698726)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_51' title="bbox 201 1654 798 1684; baseline 0 -5"><span class='ocrx_word' id='word_1_243' title='bbox 201 1654 226 1672; x_wconf 79' lang='eng'>95</span> <span class='ocrx_word' id='word_1_244' title='bbox 285 1659 311 1679; x_wconf 97' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_245' title='bbox 323 1659 521 1679; x_wconf 77' lang='eng' dir='ltr'>esteraromaticum</span> <span class='ocrx_word' id='word_1_246' title='bbox 531 1659 586 1679; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_247' title='bbox 597 1657 682 1679; x_wconf 74' lang='eng' dir='ltr'>86099T</span> <span class='ocrx_word' id='word_1_248' title='bbox 691 1659 798 1684; x_wconf 85' lang='eng' dir='ltr'>(Y17231)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_52' title="bbox 279 1691 931 1718; baseline 0 -5"><span class='ocrx_word' id='word_1_249' title='bbox 279 1694 305 1713; x_wconf 94' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_250' title='bbox 317 1694 605 1718; x_wconf 76' lang='eng' dir='ltr'>arabinogalactanolyticum</span> <span class='ocrx_word' id='word_1_251' title='bbox 615 1693 687 1713; x_wconf 88' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_252' title='bbox 699 1691 782 1713; x_wconf 78' lang='eng' dir='ltr'>14344T</span> <span class='ocrx_word' id='word_1_253' title='bbox 792 1694 931 1718; x_wconf 90' lang='eng' dir='ltr'>(ABOO4715)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_53' title="bbox 233 1725 725 1752; baseline 0 -5"><span class='ocrx_word' id='word_1_254' title='bbox 233 1728 259 1747; x_wconf 72' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_255' title='bbox 269 1728 423 1752; x_wconf 86' lang='eng' dir='ltr'>paraoxydans</span> <span class='ocrx_word' id='word_1_256' title='bbox 433 1727 488 1747; x_wconf 86' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_257' title='bbox 501 1725 583 1747; x_wconf 90' lang='eng' dir='ltr'>15019T</span> <span class='ocrx_word' id='word_1_258' title='bbox 590 1728 725 1752; x_wconf 88' lang='eng' dir='ltr'>(AJ491806)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_54' title="bbox 210 1756 728 1787; baseline 0 -5"><span class='ocrx_word' id='word_1_259' title='bbox 210 1756 234 1774; x_wconf 77' lang='eng'>82</span> <span class='ocrx_word' id='word_1_260' title='bbox 254 1762 279 1782; x_wconf 91' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_261' title='bbox 291 1762 401 1787; x_wconf 86' lang='eng' dir='ltr'>saperdae</span> <span class='ocrx_word' id='word_1_262' title='bbox 411 1762 484 1782; x_wconf 91' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_263' title='bbox 496 1760 579 1782; x_wconf 77' lang='eng' dir='ltr'>15038T</span> <span class='ocrx_word' id='word_1_264' title='bbox 588 1762 728 1787; x_wconf 87' lang='eng' dir='ltr'>(ABOO4719)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_55' title="bbox 276 1794 730 1822; baseline 0 -5"><span class='ocrx_word' id='word_1_265' title='bbox 276 1797 302 1817; x_wconf 91' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_266' title='bbox 313 1796 454 1822; x_wconf 82' lang='eng' dir='ltr'>quuefaciens</span> <span class='ocrx_word' id='word_1_267' title='bbox 463 1796 519 1817; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_268' title='bbox 529 1794 614 1817; x_wconf 79' lang='eng' dir='ltr'>20638T</span> <span class='ocrx_word' id='word_1_269' title='bbox 624 1797 730 1822; x_wconf 93' lang='eng' dir='ltr'>(X77444)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_56' title="bbox 223 1829 745 1862; baseline 0 -11"><span class='ocrx_word' id='word_1_270' title='bbox 223 1842 246 1862; x_wconf 73' lang='eng'>8</span> <span class='ocrx_word' id='word_1_271' title='bbox 266 1848 268 1851; x_wconf 99' lang='eng'>.</span> <span class='ocrx_word' id='word_1_272' title='bbox 280 1832 423 1856; x_wconf 79' lang='eng' dir='ltr'>maritypicum</span> <span class='ocrx_word' id='word_1_273' title='bbox 433 1831 506 1851; x_wconf 89' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_274' title='bbox 518 1829 600 1851; x_wconf 80' lang='eng' dir='ltr'>15779T</span> <span class='ocrx_word' id='word_1_275' title='bbox 610 1832 745 1856; x_wconf 81' lang='eng' dir='ltr'>(AJ853910)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_57' title="bbox 186 1864 655 1891; baseline 0 -5"><span class='ocrx_word' id='word_1_276' title='bbox 186 1869 208 1887; x_wconf 88' lang='eng'>61</span> <span class='ocrx_word' id='word_1_277' title='bbox 242 1866 268 1886; x_wconf 95' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_278' title='bbox 280 1866 379 1891; x_wconf 80' lang='eng' dir='ltr'>oxydans</span> <span class='ocrx_word' id='word_1_279' title='bbox 388 1866 444 1886; x_wconf 90' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_280' title='bbox 454 1864 539 1886; x_wconf 89' lang='eng' dir='ltr'>20578T</span> <span class='ocrx_word' id='word_1_281' title='bbox 549 1866 655 1891; x_wconf 92' lang='eng' dir='ltr'>(Y17227)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_58' title="bbox 259 1899 722 1926; baseline 0 -6"><span class='ocrx_word' id='word_1_282' title='bbox 259 1901 284 1920; x_wconf 96' lang='eng' dir='ltr'>M.</span> <span class='ocrx_word' id='word_1_283' title='bbox 295 1901 396 1921; x_wconf 77' lang='eng' dir='ltr'>Iuteolum</span> <span class='ocrx_word' id='word_1_284' title='bbox 406 1901 479 1921; x_wconf 89' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_285' title='bbox 490 1899 573 1921; x_wconf 91' lang='eng' dir='ltr'>15074T</span> <span class='ocrx_word' id='word_1_286' title='bbox 583 1901 722 1926; x_wconf 85' lang='eng' dir='ltr'>(ABOO4718)</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003210-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003210-0-000.pbm.png
new file mode 100644
index 00000000..b5746bea
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003210-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003210-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003210-0-000.pbm.png.hocr
new file mode 100644
index 00000000..40c6a799
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003210-0-000.pbm.png.hocr
@@ -0,0 +1,256 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003210-0-000.pbm.png"; bbox 0 0 947 1263; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 5 86 7 456">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 5 86 7 456">
+     <span class='ocr_line' id='line_1_1' title="bbox 5 86 7 456; baseline 0 807"><span class='ocrx_word' id='word_1_1' title='bbox 5 86 7 456; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 5 455 29 456">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 5 455 29 456">
+     <span class='ocr_line' id='line_1_2' title="bbox 5 455 29 456; baseline 0 807"><span class='ocrx_word' id='word_1_2' title='bbox 5 455 29 456; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 27 124 30 788">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 27 124 30 788">
+     <span class='ocr_line' id='line_1_3' title="bbox 27 124 30 788; baseline 0 475"><span class='ocrx_word' id='word_1_3' title='bbox 27 124 30 788; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 140 3 171 23">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 140 3 171 23">
+     <span class='ocr_line' id='line_1_4' title="bbox 140 3 171 23; baseline 0 0"><span class='ocrx_word' id='word_1_4' title='bbox 140 3 171 23; x_wconf 91' lang='eng'><em>0.1</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 160 76 894 178">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 160 76 894 178">
+     <span class='ocr_line' id='line_1_5' title="bbox 345 76 894 103; baseline 0 -5"><span class='ocrx_word' id='word_1_5' title='bbox 345 79 467 103; x_wconf 82' lang='eng' dir='ltr'><em>Bergeyella</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 477 79 603 98; x_wconf 84' lang='eng' dir='ltr'><em>zoohelcum</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 611 78 682 98; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 690 76 774 98; x_wconf 84' lang='eng' dir='ltr'><em>43767T</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 784 78 894 103; x_wconf 83' lang='eng' dir='ltr'><em>(M93153)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 219 112 816 139; baseline 0 -5"><span class='ocrx_word' id='word_1_10' title='bbox 219 114 416 139; x_wconf 85' lang='eng' dir='ltr'><em>Capnocytophaga</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 425 115 533 139; x_wconf 85' lang='eng' dir='ltr'><em>gingivalis</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 540 114 611 134; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 621 112 703 134; x_wconf 82' lang='eng' dir='ltr'><em>33624T</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 713 114 816 139; x_wconf 86' lang='eng' dir='ltr'><em>(L14639)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 160 151 433 178; baseline 0 -5"><span class='ocrx_word' id='word_1_15' title='bbox 160 162 201 164; x_wconf 89' lang='eng'>—</span> <span class='ocrx_word' id='word_1_16' title='bbox 207 151 285 173; x_wconf 90' lang='eng' dir='ltr'><em>EM41T</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 294 154 433 178; x_wconf 86' lang='eng' dir='ltr'><em>(EU443205)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 159 162 160 230">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 159 162 160 230">
+     <span class='ocr_line' id='line_1_8' title="bbox 159 162 160 230; baseline 0 1033"><span class='ocrx_word' id='word_1_18' title='bbox 159 162 160 230; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 101 265 125 266">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 101 265 125 266">
+     <span class='ocr_line' id='line_1_9' title="bbox 101 265 125 266; baseline 0 997"><span class='ocrx_word' id='word_1_19' title='bbox 101 265 125 266; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 124 196 125 337">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 124 196 125 337">
+     <span class='ocr_line' id='line_1_10' title="bbox 124 196 125 337; baseline 0 926"><span class='ocrx_word' id='word_1_20' title='bbox 124 196 125 337; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 120 413 144 414">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 120 413 144 414">
+     <span class='ocr_line' id='line_1_11' title="bbox 120 413 144 414; baseline 0 849"><span class='ocrx_word' id='word_1_21' title='bbox 120 413 144 414; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 143 393 144 434">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 143 393 144 434">
+     <span class='ocr_line' id='line_1_12' title="bbox 143 393 144 434; baseline 0 829"><span class='ocrx_word' id='word_1_22' title='bbox 143 393 144 434; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 72 450 102 451">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 72 450 102 451">
+     <span class='ocr_line' id='line_1_13' title="bbox 72 450 102 451; baseline 0 812"><span class='ocrx_word' id='word_1_23' title='bbox 72 450 102 451; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 27 786 74 788">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 27 786 74 788">
+     <span class='ocr_line' id='line_1_14' title="bbox 27 786 74 788; baseline 0 475"><span class='ocrx_word' id='word_1_24' title='bbox 27 786 74 788; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 72 449 74 1124">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 72 449 74 1124">
+     <span class='ocr_line' id='line_1_15' title="bbox 72 449 74 1124; baseline 0 139"><span class='ocrx_word' id='word_1_25' title='bbox 72 449 74 1124; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 128 508 324 509">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 128 508 324 509">
+     <span class='ocr_line' id='line_1_16' title="bbox 128 508 324 509; baseline 0 754"><span class='ocrx_word' id='word_1_26' title='bbox 128 508 324 509; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 173 510 174 583">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 173 510 174 583">
+     <span class='ocr_line' id='line_1_17' title="bbox 173 510 174 583; baseline 0 680"><span class='ocrx_word' id='word_1_27' title='bbox 173 510 174 583; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 279 586 340 588">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 279 586 340 588">
+     <span class='ocr_line' id='line_1_18' title="bbox 279 586 340 588; baseline 0 675"><span class='ocrx_word' id='word_1_28' title='bbox 279 586 340 588; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 100 265 102 634">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 100 265 102 634">
+     <span class='ocr_line' id='line_1_19' title="bbox 100 265 102 634; baseline 0 629"><span class='ocrx_word' id='word_1_29' title='bbox 100 265 102 634; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 198 548 200 617">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 198 548 200 617">
+     <span class='ocr_line' id='line_1_20' title="bbox 198 548 200 617; baseline 0 646"><span class='ocrx_word' id='word_1_30' title='bbox 198 548 200 617; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 198 616 279 617">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 198 616 279 617">
+     <span class='ocr_line' id='line_1_21' title="bbox 198 616 279 617; baseline 0 646"><span class='ocrx_word' id='word_1_31' title='bbox 198 616 279 617; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 101 632 122 634">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 101 632 122 634">
+     <span class='ocr_line' id='line_1_22' title="bbox 101 632 122 634; baseline 0 629"><span class='ocrx_word' id='word_1_32' title='bbox 101 632 122 634; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 278 586 279 646">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 278 586 279 646">
+     <span class='ocr_line' id='line_1_23' title="bbox 278 586 279 646; baseline 0 617"><span class='ocrx_word' id='word_1_33' title='bbox 278 586 279 646; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 289 625 291 665">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 289 625 291 665">
+     <span class='ocr_line' id='line_1_24' title="bbox 289 625 291 665; baseline 0 598"><span class='ocrx_word' id='word_1_34' title='bbox 289 625 291 665; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 120 413 122 854">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 120 413 122 854">
+     <span class='ocr_line' id='line_1_25' title="bbox 120 413 122 854; baseline 0 409"><span class='ocrx_word' id='word_1_35' title='bbox 120 413 122 854; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 128 508 131 845">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 128 508 131 845">
+     <span class='ocr_line' id='line_1_26' title="bbox 128 508 131 845; baseline 0 418"><span class='ocrx_word' id='word_1_36' title='bbox 128 508 131 845; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 160 764 162 925">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 160 764 162 925">
+     <span class='ocr_line' id='line_1_27' title="bbox 160 764 162 925; baseline 0 338"><span class='ocrx_word' id='word_1_37' title='bbox 160 764 162 925; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 125 508 130 1030">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 125 508 130 1030">
+     <span class='ocr_line' id='line_1_28' title="bbox 125 508 130 1030; baseline 0 233"><span class='ocrx_word' id='word_1_38' title='bbox 125 508 130 1030; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 94 1125 96 1195">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 94 1125 96 1195">
+     <span class='ocr_line' id='line_1_29' title="bbox 94 1125 96 1195; baseline 0 68"><span class='ocrx_word' id='word_1_39' title='bbox 94 1125 96 1195; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 119 1165 120 1224">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 119 1165 120 1224">
+     <span class='ocr_line' id='line_1_30' title="bbox 119 1165 120 1224; baseline 0 39"><span class='ocrx_word' id='word_1_40' title='bbox 119 1165 120 1224; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 45 173 945 1246">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 45 173 945 1246">
+     <span class='ocr_line' id='line_1_31' title="bbox 120 173 436 196; baseline 0.003 -6"><span class='ocrx_word' id='word_1_41' title='bbox 120 173 156 191; x_wconf 91' lang='eng'>100</span> <span class='ocrx_word' id='word_1_42' title='bbox 420 193 422 196; x_wconf 29' lang='eng' dir='ltr'><strong>I</strong></span> <span class='ocrx_word' id='word_1_43' title='bbox 433 193 436 196; x_wconf 10' lang='eng' dir='ltr'><em>g</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 125 190 756 218; baseline 0 -5"><span class='ocrx_word' id='word_1_44' title='bbox 125 190 167 204; x_wconf 41' lang='eng' dir='ltr'><em>a</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 213 193 365 218; x_wconf 83' lang='eng' dir='ltr'><em>Cellulophaga</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 373 193 461 218; x_wconf 74' lang='eng' dir='ltr'><em>paelﬂca</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 471 193 530 212; x_wconf 94' lang='eng' dir='ltr'><em>KMM</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 540 191 608 213; x_wconf 82' lang='eng' dir='ltr'><em>3664T</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 617 193 756 218; x_wconf 85' lang='eng' dir='ltr'><em>(AB100840)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 94 200 730 278; baseline 0 -28"><span class='ocrx_word' id='word_1_50' title='bbox 94 243 118 260; x_wconf 80' lang='eng'><em>74</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 143 200 241 278; x_wconf 43' lang='eng'><em>106%</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 247 230 398 255; x_wconf 86' lang='eng' dir='ltr'><em>Cellulophaga</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 407 231 495 255; x_wconf 83' lang='eng' dir='ltr'><em>a/gico/a</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 506 228 584 250; x_wconf 80' lang='eng' dir='ltr'><em>IC166T</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 593 230 730 255; x_wconf 86' lang='eng' dir='ltr'><em>(AF001366)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 167 265 757 293; baseline 0 -5"><span class='ocrx_word' id='word_1_56' title='bbox 167 265 191 283; x_wconf 82' lang='eng'><em>93</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 234 268 385 293; x_wconf 83' lang='eng' dir='ltr'><em>Cel/u/ophaga</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 394 268 469 288; x_wconf 82' lang='eng' dir='ltr'><em>baltica</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 479 266 614 288; x_wconf 89' lang='eng' dir='ltr'><em>NN01584OT</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 623 268 757 293; x_wconf 86' lang='eng' dir='ltr'><em>(AJ005972)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 210 306 768 356; baseline 0 -29"><span class='ocrx_word' id='word_1_61' title='bbox 210 308 383 356; x_wconf 69' lang='eng' dir='ltr'><em>ECeIIu/ophaga</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 393 308 480 328; x_wconf 83' lang='eng' dir='ltr'><em>fucico/a</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 490 306 625 327; x_wconf 83' lang='eng' dir='ltr'><em>NNO15860T</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 634 308 768 333; x_wconf 83' lang='eng' dir='ltr'><em>(AJ005973)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 169 343 758 370; baseline 0 -5"><span class='ocrx_word' id='word_1_65' title='bbox 169 344 205 361; x_wconf 89' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 249 346 399 370; x_wconf 82' lang='eng' dir='ltr'><em>Cellulophaga</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 408 346 467 370; x_wconf 82' lang='eng' dir='ltr'><em>Iytica</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 476 345 546 365; x_wconf 88' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 555 343 638 365; x_wconf 83' lang='eng' dir='ltr'><em>23178T</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 648 346 758 370; x_wconf 84' lang='eng' dir='ltr'><em>(M62796)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 115 383 853 410; baseline 0 -6"><span class='ocrx_word' id='word_1_71' title='bbox 115 390 139 407; x_wconf 85' lang='eng'><em>90</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 287 385 438 410; x_wconf 85' lang='eng' dir='ltr'><em>Robiginitalea</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 447 385 555 404; x_wconf 82' lang='eng' dir='ltr'><em>biformata</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 565 383 706 404; x_wconf 79' lang='eng' dir='ltr'><em>HTCC2501T</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 716 385 853 410; x_wconf 87' lang='eng' dir='ltr'><em>(AY424899)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 73 421 924 448; baseline -0.002 -3"><span class='ocrx_word' id='word_1_76' title='bbox 73 428 97 446; x_wconf 85' lang='eng'><em>62</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 291 424 502 443; x_wconf 77' lang='eng' dir='ltr'><em>Zeaxanthinibacter</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 509 424 669 443; x_wconf 87' lang='eng' dir='ltr'><em>enoshimensis</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 677 421 779 443; x_wconf 78' lang='eng' dir='ltr'><em>TD-ZE3T</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 786 424 924 448; x_wconf 78' lang='eng' dir='ltr'><em>(A3264057)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 320 459 945 486; baseline 0 -5"><span class='ocrx_word' id='word_1_81' title='bbox 320 462 455 481; x_wconf 83' lang='eng' dir='ltr'><em>Vite/Iibacter</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 462 462 652 481; x_wconf 81' lang='eng' dir='ltr'><em>v/adivostokensis</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 662 462 720 481; x_wconf 93' lang='eng' dir='ltr'><em>KMM</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 730 459 798 481; x_wconf 79' lang='eng' dir='ltr'><em>3516T</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 807 461 945 486; x_wconf 85' lang='eng' dir='ltr'><em>(ABO71382)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 128 486 919 525; baseline 0 -5"><span class='ocrx_word' id='word_1_86' title='bbox 128 486 149 503; x_wconf 64' lang='eng'>51</span> <span class='ocrx_word' id='word_1_87' title='bbox 330 500 461 520; x_wconf 77' lang='eng' dir='ltr'><em>Costenonia</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 471 502 588 525; x_wconf 77' lang='eng' dir='ltr'><em>aggregate</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 598 500 676 520; x_wconf 88' lang='eng' dir='ltr'><em>KOPRI</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 688 498 770 520; x_wconf 78' lang='eng' dir='ltr'><em>13342T</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 777 500 919 525; x_wconf 85' lang='eng' dir='ltr'><em>(DQ167246)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 148 536 905 569; baseline 0 -11"><span class='ocrx_word' id='word_1_92' title='bbox 148 552 159 569; x_wconf 74' lang='eng'>9</span> <span class='ocrx_word' id='word_1_93' title='bbox 199 539 470 563; x_wconf 84' lang='eng' dir='ltr'><em>-FIage/limonas</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 479 539 589 558; x_wconf 83' lang='eng' dir='ltr'><em>eckloniae</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 599 538 692 558; x_wconf 91' lang='eng' dir='ltr'>DOKDO</span> <span class='ocrx_word' id='word_1_96' title='bbox 702 536 905 563; x_wconf 77' lang='eng' dir='ltr'><em>007T(DQ191180)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 172 575 845 606; baseline 0 -9"><span class='ocrx_word' id='word_1_97' title='bbox 172 575 207 606; x_wconf 45' lang='eng'><em>9’8.</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 345 578 466 597; x_wconf 83' lang='eng' dir='ltr'><em>Muricauda</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 476 578 599 597; x_wconf 84' lang='eng' dir='ltr'><em>flavescens</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 608 576 698 597; x_wconf 79' lang='eng' dir='ltr'><em>SW-62T</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 707 578 845 603; x_wconf 87' lang='eng' dir='ltr'><em>(AY445073)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 92 614 815 656; baseline -0.001 -20"><span class='ocrx_word' id='word_1_102' title='bbox 92 639 117 656; x_wconf 72' lang='eng'><em>57</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 236 622 272 639; x_wconf 80' lang='eng'>100</span> <span class='ocrx_word' id='word_1_104' title='bbox 279 625 322 646; x_wconf 35' lang='eng'><em>»*</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 327 616 448 636; x_wconf 86' lang='eng' dir='ltr'><em>Muricauda</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 457 616 621 641; x_wconf 83' lang='eng' dir='ltr'><em>ruestringensis</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 630 614 671 635; x_wconf 92' lang='eng' dir='ltr'><em>B1T</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 678 616 815 641; x_wconf 86' lang='eng' dir='ltr'><em>(AF218782)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 261 651 816 680; baseline 0 -6"><span class='ocrx_word' id='word_1_109' title='bbox 261 651 285 668; x_wconf 78' lang='eng'>92</span> <span class='ocrx_word' id='word_1_110' title='bbox 291 664 307 665; x_wconf 36' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 313 655 434 675; x_wconf 85' lang='eng' dir='ltr'><em>Muricauda</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 443 655 572 680; x_wconf 86' lang='eng' dir='ltr'><em>aquimarina</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 581 653 671 675; x_wconf 81' lang='eng' dir='ltr'><em>SW-63T</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 678 655 816 680; x_wconf 89' lang='eng' dir='ltr'><em>(AY445075)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 215 691 853 718; baseline 0 -6"><span class='ocrx_word' id='word_1_115' title='bbox 215 700 252 718; x_wconf 76' lang='eng'>100</span> <span class='ocrx_word' id='word_1_116' title='bbox 266 693 357 713; x_wconf 86' lang='eng' dir='ltr'><em>Zobellia</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 366 693 550 718; x_wconf 84' lang='eng' dir='ltr'><em>galactanivorans</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 559 693 614 713; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 626 691 707 713; x_wconf 85' lang='eng' dir='ltr'><em>12802T</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 717 693 853 718; x_wconf 81' lang='eng' dir='ltr'><em>(AF208293)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 202 730 753 758; baseline 0.002 -7"><span class='ocrx_word' id='word_1_121' title='bbox 202 741 238 758; x_wconf 73' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 262 732 353 752; x_wconf 84' lang='eng' dir='ltr'><em>Zobellia</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 363 732 464 757; x_wconf 87' lang='eng' dir='ltr'><em>uliginosa</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 473 732 544 752; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 555 730 636 752; x_wconf 87' lang='eng' dir='ltr'><em>14397T</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 643 732 753 757; x_wconf 85' lang='eng' dir='ltr'><em>(M62799)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 45 701 772 857; baseline 0 -68"><span class='ocrx_word' id='word_1_127' title='bbox 45 792 69 810; x_wconf 72' lang='eng'><em>97</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 162 701 373 857; x_wconf 32' lang='eng' dir='ltr'><em>‘QZobeI/ia</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 382 770 470 789; x_wconf 87' lang='eng' dir='ltr'><em>russeI/ii</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 478 770 532 789; x_wconf 92' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 542 768 625 789; x_wconf 91' lang='eng' dir='ltr'><em>22071T</em></span> <span class='ocrx_word' id='word_1_132' title='bbox 634 770 772 795; x_wconf 84' lang='eng' dir='ltr'><em>(AB121976)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_48' title="bbox 215 807 835 834; baseline -0.002 -5"><span class='ocrx_word' id='word_1_133' title='bbox 215 812 240 829; x_wconf 84' lang='eng'>66</span> <span class='ocrx_word' id='word_1_134' title='bbox 271 809 362 829; x_wconf 70' lang='eng' dir='ltr'><em>Zobellia</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 371 809 532 834; x_wconf 83' lang='eng' dir='ltr'><em>amurskyensis</em></span> <span class='ocrx_word' id='word_1_136' title='bbox 541 809 595 829; x_wconf 92' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_137' title='bbox 604 807 687 829; x_wconf 84' lang='eng' dir='ltr'><em>22069T</em></span> <span class='ocrx_word' id='word_1_138' title='bbox 697 809 835 834; x_wconf 84' lang='eng' dir='ltr'><em>(AB121974)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_49' title="bbox 130 839 786 872; baseline -0.003 -4"><span class='ocrx_word' id='word_1_139' title='bbox 130 839 168 868; x_wconf 70' lang='eng'><em>9—7&#39;</em></span> <span class='ocrx_word' id='word_1_140' title='bbox 225 844 249 861; x_wconf 84' lang='eng'>97</span> <span class='ocrx_word' id='word_1_141' title='bbox 275 847 366 866; x_wconf 87' lang='eng' dir='ltr'><em>Zobe/Iia</em></span> <span class='ocrx_word' id='word_1_142' title='bbox 375 847 495 866; x_wconf 87' lang='eng' dir='ltr'><em>laminariae</em></span> <span class='ocrx_word' id='word_1_143' title='bbox 505 847 563 866; x_wconf 94' lang='eng' dir='ltr'><em>KMM</em></span> <span class='ocrx_word' id='word_1_144' title='bbox 573 845 641 866; x_wconf 77' lang='eng' dir='ltr'><em>3676T</em></span> <span class='ocrx_word' id='word_1_145' title='bbox 648 847 786 872; x_wconf 85' lang='eng' dir='ltr'><em>(AB121975)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_50' title="bbox 247 885 847 912; baseline 0 -5"><span class='ocrx_word' id='word_1_146' title='bbox 247 887 372 907; x_wconf 80' lang='eng' dir='ltr'><em>Maribacter</em></span> <span class='ocrx_word' id='word_1_147' title='bbox 377 887 539 912; x_wconf 81' lang='eng' dir='ltr'><em>polysiphoniae</em></span> <span class='ocrx_word' id='word_1_148' title='bbox 548 887 602 907; x_wconf 91' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_149' title='bbox 612 887 680 907; x_wconf 85' lang='eng'><em>23671</em></span> <span class='ocrx_word' id='word_1_150' title='bbox 685 885 695 898; x_wconf 70' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_151' title='bbox 704 887 847 912; x_wconf 85' lang='eng' dir='ltr'><em>(AM497875)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_51' title="bbox 155 894 787 973; baseline -0.002 -27"><span class='ocrx_word' id='word_1_152' title='bbox 155 894 379 973; x_wconf 56' lang='eng' dir='ltr'><em>QEEMaribacter</em></span> <span class='ocrx_word' id='word_1_153' title='bbox 385 926 494 951; x_wconf 84' lang='eng' dir='ltr'><em>aquivivus</em></span> <span class='ocrx_word' id='word_1_154' title='bbox 503 926 561 945; x_wconf 93' lang='eng' dir='ltr'><em>KMM</em></span> <span class='ocrx_word' id='word_1_155' title='bbox 571 924 639 946; x_wconf 76' lang='eng' dir='ltr'><em>3949T</em></span> <span class='ocrx_word' id='word_1_156' title='bbox 649 926 787 951; x_wconf 89' lang='eng' dir='ltr'><em>(AY271625)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_52' title="bbox 175 959 858 988; baseline 0.001 -6"><span class='ocrx_word' id='word_1_157' title='bbox 175 959 199 976; x_wconf 67' lang='eng'><em>98</em></span> <span class='ocrx_word' id='word_1_158' title='bbox 261 963 386 983; x_wconf 83' lang='eng' dir='ltr'><em>Maribacter</em></span> <span class='ocrx_word' id='word_1_159' title='bbox 392 963 540 983; x_wconf 84' lang='eng' dir='ltr'><em>dokdonensis</em></span> <span class='ocrx_word' id='word_1_160' title='bbox 549 963 618 983; x_wconf 93' lang='eng' dir='ltr'><em>KCTC</em></span> <span class='ocrx_word' id='word_1_161' title='bbox 629 961 711 983; x_wconf 78' lang='eng' dir='ltr'><em>12393T</em></span> <span class='ocrx_word' id='word_1_162' title='bbox 720 963 858 988; x_wconf 84' lang='eng' dir='ltr'><em>(AY960749)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_53' title="bbox 126 999 827 1050; baseline 0 -30"><span class='ocrx_word' id='word_1_163' title='bbox 126 1001 390 1050; x_wconf 51' lang='eng' dir='ltr'><em>ﬂan/beater</em></span> <span class='ocrx_word' id='word_1_164' title='bbox 395 1001 528 1025; x_wconf 84' lang='eng' dir='ltr'><em>palladensis</em></span> <span class='ocrx_word' id='word_1_165' title='bbox 537 1001 591 1020; x_wconf 92' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_166' title='bbox 600 999 683 1020; x_wconf 72' lang='eng' dir='ltr'><em>21972T</em></span> <span class='ocrx_word' id='word_1_167' title='bbox 693 1001 827 1026; x_wconf 84' lang='eng' dir='ltr'><em>(AJ575643)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_54' title="bbox 144 1035 804 1065; baseline 0 -6"><span class='ocrx_word' id='word_1_168' title='bbox 144 1035 180 1052; x_wconf 83' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_169' title='bbox 280 1040 527 1060; x_wconf 83' lang='eng' dir='ltr'><em>Arenibacter/atericius</em></span> <span class='ocrx_word' id='word_1_170' title='bbox 537 1040 594 1059; x_wconf 94' lang='eng' dir='ltr'><em>KMM</em></span> <span class='ocrx_word' id='word_1_171' title='bbox 604 1038 658 1060; x_wconf 77' lang='eng' dir='ltr'><em>426T</em></span> <span class='ocrx_word' id='word_1_172' title='bbox 668 1040 804 1065; x_wconf 89' lang='eng' dir='ltr'><em>(AF052742)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_55' title="bbox 265 1077 834 1104; baseline -0.002 -5"><span class='ocrx_word' id='word_1_173' title='bbox 265 1079 443 1099; x_wconf 84' lang='eng' dir='ltr'><em>Flavobacterium</em></span> <span class='ocrx_word' id='word_1_174' title='bbox 452 1079 543 1104; x_wconf 80' lang='eng' dir='ltr'><em>aquatile</em></span> <span class='ocrx_word' id='word_1_175' title='bbox 552 1079 622 1099; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_176' title='bbox 633 1077 714 1099; x_wconf 80' lang='eng' dir='ltr'><em>11947T</em></span> <span class='ocrx_word' id='word_1_177' title='bbox 724 1079 834 1104; x_wconf 82' lang='eng' dir='ltr'><em>(M62797)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_56' title="bbox 235 1115 725 1142; baseline 0 -6"><span class='ocrx_word' id='word_1_178' title='bbox 235 1117 419 1142; x_wconf 76' lang='eng' dir='ltr'><em>Salegentibacter</em></span> <span class='ocrx_word' id='word_1_179' title='bbox 426 1118 503 1136; x_wconf 81' lang='eng' dir='ltr'><em>catena</em></span> <span class='ocrx_word' id='word_1_180' title='bbox 513 1115 573 1136; x_wconf 88' lang='eng' dir='ltr'><em>HY1T</em></span> <span class='ocrx_word' id='word_1_181' title='bbox 582 1117 725 1142; x_wconf 87' lang='eng' dir='ltr'><em>(DQ640642)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_57' title="bbox 66 1154 944 1183; baseline -0.001 -7"><span class='ocrx_word' id='word_1_182' title='bbox 66 1166 90 1183; x_wconf 71' lang='eng'><em>68</em></span> <span class='ocrx_word' id='word_1_183' title='bbox 120 1164 238 1166; x_wconf 34' lang='eng'><strong>#</strong></span> <span class='ocrx_word' id='word_1_184' title='bbox 245 1156 416 1176; x_wconf 73' lang='eng' dir='ltr'><em>Gaetbulibacter</em></span> <span class='ocrx_word' id='word_1_185' title='bbox 422 1156 627 1176; x_wconf 86' lang='eng' dir='ltr'><em>saemankumensis</em></span> <span class='ocrx_word' id='word_1_186' title='bbox 636 1156 705 1176; x_wconf 91' lang='eng' dir='ltr'><em>KCTC</em></span> <span class='ocrx_word' id='word_1_187' title='bbox 717 1154 797 1176; x_wconf 81' lang='eng' dir='ltr'><em>12379T</em></span> <span class='ocrx_word' id='word_1_188' title='bbox 807 1156 944 1181; x_wconf 87' lang='eng' dir='ltr'><em>(AY883937)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_58' title="bbox 89 1189 756 1216; baseline -0.003 0"><span class='ocrx_word' id='word_1_189' title='bbox 89 1189 126 1216; x_wconf 51' lang='eng'><em>9—8.</em></span> <span class='ocrx_word' id='word_1_190' title='bbox 224 1194 341 1214; x_wconf 86' lang='eng' dir='ltr'><em>U/vibacter</em></span> <span class='ocrx_word' id='word_1_191' title='bbox 348 1194 474 1214; x_wconf 82' lang='eng' dir='ltr'><em>antarcticus</em></span> <span class='ocrx_word' id='word_1_192' title='bbox 484 1192 618 1214; x_wconf 89' lang='eng' dir='ltr'><em>|MCC3101T</em></span> <span class='ocrx_word' id='word_1_193' title='bbox 637 1194 756 1214; x_wconf 85' lang='eng' dir='ltr'><em>EF554364</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_59' title="bbox 120 1194 764 1246; baseline -0.006 0"><span class='ocrx_word' id='word_1_194' title='bbox 120 1203 226 1246; x_wconf 47' lang='eng' dir='ltr'><em>WC</em></span> <span class='ocrx_word' id='word_1_195' title='bbox 628 1194 634 1219; x_wconf 67' lang='eng'><strong>‘</strong></span> <span class='ocrx_word' id='word_1_196' title='bbox 758 1194 764 1219; x_wconf 57' lang='eng'><em>)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 156 1229 755 1260">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 156 1229 755 1260">
+     <span class='ocr_line' id='line_1_60' title="bbox 156 1229 755 1260; baseline 0 -6"><span class='ocrx_word' id='word_1_197' title='bbox 156 1229 167 1246; x_wconf 82' lang='eng'>0</span> <span class='ocrx_word' id='word_1_198' title='bbox 232 1235 350 1255; x_wconf 81' lang='eng' dir='ltr'><em>U/vibacter</em></span> <span class='ocrx_word' id='word_1_199' title='bbox 355 1235 437 1255; x_wconf 85' lang='eng' dir='ltr'><em>Iitoralis</em></span> <span class='ocrx_word' id='word_1_200' title='bbox 446 1235 515 1255; x_wconf 85' lang='eng' dir='ltr'><em>KCTC</em></span> <span class='ocrx_word' id='word_1_201' title='bbox 527 1233 607 1254; x_wconf 72' lang='eng' dir='ltr'><em>12104T</em></span> <span class='ocrx_word' id='word_1_202' title='bbox 617 1235 755 1260; x_wconf 84' lang='eng' dir='ltr'><em>(AY243096)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003228-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003228-0-001.pbm.png
new file mode 100644
index 00000000..6f467cdf
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003228-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003228-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003228-0-001.pbm.png.hocr
new file mode 100644
index 00000000..b0a142f7
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003228-0-001.pbm.png.hocr
@@ -0,0 +1,492 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003228-0-001.pbm.png"; bbox 0 0 1302 790; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 34 62 79 75">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 34 62 79 75">
+     <span class='ocr_line' id='line_1_1' title="bbox 34 62 79 75; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 34 62 43 75; x_wconf 90' lang='eng' dir='ltr'>O</span> <span class='ocrx_word' id='word_1_2' title='bbox 49 62 79 75; x_wconf 83' lang='eng'><em>005</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 132 245 151 259">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 132 245 151 259">
+     <span class='ocr_line' id='line_1_2' title="bbox 132 245 151 259; baseline 0 0"><span class='ocrx_word' id='word_1_3' title='bbox 132 245 151 259; x_wconf 82' lang='eng'><em>85</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 200 83 219 97">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 200 83 219 97">
+     <span class='ocr_line' id='line_1_3' title="bbox 200 83 219 97; baseline 0 0"><span class='ocrx_word' id='word_1_4' title='bbox 200 83 219 97; x_wconf 85' lang='eng'><em>50</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 253 42 272 56">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 253 42 272 56">
+     <span class='ocr_line' id='line_1_4' title="bbox 253 42 272 56; baseline 0 0"><span class='ocrx_word' id='word_1_5' title='bbox 253 42 272 56; x_wconf 86' lang='eng'><em>72</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 313 4 873 31">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 313 6 873 29">
+     <span class='ocr_line' id='line_1_5' title="bbox 313 6 873 29; baseline 0.002 -6"><span class='ocrx_word' id='word_1_6' title='bbox 313 16 332 29; x_wconf 71' lang='eng'>99</span> <span class='ocrx_word' id='word_1_7' title='bbox 341 15 387 17; x_wconf 98' lang='eng'>—</span> <span class='ocrx_word' id='word_1_8' title='bbox 393 7 559 28; x_wconf 77' lang='eng' dir='ltr'><em>Planotelraspora</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 567 7 611 24; x_wconf 86' lang='eng' dir='ltr'><em>mira</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 621 6 685 24; x_wconf 90' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 696 6 767 24; x_wconf 77' lang='eng' dir='ltr'><em>15435T</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 776 7 873 28; x_wconf 82' lang='eng' dir='ltr'><em>(D85496)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 279 33 341 35">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 279 33 341 35">
+     <span class='ocr_line' id='line_1_6' title="bbox 279 33 341 35; baseline 0 755"><span class='ocrx_word' id='word_1_13' title='bbox 279 33 341 35; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 226 59 281 63">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 226 59 281 63">
+     <span class='ocr_line' id='line_1_7' title="bbox 226 59 281 63; baseline 0 727"><span class='ocrx_word' id='word_1_14' title='bbox 226 59 281 63; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 192 101 228 103">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 192 101 228 103">
+     <span class='ocr_line' id='line_1_8' title="bbox 192 101 228 103; baseline 0 687"><span class='ocrx_word' id='word_1_15' title='bbox 192 101 228 103; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 165 145 184 158">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 165 145 184 158">
+     <span class='ocr_line' id='line_1_9' title="bbox 165 145 184 158; baseline 0 0"><span class='ocrx_word' id='word_1_16' title='bbox 165 145 184 158; x_wconf 82' lang='eng'><em>65</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 226 60 228 143">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 226 60 228 143">
+     <span class='ocr_line' id='line_1_10' title="bbox 226 60 228 143; baseline 0 647"><span class='ocrx_word' id='word_1_17' title='bbox 226 60 228 143; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 226 141 279 144">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 226 141 279 144">
+     <span class='ocr_line' id='line_1_11' title="bbox 226 141 279 144; baseline 0 646"><span class='ocrx_word' id='word_1_18' title='bbox 226 141 279 144; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 276 33 282 161">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 276 33 282 161">
+     <span class='ocr_line' id='line_1_12' title="bbox 276 33 282 161; baseline 0 629"><span class='ocrx_word' id='word_1_19' title='bbox 276 33 282 161; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 338 15 342 53">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 338 15 342 53">
+     <span class='ocr_line' id='line_1_13' title="bbox 338 15 342 53; baseline 0 737"><span class='ocrx_word' id='word_1_20' title='bbox 338 15 342 53; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 341 40 859 67">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 341 42 859 64">
+     <span class='ocr_line' id='line_1_14' title="bbox 341 42 859 64; baseline -0.002 -4"><span class='ocrx_word' id='word_1_21' title='bbox 341 43 523 64; x_wconf 32' lang='eng' dir='ltr'><em>iPlanotelraspora</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 531 43 614 60; x_wconf 78' lang='eng' dir='ltr'><em>silvatica</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 622 43 649 59; x_wconf 96' lang='eng' dir='ltr'>TT</span> <span class='ocrx_word' id='word_1_24' title='bbox 658 42 726 60; x_wconf 86' lang='eng' dir='ltr'><em>00-51T</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 735 43 859 64; x_wconf 81' lang='eng' dir='ltr'><em>(AB112082)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 281 75 968 104">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 281 78 968 100">
+     <span class='ocr_line' id='line_1_15' title="bbox 281 78 968 100; baseline 0 -4"><span class='ocrx_word' id='word_1_26' title='bbox 281 79 563 100; x_wconf 42' lang='eng' dir='ltr'><em>iPlanotetraspora</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 572 79 694 96; x_wconf 84' lang='eng' dir='ltr'><em>thailandica</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 703 78 751 96; x_wconf 88' lang='eng' dir='ltr'><em>BCC</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 760 78 833 96; x_wconf 85' lang='eng' dir='ltr'><em>21825T</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 841 79 968 100; x_wconf 71' lang='eng' dir='ltr'><em>(ABS70244)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 421 113 882 138">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 421 114 882 136">
+     <span class='ocr_line' id='line_1_16' title="bbox 421 114 882 136; baseline 0 -4"><span class='ocrx_word' id='word_1_31' title='bbox 421 115 554 136; x_wconf 84' lang='eng' dir='ltr'><em>Microbispora</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 563 119 620 132; x_wconf 79' lang='eng' dir='ltr'><em>rosea</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 629 114 693 132; x_wconf 86' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 704 114 776 132; x_wconf 74' lang='eng' dir='ltr'><em>14044T</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 785 115 882 136; x_wconf 79' lang='eng'><em>(086936)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 159 157 451 163">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 159 157 451 163">
+     <span class='ocr_line' id='line_1_17' title="bbox 159 157 451 163; baseline 0 627"><span class='ocrx_word' id='word_1_36' title='bbox 159 157 451 163; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 191 101 194 225">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 191 101 194 225">
+     <span class='ocr_line' id='line_1_18' title="bbox 191 101 194 225; baseline 0 565"><span class='ocrx_word' id='word_1_37' title='bbox 191 101 194 225; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 251 154 271 167">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 251 154 271 167">
+     <span class='ocr_line' id='line_1_19' title="bbox 251 154 271 167; baseline 0 0"><span class='ocrx_word' id='word_1_38' title='bbox 251 154 271 167; x_wconf 83' lang='eng'><em>76</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 421 148 1003 211">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 422 150 1002 208">
+     <span class='ocr_line' id='line_1_20' title="bbox 457 150 1002 172; baseline 0 -4"><span class='ocrx_word' id='word_1_39' title='bbox 457 151 590 172; x_wconf 74' lang='eng' dir='ltr'><em>Microbispora</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 599 151 741 172; x_wconf 82' lang='eng' dir='ltr'><em>chromogenes</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 750 150 814 168; x_wconf 91' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 825 150 897 168; x_wconf 72' lang='eng' dir='ltr'><em>14876T</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 905 151 1002 172; x_wconf 84' lang='eng' dir='ltr'><em>(U48989)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 422 186 941 208; baseline 0 -4"><span class='ocrx_word' id='word_1_44' title='bbox 422 187 585 208; x_wconf 76' lang='eng' dir='ltr'><em>Microtetraspora</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 593 187 728 208; x_wconf 70' lang='eng' dir='ltr'><em>malaysiensis</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 737 186 808 204; x_wconf 78' lang='eng' dir='ltr'><em>H47-7T</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 816 187 941 208; x_wconf 76' lang='eng' dir='ltr'><em>(A8062383)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 332 196 416 197">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 332 196 416 197">
+     <span class='ocr_line' id='line_1_22' title="bbox 332 196 416 197; baseline 0 593"><span class='ocrx_word' id='word_1_48' title='bbox 332 196 416 197; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 192 222 332 226">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 192 222 332 226">
+     <span class='ocr_line' id='line_1_23' title="bbox 192 222 332 226; baseline 0 564"><span class='ocrx_word' id='word_1_49' title='bbox 192 222 332 226; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 109 263 160 265">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 109 263 160 265">
+     <span class='ocr_line' id='line_1_24' title="bbox 109 263 160 265; baseline 0 525"><span class='ocrx_word' id='word_1_50' title='bbox 109 263 160 265; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 7 413 111 417">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 7 413 111 417">
+     <span class='ocr_line' id='line_1_25' title="bbox 7 413 111 417; baseline 0 373"><span class='ocrx_word' id='word_1_51' title='bbox 7 413 111 417; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 5 414 10 775">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 5 414 10 775">
+     <span class='ocr_line' id='line_1_26' title="bbox 5 414 10 775; baseline 0 15"><span class='ocrx_word' id='word_1_52' title='bbox 5 414 10 775; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 107 263 113 567">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 107 263 113 567">
+     <span class='ocr_line' id='line_1_27' title="bbox 107 263 113 567; baseline 0 223"><span class='ocrx_word' id='word_1_53' title='bbox 107 263 113 567; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 157 162 161 365">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 157 162 161 365">
+     <span class='ocr_line' id='line_1_28' title="bbox 157 162 161 365; baseline 0 425"><span class='ocrx_word' id='word_1_54' title='bbox 157 162 161 365; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 253 304 272 318">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 253 304 272 318">
+     <span class='ocr_line' id='line_1_29' title="bbox 253 304 272 318; baseline -0.053 0"><span class='ocrx_word' id='word_1_55' title='bbox 253 304 272 318; x_wconf 76' lang='eng'><em>94</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 304 235 323 248">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 304 235 323 248">
+     <span class='ocr_line' id='line_1_30' title="bbox 304 235 323 248; baseline 0 0"><span class='ocrx_word' id='word_1_56' title='bbox 304 235 323 248; x_wconf 83' lang='eng'><em>99</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 203 321 281 325">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 203 321 281 325">
+     <span class='ocr_line' id='line_1_31' title="bbox 203 321 281 325; baseline 0 465"><span class='ocrx_word' id='word_1_57' title='bbox 203 321 281 325; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 158 363 205 365">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 158 363 205 365">
+     <span class='ocr_line' id='line_1_32' title="bbox 158 363 205 365; baseline 0 425"><span class='ocrx_word' id='word_1_58' title='bbox 158 363 205 365; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 177 375 197 388">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 177 375 197 388">
+     <span class='ocr_line' id='line_1_33' title="bbox 177 375 197 388; baseline 0 0"><span class='ocrx_word' id='word_1_59' title='bbox 177 375 197 388; x_wconf 73' lang='eng'><em>78</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 202 322 206 405">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 202 322 206 405">
+     <span class='ocr_line' id='line_1_34' title="bbox 202 322 206 405; baseline 0 385"><span class='ocrx_word' id='word_1_60' title='bbox 202 322 206 405; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 204 403 255 406">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 204 403 255 406">
+     <span class='ocr_line' id='line_1_35' title="bbox 204 403 255 406; baseline 0 384"><span class='ocrx_word' id='word_1_61' title='bbox 204 403 255 406; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 253 377 255 432">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 253 377 255 432">
+     <span class='ocr_line' id='line_1_36' title="bbox 253 377 255 432; baseline 0 358"><span class='ocrx_word' id='word_1_62' title='bbox 253 377 255 432; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 228 416 247 429">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 228 416 247 429">
+     <span class='ocr_line' id='line_1_37' title="bbox 228 416 247 429; baseline 0 0"><span class='ocrx_word' id='word_1_63' title='bbox 228 416 247 429; x_wconf 82' lang='eng'>74</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_37' title="bbox 279 304 281 342">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 279 304 281 342">
+     <span class='ocr_line' id='line_1_38' title="bbox 279 304 281 342; baseline 0 448"><span class='ocrx_word' id='word_1_64' title='bbox 279 304 281 342; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_38' title="bbox 255 377 339 378">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 255 377 339 378">
+     <span class='ocr_line' id='line_1_39' title="bbox 255 377 339 378; baseline 0 412"><span class='ocrx_word' id='word_1_65' title='bbox 255 377 339 378; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_39' title="bbox 281 304 353 306">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 281 304 353 306">
+     <span class='ocr_line' id='line_1_40' title="bbox 281 304 353 306; baseline 0 484"><span class='ocrx_word' id='word_1_66' title='bbox 281 304 353 306; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_40' title="bbox 281 340 366 342">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 281 340 366 342">
+     <span class='ocr_line' id='line_1_41' title="bbox 281 340 366 342; baseline 0 448"><span class='ocrx_word' id='word_1_67' title='bbox 281 340 366 342; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_41' title="bbox 317 219 1094 428">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 413 222 934 244">
+     <span class='ocr_line' id='line_1_42' title="bbox 413 222 934 244; baseline 0 -4"><span class='ocrx_word' id='word_1_68' title='bbox 413 223 609 244; x_wconf 37' lang='eng' dir='ltr'><em>iMicrotetraspora</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 617 223 673 240; x_wconf 82' lang='eng' dir='ltr'><em>fusoa</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 682 223 745 240; x_wconf 88' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_71' title='bbox 756 222 828 240; x_wconf 74' lang='eng' dir='ltr'><em>13915T</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 837 223 934 244; x_wconf 82' lang='eng' dir='ltr'><em>(U48973)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_42' title="bbox 359 258 965 317">
+     <span class='ocr_line' id='line_1_43' title="bbox 413 258 965 281; baseline 0 -5"><span class='ocrx_word' id='word_1_73' title='bbox 413 268 458 270; x_wconf 98' lang='eng'>—</span> <span class='ocrx_word' id='word_1_74' title='bbox 465 259 627 280; x_wconf 79' lang='eng' dir='ltr'><em>Microtetraspora</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 634 259 703 281; x_wconf 87' lang='eng' dir='ltr'><em>glauca</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 713 259 777 276; x_wconf 87' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_77' title='bbox 787 258 859 276; x_wconf 83' lang='eng' dir='ltr'><em>14761T</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 868 259 965 280; x_wconf 85' lang='eng' dir='ltr'><em>(U48974)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 359 294 858 317; baseline 0 -4"><span class='ocrx_word' id='word_1_79' title='bbox 359 295 499 317; x_wconf 85' lang='eng' dir='ltr'><em>Herbidospora</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 508 296 597 313; x_wconf 82' lang='eng' dir='ltr'><em>cretacea</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 606 295 670 313; x_wconf 84' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_82' title='bbox 681 294 753 313; x_wconf 74' lang='eng' dir='ltr'><em>15474T</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 762 295 858 317; x_wconf 79' lang='eng'><em>(085485)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_43' title="bbox 317 331 1093 425">
+     <span class='ocr_line' id='line_1_45' title="bbox 371 331 1093 353; baseline -0.001 -4"><span class='ocrx_word' id='word_1_84' title='bbox 371 331 569 353; x_wconf 68' lang='eng' dir='ltr'><em>Streptosporangium</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 578 332 732 353; x_wconf 83' lang='eng' dir='ltr'><em>[Herbidospora]</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 741 331 847 349; x_wconf 82' lang='eng' dir='ltr'><em>claviforme</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 856 331 905 349; x_wconf 82' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 914 331 988 348; x_wconf 75' lang='eng' dir='ltr'><em>44127T</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 997 332 1093 353; x_wconf 83' lang='eng' dir='ltr'><em>(X89940)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 343 367 905 389; baseline -0.002 -4"><span class='ocrx_word' id='word_1_90' title='bbox 343 368 509 389; x_wconf 83' lang='eng' dir='ltr'><em>Acrocarpospora</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 518 368 616 389; x_wconf 83' lang='eng' dir='ltr'><em>corrugata</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 625 367 689 385; x_wconf 85' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 700 367 772 385; x_wconf 73' lang='eng' dir='ltr'><em>13972T</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 780 368 905 389; x_wconf 80' lang='eng' dir='ltr'><em>(AB188150)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 317 403 919 425; baseline 0 -4"><span class='ocrx_word' id='word_1_95' title='bbox 317 404 581 425; x_wconf 41' lang='eng' dir='ltr'><em>iAcrocarpospora</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 588 404 718 425; x_wconf 82' lang='eng' dir='ltr'><em>p/eiomorpha</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 728 403 786 421; x_wconf 78' lang='eng' dir='ltr'><em>R-31T</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 794 404 919 425; x_wconf 84' lang='eng' dir='ltr'><em>(ABOO6174)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_42' title="bbox 329 196 333 251">
+    <p class='ocr_par' dir='ltr' id='par_1_44' title="bbox 329 196 333 251">
+     <span class='ocr_line' id='line_1_48' title="bbox 329 196 333 251; baseline 0 539"><span class='ocrx_word' id='word_1_99' title='bbox 329 196 333 251; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_43' title="bbox 330 250 413 251">
+    <p class='ocr_par' dir='ltr' id='par_1_45' title="bbox 330 250 413 251">
+     <span class='ocr_line' id='line_1_49' title="bbox 330 250 413 251; baseline 0 539"><span class='ocrx_word' id='word_1_100' title='bbox 330 250 413 251; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_44' title="bbox 411 232 413 270">
+    <p class='ocr_par' dir='ltr' id='par_1_46' title="bbox 411 232 413 270">
+     <span class='ocr_line' id='line_1_50' title="bbox 411 232 413 270; baseline 0 520"><span class='ocrx_word' id='word_1_101' title='bbox 411 232 413 270; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_45' title="bbox 385 262 404 275">
+    <p class='ocr_par' dir='ltr' id='par_1_47' title="bbox 385 262 404 275">
+     <span class='ocr_line' id='line_1_51' title="bbox 385 262 404 275; baseline 0 0"><span class='ocrx_word' id='word_1_102' title='bbox 385 262 404 275; x_wconf 77' lang='eng'><em>99</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_46' title="bbox 253 431 317 432">
+    <p class='ocr_par' dir='ltr' id='par_1_48' title="bbox 253 431 317 432">
+     <span class='ocr_line' id='line_1_52' title="bbox 253 431 317 432; baseline 0 358"><span class='ocrx_word' id='word_1_103' title='bbox 253 431 317 432; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_47' title="bbox 238 484 257 498">
+    <p class='ocr_par' dir='ltr' id='par_1_49' title="bbox 238 485 257 498">
+     <span class='ocr_line' id='line_1_53' title="bbox 238 485 257 498; baseline 0 0"><span class='ocrx_word' id='word_1_104' title='bbox 238 485 257 498; x_wconf 84' lang='eng'><em>96</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_48' title="bbox 181 502 266 506">
+    <p class='ocr_par' dir='ltr' id='par_1_50' title="bbox 181 502 266 506">
+     <span class='ocr_line' id='line_1_54' title="bbox 181 502 266 506; baseline 0 284"><span class='ocrx_word' id='word_1_105' title='bbox 181 502 266 506; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_49' title="bbox 109 566 183 567">
+    <p class='ocr_par' dir='ltr' id='par_1_51' title="bbox 109 566 183 567">
+     <span class='ocr_line' id='line_1_55' title="bbox 109 566 183 567; baseline 0 223"><span class='ocrx_word' id='word_1_106' title='bbox 109 566 183 567; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_50' title="bbox 155 578 174 591">
+    <p class='ocr_par' dir='ltr' id='par_1_52' title="bbox 155 578 174 591">
+     <span class='ocr_line' id='line_1_56' title="bbox 155 578 174 591; baseline 0 0"><span class='ocrx_word' id='word_1_107' title='bbox 155 578 174 591; x_wconf 80' lang='eng'>83</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_51' title="bbox 180 503 184 631">
+    <p class='ocr_par' dir='ltr' id='par_1_53' title="bbox 180 503 184 631">
+     <span class='ocr_line' id='line_1_57' title="bbox 180 503 184 631; baseline 0 159"><span class='ocrx_word' id='word_1_108' title='bbox 180 503 184 631; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_52' title="bbox 264 485 266 522">
+    <p class='ocr_par' dir='ltr' id='par_1_54' title="bbox 264 485 266 522">
+     <span class='ocr_line' id='line_1_58' title="bbox 264 485 266 522; baseline 0 268"><span class='ocrx_word' id='word_1_109' title='bbox 264 485 266 522; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_53' title="bbox 289 443 308 456">
+    <p class='ocr_par' dir='ltr' id='par_1_55' title="bbox 289 443 308 456">
+     <span class='ocr_line' id='line_1_59' title="bbox 289 443 308 456; baseline 0 0"><span class='ocrx_word' id='word_1_110' title='bbox 289 443 308 456; x_wconf 82' lang='eng'><em>89</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_54' title="bbox 315 413 317 450">
+    <p class='ocr_par' dir='ltr' id='par_1_56' title="bbox 315 413 317 450">
+     <span class='ocr_line' id='line_1_60' title="bbox 315 413 317 450; baseline 0 340"><span class='ocrx_word' id='word_1_111' title='bbox 315 413 317 450; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_55' title="bbox 266 436 984 486">
+    <p class='ocr_par' dir='ltr' id='par_1_57' title="bbox 317 439 984 461">
+     <span class='ocr_line' id='line_1_61' title="bbox 317 439 984 461; baseline 0 -4"><span class='ocrx_word' id='word_1_112' title='bbox 317 440 539 461; x_wconf 39' lang='eng' dir='ltr'><em>iAcrocarpospora</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 548 440 695 461; x_wconf 81' lang='eng' dir='ltr'><em>macrocephala</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 704 440 768 457; x_wconf 87' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 779 439 851 457; x_wconf 79' lang='eng' dir='ltr'><em>16266T</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 859 440 984 461; x_wconf 77' lang='eng' dir='ltr'><em>(A8025318)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_56' title="bbox 466 473 936 500">
+    <p class='ocr_par' dir='ltr' id='par_1_58' title="bbox 466 475 936 497">
+     <span class='ocr_line' id='line_1_62' title="bbox 466 475 936 497; baseline 0 -4"><span class='ocrx_word' id='word_1_117' title='bbox 466 476 601 493; x_wconf 84' lang='eng' dir='ltr'><em>Nonomuraea</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 608 476 675 497; x_wconf 80' lang='eng' dir='ltr'><em>pusi/la</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 684 476 748 493; x_wconf 91' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 759 475 831 493; x_wconf 79' lang='eng' dir='ltr'><em>14684T</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 839 476 936 497; x_wconf 85' lang='eng' dir='ltr'><em>(D85491)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_57' title="bbox 266 509 1004 537">
+    <p class='ocr_par' dir='ltr' id='par_1_59' title="bbox 266 511 1004 534">
+     <span class='ocr_line' id='line_1_63' title="bbox 266 511 1004 534; baseline 0 -5"><span class='ocrx_word' id='word_1_122' title='bbox 266 521 478 522; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_123' title='bbox 484 512 619 529; x_wconf 86' lang='eng' dir='ltr'><em>Nonomuraea</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 627 512 743 534; x_wconf 74' lang='eng' dir='ltr'><em>angiospora</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 752 512 816 529; x_wconf 87' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_126' title='bbox 827 511 899 529; x_wconf 82' lang='eng' dir='ltr'><em>13155T</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 908 512 1004 533; x_wconf 79' lang='eng' dir='ltr'><em>(U48843)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_58' title="bbox 394 545 1068 574">
+    <p class='ocr_par' dir='ltr' id='par_1_60' title="bbox 394 547 1068 570">
+     <span class='ocr_line' id='line_1_64' title="bbox 394 547 1068 570; baseline 0 -5"><span class='ocrx_word' id='word_1_128' title='bbox 394 557 423 570; x_wconf 43' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 555 548 691 570; x_wconf 83' lang='eng' dir='ltr'><em>Planobispora</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 699 548 807 570; x_wconf 80' lang='eng' dir='ltr'><em>Iongispora</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 816 548 880 565; x_wconf 86' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_132' title='bbox 891 547 963 565; x_wconf 74' lang='eng' dir='ltr'><em>13918T</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 972 548 1068 570; x_wconf 84' lang='eng' dir='ltr'><em>(D85494)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_59' title="bbox 253 574 429 578">
+    <p class='ocr_par' dir='ltr' id='par_1_61' title="bbox 253 574 429 578">
+     <span class='ocr_line' id='line_1_65' title="bbox 253 574 429 578; baseline 0 212"><span class='ocrx_word' id='word_1_134' title='bbox 253 574 429 578; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_60' title="bbox 428 557 429 595">
+    <p class='ocr_par' dir='ltr' id='par_1_62' title="bbox 428 557 429 595">
+     <span class='ocr_line' id='line_1_66' title="bbox 428 557 429 595; baseline 0 195"><span class='ocrx_word' id='word_1_135' title='bbox 428 557 429 595; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_61' title="bbox 429 593 493 595">
+    <p class='ocr_par' dir='ltr' id='par_1_63' title="bbox 429 593 493 595">
+     <span class='ocr_line' id='line_1_67' title="bbox 429 593 493 595; baseline 0 195"><span class='ocrx_word' id='word_1_136' title='bbox 429 593 493 595; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_62' title="bbox 497 581 957 609">
+    <p class='ocr_par' dir='ltr' id='par_1_64' title="bbox 497 583 957 606">
+     <span class='ocr_line' id='line_1_68' title="bbox 497 583 957 606; baseline 0 -4"><span class='ocrx_word' id='word_1_137' title='bbox 497 584 633 606; x_wconf 80' lang='eng' dir='ltr'><em>Planobispora</em></span> <span class='ocrx_word' id='word_1_138' title='bbox 642 588 700 602; x_wconf 79' lang='eng' dir='ltr'><em>rosea</em></span> <span class='ocrx_word' id='word_1_139' title='bbox 708 584 754 602; x_wconf 87' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_140' title='bbox 764 583 823 602; x_wconf 72' lang='eng' dir='ltr'><em>3166T</em></span> <span class='ocrx_word' id='word_1_141' title='bbox 832 584 957 606; x_wconf 78' lang='eng' dir='ltr'><em>(A3028654)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_63' title="bbox 181 627 463 633">
+    <p class='ocr_par' dir='ltr' id='par_1_65' title="bbox 181 627 463 633">
+     <span class='ocr_line' id='line_1_69' title="bbox 181 627 463 633; baseline 0 157"><span class='ocrx_word' id='word_1_142' title='bbox 181 627 463 633; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_64' title="bbox 228 641 247 655">
+    <p class='ocr_par' dir='ltr' id='par_1_66' title="bbox 228 641 247 655">
+     <span class='ocr_line' id='line_1_70' title="bbox 228 641 247 655; baseline 0 0"><span class='ocrx_word' id='word_1_143' title='bbox 228 641 247 655; x_wconf 80' lang='eng' dir='ltr'><em>B7</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_65' title="bbox 253 575 255 685">
+    <p class='ocr_par' dir='ltr' id='par_1_67' title="bbox 253 575 255 685">
+     <span class='ocr_line' id='line_1_71' title="bbox 253 575 255 685; baseline 0 105"><span class='ocrx_word' id='word_1_144' title='bbox 253 575 255 685; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_66' title="bbox 320 617 955 646">
+    <p class='ocr_par' dir='ltr' id='par_1_68' title="bbox 320 620 955 643">
+     <span class='ocr_line' id='line_1_72' title="bbox 320 620 955 643; baseline 0 -5"><span class='ocrx_word' id='word_1_145' title='bbox 320 629 340 643; x_wconf 73' lang='eng'><em>64</em></span> <span class='ocrx_word' id='word_1_146' title='bbox 469 620 646 642; x_wconf 83' lang='eng' dir='ltr'><em>Planomonospora</em></span> <span class='ocrx_word' id='word_1_147' title='bbox 655 620 697 638; x_wconf 84' lang='eng' dir='ltr'><em>alba</em></span> <span class='ocrx_word' id='word_1_148' title='bbox 706 620 751 638; x_wconf 88' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_149' title='bbox 761 620 821 638; x_wconf 82' lang='eng' dir='ltr'><em>9373T</em></span> <span class='ocrx_word' id='word_1_150' title='bbox 830 620 955 642; x_wconf 76' lang='eng' dir='ltr'><em>(A3062381)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_67' title="bbox 307 647 348 649">
+    <p class='ocr_par' dir='ltr' id='par_1_69' title="bbox 307 647 348 649">
+     <span class='ocr_line' id='line_1_73' title="bbox 307 647 348 649; baseline 0 141"><span class='ocrx_word' id='word_1_151' title='bbox 307 647 348 649; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_68' title="bbox 253 684 309 685">
+    <p class='ocr_par' dir='ltr' id='par_1_70' title="bbox 253 684 309 685">
+     <span class='ocr_line' id='line_1_74' title="bbox 253 684 309 685; baseline 0 105"><span class='ocrx_word' id='word_1_152' title='bbox 253 684 309 685; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_69' title="bbox 282 696 300 709">
+    <p class='ocr_par' dir='ltr' id='par_1_71' title="bbox 283 696 299 709">
+     <span class='ocr_line' id='line_1_75' title="bbox 283 696 299 709; baseline 0 0"><span class='ocrx_word' id='word_1_153' title='bbox 283 696 299 709; x_wconf 64' lang='eng'>71</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_70' title="bbox 306 647 310 721">
+    <p class='ocr_par' dir='ltr' id='par_1_72' title="bbox 306 647 310 721">
+     <span class='ocr_line' id='line_1_76' title="bbox 306 647 310 721; baseline 0 69"><span class='ocrx_word' id='word_1_154' title='bbox 306 647 310 721; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_71' title="bbox 348 653 1093 718">
+    <p class='ocr_par' dir='ltr' id='par_1_73' title="bbox 348 656 1092 715">
+     <span class='ocr_line' id='line_1_77' title="bbox 460 656 1004 678; baseline 0 -4"><span class='ocrx_word' id='word_1_155' title='bbox 460 657 637 678; x_wconf 84' lang='eng' dir='ltr'><em>Planomonospora</em></span> <span class='ocrx_word' id='word_1_156' title='bbox 645 657 746 678; x_wconf 79' lang='eng' dir='ltr'><em>sphaerica</em></span> <span class='ocrx_word' id='word_1_157' title='bbox 755 656 800 674; x_wconf 88' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_158' title='bbox 810 656 871 674; x_wconf 77' lang='eng' dir='ltr'><em>9374T</em></span> <span class='ocrx_word' id='word_1_159' title='bbox 879 657 1004 678; x_wconf 71' lang='eng' dir='ltr'><em>(ABDGZSBZ)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_78' title="bbox 348 692 1092 715; baseline 0 -5"><span class='ocrx_word' id='word_1_160' title='bbox 348 693 761 715; x_wconf 75' lang='eng' dir='ltr'><em>—Streptosporangium</em></span> <span class='ocrx_word' id='word_1_161' title='bbox 769 697 846 710; x_wconf 82' lang='eng' dir='ltr'><em>roseum</em></span> <span class='ocrx_word' id='word_1_162' title='bbox 855 693 904 710; x_wconf 85' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_163' title='bbox 913 692 988 710; x_wconf 73' lang='eng' dir='ltr'><em>4302‘]T</em></span> <span class='ocrx_word' id='word_1_164' title='bbox 996 693 1092 714; x_wconf 84' lang='eng' dir='ltr'><em>(X89947)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_72' title="bbox 307 720 348 721">
+    <p class='ocr_par' dir='ltr' id='par_1_74' title="bbox 307 720 348 721">
+     <span class='ocr_line' id='line_1_79' title="bbox 307 720 348 721; baseline 0 69"><span class='ocrx_word' id='word_1_165' title='bbox 307 720 348 721; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_73' title="bbox 346 629 349 739">
+    <p class='ocr_par' dir='ltr' id='par_1_75' title="bbox 346 629 349 739">
+     <span class='ocr_line' id='line_1_80' title="bbox 346 629 349 739; baseline 0 51"><span class='ocrx_word' id='word_1_166' title='bbox 346 629 349 739; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_74' title="bbox 321 725 1297 754">
+    <p class='ocr_par' dir='ltr' id='par_1_76' title="bbox 321 728 1297 751">
+     <span class='ocr_line' id='line_1_81' title="bbox 321 728 1297 751; baseline 0 -5"><span class='ocrx_word' id='word_1_167' title='bbox 321 732 340 745; x_wconf 86' lang='eng'><em>55</em></span> <span class='ocrx_word' id='word_1_168' title='bbox 617 729 815 751; x_wconf 79' lang='eng' dir='ltr'><em>Streptosporangium</em></span> <span class='ocrx_word' id='word_1_169' title='bbox 824 729 1052 751; x_wconf 82' lang='eng' dir='ltr'><em>violaceochromogenes</em></span> <span class='ocrx_word' id='word_1_170' title='bbox 1061 729 1110 746; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_171' title='bbox 1119 728 1193 746; x_wconf 71' lang='eng' dir='ltr'><em>43849T</em></span> <span class='ocrx_word' id='word_1_172' title='bbox 1202 729 1297 750; x_wconf 83' lang='eng' dir='ltr'><em>(X89951)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_75' title="bbox 7 770 610 779">
+    <p class='ocr_par' dir='ltr' id='par_1_77' title="bbox 7 770 610 779">
+     <span class='ocr_line' id='line_1_82' title="bbox 7 770 610 779; baseline 0 11"><span class='ocrx_word' id='word_1_173' title='bbox 7 770 610 779; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_76' title="bbox 615 762 1106 790">
+    <p class='ocr_par' dir='ltr' id='par_1_78' title="bbox 615 764 1106 787">
+     <span class='ocr_line' id='line_1_83' title="bbox 615 764 1106 787; baseline 0 -5"><span class='ocrx_word' id='word_1_174' title='bbox 615 765 761 782; x_wconf 78' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_175' title='bbox 769 765 861 782; x_wconf 84' lang='eng' dir='ltr'><em>madurae</em></span> <span class='ocrx_word' id='word_1_176' title='bbox 870 765 919 782; x_wconf 84' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_177' title='bbox 928 764 1002 782; x_wconf 78' lang='eng' dir='ltr'><em>43067T</em></span> <span class='ocrx_word' id='word_1_178' title='bbox 1011 765 1106 787; x_wconf 84' lang='eng' dir='ltr'><em>(X97889)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003244-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003244-0-000.pbm.png
new file mode 100644
index 00000000..bd759fae
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003244-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003244-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003244-0-000.pbm.png.hocr
new file mode 100644
index 00000000..23554463
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003244-0-000.pbm.png.hocr
@@ -0,0 +1,265 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003244-0-000.pbm.png"; bbox 0 0 1302 1212; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 481 4 1266 47">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 481 4 1266 47">
+     <span class='ocr_line' id='line_1_1' title="bbox 481 4 1266 47; baseline 0 -20"><span class='ocrx_word' id='word_1_1' title='bbox 481 26 526 47; x_wconf 75' lang='eng'><em>574</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 541 6 757 33; x_wconf 43' lang='eng' dir='ltr'><em>~Psychromonas</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 767 6 936 33; x_wconf 88' lang='eng' dir='ltr'><em>macrocephali</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 944 6 1022 27; x_wconf 92' lang='eng' dir='ltr'><em>JAMM</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 1033 4 1108 27; x_wconf 85' lang='eng' dir='ltr'><em>0415T</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 1117 6 1266 33; x_wconf 75' lang='eng' dir='ltr'><em>(ABBO4806)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 539 16 541 95">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 539 16 541 95">
+     <span class='ocr_line' id='line_1_2' title="bbox 539 16 541 95; baseline 0 1117"><span class='ocrx_word' id='word_1_7' title='bbox 539 16 541 95; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 465 81 1236 110">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 465 81 1236 110">
+     <span class='ocr_line' id='line_1_3' title="bbox 465 81 1236 110; baseline 0.001 -6"><span class='ocrx_word' id='word_1_8' title='bbox 465 86 510 107; x_wconf 87' lang='eng'>810</span> <span class='ocrx_word' id='word_1_9' title='bbox 540 84 756 110; x_wconf 86' lang='eng' dir='ltr'><em>—Psychromonas</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 765 84 905 110; x_wconf 84' lang='eng' dir='ltr'><em>aquimarina</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 914 84 992 105; x_wconf 92' lang='eng' dir='ltr'><em>JAMM</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 1003 81 1078 105; x_wconf 91' lang='eng' dir='ltr'><em>0404T</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 1088 84 1236 110; x_wconf 75' lang='eng' dir='ltr'><em>(ABSO4805)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 498 113 527 115">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 498 113 527 115">
+     <span class='ocr_line' id='line_1_4' title="bbox 498 113 527 115; baseline 0 1097"><span class='ocrx_word' id='word_1_14' title='bbox 498 113 527 115; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 525 56 528 172">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 525 56 528 172">
+     <span class='ocr_line' id='line_1_5' title="bbox 525 56 528 172; baseline 0 1040"><span class='ocrx_word' id='word_1_15' title='bbox 525 56 528 172; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 449 154 1257 188">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 449 154 1257 188">
+     <span class='ocr_line' id='line_1_6' title="bbox 449 154 1257 188; baseline 0 -6"><span class='ocrx_word' id='word_1_16' title='bbox 449 154 498 183; x_wconf 73' lang='eng'><em>552.</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 527 161 750 188; x_wconf 37' lang='eng' dir='ltr'><em>*Psychromonas</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 759 161 926 182; x_wconf 86' lang='eng' dir='ltr'><em>ossibalaenae</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 935 161 1013 182; x_wconf 90' lang='eng' dir='ltr'><em>JAMM</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 1024 159 1099 182; x_wconf 81' lang='eng' dir='ltr'><em>0738T</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 1109 161 1257 188; x_wconf 90' lang='eng' dir='ltr'><em>(AB304808)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 497 113 500 252">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 497 113 500 252">
+     <span class='ocr_line' id='line_1_7' title="bbox 497 113 500 252; baseline 0 960"><span class='ocrx_word' id='word_1_22' title='bbox 497 113 500 252; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 432 226 477 247">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 432 226 477 247">
+     <span class='ocr_line' id='line_1_8' title="bbox 432 226 477 247; baseline 0 0"><span class='ocrx_word' id='word_1_23' title='bbox 432 226 477 247; x_wconf 91' lang='eng'><em>572</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 499 251 574 253">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 499 251 574 253">
+     <span class='ocr_line' id='line_1_9' title="bbox 499 251 574 253; baseline 0 959"><span class='ocrx_word' id='word_1_24' title='bbox 499 251 574 253; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 467 256 489 257">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 467 256 489 257">
+     <span class='ocr_line' id='line_1_10' title="bbox 467 256 489 257; baseline 0 955"><span class='ocrx_word' id='word_1_25' title='bbox 467 256 489 257; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 578 239 1083 268">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 578 239 1083 268">
+     <span class='ocr_line' id='line_1_11' title="bbox 578 239 1083 268; baseline 0 -6"><span class='ocrx_word' id='word_1_26' title='bbox 578 241 766 268; x_wconf 85' lang='eng' dir='ltr'><em>Psychromonas</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 775 241 907 268; x_wconf 87' lang='eng' dir='ltr'><em>ingrahamii</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 915 239 958 262; x_wconf 79' lang='eng' dir='ltr'><em>37T</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 967 241 1083 268; x_wconf 82' lang='eng' dir='ltr'><em>(U73721)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 487 180 490 330">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 487 180 490 330">
+     <span class='ocr_line' id='line_1_12' title="bbox 487 180 490 330; baseline 0 882"><span class='ocrx_word' id='word_1_30' title='bbox 487 180 490 330; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 399 302 444 323">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 399 302 444 323">
+     <span class='ocr_line' id='line_1_13' title="bbox 399 302 444 323; baseline -0.022 0"><span class='ocrx_word' id='word_1_31' title='bbox 399 302 444 323; x_wconf 81' lang='eng'><em>992</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 397 327 584 331">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 397 327 584 331">
+     <span class='ocr_line' id='line_1_14' title="bbox 397 327 584 331; baseline 0 881"><span class='ocrx_word' id='word_1_32' title='bbox 397 327 584 331; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 589 317 1202 346">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 589 317 1202 346">
+     <span class='ocr_line' id='line_1_15' title="bbox 589 317 1202 346; baseline 0 -6"><span class='ocrx_word' id='word_1_33' title='bbox 589 319 776 346; x_wconf 87' lang='eng' dir='ltr'><em>Psychromonas</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 785 319 907 340; x_wconf 81' lang='eng' dir='ltr'><em>antarctica</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 919 319 977 340; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 990 317 1078 340; x_wconf 93' lang='eng' dir='ltr'><em>10704T</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 1089 319 1202 346; x_wconf 82' lang='eng' dir='ltr'><em>(Y14697)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 467 256 469 408">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 467 256 469 408">
+     <span class='ocr_line' id='line_1_16' title="bbox 467 256 469 408; baseline 0 804"><span class='ocrx_word' id='word_1_38' title='bbox 467 256 469 408; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 335 394 1299 579">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 335 394 1200 501">
+     <span class='ocr_line' id='line_1_17' title="bbox 335 394 1168 423; baseline 0 -5"><span class='ocrx_word' id='word_1_39' title='bbox 335 399 380 421; x_wconf 87' lang='eng'><em>598</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 468 397 835 423; x_wconf 25' lang='eng' dir='ltr'><em>*Psychromonasjaponica</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 846 397 924 418; x_wconf 92' lang='eng' dir='ltr'><em>JAMM</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 935 394 1009 418; x_wconf 78' lang='eng' dir='ltr'><em>0394T</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 1019 397 1168 423; x_wconf 83' lang='eng' dir='ltr'><em>(AB304804)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 550 472 1200 501; baseline -0.002 -5"><span class='ocrx_word' id='word_1_44' title='bbox 550 474 754 501; x_wconf 87' lang='eng' dir='ltr'><em>Psychromonas</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 763 474 924 501; x_wconf 86' lang='eng' dir='ltr'><em>agarivorans</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 932 472 1037 496; x_wconf 87' lang='eng' dir='ltr'><em>J42-3AT</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 1046 474 1200 501; x_wconf 75' lang='eng' dir='ltr'><em>(ABs74544)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 400 532 1299 579">
+     <span class='ocr_line' id='line_1_19' title="bbox 400 532 838 556; baseline 0.007 -3"><span class='ocrx_word' id='word_1_48' title='bbox 400 532 460 553; x_wconf 82' lang='eng'>1000</span> <span class='ocrx_word' id='word_1_49' title='bbox 834 552 838 556; x_wconf 98' lang='eng'>.</span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 557 552 1299 579; baseline 0 -6"><span class='ocrx_word' id='word_1_50' title='bbox 557 552 761 579; x_wconf 87' lang='eng' dir='ltr'><em>Psychromonas</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 769 557 930 579; x_wconf 86' lang='eng' dir='ltr'><em>agarlvorans</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 939 552 1136 573; x_wconf 90' lang='eng' dir='ltr'><em>04OZ-AS15-7A</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 1146 552 1299 579; x_wconf 87' lang='eng' dir='ltr'><em>(AB374545)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 319 625 991 659">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 319 625 991 659">
+     <span class='ocr_line' id='line_1_21' title="bbox 319 625 991 659; baseline 0 -6"><span class='ocrx_word' id='word_1_54' title='bbox 319 625 366 656; x_wconf 54' lang='eng'><em>58%</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 472 632 660 659; x_wconf 86' lang='eng' dir='ltr'><em>Psychromonas</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 669 632 754 654; x_wconf 83' lang='eng' dir='ltr'><em>marina</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 763 630 832 653; x_wconf 86' lang='eng' dir='ltr'><em>4—22T</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 842 632 991 659; x_wconf 85' lang='eng' dir='ltr'><em>(AB023378)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 366 427 398 428">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 366 427 398 428">
+     <span class='ocr_line' id='line_1_22' title="bbox 366 427 398 428; baseline 0 784"><span class='ocrx_word' id='word_1_59' title='bbox 366 427 398 428; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 397 331 399 526">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 397 331 399 526">
+     <span class='ocr_line' id='line_1_23' title="bbox 397 331 399 526; baseline 0 686"><span class='ocrx_word' id='word_1_60' title='bbox 397 331 399 526; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 408 708 1026 737">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 408 708 1026 737">
+     <span class='ocr_line' id='line_1_24' title="bbox 408 708 1026 737; baseline 0 -6"><span class='ocrx_word' id='word_1_61' title='bbox 408 710 453 731; x_wconf 86' lang='eng'><em>998</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 481 710 669 737; x_wconf 86' lang='eng' dir='ltr'><em>Psychromonas</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 676 710 788 737; x_wconf 88' lang='eng' dir='ltr'><em>profunda</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 797 708 872 731; x_wconf 81' lang='eng' dir='ltr'><em>2825T</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 882 710 1026 737; x_wconf 87' lang='eng' dir='ltr'><em>(AJ416756)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 471 785 1038 814">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 471 785 1038 814">
+     <span class='ocr_line' id='line_1_25' title="bbox 471 785 1038 814; baseline 0 -5"><span class='ocrx_word' id='word_1_66' title='bbox 471 788 659 814; x_wconf 87' lang='eng' dir='ltr'><em>Psychromonas</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 668 788 764 809; x_wconf 82' lang='eng' dir='ltr'><em>Kaikoae</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 773 785 880 809; x_wconf 82' lang='eng' dir='ltr'><em>JT7304T</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 890 788 1038 814; x_wconf 84' lang='eng' dir='ltr'><em>(AB052160)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 387 808 407 809">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 387 808 407 809">
+     <span class='ocr_line' id='line_1_26' title="bbox 387 808 407 809; baseline 0 403"><span class='ocrx_word' id='word_1_70' title='bbox 387 808 407 809; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 133 815 192 836">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 133 815 192 836">
+     <span class='ocr_line' id='line_1_27' title="bbox 133 815 192 836; baseline 0 0"><span class='ocrx_word' id='word_1_71' title='bbox 133 815 192 836; x_wconf 81' lang='eng'>1000</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 129 842 355 844">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 129 842 355 844">
+     <span class='ocr_line' id='line_1_28' title="bbox 129 842 355 844; baseline 0 368"><span class='ocrx_word' id='word_1_72' title='bbox 129 842 355 844; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 5 975 131 978">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 5 975 131 978">
+     <span class='ocr_line' id='line_1_29' title="bbox 5 975 131 978; baseline 0 234"><span class='ocrx_word' id='word_1_73' title='bbox 5 975 131 978; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 5 975 7 1190">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 5 975 7 1190">
+     <span class='ocr_line' id='line_1_30' title="bbox 5 975 7 1190; baseline 0 22"><span class='ocrx_word' id='word_1_74' title='bbox 5 975 7 1190; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 366 427 368 881">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 366 427 368 881">
+     <span class='ocr_line' id='line_1_31' title="bbox 366 427 368 881; baseline 0 331"><span class='ocrx_word' id='word_1_75' title='bbox 366 427 368 881; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 406 740 408 877">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 406 740 408 877">
+     <span class='ocr_line' id='line_1_32' title="bbox 406 740 408 877; baseline 0 335"><span class='ocrx_word' id='word_1_76' title='bbox 406 740 408 877; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 407 875 508 877">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 407 875 508 877">
+     <span class='ocr_line' id='line_1_33' title="bbox 407 875 508 877; baseline 0 335"><span class='ocrx_word' id='word_1_77' title='bbox 407 875 508 877; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 366 880 389 882">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 366 880 389 882">
+     <span class='ocr_line' id='line_1_34' title="bbox 366 880 389 882; baseline 0 330"><span class='ocrx_word' id='word_1_78' title='bbox 366 880 389 882; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 511 863 1124 892">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 511 863 1124 892">
+     <span class='ocr_line' id='line_1_35' title="bbox 511 863 1124 892; baseline 0.002 -6"><span class='ocrx_word' id='word_1_79' title='bbox 511 865 699 892; x_wconf 82' lang='eng' dir='ltr'><em>Psychromonas</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 707 865 819 887; x_wconf 85' lang='eng' dir='ltr'><em>heitensis</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 827 863 966 887; x_wconf 76' lang='eng' dir='ltr'><em>AK‘15-027T</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 976 865 1124 892; x_wconf 81' lang='eng' dir='ltr'><em>(AB365352)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 387 807 390 955">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 387 807 390 955">
+     <span class='ocr_line' id='line_1_36' title="bbox 387 807 390 955; baseline 0 257"><span class='ocrx_word' id='word_1_83' title='bbox 387 807 390 955; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 524 941 1061 970">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 524 941 1061 970">
+     <span class='ocr_line' id='line_1_37' title="bbox 524 941 1061 970; baseline -0.002 -5"><span class='ocrx_word' id='word_1_84' title='bbox 524 944 712 970; x_wconf 87' lang='eng' dir='ltr'><em>Psychromonas</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 721 944 810 965; x_wconf 85' lang='eng' dir='ltr'><em>hadalis</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 820 944 863 964; x_wconf 88' lang='eng' dir='ltr'>K41</span> <span class='ocrx_word' id='word_1_87' title='bbox 870 941 903 965; x_wconf 92' lang='eng' dir='ltr'><em>GT</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 913 944 1061 970; x_wconf 79' lang='eng' dir='ltr'><em>(ABOQ4413)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 354 654 356 1034">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 354 654 356 1034">
+     <span class='ocr_line' id='line_1_38' title="bbox 354 654 356 1034; baseline 0 178"><span class='ocrx_word' id='word_1_89' title='bbox 354 654 356 1034; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 485 1021 1037 1050">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 485 1021 1037 1050">
+     <span class='ocr_line' id='line_1_39' title="bbox 485 1021 1037 1050; baseline 0 -6"><span class='ocrx_word' id='word_1_90' title='bbox 485 1023 673 1050; x_wconf 86' lang='eng' dir='ltr'><em>Psychromonas</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 682 1023 764 1044; x_wconf 81' lang='eng' dir='ltr'><em>arctica</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 775 1023 819 1044; x_wconf 94' lang='eng' dir='ltr'>Pull</span> <span class='ocrx_word' id='word_1_93' title='bbox 830 1021 881 1044; x_wconf 92' lang='eng' dir='ltr'><em>5.3T</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 890 1023 1037 1050; x_wconf 83' lang='eng' dir='ltr'><em>(AF374385)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_37' title="bbox 129 842 132 1112">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 129 842 132 1112">
+     <span class='ocr_line' id='line_1_40' title="bbox 129 842 132 1112; baseline 0 100"><span class='ocrx_word' id='word_1_95' title='bbox 129 842 132 1112; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_38' title="bbox 513 1098 1142 1128">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 513 1098 1142 1128">
+     <span class='ocr_line' id='line_1_41' title="bbox 513 1098 1142 1128; baseline 0 -6"><span class='ocrx_word' id='word_1_96' title='bbox 513 1101 711 1122; x_wconf 88' lang='eng' dir='ltr'><em>Thalassomonas</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 721 1101 818 1122; x_wconf 88' lang='eng' dir='ltr'><em>viridans</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 828 1101 887 1122; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 900 1098 988 1122; x_wconf 87' lang='eng' dir='ltr'><em>13754T</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 998 1101 1142 1128; x_wconf 87' lang='eng' dir='ltr'><em>(AJ294748)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_39' title="bbox 5 1188 527 1190">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 5 1188 527 1190">
+     <span class='ocr_line' id='line_1_42' title="bbox 5 1188 527 1190; baseline 0 22"><span class='ocrx_word' id='word_1_101' title='bbox 5 1188 527 1190; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_40' title="bbox 531 1176 1037 1206">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 531 1176 1037 1206">
+     <span class='ocr_line' id='line_1_43' title="bbox 531 1176 1037 1206; baseline 0 -7"><span class='ocrx_word' id='word_1_102' title='bbox 531 1178 676 1200; x_wconf 85' lang='eng' dir='ltr'><em>Escherichia</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 687 1178 730 1200; x_wconf 83' lang='eng' dir='ltr'><em>coli</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 736 1178 813 1200; x_wconf 93' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 825 1176 914 1200; x_wconf 88' lang='eng' dir='ltr'><em>11775T</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 923 1178 1037 1206; x_wconf 86' lang='eng' dir='ltr'><em>(X80725)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003251-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003251-0-000.pbm.png
new file mode 100644
index 00000000..6da90d08
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003251-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003251-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003251-0-000.pbm.png.hocr
new file mode 100644
index 00000000..5875ec7f
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003251-0-000.pbm.png.hocr
@@ -0,0 +1,147 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003251-0-000.pbm.png"; bbox 0 0 1124 1013; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 197 5 1119 1008">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 287 5 1119 540">
+     <span class='ocr_line' id='line_1_1' title="bbox 287 5 964 33; baseline 0.001 -7"><span class='ocrx_word' id='word_1_1' title='bbox 287 7 324 26; x_wconf 78' lang='eng'><em>97*</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 415 5 579 27; x_wconf 77' lang='eng' dir='ltr'><em>Salinicoccus</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 589 6 706 27; x_wconf 84' lang='eng' dir='ltr'><em>iranensis</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 716 5 794 28; x_wconf 89' lang='eng' dir='ltr'><em>QW6T</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 804 5 964 33; x_wconf 87' lang='eng' dir='ltr'>(DQ767692)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 412 44 998 71; baseline 0 -5"><span class='ocrx_word' id='word_1_6' title='bbox 412 44 575 66; x_wconf 84' lang='eng' dir='ltr'><em>Salinicoccus</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 585 44 663 66; x_wconf 82' lang='eng' dir='ltr'><em>Iuteus</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 672 44 722 66; x_wconf 92' lang='eng' dir='ltr'><em>YIM</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 734 44 827 66; x_wconf 90' lang='eng' dir='ltr'><em>70202T</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 838 44 998 71; x_wconf 89' lang='eng' dir='ltr'><em>(DQ352839)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 339 83 891 111; baseline 0 -6"><span class='ocrx_word' id='word_1_11' title='bbox 339 83 502 105; x_wconf 85' lang='eng' dir='ltr'><em>Sa/inicoccus</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 512 89 600 105; x_wconf 87' lang='eng' dir='ltr'><em>rcseus</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 611 83 672 105; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 685 83 761 105; x_wconf 91' lang='eng' dir='ltr'><em>5351T</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 771 83 891 111; x_wconf 85' lang='eng' dir='ltr'>(X94559)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 357 122 996 149; baseline 0 -5"><span class='ocrx_word' id='word_1_16' title='bbox 357 122 520 144; x_wconf 85' lang='eng' dir='ltr'><em>Salinicoccus</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 529 122 669 149; x_wconf 86' lang='eng' dir='ltr'><em>hispanicus</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 680 122 741 144; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 753 122 830 144; x_wconf 90' lang='eng' dir='ltr'><em>5352T</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 840 122 996 149; x_wconf 85' lang='eng' dir='ltr'><em>(AY028927)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 365 161 939 188; baseline 0 -5"><span class='ocrx_word' id='word_1_21' title='bbox 365 161 528 183; x_wconf 84' lang='eng' dir='ltr'><em>Salinicoccus</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 537 161 669 183; x_wconf 86' lang='eng' dir='ltr'><em>siamensis</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 679 161 772 183; x_wconf 93' lang='eng' dir='ltr'><em>PN1—2T</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 783 161 939 188; x_wconf 80' lang='eng' dir='ltr'><em>(A8258358)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 359 200 907 227; baseline 0 -5"><span class='ocrx_word' id='word_1_25' title='bbox 359 200 523 222; x_wconf 83' lang='eng' dir='ltr'><em>Salinicoccus</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 532 200 656 222; x_wconf 86' lang='eng' dir='ltr'><em>sa/siraiae</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 668 200 736 221; x_wconf 65' lang='eng' dir='ltr'><em>F€H1T</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 746 200 907 227; x_wconf 78' lang='eng'>(00333949)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 355 239 930 266; baseline 0 -5"><span class='ocrx_word' id='word_1_29' title='bbox 355 239 519 261; x_wconf 86' lang='eng' dir='ltr'><em>Salinicoccus</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 524 239 623 266; x_wconf 86' lang='eng' dir='ltr'><em>jeotgali</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 632 239 759 261; x_wconf 78' lang='eng' dir='ltr'><em>82R53—5T</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 769 239 930 266; x_wconf 85' lang='eng' dir='ltr'>(DQ471329)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 346 277 883 306; baseline -0.002 -6"><span class='ocrx_word' id='word_1_33' title='bbox 346 277 510 300; x_wconf 85' lang='eng' dir='ltr'><em>Salinicoccus</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 519 278 664 306; x_wconf 82' lang='eng' dir='ltr'><em>alkaliphilus</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 673 278 718 300; x_wconf 93' lang='eng' dir='ltr'><em>T8T</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 729 278 883 306; x_wconf 91' lang='eng' dir='ltr'>(AF275710)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 334 317 993 345; baseline 0 -6"><span class='ocrx_word' id='word_1_37' title='bbox 334 317 497 339; x_wconf 83' lang='eng' dir='ltr'><em>Salinicoccus</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 507 318 688 345; x_wconf 77' lang='eng' dir='ltr'><em>kunmingensis</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 697 318 746 339; x_wconf 92' lang='eng' dir='ltr'><em>YIM</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 758 318 821 339; x_wconf 91' lang='eng' dir='ltr'><em>Y15T</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 832 317 993 345; x_wconf 81' lang='eng' dir='ltr'>(DQB37380)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 395 356 960 383; baseline 0 -5"><span class='ocrx_word' id='word_1_42' title='bbox 395 356 576 378; x_wconf 86' lang='eng' dir='ltr'><em>Salinicoccus</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 586 356 662 378; x_wconf 87' lang='eng' dir='ltr'><em>albus</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 671 356 798 378; x_wconf 92' lang='eng' dir='ltr'><em>YIM-Y21T</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 805 356 960 383; x_wconf 85' lang='eng' dir='ltr'>(EF177692)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 346 395 1012 423; baseline 0 -6"><span class='ocrx_word' id='word_1_46' title='bbox 346 395 540 423; x_wconf 84' lang='eng' dir='ltr'><em>Jeotgalicoccus</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 550 395 711 417; x_wconf 87' lang='eng' dir='ltr'><em>ha/oto/erans</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 720 395 846 417; x_wconf 86' lang='eng' dir='ltr'><em>YKJ-1O1T</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 856 395 1012 423; x_wconf 86' lang='eng' dir='ltr'><em>(AY028925)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 358 434 1044 461; baseline -0.001 -5"><span class='ocrx_word' id='word_1_50' title='bbox 358 434 552 461; x_wconf 84' lang='eng' dir='ltr'><em>Jeotga/icoccus</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 561 434 744 461; x_wconf 87' lang='eng' dir='ltr'><em>psychrophi/us</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 753 434 877 456; x_wconf 81' lang='eng' dir='ltr'><em>YKJ—115T</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 888 434 1044 461; x_wconf 85' lang='eng' dir='ltr'>(AY028926)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 392 473 1119 500; baseline 0 -5"><span class='ocrx_word' id='word_1_54' title='bbox 392 473 587 500; x_wconf 85' lang='eng' dir='ltr'><em>Jeotga/icoccus</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 596 473 760 500; x_wconf 84' lang='eng' dir='ltr'><em>pinnipedia/is</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 770 473 854 495; x_wconf 91' lang='eng' dir='ltr'><strong>CCUG</strong></span> <span class='ocrx_word' id='word_1_57' title='bbox 865 473 959 495; x_wconf 91' lang='eng' dir='ltr'><em>42722T</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 969 473 1119 500; x_wconf 83' lang='eng' dir='ltr'>(AJ251530)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 292 512 877 540; baseline 0 -6"><span class='ocrx_word' id='word_1_59' title='bbox 292 512 465 534; x_wconf 89' lang='eng' dir='ltr'><em>Macrococcus</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 475 512 640 534; x_wconf 86' lang='eng' dir='ltr'><em>carouselicus</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 650 512 747 534; x_wconf 87' lang='eng' dir='ltr'>H8b16T</span> <span class='ocrx_word' id='word_1_62' title='bbox 758 512 877 540; x_wconf 91' lang='eng' dir='ltr'>(Y15713)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 197 546 1050 1008">
+     <span class='ocr_line' id='line_1_15' title="bbox 226 546 893 584; baseline 0 -11"><span class='ocrx_word' id='word_1_63' title='bbox 226 546 253 584; x_wconf 68' lang='eng' dir='ltr'><em>9f</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 288 552 462 573; x_wconf 84' lang='eng' dir='ltr'><em>Macrococcus</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 472 552 571 573; x_wconf 88' lang='eng' dir='ltr'><em>bovicus</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 580 551 659 573; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 670 552 763 573; x_wconf 84' lang='eng' dir='ltr'><em>51825T</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 774 552 893 579; x_wconf 94' lang='eng' dir='ltr'>(Y15714)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 197 577 901 618; baseline -0.001 -5"><span class='ocrx_word' id='word_1_69' title='bbox 197 577 237 595; x_wconf 60' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 296 590 469 613; x_wconf 82' lang='eng' dir='ltr'><em>Macrococcus</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 479 590 558 613; x_wconf 87' lang='eng' dir='ltr'><em>lamae</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 570 590 630 613; x_wconf 91' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 641 590 735 613; x_wconf 77' lang='eng' dir='ltr'><em>21713T</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 745 590 901 618; x_wconf 87' lang='eng' dir='ltr'>(AY119687)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 316 630 983 657; baseline -0.001 -5"><span class='ocrx_word' id='word_1_75' title='bbox 316 630 489 652; x_wconf 87' lang='eng' dir='ltr'><em>Macrococcus</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 499 630 661 657; x_wconf 86' lang='eng' dir='ltr'><em>caseolyticus</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 669 630 748 652; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 762 630 853 652; x_wconf 87' lang='eng' dir='ltr'><em>13548T</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 863 630 983 657; x_wconf 92' lang='eng' dir='ltr'>(Y15711)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 336 668 1050 696; baseline 0 -6"><span class='ocrx_word' id='word_1_80' title='bbox 336 668 543 696; x_wconf 85' lang='eng' dir='ltr'><em>Staphylococcus</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 552 668 760 696; x_wconf 83' lang='eng' dir='ltr'><em>piscifermentans</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 771 668 832 690; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 845 669 921 690; x_wconf 76' lang='eng' dir='ltr'><em>7373T</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 932 669 1050 696; x_wconf 91' lang='eng' dir='ltr'>(Y15754)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 335 707 1032 735; baseline -0.001 -5"><span class='ocrx_word' id='word_1_85' title='bbox 335 707 542 735; x_wconf 83' lang='eng' dir='ltr'><em>Staphylococcus</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 552 708 693 735; x_wconf 86' lang='eng' dir='ltr'><em>nepalensis</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 704 707 766 730; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 779 708 871 730; x_wconf 90' lang='eng' dir='ltr'><em>15150T</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 882 708 1032 735; x_wconf 91' lang='eng' dir='ltr'>(AJ517414)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 340 746 998 774; baseline 0 -6"><span class='ocrx_word' id='word_1_90' title='bbox 340 746 548 768; x_wconf 85' lang='eng' dir='ltr'><em>Carnobacterium</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 557 747 739 774; x_wconf 82' lang='eng' dir='ltr'><em>pleistocenium</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 750 747 834 768; x_wconf 91' lang='eng' dir='ltr'><em>FTR1T</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 844 747 998 774; x_wconf 89' lang='eng' dir='ltr'>(AF450136)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 344 785 1000 813; baseline 0 -5"><span class='ocrx_word' id='word_1_94' title='bbox 344 786 524 808; x_wconf 82' lang='eng' dir='ltr'><em>Enterococcus</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 534 785 636 808; x_wconf 86' lang='eng' dir='ltr'><em>faecium</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 645 785 724 808; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 737 786 828 808; x_wconf 86' lang='eng' dir='ltr'><em>19434T</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 839 785 1000 813; x_wconf 92' lang='eng' dir='ltr'>(DQ411813)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 347 824 987 852; baseline 0 -6"><span class='ocrx_word' id='word_1_99' title='bbox 347 824 526 846; x_wconf 82' lang='eng' dir='ltr'><em>Enterococcus</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 536 824 633 846; x_wconf 81' lang='eng' dir='ltr'><em>mundtii</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 640 824 719 846; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 729 824 823 846; x_wconf 80' lang='eng' dir='ltr'><em>43186T</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 833 824 987 852; x_wconf 88' lang='eng' dir='ltr'>(AF061013)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 312 863 934 891; baseline 0 -6"><span class='ocrx_word' id='word_1_104' title='bbox 312 864 471 885; x_wconf 82' lang='eng' dir='ltr'><em>Halobaci/Ius</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 480 864 614 891; x_wconf 86' lang='eng' dir='ltr'><em>ha/ophilus</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 625 863 716 885; x_wconf 90' lang='eng' dir='ltr'><em>NCIMB</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 727 864 804 885; x_wconf 78' lang='eng' dir='ltr'><em>2269T</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 814 864 934 891; x_wconf 87' lang='eng' dir='ltr'>(X62174)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 346 902 916 930; baseline 0 -5"><span class='ocrx_word' id='word_1_109' title='bbox 346 903 528 925; x_wconf 86' lang='eng' dir='ltr'><em>Marinococcus</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 538 903 608 925; x_wconf 86' lang='eng' dir='ltr'><em>albus</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 619 902 680 925; x_wconf 86' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 692 903 786 925; x_wconf 80' lang='eng' dir='ltr'><em>20748T</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 796 903 916 930; x_wconf 87' lang='eng' dir='ltr'>(X90834)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 411 942 1044 969; baseline 0.002 -6"><span class='ocrx_word' id='word_1_114' title='bbox 411 942 593 964; x_wconf 84' lang='eng' dir='ltr'><em>Marinococcus</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 603 942 737 969; x_wconf 84' lang='eng' dir='ltr'><em>halophilus</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 747 942 808 964; x_wconf 87' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_117' title='bbox 820 942 914 964; x_wconf 85' lang='eng' dir='ltr'>20408T</span> <span class='ocrx_word' id='word_1_118' title='bbox 924 942 1044 969; x_wconf 87' lang='eng' dir='ltr'>(X90835)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 422 981 1017 1008; baseline 0 -5"><span class='ocrx_word' id='word_1_119' title='bbox 422 981 612 1003; x_wconf 84' lang='eng' dir='ltr'><em>Nesterenkonia</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 622 981 685 1003; x_wconf 88' lang='eng' dir='ltr'><em>Iutea</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 695 981 745 1002; x_wconf 93' lang='eng' dir='ltr'><em>YIM</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 757 981 850 1003; x_wconf 85' lang='eng' dir='ltr'><em>70081T</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 861 981 1017 1008; x_wconf 90' lang='eng' dir='ltr'><em>(AY588278)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 0 11 416 994">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 0 11 416 994">
+     <span class='ocr_line' id='line_1_27' title="bbox 271 11 411 84; baseline 0 -15"><span class='ocrx_word' id='word_1_124' title='bbox 271 11 411 84; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 263 84 339 125; baseline 0 888"><span class='ocrx_word' id='word_1_125' title='bbox 263 84 339 125; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 263 125 364 201; baseline 0 -14"><span class='ocrx_word' id='word_1_126' title='bbox 263 125 364 201; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 240 201 353 279; baseline 0 -16"><span class='ocrx_word' id='word_1_127' title='bbox 240 201 353 279; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 207 279 341 320; baseline 0 0"><span class='ocrx_word' id='word_1_128' title='bbox 207 279 341 320; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 158 320 388 396; baseline 0 0"><span class='ocrx_word' id='word_1_129' title='bbox 158 320 388 396; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 158 396 344 437; baseline 0 576"><span class='ocrx_word' id='word_1_130' title='bbox 158 396 344 437; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 158 437 383 513; baseline 0 -39"><span class='ocrx_word' id='word_1_131' title='bbox 158 437 383 513; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 93 513 296 632; baseline 0 0"><span class='ocrx_word' id='word_1_132' title='bbox 93 513 296 632; x_wconf 95' lang='eng' dir='ltr'><em>     </em></span> <span class='ocrx_word' id='word_1_133' title='bbox 247 595 291 604; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 93 632 316 670; baseline 0 343"><span class='ocrx_word' id='word_1_134' title='bbox 93 632 316 670; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 93 670 331 710; baseline 0 303"><span class='ocrx_word' id='word_1_135' title='bbox 93 670 331 710; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 0 710 335 749; baseline 0 264"><span class='ocrx_word' id='word_1_136' title='bbox 0 710 335 749; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 0 749 340 788; baseline 0 225"><span class='ocrx_word' id='word_1_137' title='bbox 0 749 340 788; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 0 788 340 827; baseline 0 186"><span class='ocrx_word' id='word_1_138' title='bbox 0 788 340 827; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 0 827 343 866; baseline 0 0"><span class='ocrx_word' id='word_1_139' title='bbox 0 827 343 866; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 0 866 312 905; baseline 0 108"><span class='ocrx_word' id='word_1_140' title='bbox 0 866 312 905; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 0 905 346 944; baseline 0 69"><span class='ocrx_word' id='word_1_141' title='bbox 0 905 346 944; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 0 944 416 994; baseline 0 0"><span class='ocrx_word' id='word_1_142' title='bbox 0 944 416 994; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 262 67 288 85">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 262 67 288 85">
+     <span class='ocr_line' id='line_1_45' title="bbox 262 67 288 85; baseline 0 0"><span class='ocrx_word' id='word_1_143' title='bbox 262 67 288 85; x_wconf 87' lang='eng'>56</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 86 134 261 210">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 86 134 261 210">
+     <span class='ocr_line' id='line_1_46' title="bbox 86 134 133 152; baseline 0 0"><span class='ocrx_word' id='word_1_144' title='bbox 86 134 133 152; x_wconf 75' lang='eng'><em>002</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 237 192 261 210; baseline 0 0"><span class='ocrx_word' id='word_1_145' title='bbox 237 192 261 210; x_wconf 89' lang='eng'>71</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 222 248 248 266">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 222 248 248 266">
+     <span class='ocr_line' id='line_1_48' title="bbox 222 248 248 266; baseline 0 0"><span class='ocrx_word' id='word_1_146' title='bbox 222 248 248 266; x_wconf 89' lang='eng'><em>50</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 157 361 207 380">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 157 361 207 380">
+     <span class='ocr_line' id='line_1_49' title="bbox 157 361 207 380; baseline 0 0"><span class='ocrx_word' id='word_1_147' title='bbox 157 361 207 380; x_wconf 85' lang='eng'><em>100*</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 121 493 158 512">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 121 493 158 512">
+     <span class='ocr_line' id='line_1_50' title="bbox 121 493 158 512; baseline 0 0"><span class='ocrx_word' id='word_1_148' title='bbox 121 493 158 512; x_wconf 73' lang='eng'><em>98&quot;</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003269-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003269-0-000.pbm.png
new file mode 100644
index 00000000..57399da8
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003269-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003269-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003269-0-000.pbm.png.hocr
new file mode 100644
index 00000000..8242dd85
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003269-0-000.pbm.png.hocr
@@ -0,0 +1,136 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003269-0-000.pbm.png"; bbox 0 0 1302 1389; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 26 74 295 127">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 26 74 295 127">
+     <span class='ocr_line' id='line_1_1' title="bbox 244 74 295 93; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 244 74 295 93; x_wconf 82' lang='eng'>100*</span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 26 108 71 127; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 26 108 71 127; x_wconf 91' lang='eng'><em>0.01</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 185 158 211 178">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 185 158 211 178">
+     <span class='ocr_line' id='line_1_3' title="bbox 185 158 211 178; baseline 0 0"><span class='ocrx_word' id='word_1_3' title='bbox 185 158 211 178; x_wconf 85' lang='eng'>59</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 308 238 360 258">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 308 238 360 258">
+     <span class='ocr_line' id='line_1_4' title="bbox 308 238 360 258; baseline 0.019 -1"><span class='ocrx_word' id='word_1_4' title='bbox 308 238 360 258; x_wconf 74' lang='eng'>100*</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 159 305 186 325">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 159 305 186 325">
+     <span class='ocr_line' id='line_1_5' title="bbox 159 305 186 325; baseline 0.037 -1"><span class='ocrx_word' id='word_1_5' title='bbox 159 305 186 325; x_wconf 85' lang='eng'>73</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 111 494 149 513">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 111 494 149 513">
+     <span class='ocr_line' id='line_1_6' title="bbox 111 494 149 513; baseline -0.026 0"><span class='ocrx_word' id='word_1_6' title='bbox 111 494 149 513; x_wconf 66' lang='eng'><em>62*</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 93 685 318 758">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 93 685 318 758">
+     <span class='ocr_line' id='line_1_7' title="bbox 172 685 210 705; baseline -0.026 0"><span class='ocrx_word' id='word_1_7' title='bbox 172 685 210 705; x_wconf 74' lang='eng'>94*</span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 93 713 130 732; baseline 0 0"><span class='ocrx_word' id='word_1_8' title='bbox 93 713 130 732; x_wconf 67' lang='eng'><em>98*</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 267 739 318 758; baseline 0 0"><span class='ocrx_word' id='word_1_9' title='bbox 267 739 318 758; x_wconf 68' lang='eng'>100*</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 24 883 332 957">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 24 883 332 957">
+     <span class='ocr_line' id='line_1_10' title="bbox 295 883 332 902; baseline 0 0"><span class='ocrx_word' id='word_1_10' title='bbox 295 883 332 902; x_wconf 75' lang='eng'>99*</span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 24 937 249 957; baseline 0.004 -1"><span class='ocrx_word' id='word_1_11' title='bbox 24 937 36 956; x_wconf 89' lang='eng' dir='ltr'>P</span> <span class='ocrx_word' id='word_1_12' title='bbox 198 938 249 957; x_wconf 69' lang='eng'>100‘</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 78 1097 189 1191">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 78 1097 189 1191">
+     <span class='ocr_line' id='line_1_12' title="bbox 151 1097 189 1116; baseline 0 0"><span class='ocrx_word' id='word_1_13' title='bbox 151 1097 189 1116; x_wconf 77' lang='eng'>99*</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 78 1167 120 1191; baseline 0 -4"><span class='ocrx_word' id='word_1_14' title='bbox 78 1167 120 1191; x_wconf 83' lang='eng' dir='ltr'>99p</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 156 1239 198 1263">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 156 1239 198 1263">
+     <span class='ocr_line' id='line_1_14' title="bbox 156 1239 198 1263; baseline 0 -5"><span class='ocrx_word' id='word_1_15' title='bbox 156 1239 198 1263; x_wconf 84' lang='eng' dir='ltr'><em>98p</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 358 0 1245 401">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 358 0 1245 401">
+     <span class='ocr_line' id='line_1_15' title="bbox 358 0 1231 41; baseline 0 -16"><span class='ocrx_word' id='word_1_16' title='bbox 358 22 409 41; x_wconf 54' lang='eng'><em>100,</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 534 3 740 30; x_wconf 84' lang='eng' dir='ltr'><em>Salegentibacter</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 746 3 903 25; x_wconf 83' lang='eng' dir='ltr'><em>mishustinae</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 914 3 979 24; x_wconf 92' lang='eng' dir='ltr'><em>KMM</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 990 0 1067 25; x_wconf 81' lang='eng' dir='ltr'><em>6049T</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 1077 3 1231 30; x_wconf 80' lang='eng' dir='ltr'><em>(AY576653)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 512 70 1123 100; baseline 0 -6"><span class='ocrx_word' id='word_1_22' title='bbox 512 72 719 100; x_wconf 79' lang='eng' dir='ltr'><em>Salegentibacter</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 725 72 842 100; x_wconf 85' lang='eng' dir='ltr'><em>salegens</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 851 72 934 94; x_wconf 90' lang='eng' dir='ltr'><em>ACAM</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 945 70 990 94; x_wconf 90' lang='eng' dir='ltr'><em>48T</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 1000 72 1123 100; x_wconf 90' lang='eng' dir='ltr'>(M92279)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 510 141 1060 172; baseline 0 -6"><span class='ocrx_word' id='word_1_27' title='bbox 510 144 717 171; x_wconf 85' lang='eng' dir='ltr'><em>Salegentibacter</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 724 144 800 166; x_wconf 89' lang='eng' dir='ltr'><em>ﬂavus</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 810 144 841 172; x_wconf 89' lang='eng' dir='ltr'><em>Fg</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 851 141 896 166; x_wconf 89' lang='eng' dir='ltr'><em>69T</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 906 144 1060 171; x_wconf 89' lang='eng' dir='ltr'>(AY682200)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 550 214 1068 244; baseline 0.002 -6"><span class='ocrx_word' id='word_1_32' title='bbox 550 217 660 239; x_wconf 83' lang='eng' dir='ltr'><em>Mesonia</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 671 217 741 244; x_wconf 85' lang='eng' dir='ltr'><em>algae</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 752 217 816 238; x_wconf 93' lang='eng' dir='ltr'><em>KMM</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 829 214 905 239; x_wconf 89' lang='eng' dir='ltr'><em>3909T</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 916 217 1068 244; x_wconf 83' lang='eng' dir='ltr'><em>(AF536383)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 521 285 1065 316; baseline 0 -6"><span class='ocrx_word' id='word_1_37' title='bbox 521 288 631 310; x_wconf 87' lang='eng' dir='ltr'><em>Mesonia</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 641 288 733 310; x_wconf 80' lang='eng' dir='ltr'><em>mob/[is</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 743 288 807 310; x_wconf 91' lang='eng' dir='ltr'><em>KMM</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 819 285 896 310; x_wconf 87' lang='eng' dir='ltr'><em>6059T</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 907 288 1065 316; x_wconf 87' lang='eng' dir='ltr'>(DQ367409)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 433 357 1245 401; baseline -0.001 -19"><span class='ocrx_word' id='word_1_42' title='bbox 433 382 471 401; x_wconf 38' lang='eng'><em>96*</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 580 360 781 388; x_wconf 87' lang='eng' dir='ltr'><em>Psychroflexus</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 790 360 926 382; x_wconf 87' lang='eng' dir='ltr'><em>sediminis</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 934 357 1079 382; x_wconf 78' lang='eng' dir='ltr'><em>YlM-C238T</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 1089 360 1136 387; x_wconf 96' lang='eng' dir='ltr'><em>(EU</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 1141 360 1150 381; x_wconf 98' lang='eng'>1</span> <span class='ocrx_word' id='word_1_48' title='bbox 1156 360 1216 382; x_wconf 87' lang='eng'><strong>3571</strong></span> <span class='ocrx_word' id='word_1_49' title='bbox 1222 360 1245 387; x_wconf 93' lang='eng'><strong>5)</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 374 428 1302 472">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 374 428 1302 472">
+     <span class='ocr_line' id='line_1_21' title="bbox 374 428 1302 472; baseline 0 -19"><span class='ocrx_word' id='word_1_50' title='bbox 374 453 381 472; x_wconf 64' lang='eng'>1</span> <span class='ocrx_word' id='word_1_51' title='bbox 387 453 425 472; x_wconf 54' lang='eng'><em>00*</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 616 431 799 458; x_wconf 85' lang='eng' dir='ltr'><em>Psychroﬂexus</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 809 431 911 458; x_wconf 84' lang='eng' dir='ltr'><em>tropicus</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 920 431 999 453; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 1011 428 1139 453; x_wconf 89' lang='eng' dir='ltr'><em>BAA-734T</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 1150 431 1302 458; x_wconf 84' lang='eng' dir='ltr'>(AF513434)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 353 502 1263 1320">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 353 502 1263 1320">
+     <span class='ocr_line' id='line_1_22' title="bbox 471 502 1263 543; baseline 0 -17"><span class='ocrx_word' id='word_1_57' title='bbox 471 524 522 543; x_wconf 57' lang='eng'><em>100*</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 599 504 782 532; x_wconf 82' lang='eng' dir='ltr'><em>Psychroﬂexus</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 791 505 980 532; x_wconf 86' lang='eng' dir='ltr'><em>gondwanensis</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 989 504 1072 526; x_wconf 93' lang='eng' dir='ltr'><em>ACAM</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 1084 502 1129 526; x_wconf 93' lang='eng' dir='ltr'><em>44T</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 1140 505 1263 532; x_wconf 89' lang='eng' dir='ltr'>(M92278)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 527 552 1211 604; baseline 0 -6"><span class='ocrx_word' id='word_1_63' title='bbox 527 552 821 604; x_wconf 77' lang='eng' dir='ltr'><em>|—Psychroﬂexus</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 830 576 918 604; x_wconf 81' lang='eng' dir='ltr'><em>torquis</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 926 576 1009 598; x_wconf 90' lang='eng' dir='ltr'><em>ACAM</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 1021 574 1081 598; x_wconf 81' lang='eng' dir='ltr'><em>623T</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 1092 576 1211 604; x_wconf 88' lang='eng' dir='ltr'><em>(U85881)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 439 646 990 676; baseline 0 -6"><span class='ocrx_word' id='word_1_68' title='bbox 439 648 645 670; x_wconf 86' lang='eng' dir='ltr'><em>Salinimicrobium</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 656 648 742 670; x_wconf 84' lang='eng' dir='ltr'><em>catena</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 754 646 820 670; x_wconf 78' lang='eng' dir='ltr'><em>HY’lT</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 831 648 990 676; x_wconf 87' lang='eng' dir='ltr'>(DQ640642)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 443 718 1186 748; baseline 0 -6"><span class='ocrx_word' id='word_1_72' title='bbox 443 720 649 742; x_wconf 85' lang='eng' dir='ltr'><em>Salinimicrobium</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 659 720 823 748; x_wconf 86' lang='eng' dir='ltr'><em>Xinjiangense</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 838 720 914 742; x_wconf 89' lang='eng' dir='ltr'><em>KCTC</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 930 718 1021 742; x_wconf 90' lang='eng' dir='ltr'><em>12883T</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 1034 720 1186 748; x_wconf 90' lang='eng' dir='ltr'>(EF520007)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 443 789 1055 819; baseline 0.002 -6"><span class='ocrx_word' id='word_1_77' title='bbox 443 791 649 814; x_wconf 86' lang='eng' dir='ltr'><em>Salinimicrobium</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 660 793 734 814; x_wconf 81' lang='eng' dir='ltr'><em>terrae</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 744 789 888 814; x_wconf 79' lang='eng' dir='ltr'><em>YIM—C338T</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 899 792 1055 819; x_wconf 88' lang='eng' dir='ltr'><em>(EU135614)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 443 859 1069 889; baseline 0.002 -6"><span class='ocrx_word' id='word_1_81' title='bbox 443 862 526 884; x_wconf 87' lang='eng' dir='ltr'><em>Gi/Iisia</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 536 862 713 884; x_wconf 77' lang='eng' dir='ltr'><em>mitskevichiae</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 724 862 801 884; x_wconf 86' lang='eng' dir='ltr'><em>KCTC</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 814 859 904 884; x_wconf 77' lang='eng' dir='ltr'>12261T</span> <span class='ocrx_word' id='word_1_85' title='bbox 915 862 1069 889; x_wconf 87' lang='eng' dir='ltr'><em>(AY576655)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 481 933 1088 963; baseline 0.002 -6"><span class='ocrx_word' id='word_1_86' title='bbox 481 936 564 958; x_wconf 88' lang='eng' dir='ltr'><em>Gillisia</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 575 936 680 963; x_wconf 89' lang='eng' dir='ltr'><em>myxi/Iae</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 692 933 918 958; x_wconf 86' lang='eng' dir='ltr'><em>UST050418—085T</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 929 936 1088 963; x_wconf 79' lang='eng' dir='ltr'>(D0202393)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 525 1006 1103 1036; baseline 0.002 -6"><span class='ocrx_word' id='word_1_90' title='bbox 525 1009 609 1031; x_wconf 84' lang='eng' dir='ltr'><em>Gil/isia</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 619 1009 757 1031; x_wconf 80' lang='eng' dir='ltr'><em>illustrilutea</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 766 1009 850 1031; x_wconf 91' lang='eng' dir='ltr'><em>ACAM</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 863 1006 938 1031; x_wconf 90' lang='eng' dir='ltr'><em>1062T</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 949 1009 1103 1036; x_wconf 88' lang='eng' dir='ltr'>(AY694008)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 363 1076 1105 1106; baseline -0.001 -5"><span class='ocrx_word' id='word_1_95' title='bbox 363 1079 574 1106; x_wconf 85' lang='eng' dir='ltr'><em>Psychroserpens</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 583 1079 732 1106; x_wconf 84' lang='eng' dir='ltr'><em>mesophilus</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 743 1078 830 1101; x_wconf 87' lang='eng' dir='ltr'>KOPRI</span> <span class='ocrx_word' id='word_1_98' title='bbox 844 1076 935 1101; x_wconf 79' lang='eng' dir='ltr'><em>13649T</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 945 1078 1105 1106; x_wconf 83' lang='eng' dir='ltr'><em>(DQOO1321)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 474 1146 1149 1176; baseline 0 -5"><span class='ocrx_word' id='word_1_100' title='bbox 474 1149 685 1176; x_wconf 82' lang='eng' dir='ltr'><em>Psychroserpens</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 697 1149 848 1171; x_wconf 78' lang='eng' dir='ltr'><em>burtonensis</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 859 1149 942 1171; x_wconf 90' lang='eng' dir='ltr'><em>ACAM</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 959 1146 1016 1171; x_wconf 91' lang='eng' dir='ltr'><em>188T</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 1029 1149 1149 1176; x_wconf 88' lang='eng' dir='ltr'>(U62913)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 353 1220 974 1250; baseline 0 -6"><span class='ocrx_word' id='word_1_105' title='bbox 353 1223 488 1250; x_wconf 82' lang='eng' dir='ltr'><em>Algibacter</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 495 1223 631 1244; x_wconf 86' lang='eng' dir='ltr'><em>mikhai/ovii</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 640 1222 700 1244; x_wconf 91' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 712 1220 805 1244; x_wconf 80' lang='eng' dir='ltr'><em>23988T</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 816 1222 974 1250; x_wconf 86' lang='eng' dir='ltr'>(AM491809)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 358 1290 904 1320; baseline 0 -6"><span class='ocrx_word' id='word_1_110' title='bbox 358 1292 576 1320; x_wconf 81' lang='eng' dir='ltr'><em>Algibacter/ectus</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 586 1292 651 1314; x_wconf 92' lang='eng' dir='ltr'><em>KMM</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 663 1290 739 1314; x_wconf 91' lang='eng' dir='ltr'><em>3902T</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 750 1292 904 1320; x_wconf 85' lang='eng' dir='ltr'>(AY187689)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 635 1358 1186 1389">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 635 1358 1186 1389">
+     <span class='ocr_line' id='line_1_34' title="bbox 635 1358 1186 1389; baseline -0.002 -6"><span class='ocrx_word' id='word_1_114' title='bbox 635 1361 754 1389; x_wconf 89' lang='eng' dir='ltr'><em>Myroides</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 764 1361 878 1383; x_wconf 82' lang='eng' dir='ltr'><em>odoratus</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 887 1361 965 1383; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 976 1358 1053 1383; x_wconf 78' lang='eng' dir='ltr'><em>4651T</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 1063 1361 1186 1389; x_wconf 89' lang='eng' dir='ltr'>(M58777)</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003285-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003285-0-000.pbm.png
new file mode 100644
index 00000000..ea3fe0d4
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003285-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003285-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003285-0-000.pbm.png.hocr
new file mode 100644
index 00000000..a5ae3dc0
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003285-0-000.pbm.png.hocr
@@ -0,0 +1,188 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003285-0-000.pbm.png"; bbox 0 0 876 1075; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 0 5 324 1046">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 0 5 324 1046">
+     <span class='ocr_line' id='line_1_1' title="bbox 235 5 324 103; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 235 42 324 103; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> <span class='ocrx_word' id='word_1_2' title='bbox 306 5 317 18; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 235 103 324 220; baseline 0 -22"><span class='ocrx_word' id='word_1_3' title='bbox 235 103 324 220; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 205 220 281 276; baseline 0 799"><span class='ocrx_word' id='word_1_4' title='bbox 205 220 281 276; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 225 276 301 376; baseline 0 -22"><span class='ocrx_word' id='word_1_5' title='bbox 225 276 301 376; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 212 376 297 454; baseline 0 -22"><span class='ocrx_word' id='word_1_6' title='bbox 212 376 297 454; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 200 454 289 571; baseline 0 -22"><span class='ocrx_word' id='word_1_7' title='bbox 200 454 289 571; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 212 571 284 649; baseline 0 0"><span class='ocrx_word' id='word_1_8' title='bbox 212 571 284 649; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 212 649 241 705; baseline 0 -39"><span class='ocrx_word' id='word_1_9' title='bbox 212 649 241 705; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 191 705 287 805; baseline 0 0"><span class='ocrx_word' id='word_1_10' title='bbox 191 705 287 805; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 0 805 297 883; baseline 0 0"><span class='ocrx_word' id='word_1_11' title='bbox 0 805 297 883; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 0 883 293 961; baseline 0 0"><span class='ocrx_word' id='word_1_12' title='bbox 0 883 293 961; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 0 961 293 1046; baseline 0 0"><span class='ocrx_word' id='word_1_13' title='bbox 0 961 293 1046; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 241 0 876 1003">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 323 0 695 28">
+     <span class='ocr_line' id='line_1_13' title="bbox 323 0 695 28; baseline 0.003 -6"><span class='ocrx_word' id='word_1_14' title='bbox 323 1 344 23; x_wconf 91' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 358 1 421 23; x_wconf 84' lang='eng' dir='ltr'><em>faeni</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 430 0 537 23; x_wconf 91' lang='eng' dir='ltr'><em>MA—olkiT</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 547 1 695 28; x_wconf 83' lang='eng' dir='ltr'><em>(AJ429239)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 249 34 788 67">
+     <span class='ocr_line' id='line_1_14' title="bbox 249 34 788 67; baseline 0 -6"><span class='ocrx_word' id='word_1_18' title='bbox 249 34 301 52; x_wconf 69' lang='eng'>1000</span> <span class='ocrx_word' id='word_1_19' title='bbox 331 40 353 61; x_wconf 91' lang='eng' dir='ltr'><em>s.</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 366 40 500 61; x_wconf 82' lang='eng' dir='ltr'><em>aurantiaca</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 511 39 629 61; x_wconf 83' lang='eng' dir='ltr'><em>MA1O1bT</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 640 40 788 67; x_wconf 86' lang='eng' dir='ltr'><em>(AJ429238)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 329 78 728 106">
+     <span class='ocr_line' id='line_1_15' title="bbox 329 78 728 106; baseline 0 -6"><span class='ocrx_word' id='word_1_23' title='bbox 329 79 351 100; x_wconf 85' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 364 79 467 100; x_wconf 81' lang='eng' dir='ltr'><em>aero/ata</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 479 78 569 100; x_wconf 81' lang='eng' dir='ltr'><em>NW12T</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 579 79 728 106; x_wconf 85' lang='eng' dir='ltr'><em>(AJ429240)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 293 117 686 145">
+     <span class='ocr_line' id='line_1_16' title="bbox 293 117 686 145; baseline 0 -6"><span class='ocrx_word' id='word_1_27' title='bbox 293 118 315 139; x_wconf 88' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 329 118 434 145; x_wconf 87' lang='eng' dir='ltr'><em>aquatilis</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 444 117 524 139; x_wconf 81' lang='eng' dir='ltr'>JSS7T</span> <span class='ocrx_word' id='word_1_30' title='bbox 534 118 686 145; x_wconf 87' lang='eng' dir='ltr'><em>(AF131295)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 317 156 651 184">
+     <span class='ocr_line' id='line_1_17' title="bbox 317 156 651 184; baseline 0 -6"><span class='ocrx_word' id='word_1_31' title='bbox 317 157 338 178; x_wconf 88' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 351 157 421 178; x_wconf 84' lang='eng' dir='ltr'><em>abaci</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 429 156 493 178; x_wconf 80' lang='eng' dir='ltr'><em>C42T</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 503 157 651 184; x_wconf 81' lang='eng' dir='ltr'><em>(AJ575817)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 281 195 819 262">
+     <span class='ocr_line' id='line_1_18' title="bbox 329 195 819 223; baseline 0 -6"><span class='ocrx_word' id='word_1_35' title='bbox 329 196 351 217; x_wconf 89' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 364 196 502 217; x_wconf 86' lang='eng' dir='ltr'><em>echinoides</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 513 196 573 217; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 587 195 660 217; x_wconf 89' lang='eng' dir='ltr'><em>1805T</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 671 196 819 223; x_wconf 87' lang='eng' dir='ltr'><em>(AJO12461)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 281 234 688 262; baseline 0 -6"><span class='ocrx_word' id='word_1_40' title='bbox 281 235 303 256; x_wconf 92' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 316 235 369 256; x_wconf 87' lang='eng' dir='ltr'><em>mali</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 379 235 458 256; x_wconf 86' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_43' title='bbox 471 234 560 256; x_wconf 74' lang='eng' dir='ltr'><em>15500T</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 570 235 688 262; x_wconf 87' lang='eng' dir='ltr'><em>(Y09638)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 285 273 703 301">
+     <span class='ocr_line' id='line_1_20' title="bbox 285 273 703 301; baseline 0 -6"><span class='ocrx_word' id='word_1_45' title='bbox 285 274 307 295; x_wconf 88' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 318 274 385 301; x_wconf 89' lang='eng' dir='ltr'><em>pruni</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 394 274 474 295; x_wconf 89' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_48' title='bbox 487 273 575 295; x_wconf 85' lang='eng' dir='ltr'><em>15498T</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 586 274 703 301; x_wconf 86' lang='eng' dir='ltr'><em>(Y09637)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 283 312 838 379">
+     <span class='ocr_line' id='line_1_21' title="bbox 283 312 838 340; baseline 0 -6"><span class='ocrx_word' id='word_1_50' title='bbox 283 313 305 334; x_wconf 91' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 318 313 517 340; x_wconf 82' lang='eng' dir='ltr'><em>asaccharo/ytica</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 529 313 608 334; x_wconf 86' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 621 312 710 334; x_wconf 83' lang='eng' dir='ltr'><em>15499T</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 720 313 838 340; x_wconf 85' lang='eng' dir='ltr'><em>(Y09639)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 306 351 642 379; baseline 0 -6"><span class='ocrx_word' id='word_1_55' title='bbox 306 352 328 373; x_wconf 66' lang='eng' dir='ltr'><em>S,</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 341 352 385 373; x_wconf 91' lang='eng' dir='ltr'><em>soli</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 393 351 479 373; x_wconf 92' lang='eng' dir='ltr'><em>T5-04T</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 490 352 642 379; x_wconf 84' lang='eng' dir='ltr'><em>(AB166883)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 285 390 711 418">
+     <span class='ocr_line' id='line_1_23' title="bbox 285 390 711 418; baseline 0 -6"><span class='ocrx_word' id='word_1_59' title='bbox 285 391 307 412; x_wconf 89' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 320 391 444 412; x_wconf 82' lang='eng' dir='ltr'><em>koreensis</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 453 390 549 412; x_wconf 81' lang='eng' dir='ltr'><em>JSSZGT</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 560 391 711 418; x_wconf 80' lang='eng' dir='ltr'><em>(AF131296)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 302 429 776 457">
+     <span class='ocr_line' id='line_1_24' title="bbox 302 429 776 457; baseline 0 -6"><span class='ocrx_word' id='word_1_63' title='bbox 302 430 324 451; x_wconf 88' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 337 430 468 451; x_wconf 87' lang='eng' dir='ltr'><em>adhaesiva</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 478 430 544 451; x_wconf 91' lang='eng' dir='ltr'><em>GIFU</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 558 429 647 451; x_wconf 79' lang='eng' dir='ltr'><em>11458T</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 657 430 776 457; x_wconf 80' lang='eng' dir='ltr'><em>(D16146)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 281 468 733 496">
+     <span class='ocr_line' id='line_1_25' title="bbox 281 468 733 496; baseline 0 -6"><span class='ocrx_word' id='word_1_68' title='bbox 281 469 303 490; x_wconf 89' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 316 469 479 490; x_wconf 83' lang='eng' dir='ltr'><em>dokdonensis</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 489 468 565 490; x_wconf 89' lang='eng' dir='ltr'><em>DS-4T</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 575 469 733 496; x_wconf 87' lang='eng' dir='ltr'><em>(DQ178975)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 283 507 834 652">
+     <span class='ocr_line' id='line_1_26' title="bbox 289 507 834 535; baseline 0 -6"><span class='ocrx_word' id='word_1_72' title='bbox 289 508 311 529; x_wconf 89' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 324 508 491 529; x_wconf 84' lang='eng' dir='ltr'><em>mucosissima</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 503 508 563 529; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 576 507 666 529; x_wconf 78' lang='eng' dir='ltr'><em>17494T</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 676 508 834 535; x_wconf 84' lang='eng' dir='ltr'><em>(AM229669)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 298 546 821 573; baseline 0 -5"><span class='ocrx_word' id='word_1_77' title='bbox 298 547 319 568; x_wconf 88' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 332 547 496 568; x_wconf 86' lang='eng' dir='ltr'><em>molluscorum</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 507 547 571 568; x_wconf 92' lang='eng' dir='ltr'><em>KMM</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 583 546 658 568; x_wconf 81' lang='eng' dir='ltr'><em>3882T</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 668 547 821 573; x_wconf 78' lang='eng' dir='ltr'><em>(ABZ48285)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 283 585 799 613; baseline -0.002 -5"><span class='ocrx_word' id='word_1_82' title='bbox 283 586 305 608; x_wconf 89' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 318 586 466 608; x_wconf 86' lang='eng' dir='ltr'><em>desiccabi/is</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 477 586 537 608; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 551 585 640 608; x_wconf 74' lang='eng' dir='ltr'><em>18792T</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 650 586 799 613; x_wconf 84' lang='eng' dir='ltr'><em>(AJ871435)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 289 624 626 652; baseline 0 -6"><span class='ocrx_word' id='word_1_87' title='bbox 289 625 311 646; x_wconf 91' lang='eng' dir='ltr'><em>s.</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 323 625 395 652; x_wconf 82' lang='eng' dir='ltr'><em>pann/</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 404 624 467 646; x_wconf 80' lang='eng' dir='ltr'><em>052T</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 478 625 626 652; x_wconf 89' lang='eng' dir='ltr'><em>(AJ575818)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 241 663 831 730">
+     <span class='ocr_line' id='line_1_30' title="bbox 241 663 831 691; baseline -0.003 -4"><span class='ocrx_word' id='word_1_91' title='bbox 241 668 280 687; x_wconf 88' lang='eng'><em>982</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 302 664 324 685; x_wconf 89' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 337 664 475 691; x_wconf 81' lang='eng' dir='ltr'><em>azotiﬁgens</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 486 664 565 685; x_wconf 85' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 578 663 667 685; x_wconf 85' lang='eng' dir='ltr'><em>15497T</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 678 664 831 691; x_wconf 85' lang='eng' dir='ltr'>(ABZ17471)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 242 699 716 730; baseline 0 -6"><span class='ocrx_word' id='word_1_97' title='bbox 242 699 267 718; x_wconf 85' lang='eng'>00</span> <span class='ocrx_word' id='word_1_98' title='bbox 300 703 322 724; x_wconf 87' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 335 703 433 730; x_wconf 82' lang='eng' dir='ltr'><em>trueperi</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 443 703 502 724; x_wconf 92' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 513 702 588 724; x_wconf 85' lang='eng' dir='ltr'><em>2142T</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 598 703 716 730; x_wconf 83' lang='eng' dir='ltr'><em>(X97776)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 295 741 685 769">
+     <span class='ocr_line' id='line_1_32' title="bbox 295 741 685 769; baseline 0 -6"><span class='ocrx_word' id='word_1_103' title='bbox 295 742 317 763; x_wconf 88' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 329 742 437 769; x_wconf 82' lang='eng' dir='ltr'><em>pituitosa</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 449 741 526 763; x_wconf 67' lang='eng' dir='ltr'><em>EDIW</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 536 742 685 769; x_wconf 89' lang='eng' dir='ltr'><em>(AJ243751)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 298 780 692 808">
+     <span class='ocr_line' id='line_1_33' title="bbox 298 780 692 808; baseline 0 -6"><span class='ocrx_word' id='word_1_107' title='bbox 298 781 322 802; x_wconf 90' lang='eng' dir='ltr'><strong><em>S.</em></strong></span> <span class='ocrx_word' id='word_1_108' title='bbox 329 781 451 808; x_wconf 86' lang='eng' dir='ltr'><em>japonica</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 461 780 529 802; x_wconf 92' lang='eng' dir='ltr'><em>KC7T</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 536 781 692 808; x_wconf 85' lang='eng' dir='ltr'><em>(AB428568)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 273 819 751 847">
+     <span class='ocr_line' id='line_1_34' title="bbox 273 819 751 847; baseline 0 -6"><span class='ocrx_word' id='word_1_111' title='bbox 273 820 294 841; x_wconf 90' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 307 820 429 847; x_wconf 86' lang='eng' dir='ltr'><em>sanguinis</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 440 820 519 841; x_wconf 91' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 533 819 621 841; x_wconf 80' lang='eng' dir='ltr'><em>13937T</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 632 820 751 847; x_wconf 82' lang='eng' dir='ltr'><em>(D13726)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 293 858 876 925">
+     <span class='ocr_line' id='line_1_35' title="bbox 302 858 876 885; baseline 0 -5"><span class='ocrx_word' id='word_1_116' title='bbox 302 859 324 880; x_wconf 71' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 335 859 555 885; x_wconf 81' lang='eng' dir='ltr'><em>parapaucimobilis</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 565 859 644 880; x_wconf 89' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 657 858 747 880; x_wconf 82' lang='eng' dir='ltr'><em>15100T</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 757 859 876 885; x_wconf 88' lang='eng' dir='ltr'><em>(D13724)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 293 897 780 925; baseline 0 -6"><span class='ocrx_word' id='word_1_121' title='bbox 293 897 315 919; x_wconf 87' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 327 898 488 925; x_wconf 85' lang='eng' dir='ltr'><em>paucimobilis</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 498 897 564 919; x_wconf 89' lang='eng' dir='ltr'><em>GIFU</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 575 897 650 919; x_wconf 87' lang='eng' dir='ltr'><em>2395T</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 661 898 780 925; x_wconf 84' lang='eng' dir='ltr'><em>(D16144)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 298 936 698 964">
+     <span class='ocr_line' id='line_1_37' title="bbox 298 936 698 964; baseline 0 -6"><span class='ocrx_word' id='word_1_126' title='bbox 298 937 319 958; x_wconf 88' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 332 937 456 958; x_wconf 84' lang='eng' dir='ltr'><em>roseif/ava</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 467 936 568 958; x_wconf 80' lang='eng' dir='ltr'><em>MK341T</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 579 937 698 964; x_wconf 88' lang='eng' dir='ltr'><em>(D84520)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 289 975 739 1003">
+     <span class='ocr_line' id='line_1_38' title="bbox 289 975 739 1003; baseline 0 -6"><span class='ocrx_word' id='word_1_130' title='bbox 289 976 311 997; x_wconf 90' lang='eng' dir='ltr'><em>S.</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 325 976 418 997; x_wconf 82' lang='eng' dir='ltr'><em>wittichii</em></span> <span class='ocrx_word' id='word_1_132' title='bbox 427 976 488 997; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 499 975 575 997; x_wconf 80' lang='eng' dir='ltr'><em>6014T</em></span> <span class='ocrx_word' id='word_1_134' title='bbox 585 976 739 1003; x_wconf 83' lang='eng' dir='ltr'><em>(ABOZ1492)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 297 1012 757 1075">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 297 1012 757 1075">
+     <span class='ocr_line' id='line_1_39' title="bbox 297 1012 757 1040; baseline 0 -6"><span class='ocrx_word' id='word_1_135' title='bbox 297 1013 459 1034; x_wconf 81' lang='eng' dir='ltr'><em>Burkho/deria</em></span> <span class='ocrx_word' id='word_1_136' title='bbox 469 1013 568 1040; x_wconf 85' lang='eng' dir='ltr'><em>cepacia</em></span> <span class='ocrx_word' id='word_1_137' title='bbox 577 1013 654 1034; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_138' title='bbox 666 1012 757 1034; x_wconf 82' lang='eng' dir='ltr'><em>25416T</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 297 1048 449 1075; baseline 0 -6"><span class='ocrx_word' id='word_1_139' title='bbox 297 1048 449 1075; x_wconf 83' lang='eng' dir='ltr'><em>(AF097530)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 13 187 59 206">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 13 187 59 206">
+     <span class='ocr_line' id='line_1_41' title="bbox 13 187 59 206; baseline -0.022 0"><span class='ocrx_word' id='word_1_140' title='bbox 13 187 59 206; x_wconf 57' lang='eng'>0,02</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 161 250 201 268">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 161 250 201 268">
+     <span class='ocr_line' id='line_1_42' title="bbox 161 250 201 268; baseline 0 0"><span class='ocrx_word' id='word_1_141' title='bbox 161 250 201 268; x_wconf 87' lang='eng'><em>959</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 158 508 210 561">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 158 508 210 561">
+     <span class='ocr_line' id='line_1_43' title="bbox 158 508 197 526; baseline 0 0"><span class='ocrx_word' id='word_1_142' title='bbox 158 508 197 526; x_wconf 84' lang='eng'><em>975</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 171 542 210 561; baseline 0 0"><span class='ocrx_word' id='word_1_143' title='bbox 171 542 210 561; x_wconf 81' lang='eng'><em>995</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 175 734 215 753">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 175 734 215 753">
+     <span class='ocr_line' id='line_1_45' title="bbox 175 734 215 753; baseline 0 0"><span class='ocrx_word' id='word_1_144' title='bbox 175 734 215 753; x_wconf 85' lang='eng'><em>903</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003293-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003293-0-000.pbm.png
new file mode 100644
index 00000000..7d2076dc
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003293-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003293-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003293-0-000.pbm.png.hocr
new file mode 100644
index 00000000..fd3c04a0
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003293-0-000.pbm.png.hocr
@@ -0,0 +1,259 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003293-0-000.pbm.png"; bbox 0 0 1302 1015; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 123 275 331 295">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 123 276 331 293">
+     <span class='ocr_line' id='line_1_1' title="bbox 123 276 331 293; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 123 277 147 293; x_wconf 85' lang='eng'>98</span> <span class='ocrx_word' id='word_1_2' title='bbox 308 276 331 293; x_wconf 82' lang='eng'><em>92</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 184 0 1300 278">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 217 3 1298 168">
+     <span class='ocr_line' id='line_1_2' title="bbox 353 3 1117 28; baseline -0.001 -4"><span class='ocrx_word' id='word_1_3' title='bbox 353 8 376 25; x_wconf 87' lang='eng'><em>77</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 408 13 657 16; x_wconf 74' lang='eng'><em>_</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 663 5 802 23; x_wconf 81' lang='eng' dir='ltr'><em>AI/oiococcus</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 810 5 860 23; x_wconf 83' lang='eng' dir='ltr'><em>otitis</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 869 5 934 23; x_wconf 91' lang='eng' dir='ltr'><em>NCFB</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 943 3 1008 23; x_wconf 81' lang='eng' dir='ltr'><em>2890T</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 1016 5 1117 28; x_wconf 80' lang='eng' dir='ltr'>(X59765)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 264 38 1201 63; baseline 0 -5"><span class='ocrx_word' id='word_1_10' title='bbox 264 44 299 61; x_wconf 88' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 408 48 682 50; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_12' title='bbox 689 40 860 63; x_wconf 82' lang='eng' dir='ltr'><em>Do/osigranulum</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 868 40 944 63; x_wconf 73' lang='eng' dir='ltr'><em>pigrurn</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 953 40 1018 58; x_wconf 88' lang='eng' dir='ltr'><em>NCFB</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 1027 38 1091 58; x_wconf 76' lang='eng' dir='ltr'><em>2975T</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 1101 40 1201 63; x_wconf 84' lang='eng' dir='ltr'>(X70907)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 392 73 1124 98; baseline 0 -5"><span class='ocrx_word' id='word_1_17' title='bbox 392 82 618 97; x_wconf 65' lang='eng'><em>[—</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 625 75 755 98; x_wconf 79' lang='eng' dir='ltr'><em>Atopost/pes</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 763 75 890 93; x_wconf 85' lang='eng' dir='ltr'><em>suicloacalis</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 899 73 986 93; x_wconf 89' lang='eng' dir='ltr'><em>PPC79T</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 995 75 1124 98; x_wconf 86' lang='eng' dir='ltr'>(AF445248)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 217 108 1298 137; baseline 0 -9"><span class='ocrx_word' id='word_1_22' title='bbox 217 121 241 137; x_wconf 67' lang='eng'><em>96</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 353 109 376 125; x_wconf 85' lang='eng'><em>78</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 394 119 798 121; x_wconf 94' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_25' title='bbox 805 110 905 128; x_wconf 75' lang='eng' dir='ltr'><em>Allofush&#39;s</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 913 110 996 128; x_wconf 86' lang='eng' dir='ltr'><em>seminis</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 1004 110 1075 128; x_wconf 88' lang='eng' dir='ltr'><strong>CCUG</strong></span> <span class='ocrx_word' id='word_1_28' title='bbox 1084 108 1163 128; x_wconf 78' lang='eng' dir='ltr'><em>45438T</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 1172 110 1298 133; x_wconf 90' lang='eng' dir='ltr'>(AJ410303)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 307 143 1008 168; baseline 0 -5"><span class='ocrx_word' id='word_1_30' title='bbox 307 149 342 166; x_wconf 86' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 403 145 597 163; x_wconf 81' lang='eng' dir='ltr'><em>Marini/actibacillus</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 604 145 781 168; x_wconf 79' lang='eng' dir='ltr'><em>psychrotolerans</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 790 143 869 163; x_wconf 82' lang='eng' dir='ltr'><em>M13-2T</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 878 145 1008 168; x_wconf 79' lang='eng' dir='ltr'>(A8083406)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 184 178 1065 273">
+     <span class='ocr_line' id='line_1_7' title="bbox 406 178 969 203; baseline 0 -5"><span class='ocrx_word' id='word_1_35' title='bbox 406 180 600 198; x_wconf 83' lang='eng' dir='ltr'><em>Marinilactibaci/lus</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 607 180 755 203; x_wconf 75' lang='eng' dir='ltr'><em>piezotolerans</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 764 178 829 198; x_wconf 90' lang='eng' dir='ltr'><em>LT20T</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 838 180 969 203; x_wconf 83' lang='eng' dir='ltr'>(AY485792)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 184 213 1020 260; baseline -0.001 -26"><span class='ocrx_word' id='word_1_39' title='bbox 184 214 219 238; x_wconf 51' lang='eng' dir='ltr'><em>{l</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 265 228 288 245; x_wconf 74' lang='eng'>98</span> <span class='ocrx_word' id='word_1_41' title='bbox 352 215 601 260; x_wconf 51' lang='eng' dir='ltr'><em>r‘:AIkalibacterium</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 608 215 784 239; x_wconf 84' lang='eng' dir='ltr'><em>psychrotolerans</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 794 213 881 233; x_wconf 88' lang='eng' dir='ltr'><em>IDR2-2T</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 890 215 1020 239; x_wconf 85' lang='eng' dir='ltr'>(AB125938)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 447 248 1065 273; baseline 0 -5"><span class='ocrx_word' id='word_1_45' title='bbox 447 250 616 268; x_wconf 74' lang='eng' dir='ltr'><em>Alka/ibaclerium</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 624 250 777 273; x_wconf 82' lang='eng' dir='ltr'><em>olivapovliticus</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 785 248 927 268; x_wconf 85' lang='eng' dir='ltr'><em>WW2-SN4aT</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 935 250 1065 273; x_wconf 88' lang='eng' dir='ltr'>(AF143511)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 354 30 408 32">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 354 30 408 32">
+     <span class='ocr_line' id='line_1_10' title="bbox 354 30 408 32; baseline 0 983"><span class='ocrx_word' id='word_1_49' title='bbox 354 30 408 32; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 406 13 408 50">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 406 13 408 50">
+     <span class='ocr_line' id='line_1_11' title="bbox 406 13 408 50; baseline 0 965"><span class='ocrx_word' id='word_1_50' title='bbox 406 13 408 50; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 267 65 356 69">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 267 65 356 69">
+     <span class='ocr_line' id='line_1_12' title="bbox 267 65 356 69; baseline 0 946"><span class='ocrx_word' id='word_1_51' title='bbox 267 65 356 69; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 354 30 357 102">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 354 30 357 102">
+     <span class='ocr_line' id='line_1_13' title="bbox 354 30 357 102; baseline 0 913"><span class='ocrx_word' id='word_1_52' title='bbox 354 30 357 102; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 355 101 394 103">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 355 101 394 103">
+     <span class='ocr_line' id='line_1_14' title="bbox 355 101 394 103; baseline 0 912"><span class='ocrx_word' id='word_1_53' title='bbox 355 101 394 103; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 391 97 395 120">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 391 97 395 120">
+     <span class='ocr_line' id='line_1_15' title="bbox 391 97 395 120; baseline 0 895"><span class='ocrx_word' id='word_1_54' title='bbox 391 97 395 120; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 220 143 269 145">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 220 143 269 145">
+     <span class='ocr_line' id='line_1_16' title="bbox 220 143 269 145; baseline 0 870"><span class='ocrx_word' id='word_1_55' title='bbox 220 143 269 145; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 266 66 270 221">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 266 66 270 221">
+     <span class='ocr_line' id='line_1_17' title="bbox 266 66 270 221; baseline 0 794"><span class='ocrx_word' id='word_1_56' title='bbox 266 66 270 221; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 352 257 354 295">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 352 257 354 295">
+     <span class='ocr_line' id='line_1_18' title="bbox 352 257 354 295; baseline 0 720"><span class='ocrx_word' id='word_1_57' title='bbox 352 257 354 295; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 125 298 188 302">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 125 298 188 302">
+     <span class='ocr_line' id='line_1_19' title="bbox 125 298 188 302; baseline 0 713"><span class='ocrx_word' id='word_1_58' title='bbox 125 298 188 302; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 4 747 94 752">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 4 747 94 752">
+     <span class='ocr_line' id='line_1_20' title="bbox 4 747 94 752; baseline 0 263"><span class='ocrx_word' id='word_1_59' title='bbox 4 747 94 752; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 121 299 132 776">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 121 299 132 776">
+     <span class='ocr_line' id='line_1_21' title="bbox 121 299 132 776; baseline 0 239"><span class='ocrx_word' id='word_1_60' title='bbox 121 299 132 776; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 88 536 98 962">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 88 536 98 962">
+     <span class='ocr_line' id='line_1_22' title="bbox 88 536 98 962; baseline 0 53"><span class='ocrx_word' id='word_1_61' title='bbox 88 536 98 962; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 2 748 8 998">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 2 748 8 998">
+     <span class='ocr_line' id='line_1_23' title="bbox 2 748 8 998; baseline 0 17"><span class='ocrx_word' id='word_1_62' title='bbox 2 748 8 998; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 219 143 223 331">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 219 143 223 331">
+     <span class='ocr_line' id='line_1_24' title="bbox 219 143 223 331; baseline 0 684"><span class='ocrx_word' id='word_1_63' title='bbox 219 143 223 331; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 171 281 934 523">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 171 283 932 519">
+     <span class='ocr_line' id='line_1_25' title="bbox 354 283 932 309; baseline 0 -5"><span class='ocrx_word' id='word_1_64' title='bbox 354 293 457 295; x_wconf 91' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_65' title='bbox 463 285 632 304; x_wconf 54' lang='eng' dir='ltr'><em>Aka/(bacterium</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 640 285 740 304; x_wconf 81' lang='eng' dir='ltr'><em>iburiense</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 750 283 792 304; x_wconf 75' lang='eng' dir='ltr'><em>M3T</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 801 285 932 309; x_wconf 88' lang='eng' dir='ltr'>(AB188091)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 398 318 917 344; baseline 0 -5"><span class='ocrx_word' id='word_1_69' title='bbox 398 321 541 344; x_wconf 81' lang='eng' dir='ltr'><em>Atopococcus</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 549 321 616 339; x_wconf 82' lang='eng' dir='ltr'><em>tabaci</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 623 320 694 339; x_wconf 89' lang='eng' dir='ltr'><strong>CCUG</strong></span> <span class='ocrx_word' id='word_1_72' title='bbox 703 318 781 339; x_wconf 83' lang='eng' dir='ltr'><em>48253T</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 790 320 917 344; x_wconf 85' lang='eng' dir='ltr'>(AJ634917)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 352 354 877 379; baseline 0 -5"><span class='ocrx_word' id='word_1_74' title='bbox 352 356 519 379; x_wconf 82' lang='eng' dir='ltr'><em>Lacticigenium</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 528 356 623 379; x_wconf 85' lang='eng' dir='ltr'><em>naphtae</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 631 354 736 374; x_wconf 82' lang='eng' dir='ltr'><em>MIC1-18T</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 744 356 877 379; x_wconf 85' lang='eng' dir='ltr'>(AB430339)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 193 388 798 436; baseline 0 -27"><span class='ocrx_word' id='word_1_78' title='bbox 193 391 420 436; x_wconf 40' lang='eng' dir='ltr'><em>1001:36mobacterium</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 427 391 579 414; x_wconf 73' lang='eng' dir='ltr'><em>p/eistoceniurn</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 589 388 659 409; x_wconf 89' lang='eng' dir='ltr'><em>FTR1T</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 668 391 798 414; x_wconf 86' lang='eng' dir='ltr'>(AF450136)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 266 424 836 449; baseline 0 -5"><span class='ocrx_word' id='word_1_82' title='bbox 266 426 441 444; x_wconf 79' lang='eng' dir='ltr'><em>Carnobacterium</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 449 426 592 444; x_wconf 71' lang='eng' dir='ltr'><em>alterfunditum</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 599 426 670 444; x_wconf 87' lang='eng' dir='ltr'><em>ACAM</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 680 424 730 444; x_wconf 78' lang='eng' dir='ltr'><em>313T</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 739 426 836 449; x_wconf 86' lang='eng' dir='ltr'>(L08623)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 171 443 751 484; baseline 0 -5"><span class='ocrx_word' id='word_1_87' title='bbox 171 443 232 476; x_wconf 71' lang='eng' dir='ltr'>86—J—</span> <span class='ocrx_word' id='word_1_88' title='bbox 240 461 415 479; x_wconf 82' lang='eng' dir='ltr'><em>Carnobacterium</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 424 461 509 479; x_wconf 84' lang='eng' dir='ltr'><em>viridans</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 518 459 613 479; x_wconf 89' lang='eng' dir='ltr'><em>MPL-11T</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 622 461 751 484; x_wconf 87' lang='eng' dir='ltr'>(AF425608)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 206 494 669 519; baseline 0 -5"><span class='ocrx_word' id='word_1_92' title='bbox 206 503 230 506; x_wconf 81' lang='eng'>—</span> <span class='ocrx_word' id='word_1_93' title='bbox 239 496 413 514; x_wconf 81' lang='eng' dir='ltr'><em>Carnobacterium</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 421 496 514 514; x_wconf 85' lang='eng' dir='ltr'><em>inhibens</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 522 496 547 514; x_wconf 97' lang='eng' dir='ltr'>K1</span> <span class='ocrx_word' id='word_1_96' title='bbox 552 494 561 506; x_wconf 69' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_97' title='bbox 570 496 669 519; x_wconf 84' lang='eng'>(273313)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 187 526 878 613">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 193 529 877 613">
+     <span class='ocr_line' id='line_1_32' title="bbox 193 529 877 613; baseline -0.003 -62"><span class='ocrx_word' id='word_1_98' title='bbox 193 535 246 613; x_wconf 51' lang='eng' dir='ltr'><em>95S</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 254 531 429 550; x_wconf 82' lang='eng' dir='ltr'><em>Carnobacterium</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 438 531 614 550; x_wconf 84' lang='eng' dir='ltr'><em>maltaromaticum</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 623 531 675 550; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 685 529 763 550; x_wconf 75' lang='eng' dir='ltr'><em>20342T</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 772 531 877 555; x_wconf 86' lang='eng' dir='ltr'><em>(M58825)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 184 236 190 366">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 184 236 190 366">
+     <span class='ocr_line' id='line_1_33' title="bbox 184 236 190 366; baseline 0 649"><span class='ocrx_word' id='word_1_104' title='bbox 184 236 190 366; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 203 416 209 505">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 203 416 209 505">
+     <span class='ocr_line' id='line_1_34' title="bbox 203 416 209 505; baseline 0 510"><span class='ocrx_word' id='word_1_105' title='bbox 203 416 209 505; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 168 528 188 532">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 168 528 188 532">
+     <span class='ocr_line' id='line_1_35' title="bbox 168 528 188 532; baseline 0 483"><span class='ocrx_word' id='word_1_106' title='bbox 168 528 188 532; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 129 562 885 945">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 129 564 885 941">
+     <span class='ocr_line' id='line_1_36' title="bbox 292 564 846 589; baseline 0 -5"><span class='ocrx_word' id='word_1_107' title='bbox 292 566 467 585; x_wconf 83' lang='eng' dir='ltr'><em>Carnobacterium</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 475 566 589 589; x_wconf 80' lang='eng' dir='ltr'><em>gal/inarum</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 598 566 664 585; x_wconf 89' lang='eng' dir='ltr'>NCFB</span> <span class='ocrx_word' id='word_1_110' title='bbox 673 564 737 585; x_wconf 74' lang='eng' dir='ltr'><em>2766T</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 746 566 846 589; x_wconf 82' lang='eng' dir='ltr'><em>(X54269)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 288 599 841 625; baseline 0 -5"><span class='ocrx_word' id='word_1_112' title='bbox 288 602 463 620; x_wconf 76' lang='eng' dir='ltr'><em>Camobacterium</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 472 602 579 625; x_wconf 85' lang='eng' dir='ltr'><em>divergens</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 588 602 659 620; x_wconf 90' lang='eng' dir='ltr'><em>NCDO</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 667 599 732 620; x_wconf 83' lang='eng' dir='ltr'><em>2763T</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 741 602 841 625; x_wconf 89' lang='eng' dir='ltr'><em>(X54270)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 129 633 678 660; baseline 0 -5"><span class='ocrx_word' id='word_1_117' title='bbox 129 633 153 650; x_wconf 73' lang='eng'>66</span> <span class='ocrx_word' id='word_1_118' title='bbox 190 645 230 647; x_wconf 97' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_119' title='bbox 239 636 413 655; x_wconf 85' lang='eng' dir='ltr'><em>Carnobacterium</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 422 636 516 655; x_wconf 74' lang='eng' dir='ltr'><em>funditum</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 525 634 568 660; x_wconf 81' lang='eng' dir='ltr'><em>pf3T</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 577 636 678 660; x_wconf 81' lang='eng'>(886170)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 165 670 753 695; baseline 0.003 -7"><span class='ocrx_word' id='word_1_123' title='bbox 165 672 232 688; x_wconf 87' lang='eng'><em>71—</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 240 672 415 690; x_wconf 82' lang='eng' dir='ltr'><em>Carnobacterium</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 424 672 496 690; x_wconf 86' lang='eng' dir='ltr'><em>mobile</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 505 672 570 690; x_wconf 92' lang='eng' dir='ltr'><em>NCFB</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 579 670 643 690; x_wconf 79' lang='eng' dir='ltr'><em>2765T</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 653 672 753 695; x_wconf 90' lang='eng' dir='ltr'>(X54271)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 291 704 741 730; baseline 0 -5"><span class='ocrx_word' id='word_1_129' title='bbox 291 707 400 725; x_wconf 86' lang='eng' dir='ltr'><em>Desemzia</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 409 707 482 725; x_wconf 68' lang='eng' dir='ltr'><em>incena</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 492 707 544 725; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_132' title='bbox 553 704 632 725; x_wconf 90' lang='eng' dir='ltr'><em>20581T</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 640 707 741 730; x_wconf 86' lang='eng' dir='ltr'>(Y17300)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 311 740 781 765; baseline 0 -5"><span class='ocrx_word' id='word_1_134' title='bbox 311 742 455 760; x_wconf 86' lang='eng' dir='ltr'><em>Trichococcus</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 464 742 544 760; x_wconf 86' lang='eng' dir='ltr'><em>collinsii</em></span> <span class='ocrx_word' id='word_1_136' title='bbox 551 740 645 760; x_wconf 71' lang='eng' dir='ltr'><em>37AN3’T</em></span> <span class='ocrx_word' id='word_1_137' title='bbox 655 742 781 765; x_wconf 87' lang='eng' dir='ltr'>(AJ306612)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 311 775 870 800; baseline 0 -5"><span class='ocrx_word' id='word_1_138' title='bbox 311 777 455 795; x_wconf 85' lang='eng' dir='ltr'><em>Trichococcus</em></span> <span class='ocrx_word' id='word_1_139' title='bbox 462 777 616 800; x_wconf 80' lang='eng' dir='ltr'><em>pategoniensis</em></span> <span class='ocrx_word' id='word_1_140' title='bbox 625 775 732 800; x_wconf 79' lang='eng' dir='ltr'><em>PmagG1T</em></span> <span class='ocrx_word' id='word_1_141' title='bbox 741 777 870 800; x_wconf 85' lang='eng' dir='ltr'>(AF394926)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 266 803 833 835; baseline 0 -5"><span class='ocrx_word' id='word_1_142' title='bbox 266 803 290 820; x_wconf 70' lang='eng'><em>76</em></span> <span class='ocrx_word' id='word_1_143' title='bbox 320 812 464 830; x_wconf 88' lang='eng' dir='ltr'><em>Trichococcus</em></span> <span class='ocrx_word' id='word_1_144' title='bbox 471 812 566 835; x_wconf 80' lang='eng' dir='ltr'><em>pasteurii</em></span> <span class='ocrx_word' id='word_1_145' title='bbox 573 812 639 830; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_146' title='bbox 649 810 727 830; x_wconf 80' lang='eng' dir='ltr'>35945T</span> <span class='ocrx_word' id='word_1_147' title='bbox 736 812 833 835; x_wconf 81' lang='eng' dir='ltr'><em>(L76599)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 316 845 830 870; baseline 0 -5"><span class='ocrx_word' id='word_1_148' title='bbox 316 847 460 865; x_wconf 84' lang='eng' dir='ltr'><em>Trichococcus</em></span> <span class='ocrx_word' id='word_1_149' title='bbox 467 847 560 870; x_wconf 77' lang='eng' dir='ltr'><em>pa/ustris</em></span> <span class='ocrx_word' id='word_1_150' title='bbox 569 847 621 865; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_151' title='bbox 630 845 695 865; x_wconf 74' lang='eng' dir='ltr'><em>9172T</em></span> <span class='ocrx_word' id='word_1_152' title='bbox 704 847 830 870; x_wconf 80' lang='eng' dir='ltr'>(AJ296179)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 345 880 885 906; baseline 0 -5"><span class='ocrx_word' id='word_1_153' title='bbox 345 882 489 901; x_wconf 83' lang='eng' dir='ltr'><em>Trichococcus</em></span> <span class='ocrx_word' id='word_1_154' title='bbox 497 882 640 901; x_wconf 79' lang='eng' dir='ltr'><em>floccu/iformis</em></span> <span class='ocrx_word' id='word_1_155' title='bbox 649 882 702 901; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_156' title='bbox 711 880 776 901; x_wconf 83' lang='eng' dir='ltr'><em>2094T</em></span> <span class='ocrx_word' id='word_1_157' title='bbox 785 882 885 906; x_wconf 84' lang='eng' dir='ltr'>(Y17301)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 244 915 738 941; baseline 0 -5"><span class='ocrx_word' id='word_1_158' title='bbox 244 918 370 936; x_wconf 86' lang='eng' dir='ltr'><em>Isobaculum</em></span> <span class='ocrx_word' id='word_1_159' title='bbox 378 918 436 936; x_wconf 86' lang='eng' dir='ltr'><em>melis</em></span> <span class='ocrx_word' id='word_1_160' title='bbox 444 917 515 936; x_wconf 90' lang='eng' dir='ltr'><strong>CCUG</strong></span> <span class='ocrx_word' id='word_1_161' title='bbox 524 915 602 936; x_wconf 82' lang='eng' dir='ltr'><em>37660T</em></span> <span class='ocrx_word' id='word_1_162' title='bbox 611 917 738 941; x_wconf 82' lang='eng' dir='ltr'>(AJ302648)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 167 529 171 665">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 167 529 171 665">
+     <span class='ocr_line' id='line_1_47' title="bbox 167 529 171 665; baseline 0 350"><span class='ocrx_word' id='word_1_163' title='bbox 167 529 171 665; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 168 662 190 666">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 168 662 190 666">
+     <span class='ocr_line' id='line_1_48' title="bbox 168 662 190 666; baseline 0 349"><span class='ocrx_word' id='word_1_164' title='bbox 168 662 190 666; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 184 236 194 681">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 184 236 194 681">
+     <span class='ocr_line' id='line_1_49' title="bbox 184 236 194 681; baseline 0 334"><span class='ocrx_word' id='word_1_165' title='bbox 184 236 194 681; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 153 747 339 896">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 154 747 339 896">
+     <span class='ocr_line' id='line_1_50' title="bbox 294 747 307 787; baseline 0 0"><span class='ocrx_word' id='word_1_166' title='bbox 294 747 307 787; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_51' title="bbox 154 851 339 896; baseline 0 0"><span class='ocrx_word' id='word_1_167' title='bbox 154 851 339 896; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 150 835 184 852">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 150 836 184 852">
+     <span class='ocr_line' id='line_1_52' title="bbox 150 836 184 852; baseline 0 0"><span class='ocrx_word' id='word_1_168' title='bbox 150 836 184 852; x_wconf 89' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 150 658 158 928">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 150 658 158 928">
+     <span class='ocr_line' id='line_1_53' title="bbox 150 658 158 928; baseline 0 87"><span class='ocrx_word' id='word_1_169' title='bbox 150 658 158 928; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 154 926 236 928">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 154 926 236 928">
+     <span class='ocr_line' id='line_1_54' title="bbox 154 926 236 928; baseline 0 87"><span class='ocrx_word' id='word_1_170' title='bbox 154 926 236 928; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 5 949 766 999">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 94 950 765 976">
+     <span class='ocr_line' id='line_1_55' title="bbox 94 950 765 976; baseline 0 -5"><span class='ocrx_word' id='word_1_171' title='bbox 94 960 246 963; x_wconf 70' lang='eng'><em>—</em></span> <span class='ocrx_word' id='word_1_172' title='bbox 253 953 403 971; x_wconf 82' lang='eng' dir='ltr'><em>Enterococcus</em></span> <span class='ocrx_word' id='word_1_173' title='bbox 411 952 495 971; x_wconf 85' lang='eng' dir='ltr'><em>faecalis</em></span> <span class='ocrx_word' id='word_1_174' title='bbox 503 952 552 971; x_wconf 89' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_175' title='bbox 562 950 626 971; x_wconf 86' lang='eng' dir='ltr'><em>5803T</em></span> <span class='ocrx_word' id='word_1_176' title='bbox 634 952 765 976; x_wconf 89' lang='eng' dir='ltr'>(ABO12212)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 371 983 913 1015">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 371 986 913 1011">
+     <span class='ocr_line' id='line_1_56' title="bbox 371 986 913 1011; baseline 0 -5"><span class='ocrx_word' id='word_1_177' title='bbox 371 988 527 1011; x_wconf 81' lang='eng' dir='ltr'><em>Streptococcus</em></span> <span class='ocrx_word' id='word_1_178' title='bbox 534 993 642 1011; x_wconf 83' lang='eng' dir='ltr'><em>pyugenes</em></span> <span class='ocrx_word' id='word_1_179' title='bbox 650 988 699 1006; x_wconf 86' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_180' title='bbox 709 986 773 1006; x_wconf 77' lang='eng' dir='ltr'><em>5674T</em></span> <span class='ocrx_word' id='word_1_181' title='bbox 782 988 913 1011; x_wconf 85' lang='eng' dir='ltr'>(AB023575)</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003327-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003327-0-000.pbm.png
new file mode 100644
index 00000000..d33e8ae8
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003327-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003327-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003327-0-000.pbm.png.hocr
new file mode 100644
index 00000000..9d48f20d
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003327-0-000.pbm.png.hocr
@@ -0,0 +1,305 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003327-0-000.pbm.png"; bbox 0 0 994 945; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 0 661 2 917">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 0 661 2 917">
+     <span class='ocr_line' id='line_1_1' title="bbox 0 661 2 917; baseline 0 28"><span class='ocrx_word' id='word_1_1' title='bbox 0 661 2 917; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 184 451 214 465">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 184 451 214 465">
+     <span class='ocr_line' id='line_1_2' title="bbox 184 451 214 465; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 184 451 214 465; x_wconf 84' lang='eng'>976</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 224 398 255 412">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 224 398 255 412">
+     <span class='ocr_line' id='line_1_3' title="bbox 224 398 255 412; baseline -0.032 0"><span class='ocrx_word' id='word_1_3' title='bbox 224 398 255 412; x_wconf 80' lang='eng'><em>994</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 219 414 261 435">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 219 414 261 435">
+     <span class='ocr_line' id='line_1_4' title="bbox 219 414 261 435; baseline 0 -19"><span class='ocrx_word' id='word_1_4' title='bbox 219 414 261 435; x_wconf 74' lang='eng' dir='ltr'><em>I,—</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 181 466 222 468">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 181 466 222 468">
+     <span class='ocr_line' id='line_1_5' title="bbox 181 466 222 468; baseline 0 477"><span class='ocrx_word' id='word_1_5' title='bbox 181 466 222 468; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 181 466 183 624">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 181 466 183 624">
+     <span class='ocr_line' id='line_1_6' title="bbox 181 466 183 624; baseline 0 321"><span class='ocrx_word' id='word_1_6' title='bbox 181 466 183 624; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 101 646 140 660">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 101 646 140 660">
+     <span class='ocr_line' id='line_1_7' title="bbox 101 646 140 660; baseline 0 0"><span class='ocrx_word' id='word_1_7' title='bbox 101 646 140 660; x_wconf 85' lang='eng'>1000</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 151 762 181 776">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 151 762 181 776">
+     <span class='ocr_line' id='line_1_8' title="bbox 151 762 181 776; baseline 0 0"><span class='ocrx_word' id='word_1_8' title='bbox 151 762 181 776; x_wconf 82' lang='eng'><em>933</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 0 942 64 945">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 0 942 64 945">
+     <span class='ocr_line' id='line_1_9' title="bbox 0 942 64 945; baseline 0 0"><span class='ocrx_word' id='word_1_9' title='bbox 0 942 64 945; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 220 435 222 519">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 220 435 222 519">
+     <span class='ocr_line' id='line_1_10' title="bbox 220 435 222 519; baseline 0 426"><span class='ocrx_word' id='word_1_10' title='bbox 220 435 222 519; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 239 578 269 592">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 239 578 269 592">
+     <span class='ocr_line' id='line_1_11' title="bbox 239 578 269 592; baseline 0 0"><span class='ocrx_word' id='word_1_11' title='bbox 239 578 269 592; x_wconf 73' lang='eng'><em>854</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 183 607 261 624">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 218 607 258 621">
+     <span class='ocr_line' id='line_1_12' title="bbox 218 607 258 621; baseline 0.025 -1"><span class='ocrx_word' id='word_1_12' title='bbox 218 607 258 621; x_wconf 89' lang='eng'>1000</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 236 720 276 734">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 236 720 276 734">
+     <span class='ocr_line' id='line_1_13' title="bbox 236 720 276 734; baseline 0.025 -1"><span class='ocrx_word' id='word_1_13' title='bbox 236 720 276 734; x_wconf 88' lang='eng'>1000</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 222 499 393 552">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 247 502 393 552">
+     <span class='ocr_line' id='line_1_14' title="bbox 247 502 286 516; baseline 0 0"><span class='ocrx_word' id='word_1_14' title='bbox 247 502 286 516; x_wconf 81' lang='eng'>1000</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 327 529 393 552; baseline 0 -5"><span class='ocrx_word' id='word_1_15' title='bbox 327 529 393 552; x_wconf 91' lang='eng' dir='ltr'><em>PhyI/o</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 263 0 994 704">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 280 0 964 26">
+     <span class='ocr_line' id='line_1_16' title="bbox 280 0 964 26; baseline 0 -5"><span class='ocrx_word' id='word_1_16' title='bbox 280 12 310 26; x_wconf 77' lang='eng'><em>915</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 334 2 517 21; x_wconf 87' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 525 2 687 21; x_wconf 84' lang='eng' dir='ltr'><em>metallidurans</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 695 2 745 21; x_wconf 88' lang='eng' dir='ltr'><em>STM</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 755 0 819 21; x_wconf 70' lang='eng' dir='ltr'><em>2683T</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 828 2 964 26; x_wconf 83' lang='eng' dir='ltr'>(AM930381)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 278 38 880 64">
+     <span class='ocr_line' id='line_1_17' title="bbox 278 38 880 64; baseline 0 -6"><span class='ocrx_word' id='word_1_22' title='bbox 278 50 307 64; x_wconf 74' lang='eng'><em>757</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 330 40 498 58; x_wconf 83' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 507 40 653 58; x_wconf 79' lang='eng' dir='ltr'><em>tianshanense</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 660 38 742 58; x_wconf 88' lang='eng' dir='ltr'><em>A-1BST</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 751 40 880 63; x_wconf 90' lang='eng' dir='ltr'>(AFO41447)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 327 69 914 101">
+     <span class='ocr_line' id='line_1_18' title="bbox 327 69 914 101; baseline 0 -5"><span class='ocrx_word' id='word_1_27' title='bbox 327 69 520 96; x_wconf 54' lang='eng' dir='ltr'><em>q‘4M1&#39;asorh/zobfum</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 528 78 660 101; x_wconf 81' lang='eng' dir='ltr'><em>temperatum</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 668 75 777 96; x_wconf 86' lang='eng' dir='ltr'><em>SDWO18T</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 786 77 914 100; x_wconf 88' lang='eng' dir='ltr'>(AF508208)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 345 113 933 138">
+     <span class='ocr_line' id='line_1_19' title="bbox 345 113 933 138; baseline 0.002 -5"><span class='ocrx_word' id='word_1_31' title='bbox 345 115 513 134; x_wconf 82' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 521 115 687 134; x_wconf 82' lang='eng' dir='ltr'><em>mediterraneum</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 696 113 828 134; x_wconf 79' lang='eng' dir='ltr'><em>UPM-Ca36T</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 837 115 933 138; x_wconf 86' lang='eng' dir='ltr'><em>(L38825)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 318 150 933 198">
+     <span class='ocr_line' id='line_1_20' title="bbox 318 150 933 198; baseline 0 -27"><span class='ocrx_word' id='word_1_35' title='bbox 318 159 344 198; x_wconf 53' lang='eng'><em>31&#39;</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 348 153 515 171; x_wconf 86' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 523 153 679 176; x_wconf 79' lang='eng' dir='ltr'><em>septentrionale</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 687 150 796 171; x_wconf 81' lang='eng' dir='ltr'><em>SDW014T</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 805 153 933 176; x_wconf 89' lang='eng' dir='ltr'>(AF508207)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 339 188 911 213">
+     <span class='ocr_line' id='line_1_21' title="bbox 339 188 911 213; baseline -0.002 -4"><span class='ocrx_word' id='word_1_40' title='bbox 339 190 506 209; x_wconf 82' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 515 190 626 213; x_wconf 83' lang='eng' dir='ltr'><em>amorphae</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 635 190 685 209; x_wconf 89' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 697 188 773 209; x_wconf 74' lang='eng' dir='ltr'><em>18977T</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 782 190 911 213; x_wconf 88' lang='eng' dir='ltr'>(AF041442)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 311 222 911 256">
+     <span class='ocr_line' id='line_1_22' title="bbox 311 222 911 256; baseline 0 -10"><span class='ocrx_word' id='word_1_45' title='bbox 311 222 357 256; x_wconf 67' lang='eng'><em>62,—</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 363 228 531 246; x_wconf 78' lang='eng' dir='ltr'><em>Mesomizobium</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 538 228 654 251; x_wconf 84' lang='eng' dir='ltr'><em>plurifarium</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 663 228 714 246; x_wconf 90' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 725 226 802 246; x_wconf 74' lang='eng' dir='ltr'><em>11892T</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 811 228 911 251; x_wconf 87' lang='eng' dir='ltr'>(Y14158)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 334 263 889 289">
+     <span class='ocr_line' id='line_1_23' title="bbox 334 263 889 289; baseline 0 -5"><span class='ocrx_word' id='word_1_51' title='bbox 334 265 526 284; x_wconf 78' lang='eng' dir='ltr'><em>—Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 534 265 613 284; x_wconf 76' lang='eng' dir='ltr'><em>huakuii</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 620 265 705 284; x_wconf 91' lang='eng' dir='ltr'>CCBAU</span> <span class='ocrx_word' id='word_1_54' title='bbox 714 263 779 284; x_wconf 86' lang='eng' dir='ltr'><em>2609T</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 788 265 889 289; x_wconf 86' lang='eng' dir='ltr'>(D12797)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 311 301 810 328">
+     <span class='ocr_line' id='line_1_24' title="bbox 311 301 810 328; baseline 0 -6"><span class='ocrx_word' id='word_1_56' title='bbox 311 314 341 328; x_wconf 69' lang='eng'><em>999</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 361 303 529 322; x_wconf 74' lang='eng' dir='ltr'><em>Mesorh/zobium</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 537 303 569 322; x_wconf 78' lang='eng' dir='ltr'><em>Ioti</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 577 303 628 322; x_wconf 87' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 637 301 701 322; x_wconf 84' lang='eng' dir='ltr'><em>6125T</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 710 303 810 326; x_wconf 84' lang='eng' dir='ltr'>(X67229)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 364 339 833 364">
+     <span class='ocr_line' id='line_1_25' title="bbox 364 339 833 364; baseline 0.002 -5"><span class='ocrx_word' id='word_1_62' title='bbox 364 341 531 360; x_wconf 83' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 539 341 598 360; x_wconf 81' lang='eng' dir='ltr'><em>ciceri</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 605 339 723 360; x_wconf 85' lang='eng' dir='ltr'><em>UPM-Ca7T</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 731 341 833 364; x_wconf 84' lang='eng' dir='ltr'>(U07934)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 366 376 852 402">
+     <span class='ocr_line' id='line_1_26' title="bbox 366 376 852 402; baseline 0 -5"><span class='ocrx_word' id='word_1_66' title='bbox 366 379 533 397; x_wconf 81' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 542 379 661 397; x_wconf 83' lang='eng' dir='ltr'><em>chacoense</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 670 376 717 397; x_wconf 90' lang='eng' dir='ltr'><em>Pr5T</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 725 379 852 402; x_wconf 85' lang='eng' dir='ltr'>(AJ278249)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 284 414 973 439">
+     <span class='ocr_line' id='line_1_27' title="bbox 284 414 973 439; baseline 0.001 -5"><span class='ocrx_word' id='word_1_70' title='bbox 284 416 557 435; x_wconf 83' lang='eng' dir='ltr'><em>—Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 566 416 649 435; x_wconf 83' lang='eng' dir='ltr'><em>albiziae</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 657 416 742 435; x_wconf 86' lang='eng' dir='ltr'>CCBAU</span> <span class='ocrx_word' id='word_1_73' title='bbox 751 414 830 435; x_wconf 88' lang='eng' dir='ltr'><em>61158T</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 838 416 973 439; x_wconf 90' lang='eng' dir='ltr'>(DQ100066)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 454 452 994 477">
+     <span class='ocr_line' id='line_1_28' title="bbox 454 452 994 477; baseline 0 -5"><span class='ocrx_word' id='word_1_75' title='bbox 454 454 621 472; x_wconf 84' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 630 454 797 477; x_wconf 80' lang='eng' dir='ltr'><em>thiogangeticum</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 806 452 859 472; x_wconf 77' lang='eng' dir='ltr'><em>SJTT</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 868 454 994 477; x_wconf 88' lang='eng' dir='ltr'>(AJ864462)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 380 489 870 515">
+     <span class='ocr_line' id='line_1_29' title="bbox 380 489 870 515; baseline 0 -5"><span class='ocrx_word' id='word_1_79' title='bbox 380 491 556 515; x_wconf 75' lang='eng' dir='ltr'><em>Phy/lobaclerium</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 564 491 622 510; x_wconf 82' lang='eng' dir='ltr'><em>trifo/ii</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 630 489 731 510; x_wconf 84' lang='eng' dir='ltr'><em>PETPOZT</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 740 491 870 514; x_wconf 86' lang='eng' dir='ltr'>(AY786080)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 320 527 938 590">
+     <span class='ocr_line' id='line_1_30' title="bbox 395 527 938 552; baseline 0 -5"><span class='ocrx_word' id='word_1_83' title='bbox 395 529 503 547; x_wconf 83' lang='eng' dir='ltr'><em>bacterium</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 511 529 681 552; x_wconf 85' lang='eng' dir='ltr'><em>myrsinacearum</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 689 529 739 547; x_wconf 87' lang='eng' dir='ltr'><em>STM</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 749 527 799 547; x_wconf 83' lang='eng' dir='ltr'><em>948T</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 808 529 938 552; x_wconf 87' lang='eng' dir='ltr'>(AY785315)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 320 564 790 590; baseline 0 -5"><span class='ocrx_word' id='word_1_88' title='bbox 320 566 475 585; x_wconf 85' lang='eng' dir='ltr'><em>Sinorhizobium</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 483 567 549 585; x_wconf 80' lang='eng' dir='ltr'><em>saheli</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 557 566 608 585; x_wconf 92' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 617 564 681 585; x_wconf 72' lang='eng' dir='ltr'><em>7837T</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 690 567 790 590; x_wconf 84' lang='eng' dir='ltr'>(X68390)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 309 602 752 628">
+     <span class='ocr_line' id='line_1_32' title="bbox 309 602 752 628; baseline 0 -5"><span class='ocrx_word' id='word_1_93' title='bbox 309 605 449 623; x_wconf 84' lang='eng' dir='ltr'><em>inorhizobium</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 457 604 511 623; x_wconf 82' lang='eng' dir='ltr'><em>fred/i</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 519 604 570 623; x_wconf 92' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 579 602 644 623; x_wconf 81' lang='eng' dir='ltr'><em>6217T</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 652 605 752 628; x_wconf 87' lang='eng' dir='ltr'><em>(X67231)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 263 640 797 665">
+     <span class='ocr_line' id='line_1_33' title="bbox 263 640 797 665; baseline 0 -5"><span class='ocrx_word' id='word_1_98' title='bbox 263 650 308 653; x_wconf 93' lang='eng'><em>——</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 314 642 470 661; x_wconf 83' lang='eng' dir='ltr'><em>Sinorhlzobium</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 478 642 556 661; x_wconf 78' lang='eng' dir='ltr'><em>me/I&#39;loti</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 564 642 615 661; x_wconf 90' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 624 640 688 661; x_wconf 78' lang='eng' dir='ltr'><em>6133T</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 697 642 797 665; x_wconf 89' lang='eng' dir='ltr'>(X67222)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 315 678 901 704">
+     <span class='ocr_line' id='line_1_34' title="bbox 315 678 901 704; baseline 0.002 -6"><span class='ocrx_word' id='word_1_104' title='bbox 315 688 342 690; x_wconf 96' lang='eng'>—</span> <span class='ocrx_word' id='word_1_105' title='bbox 348 680 464 699; x_wconf 83' lang='eng' dir='ltr'><em>Rhizoblum</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 472 680 641 704; x_wconf 81' lang='eng' dir='ltr'><em>Ieguminosarum</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 651 680 718 699; x_wconf 90' lang='eng' dir='ltr'><em>USDA</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 726 678 791 699; x_wconf 86' lang='eng' dir='ltr'><em>2370T</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 800 680 901 703; x_wconf 82' lang='eng' dir='ltr'>(U29386)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 284 77 362 388">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 284 77 362 388">
+     <span class='ocr_line' id='line_1_35' title="bbox 295 77 332 114; baseline 0 831"><span class='ocrx_word' id='word_1_110' title='bbox 295 77 332 114; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 295 114 314 150; baseline 0 795"><span class='ocrx_word' id='word_1_111' title='bbox 295 114 314 150; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 291 150 315 273; baseline 0 0"><span class='ocrx_word' id='word_1_112' title='bbox 291 150 315 273; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 284 273 311 341; baseline 0 -39"><span class='ocrx_word' id='word_1_113' title='bbox 284 273 311 341; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 295 341 362 388; baseline 0 557"><span class='ocrx_word' id='word_1_114' title='bbox 295 341 362 388; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 323 142 343 156">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 323 142 343 156">
+     <span class='ocr_line' id='line_1_40' title="bbox 323 142 343 156; baseline 0 0"><span class='ocrx_word' id='word_1_115' title='bbox 323 142 343 156; x_wconf 85' lang='eng'>80</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 332 81 335 274">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 332 81 335 274">
+     <span class='ocr_line' id='line_1_41' title="bbox 332 81 335 274; baseline 0 671"><span class='ocrx_word' id='word_1_116' title='bbox 332 81 335 274; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 262 367 284 369">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 262 367 284 369">
+     <span class='ocr_line' id='line_1_42' title="bbox 262 367 284 369; baseline 0 576"><span class='ocrx_word' id='word_1_117' title='bbox 262 367 284 369; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 282 310 284 425">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 282 310 284 425">
+     <span class='ocr_line' id='line_1_43' title="bbox 282 310 284 425; baseline 0 520"><span class='ocrx_word' id='word_1_118' title='bbox 282 310 284 425; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 262 367 264 652">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 262 367 264 652">
+     <span class='ocr_line' id='line_1_44' title="bbox 262 367 264 652; baseline 0 293"><span class='ocrx_word' id='word_1_119' title='bbox 262 367 264 652; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 278 691 313 709">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 278 691 313 709">
+     <span class='ocr_line' id='line_1_45' title="bbox 278 691 313 709; baseline -0.029 0"><span class='ocrx_word' id='word_1_120' title='bbox 278 691 313 709; x_wconf 45' lang='eng'>21$</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 313 688 315 728">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 313 688 315 728">
+     <span class='ocr_line' id='line_1_46' title="bbox 313 688 315 728; baseline 0 217"><span class='ocrx_word' id='word_1_121' title='bbox 313 688 315 728; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 187 735 282 737">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 187 735 282 737">
+     <span class='ocr_line' id='line_1_47' title="bbox 187 735 282 737; baseline 0 208"><span class='ocrx_word' id='word_1_122' title='bbox 187 735 282 737; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 187 735 189 821">
+    <p class='ocr_par' dir='ltr' id='par_1_42' title="bbox 187 735 189 821">
+     <span class='ocr_line' id='line_1_48' title="bbox 187 735 189 821; baseline 0 124"><span class='ocrx_word' id='word_1_123' title='bbox 187 735 189 821; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 244 868 260 886">
+    <p class='ocr_par' dir='ltr' id='par_1_43' title="bbox 244 868 260 886">
+     <span class='ocr_line' id='line_1_49' title="bbox 244 868 260 886; baseline 0 0"><span class='ocrx_word' id='word_1_124' title='bbox 244 868 260 886; x_wconf 94' lang='eng' dir='ltr'><em>A</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 315 715 832 778">
+    <p class='ocr_par' dir='ltr' id='par_1_44' title="bbox 315 715 832 778">
+     <span class='ocr_line' id='line_1_50' title="bbox 315 715 734 741; baseline 0 -5"><span class='ocrx_word' id='word_1_125' title='bbox 315 726 360 728; x_wconf 95' lang='eng'>—</span> <span class='ocrx_word' id='word_1_126' title='bbox 366 718 482 736; x_wconf 86' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 490 718 522 736; x_wconf 74' lang='eng' dir='ltr'><em>et/i</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 529 717 578 736; x_wconf 95' lang='eng' dir='ltr'><em>CFN</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 587 715 624 736; x_wconf 88' lang='eng' dir='ltr'><em>42T</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 633 718 734 741; x_wconf 81' lang='eng' dir='ltr'>(U28916)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_51' title="bbox 384 753 832 778; baseline 0.002 -5"><span class='ocrx_word' id='word_1_131' title='bbox 384 755 500 774; x_wconf 81' lang='eng' dir='ltr'><em>Rhizobium</em></span> <span class='ocrx_word' id='word_1_132' title='bbox 509 755 575 778; x_wconf 71' lang='eng' dir='ltr'><em>tropic]</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 583 755 650 774; x_wconf 87' lang='eng' dir='ltr'><em>USDA</em></span> <span class='ocrx_word' id='word_1_134' title='bbox 658 753 722 774; x_wconf 80' lang='eng' dir='ltr'><em>9030T</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 731 755 832 778; x_wconf 83' lang='eng' dir='ltr'>(U89832)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 280 707 282 766">
+    <p class='ocr_par' dir='ltr' id='par_1_45' title="bbox 280 707 282 766">
+     <span class='ocr_line' id='line_1_52' title="bbox 280 707 282 766; baseline 0 120"><span class='ocrx_word' id='word_1_136' title='bbox 280 707 282 766; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 282 764 376 766">
+    <p class='ocr_par' dir='ltr' id='par_1_46' title="bbox 282 764 376 766">
+     <span class='ocr_line' id='line_1_53' title="bbox 282 764 376 766; baseline 0 179"><span class='ocrx_word' id='word_1_137' title='bbox 282 764 376 766; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 188 790 953 854">
+    <p class='ocr_par' dir='ltr' id='par_1_47' title="bbox 188 790 953 854">
+     <span class='ocr_line' id='line_1_54' title="bbox 188 790 792 841; baseline 0 -30"><span class='ocrx_word' id='word_1_138' title='bbox 188 793 454 841; x_wconf 70' lang='eng' dir='ltr'><em>_|:Rhizobium</em></span> <span class='ocrx_word' id='word_1_139' title='bbox 462 793 550 816; x_wconf 82' lang='eng' dir='ltr'><em>ga/egae</em></span> <span class='ocrx_word' id='word_1_140' title='bbox 559 793 610 811; x_wconf 92' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_141' title='bbox 619 790 684 811; x_wconf 80' lang='eng' dir='ltr'><em>6214T</em></span> <span class='ocrx_word' id='word_1_142' title='bbox 692 793 792 816; x_wconf 88' lang='eng' dir='ltr'>(X67226)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_55' title="bbox 374 828 953 854; baseline 0 -5"><span class='ocrx_word' id='word_1_143' title='bbox 374 830 536 854; x_wconf 80' lang='eng' dir='ltr'><em>Agrobacterium</em></span> <span class='ocrx_word' id='word_1_144' title='bbox 545 830 678 849; x_wconf 76' lang='eng' dir='ltr'><em>tumefaciens</em></span> <span class='ocrx_word' id='word_1_145' title='bbox 687 830 770 849; x_wconf 86' lang='eng' dir='ltr'>NCPPB</span> <span class='ocrx_word' id='word_1_146' title='bbox 779 828 844 849; x_wconf 79' lang='eng' dir='ltr'><em>2437T</em></span> <span class='ocrx_word' id='word_1_147' title='bbox 852 830 953 854; x_wconf 86' lang='eng' dir='ltr'>(D14500)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 262 865 920 930">
+    <p class='ocr_par' dir='ltr' id='par_1_48' title="bbox 262 865 920 930">
+     <span class='ocr_line' id='line_1_56' title="bbox 262 865 765 891; baseline 0 -5"><span class='ocrx_word' id='word_1_148' title='bbox 262 868 395 886; x_wconf 85' lang='eng' dir='ltr'><em>zorhizobium</em></span> <span class='ocrx_word' id='word_1_149' title='bbox 404 868 536 886; x_wconf 82' lang='eng' dir='ltr'><em>cau/inodans</em></span> <span class='ocrx_word' id='word_1_150' title='bbox 544 868 596 886; x_wconf 87' lang='eng' dir='ltr'><em>ORS</em></span> <span class='ocrx_word' id='word_1_151' title='bbox 605 868 641 886; x_wconf 94' lang='eng'>571</span> <span class='ocrx_word' id='word_1_152' title='bbox 646 865 655 878; x_wconf 57' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_153' title='bbox 664 868 765 891; x_wconf 85' lang='eng' dir='ltr'>(D11342)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_57' title="bbox 385 904 920 930; baseline 0.002 -6"><span class='ocrx_word' id='word_1_154' title='bbox 385 906 677 930; x_wconf 83' lang='eng' dir='ltr'><em>Bradyrhlzoblumjaponlcum</em></span> <span class='ocrx_word' id='word_1_155' title='bbox 687 906 738 925; x_wconf 89' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_156' title='bbox 747 904 812 925; x_wconf 77' lang='eng' dir='ltr'><em>6138T</em></span> <span class='ocrx_word' id='word_1_157' title='bbox 821 906 920 929; x_wconf 85' lang='eng' dir='ltr'>(X66024)</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003327-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003327-0-001.pbm.png
new file mode 100644
index 00000000..db5736fe
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003327-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003327-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003327-0-001.pbm.png.hocr
new file mode 100644
index 00000000..aecb3832
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003327-0-001.pbm.png.hocr
@@ -0,0 +1,411 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003327-0-001.pbm.png"; bbox 0 0 994 1496; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 164 261 200 280">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 164 261 200 280">
+     <span class='ocr_line' id='line_1_1' title="bbox 164 261 200 280; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 164 261 200 280; x_wconf 35' lang='eng'><em>7%</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 157 339 174 340">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 157 339 174 340">
+     <span class='ocr_line' id='line_1_2' title="bbox 157 339 174 340; baseline 0 1156"><span class='ocrx_word' id='word_1_2' title='bbox 157 339 174 340; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 200 216 203 363">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 200 216 203 363">
+     <span class='ocr_line' id='line_1_3' title="bbox 200 216 203 363; baseline 0 1133"><span class='ocrx_word' id='word_1_3' title='bbox 200 216 203 363; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 173 279 174 397">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 173 279 174 397">
+     <span class='ocr_line' id='line_1_4' title="bbox 173 279 174 397; baseline 0 1099"><span class='ocrx_word' id='word_1_4' title='bbox 173 279 174 397; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 157 338 159 434">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 157 338 159 434">
+     <span class='ocr_line' id='line_1_5' title="bbox 157 338 159 434; baseline 0 1062"><span class='ocrx_word' id='word_1_5' title='bbox 157 338 159 434; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 99 408 140 423">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 99 408 140 423">
+     <span class='ocr_line' id='line_1_6' title="bbox 99 408 140 423; baseline 0 0"><span class='ocrx_word' id='word_1_6' title='bbox 99 408 140 423; x_wconf 85' lang='eng'>1000</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 66 426 146 428">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 66 426 146 428">
+     <span class='ocr_line' id='line_1_7' title="bbox 66 426 146 428; baseline 0 1068"><span class='ocrx_word' id='word_1_7' title='bbox 66 426 146 428; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 35 474 68 475">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 35 474 68 475">
+     <span class='ocr_line' id='line_1_8' title="bbox 35 474 68 475; baseline 0 1021"><span class='ocrx_word' id='word_1_8' title='bbox 35 474 68 475; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 66 426 68 523">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 66 426 68 523">
+     <span class='ocr_line' id='line_1_9' title="bbox 66 426 68 523; baseline 0 973"><span class='ocrx_word' id='word_1_9' title='bbox 66 426 68 523; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 84 503 115 518">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 84 503 115 518">
+     <span class='ocr_line' id='line_1_10' title="bbox 84 503 115 518; baseline 0 -1"><span class='ocrx_word' id='word_1_10' title='bbox 84 503 115 518; x_wconf 81' lang='eng'><em>784</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 66 521 121 522">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 66 521 121 522">
+     <span class='ocr_line' id='line_1_11' title="bbox 66 521 121 522; baseline 0 974"><span class='ocrx_word' id='word_1_11' title='bbox 66 521 121 522; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 120 503 121 540">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 120 503 121 540">
+     <span class='ocr_line' id='line_1_12' title="bbox 120 503 121 540; baseline 0 956"><span class='ocrx_word' id='word_1_12' title='bbox 120 503 121 540; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 0 533 37 534">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 0 533 37 534">
+     <span class='ocr_line' id='line_1_13' title="bbox 0 533 37 534; baseline 0 962"><span class='ocrx_word' id='word_1_13' title='bbox 0 533 37 534; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 1 533 2 684">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 1 533 2 684">
+     <span class='ocr_line' id='line_1_14' title="bbox 1 533 2 684; baseline 0 812"><span class='ocrx_word' id='word_1_14' title='bbox 1 533 2 684; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 35 474 37 594">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 35 474 37 594">
+     <span class='ocr_line' id='line_1_15' title="bbox 35 474 37 594; baseline 0 902"><span class='ocrx_word' id='word_1_15' title='bbox 35 474 37 594; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 107 575 138 590">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 107 575 138 590">
+     <span class='ocr_line' id='line_1_16' title="bbox 107 575 138 590; baseline -0.032 0"><span class='ocrx_word' id='word_1_16' title='bbox 107 575 138 590; x_wconf 77' lang='eng'><em>994</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 35 592 144 594">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 35 592 144 594">
+     <span class='ocr_line' id='line_1_17' title="bbox 35 592 144 594; baseline 0 902"><span class='ocrx_word' id='word_1_17' title='bbox 35 592 144 594; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 143 384 148 613">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 143 384 148 613">
+     <span class='ocr_line' id='line_1_18' title="bbox 143 384 148 613; baseline 0 883"><span class='ocrx_word' id='word_1_18' title='bbox 143 384 148 613; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 138 690 162 704">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 138 690 162 704">
+     <span class='ocr_line' id='line_1_19' title="bbox 138 690 162 704; baseline 0 0"><span class='ocrx_word' id='word_1_19' title='bbox 138 690 162 704; x_wconf 61' lang='eng'><em>01</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 17 755 46 779">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 17 755 46 779">
+     <span class='ocr_line' id='line_1_20' title="bbox 17 755 46 779; baseline 0 0"><span class='ocrx_word' id='word_1_20' title='bbox 17 755 46 779; x_wconf 83' lang='eng' dir='ltr'><em>(b)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 187 1090 218 1105">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 187 1090 218 1105">
+     <span class='ocr_line' id='line_1_21' title="bbox 187 1090 218 1105; baseline 0 0"><span class='ocrx_word' id='word_1_21' title='bbox 187 1090 218 1105; x_wconf 83' lang='eng'>959</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 212 0 912 307">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 212 0 912 307">
+     <span class='ocr_line' id='line_1_22' title="bbox 251 0 894 22; baseline 0 -4"><span class='ocrx_word' id='word_1_22' title='bbox 251 3 282 18; x_wconf 86' lang='eng'><em>767</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 295 1 471 18; x_wconf 81' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 480 1 636 18; x_wconf 80' lang='eng' dir='ltr'><em>metallidurans</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 643 0 692 18; x_wconf 89' lang='eng' dir='ltr'>STM</span> <span class='ocrx_word' id='word_1_26' title='bbox 702 1 754 18; x_wconf 84' lang='eng'><strong>3297</strong></span> <span class='ocrx_word' id='word_1_27' title='bbox 762 1 894 22; x_wconf 80' lang='eng' dir='ltr'><em>(AM930387)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 247 30 898 58; baseline 0.002 -5"><span class='ocrx_word' id='word_1_28' title='bbox 247 30 279 45; x_wconf 70' lang='eng'><em>993</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 299 36 476 54; x_wconf 87' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 484 36 640 54; x_wconf 82' lang='eng' dir='ltr'><em>metallidurans</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 648 36 696 54; x_wconf 87' lang='eng' dir='ltr'><em>STM</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 705 36 758 54; x_wconf 84' lang='eng'><strong>3295</strong></span> <span class='ocrx_word' id='word_1_33' title='bbox 766 36 898 58; x_wconf 85' lang='eng' dir='ltr'><em>(AM930386)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 293 71 892 93; baseline 0 -4"><span class='ocrx_word' id='word_1_34' title='bbox 293 71 469 89; x_wconf 84' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 477 71 633 89; x_wconf 75' lang='eng' dir='ltr'><em>metallidurans</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 641 71 689 89; x_wconf 89' lang='eng' dir='ltr'>STM</span> <span class='ocrx_word' id='word_1_37' title='bbox 699 71 752 89; x_wconf 79' lang='eng'><em>3294</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 760 71 892 93; x_wconf 83' lang='eng' dir='ltr'><em>(AM930385)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 257 107 856 129; baseline 0.002 -5"><span class='ocrx_word' id='word_1_39' title='bbox 257 107 433 125; x_wconf 84' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 441 107 597 125; x_wconf 83' lang='eng' dir='ltr'><em>metallidurans</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 605 107 653 125; x_wconf 87' lang='eng' dir='ltr'>STM</span> <span class='ocrx_word' id='word_1_42' title='bbox 663 107 715 125; x_wconf 79' lang='eng'><strong>3292</strong></span> <span class='ocrx_word' id='word_1_43' title='bbox 723 107 856 129; x_wconf 85' lang='eng' dir='ltr'><em>(AM930383)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 212 142 866 164; baseline 0 -4"><span class='ocrx_word' id='word_1_44' title='bbox 212 159 218 161; x_wconf 61' lang='eng'><strong><em>,</em></strong></span> <span class='ocrx_word' id='word_1_45' title='bbox 267 142 443 160; x_wconf 84' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 451 142 607 160; x_wconf 85' lang='eng' dir='ltr'><em>metallidurans</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 615 142 664 160; x_wconf 91' lang='eng' dir='ltr'>STM</span> <span class='ocrx_word' id='word_1_48' title='bbox 673 142 725 160; x_wconf 86' lang='eng'><strong>3293</strong></span> <span class='ocrx_word' id='word_1_49' title='bbox 734 142 866 164; x_wconf 87' lang='eng' dir='ltr'><em>(AM930384)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 306 178 912 200; baseline 0.002 -5"><span class='ocrx_word' id='word_1_50' title='bbox 306 178 482 196; x_wconf 87' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 490 178 646 196; x_wconf 86' lang='eng' dir='ltr'><em>metallidurans</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 654 178 702 196; x_wconf 86' lang='eng' dir='ltr'>STM</span> <span class='ocrx_word' id='word_1_53' title='bbox 712 178 774 196; x_wconf 73' lang='eng' dir='ltr'><em>2683T</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 780 178 912 200; x_wconf 83' lang='eng' dir='ltr'><em>(AM930382)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 219 213 879 236; baseline 0 -5"><span class='ocrx_word' id='word_1_55' title='bbox 219 218 285 219; x_wconf 98' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 291 214 453 231; x_wconf 83' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 462 214 604 231; x_wconf 82' lang='eng' dir='ltr'><em>tianshanense</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 613 213 679 231; x_wconf 84' lang='eng' dir='ltr'><em>USDA</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 687 213 748 231; x_wconf 82' lang='eng' dir='ltr'><em>3592T</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 757 214 879 236; x_wconf 86' lang='eng' dir='ltr'><em>(AJ294368)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 216 249 899 271; baseline 0.001 -5"><span class='ocrx_word' id='word_1_61' title='bbox 216 253 285 254; x_wconf 98' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 292 249 454 267; x_wconf 77' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 463 249 624 267; x_wconf 81' lang='eng' dir='ltr'><em>mediterraneum</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 633 249 698 267; x_wconf 84' lang='eng' dir='ltr'>USDA</span> <span class='ocrx_word' id='word_1_65' title='bbox 707 249 769 267; x_wconf 76' lang='eng' dir='ltr'><em>3392T</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 777 249 899 271; x_wconf 84' lang='eng' dir='ltr'><em>(AJ294369)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 283 284 782 307; baseline 0 -5"><span class='ocrx_word' id='word_1_67' title='bbox 283 284 445 302; x_wconf 84' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 453 284 510 302; x_wconf 74' lang='eng' dir='ltr'><em>ciceri</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 518 284 583 302; x_wconf 86' lang='eng' dir='ltr'><em>USDA</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 592 284 653 302; x_wconf 84' lang='eng' dir='ltr'><em>3383T</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 660 284 782 307; x_wconf 84' lang='eng' dir='ltr'><em>(AJ294367)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 216 101 221 291">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 216 101 221 291">
+     <span class='ocr_line' id='line_1_31' title="bbox 216 101 221 291; baseline 0 1205"><span class='ocrx_word' id='word_1_72' title='bbox 216 101 221 291; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 217 289 277 291">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 217 289 277 291">
+     <span class='ocr_line' id='line_1_32' title="bbox 217 289 277 291; baseline 0 1205"><span class='ocrx_word' id='word_1_73' title='bbox 217 289 277 291; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 201 320 866 378">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 201 320 866 378">
+     <span class='ocr_line' id='line_1_33' title="bbox 201 320 821 342; baseline 0 -4"><span class='ocrx_word' id='word_1_74' title='bbox 201 325 292 326; x_wconf 98' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 300 321 462 338; x_wconf 71' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 470 321 548 338; x_wconf 73' lang='eng' dir='ltr'><em>huakuf/</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 555 320 620 338; x_wconf 86' lang='eng' dir='ltr'>USDA</span> <span class='ocrx_word' id='word_1_78' title='bbox 628 320 691 338; x_wconf 76' lang='eng' dir='ltr'><em>4779T</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 699 321 821 342; x_wconf 83' lang='eng' dir='ltr'><em>(AJ294370)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 203 356 866 378; baseline 0 -5"><span class='ocrx_word' id='word_1_80' title='bbox 203 361 297 363; x_wconf 89' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 305 356 467 374; x_wconf 82' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 476 356 583 378; x_wconf 81' lang='eng' dir='ltr'><em>amorphae</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 592 356 650 374; x_wconf 88' lang='eng' dir='ltr'><em>ICMP</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 660 356 734 374; x_wconf 79' lang='eng' dir='ltr'><em>15022T</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 740 356 866 378; x_wconf 84' lang='eng' dir='ltr'><em>(AY494816)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 258 391 992 699">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 265 391 992 520">
+     <span class='ocr_line' id='line_1_35' title="bbox 278 391 751 414; baseline 0 -5"><span class='ocrx_word' id='word_1_86' title='bbox 278 392 440 409; x_wconf 83' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 448 392 480 409; x_wconf 80' lang='eng' dir='ltr'><em>Ioti</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 487 392 552 409; x_wconf 88' lang='eng' dir='ltr'>USDA</span> <span class='ocrx_word' id='word_1_89' title='bbox 561 391 623 409; x_wconf 75' lang='eng' dir='ltr'><em>3471T</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 629 392 751 414; x_wconf 79' lang='eng' dir='ltr'><em>(AJ294371)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 265 427 833 449; baseline 0 -5"><span class='ocrx_word' id='word_1_91' title='bbox 265 427 427 445; x_wconf 83' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 435 427 547 449; x_wconf 82' lang='eng' dir='ltr'><em>plurifarium</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 557 427 614 445; x_wconf 88' lang='eng' dir='ltr'><em>ICMP</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 624 427 698 445; x_wconf 76' lang='eng' dir='ltr'><em>1364GT</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 707 427 833 449; x_wconf 85' lang='eng' dir='ltr'><em>(AY494824)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 358 462 930 484; baseline 0 -4"><span class='ocrx_word' id='word_1_96' title='bbox 358 463 520 480; x_wconf 84' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 529 463 644 480; x_wconf 80' lang='eng' dir='ltr'><em>chacoense</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 654 462 711 480; x_wconf 86' lang='eng' dir='ltr'><em>ICMP</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 721 462 795 480; x_wconf 65' lang='eng' dir='ltr'><em>14,587T</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 804 463 930 484; x_wconf 85' lang='eng' dir='ltr'><em>(AY494825)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 407 498 992 520; baseline -0.002 -4"><span class='ocrx_word' id='word_1_101' title='bbox 407 498 564 520; x_wconf 82' lang='eng' dir='ltr'><em>Agrobacterium</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 572 498 701 516; x_wconf 84' lang='eng' dir='ltr'><em>tumefaciens</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 710 498 791 516; x_wconf 88' lang='eng' dir='ltr'>NCPPB</span> <span class='ocrx_word' id='word_1_104' title='bbox 800 498 862 516; x_wconf 76' lang='eng' dir='ltr'><em>2437T</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 870 498 992 520; x_wconf 83' lang='eng' dir='ltr'><em>(AJ294377)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 335 533 971 591">
+     <span class='ocr_line' id='line_1_39' title="bbox 341 533 971 556; baseline 0 -5"><span class='ocrx_word' id='word_1_106' title='bbox 341 534 512 556; x_wconf 82' lang='eng' dir='ltr'><em>Phyllobacterium</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 520 534 684 556; x_wconf 85' lang='eng' dir='ltr'><em>myrsinacearum</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 691 534 756 551; x_wconf 86' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 764 533 841 551; x_wconf 81' lang='eng' dir='ltr'><em>43590T</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 849 534 971 556; x_wconf 84' lang='eng' dir='ltr'><em>(AJ294365)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 335 569 844 591; baseline 0 -4"><span class='ocrx_word' id='word_1_111' title='bbox 335 569 486 587; x_wconf 84' lang='eng' dir='ltr'><em>Sinorhizob/‘um</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 495 569 570 587; x_wconf 77' lang='eng' dir='ltr'><em>meliloti</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 578 569 643 587; x_wconf 89' lang='eng' dir='ltr'>USDA</span> <span class='ocrx_word' id='word_1_114' title='bbox 653 569 713 587; x_wconf 88' lang='eng' dir='ltr'><em>1002T</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 722 569 844 591; x_wconf 84' lang='eng' dir='ltr'><em>(AJ294382)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 258 605 741 627">
+     <span class='ocr_line' id='line_1_41' title="bbox 258 605 741 627; baseline 0 -5"><span class='ocrx_word' id='word_1_116' title='bbox 258 605 409 623; x_wconf 83' lang='eng' dir='ltr'><em>Sinorhizobium</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 418 605 481 623; x_wconf 85' lang='eng' dir='ltr'><em>saheli</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 489 605 562 622; x_wconf 91' lang='eng' dir='ltr'>HAMBI</span> <span class='ocrx_word' id='word_1_119' title='bbox 571 605 610 622; x_wconf 88' lang='eng'><strong>217</strong></span> <span class='ocrx_word' id='word_1_120' title='bbox 619 605 741 627; x_wconf 83' lang='eng' dir='ltr'>(AJ294380)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 265 640 823 662">
+     <span class='ocr_line' id='line_1_42' title="bbox 265 640 823 662; baseline 0 -4"><span class='ocrx_word' id='word_1_121' title='bbox 265 641 411 658; x_wconf 73' lang='eng' dir='ltr'><em>Azorhizob/‘um</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 420 641 548 658; x_wconf 79' lang='eng' dir='ltr'><em>caulinodans</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 557 640 622 658; x_wconf 85' lang='eng' dir='ltr'>USDA</span> <span class='ocrx_word' id='word_1_124' title='bbox 630 640 693 658; x_wconf 78' lang='eng' dir='ltr'><em>4892T</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 701 641 823 662; x_wconf 80' lang='eng' dir='ltr'><em>(AJ294363)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 290 676 852 699">
+     <span class='ocr_line' id='line_1_43' title="bbox 290 676 852 699; baseline 0 -5"><span class='ocrx_word' id='word_1_126' title='bbox 290 676 457 699; x_wconf 74' lang='eng' dir='ltr'><em>Bradyrhizobium</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 462 676 575 699; x_wconf 82' lang='eng' dir='ltr'><em>japonicum</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 584 676 634 694; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_129' title='bbox 644 676 852 698; x_wconf 65' lang='eng' dir='ltr'><em>30131T(AY591555)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 225 752 899 1109">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 225 752 899 1109">
+     <span class='ocr_line' id='line_1_44' title="bbox 243 752 896 774; baseline 0 -5"><span class='ocrx_word' id='word_1_130' title='bbox 243 757 285 772; x_wconf 84' lang='eng'>1000</span> <span class='ocrx_word' id='word_1_131' title='bbox 297 752 474 769; x_wconf 87' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_132' title='bbox 481 752 638 769; x_wconf 77' lang='eng' dir='ltr'><em>metallidurans</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 645 752 694 769; x_wconf 88' lang='eng' dir='ltr'><em>STM</em></span> <span class='ocrx_word' id='word_1_134' title='bbox 704 752 756 769; x_wconf 84' lang='eng'><em>3297</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 764 752 896 774; x_wconf 81' lang='eng' dir='ltr'><em>(AM930389)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 235 789 894 811; baseline 0.002 -5"><span class='ocrx_word' id='word_1_136' title='bbox 235 796 266 811; x_wconf 76' lang='eng'><em>753</em></span> <span class='ocrx_word' id='word_1_137' title='bbox 295 789 471 807; x_wconf 84' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_138' title='bbox 479 789 635 807; x_wconf 82' lang='eng' dir='ltr'><em>metallidurans</em></span> <span class='ocrx_word' id='word_1_139' title='bbox 643 789 691 807; x_wconf 87' lang='eng' dir='ltr'>STM</span> <span class='ocrx_word' id='word_1_140' title='bbox 701 789 754 807; x_wconf 81' lang='eng'><strong>3294</strong></span> <span class='ocrx_word' id='word_1_141' title='bbox 762 789 894 811; x_wconf 82' lang='eng' dir='ltr'><em>(AM930393)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 296 826 895 848; baseline 0.002 -5"><span class='ocrx_word' id='word_1_142' title='bbox 296 826 472 844; x_wconf 87' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_143' title='bbox 480 826 636 844; x_wconf 84' lang='eng' dir='ltr'><em>metallidurans</em></span> <span class='ocrx_word' id='word_1_144' title='bbox 644 826 692 844; x_wconf 90' lang='eng' dir='ltr'>STM</span> <span class='ocrx_word' id='word_1_145' title='bbox 702 826 754 844; x_wconf 81' lang='eng'><strong>3292</strong></span> <span class='ocrx_word' id='word_1_146' title='bbox 763 826 895 848; x_wconf 81' lang='eng' dir='ltr'><em>(AM930392)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 286 863 885 885; baseline 0 -4"><span class='ocrx_word' id='word_1_147' title='bbox 286 864 462 881; x_wconf 83' lang='eng' dir='ltr'><em>Mesorhizabium</em></span> <span class='ocrx_word' id='word_1_148' title='bbox 470 864 626 881; x_wconf 78' lang='eng' dir='ltr'><em>metallidurans</em></span> <span class='ocrx_word' id='word_1_149' title='bbox 634 863 682 881; x_wconf 87' lang='eng' dir='ltr'>STM</span> <span class='ocrx_word' id='word_1_150' title='bbox 692 864 744 881; x_wconf 83' lang='eng'><em>3293</em></span> <span class='ocrx_word' id='word_1_151' title='bbox 753 864 885 885; x_wconf 84' lang='eng' dir='ltr'><em>(AM930390)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_48' title="bbox 225 901 882 923; baseline -0.002 -3"><span class='ocrx_word' id='word_1_152' title='bbox 225 906 257 920; x_wconf 80' lang='eng'><em>840</em></span> <span class='ocrx_word' id='word_1_153' title='bbox 282 901 459 919; x_wconf 85' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_154' title='bbox 467 901 623 919; x_wconf 79' lang='eng' dir='ltr'><em>metallidurans</em></span> <span class='ocrx_word' id='word_1_155' title='bbox 631 901 679 919; x_wconf 87' lang='eng' dir='ltr'>STM</span> <span class='ocrx_word' id='word_1_156' title='bbox 689 901 741 919; x_wconf 81' lang='eng'><em>3310</em></span> <span class='ocrx_word' id='word_1_157' title='bbox 749 901 882 923; x_wconf 80' lang='eng' dir='ltr'><em>(AM930391)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_49' title="bbox 277 938 883 960; baseline 0 -4"><span class='ocrx_word' id='word_1_158' title='bbox 277 938 453 956; x_wconf 83' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_159' title='bbox 461 938 617 956; x_wconf 82' lang='eng' dir='ltr'><em>metallidurans</em></span> <span class='ocrx_word' id='word_1_160' title='bbox 625 938 674 956; x_wconf 90' lang='eng' dir='ltr'>STM</span> <span class='ocrx_word' id='word_1_161' title='bbox 684 938 745 956; x_wconf 65' lang='eng' dir='ltr'><em>2683Y</em></span> <span class='ocrx_word' id='word_1_162' title='bbox 751 938 883 960; x_wconf 82' lang='eng' dir='ltr'><em>(AM930388)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_50' title="bbox 318 975 864 998; baseline 0 -5"><span class='ocrx_word' id='word_1_163' title='bbox 318 976 480 993; x_wconf 83' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_164' title='bbox 488 975 600 998; x_wconf 73' lang='eng' dir='ltr'><em>plurifar/um</em></span> <span class='ocrx_word' id='word_1_165' title='bbox 609 975 658 993; x_wconf 88' lang='eng' dir='ltr'>ORS</span> <span class='ocrx_word' id='word_1_166' title='bbox 669 975 730 993; x_wconf 82' lang='eng' dir='ltr'><em>1032T</em></span> <span class='ocrx_word' id='word_1_167' title='bbox 738 976 864 998; x_wconf 84' lang='eng' dir='ltr'><em>(AY785350)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_51' title="bbox 251 1012 899 1035; baseline 0 -5"><span class='ocrx_word' id='word_1_168' title='bbox 251 1017 285 1019; x_wconf 86' lang='eng'>—</span> <span class='ocrx_word' id='word_1_169' title='bbox 292 1013 454 1030; x_wconf 83' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_170' title='bbox 463 1013 624 1030; x_wconf 75' lang='eng' dir='ltr'><em>mediterraneum</em></span> <span class='ocrx_word' id='word_1_171' title='bbox 633 1013 698 1030; x_wconf 90' lang='eng' dir='ltr'>USDA</span> <span class='ocrx_word' id='word_1_172' title='bbox 707 1012 768 1030; x_wconf 71' lang='eng' dir='ltr'><em>3392T</em></span> <span class='ocrx_word' id='word_1_173' title='bbox 777 1013 899 1035; x_wconf 83' lang='eng' dir='ltr'><em>(AJ294391)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_52' title="bbox 245 1050 858 1072; baseline 0.002 -5"><span class='ocrx_word' id='word_1_174' title='bbox 245 1055 265 1056; x_wconf 49' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_175' title='bbox 272 1050 434 1068; x_wconf 82' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_176' title='bbox 443 1050 586 1068; x_wconf 75' lang='eng' dir='ltr'><em>lianshanense</em></span> <span class='ocrx_word' id='word_1_177' title='bbox 595 1050 660 1068; x_wconf 85' lang='eng' dir='ltr'>USDA</span> <span class='ocrx_word' id='word_1_178' title='bbox 668 1050 730 1068; x_wconf 79' lang='eng' dir='ltr'><em>3592T</em></span> <span class='ocrx_word' id='word_1_179' title='bbox 736 1050 858 1072; x_wconf 82' lang='eng' dir='ltr'><em>(AJ294392)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_53' title="bbox 297 1087 818 1109; baseline 0 -5"><span class='ocrx_word' id='word_1_180' title='bbox 297 1087 459 1105; x_wconf 83' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_181' title='bbox 467 1087 544 1105; x_wconf 77' lang='eng' dir='ltr'><em>huakuii</em></span> <span class='ocrx_word' id='word_1_182' title='bbox 552 1087 617 1105; x_wconf 86' lang='eng' dir='ltr'>USDA</span> <span class='ocrx_word' id='word_1_183' title='bbox 624 1087 688 1105; x_wconf 78' lang='eng' dir='ltr'><em>4779T</em></span> <span class='ocrx_word' id='word_1_184' title='bbox 696 1087 818 1109; x_wconf 83' lang='eng' dir='ltr'><em>(AJ294394)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 256 822 315 986">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 256 822 315 986">
+     <span class='ocr_line' id='line_1_54' title="bbox 256 822 294 859; baseline 0 -7"><span class='ocrx_word' id='word_1_185' title='bbox 256 822 294 859; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_55' title="bbox 256 859 285 890; baseline 0 606"><span class='ocrx_word' id='word_1_186' title='bbox 256 859 285 890; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_56' title="bbox 256 934 315 986; baseline 0 0"><span class='ocrx_word' id='word_1_187' title='bbox 256 934 315 986; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 209 994 240 1008">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 209 994 240 1008">
+     <span class='ocr_line' id='line_1_57' title="bbox 209 994 240 1008; baseline 0 0"><span class='ocrx_word' id='word_1_188' title='bbox 209 994 240 1008; x_wconf 89' lang='eng'><em>770</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 225 1013 245 1014">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 225 1013 245 1014">
+     <span class='ocr_line' id='line_1_58' title="bbox 225 1013 245 1014; baseline 0 482"><span class='ocrx_word' id='word_1_189' title='bbox 225 1013 245 1014; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 244 971 245 1057">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 244 971 245 1057">
+     <span class='ocr_line' id='line_1_59' title="bbox 244 971 245 1057; baseline 0 439"><span class='ocrx_word' id='word_1_190' title='bbox 244 971 245 1057; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 150 1109 226 1111">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 150 1109 226 1111">
+     <span class='ocr_line' id='line_1_60' title="bbox 150 1109 226 1111; baseline 0 385"><span class='ocrx_word' id='word_1_191' title='bbox 150 1109 226 1111; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 110 1217 141 1231">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 110 1217 141 1231">
+     <span class='ocr_line' id='line_1_61' title="bbox 110 1217 141 1231; baseline 0 0"><span class='ocrx_word' id='word_1_192' title='bbox 110 1217 141 1231; x_wconf 82' lang='eng'><em>728</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 4 1234 151 1236">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 4 1234 151 1236">
+     <span class='ocr_line' id='line_1_62' title="bbox 4 1234 151 1236; baseline 0 260"><span class='ocrx_word' id='word_1_193' title='bbox 4 1234 151 1236; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 4 1234 5 1467">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 4 1234 5 1467">
+     <span class='ocr_line' id='line_1_63' title="bbox 4 1234 5 1467; baseline 0 29"><span class='ocrx_word' id='word_1_194' title='bbox 4 1234 5 1467; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 150 1109 151 1360">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 150 1109 151 1360">
+     <span class='ocr_line' id='line_1_64' title="bbox 150 1109 151 1360; baseline 0 136"><span class='ocrx_word' id='word_1_195' title='bbox 150 1109 151 1360; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_37' title="bbox 191 1339 222 1354">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 191 1339 222 1354">
+     <span class='ocr_line' id='line_1_65' title="bbox 191 1339 222 1354; baseline 0 0"><span class='ocrx_word' id='word_1_196' title='bbox 191 1339 222 1354; x_wconf 59' lang='eng'><em>812</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_38' title="bbox 261 1124 901 1333">
+    <p class='ocr_par' dir='ltr' id='par_1_42' title="bbox 297 1124 901 1222">
+     <span class='ocr_line' id='line_1_66' title="bbox 352 1124 901 1147; baseline 0 -5"><span class='ocrx_word' id='word_1_197' title='bbox 352 1125 514 1142; x_wconf 84' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_198' title='bbox 523 1125 638 1142; x_wconf 76' lang='eng' dir='ltr'><em>chacoense</em></span> <span class='ocrx_word' id='word_1_199' title='bbox 646 1125 694 1142; x_wconf 91' lang='eng' dir='ltr'><em>STM</em></span> <span class='ocrx_word' id='word_1_200' title='bbox 704 1124 766 1142; x_wconf 89' lang='eng' dir='ltr'><em>2154T</em></span> <span class='ocrx_word' id='word_1_201' title='bbox 775 1125 901 1147; x_wconf 82' lang='eng' dir='ltr'><em>(AY785351)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_67' title="bbox 299 1161 800 1184; baseline 0 -5"><span class='ocrx_word' id='word_1_202' title='bbox 299 1162 461 1179; x_wconf 81' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_203' title='bbox 469 1162 526 1179; x_wconf 73' lang='eng' dir='ltr'><em>ciceri</em></span> <span class='ocrx_word' id='word_1_204' title='bbox 534 1161 599 1179; x_wconf 86' lang='eng' dir='ltr'>USDA</span> <span class='ocrx_word' id='word_1_205' title='bbox 607 1161 669 1179; x_wconf 78' lang='eng' dir='ltr'><em>3383T</em></span> <span class='ocrx_word' id='word_1_206' title='bbox 678 1162 800 1184; x_wconf 81' lang='eng' dir='ltr'><em>(AJ294395)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_68' title="bbox 297 1199 824 1222; baseline 0 -5"><span class='ocrx_word' id='word_1_207' title='bbox 297 1199 459 1217; x_wconf 76' lang='eng' dir='ltr'><em>Mesorh/zobium</em></span> <span class='ocrx_word' id='word_1_208' title='bbox 467 1199 575 1222; x_wconf 74' lang='eng' dir='ltr'><em>amorphae</em></span> <span class='ocrx_word' id='word_1_209' title='bbox 583 1199 631 1217; x_wconf 92' lang='eng' dir='ltr'>STM</span> <span class='ocrx_word' id='word_1_210' title='bbox 641 1199 689 1217; x_wconf 83' lang='eng' dir='ltr'><em>291T</em></span> <span class='ocrx_word' id='word_1_211' title='bbox 697 1199 824 1222; x_wconf 85' lang='eng' dir='ltr'><em>(AY785352)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_43' title="bbox 261 1236 872 1333">
+     <span class='ocr_line' id='line_1_69' title="bbox 261 1236 733 1259; baseline 0 -5"><span class='ocrx_word' id='word_1_212' title='bbox 261 1237 423 1254; x_wconf 70' lang='eng' dir='ltr'><em>Mesorhizobium</em></span> <span class='ocrx_word' id='word_1_213' title='bbox 431 1237 462 1254; x_wconf 81' lang='eng' dir='ltr'><em>Ioti</em></span> <span class='ocrx_word' id='word_1_214' title='bbox 470 1236 535 1254; x_wconf 87' lang='eng' dir='ltr'>USDA</span> <span class='ocrx_word' id='word_1_215' title='bbox 544 1236 606 1254; x_wconf 86' lang='eng' dir='ltr'><em>3471T</em></span> <span class='ocrx_word' id='word_1_216' title='bbox 612 1237 733 1259; x_wconf 82' lang='eng' dir='ltr'><em>(AJ294393)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_70' title="bbox 363 1273 872 1296; baseline 0 -5"><span class='ocrx_word' id='word_1_217' title='bbox 363 1274 515 1291; x_wconf 84' lang='eng' dir='ltr'><em>Sinorhizobium</em></span> <span class='ocrx_word' id='word_1_218' title='bbox 523 1274 599 1291; x_wconf 77' lang='eng' dir='ltr'><em>me/i/oti</em></span> <span class='ocrx_word' id='word_1_219' title='bbox 606 1274 671 1291; x_wconf 87' lang='eng' dir='ltr'>USDA</span> <span class='ocrx_word' id='word_1_220' title='bbox 681 1273 742 1291; x_wconf 88' lang='eng' dir='ltr'><em>1002T</em></span> <span class='ocrx_word' id='word_1_221' title='bbox 750 1274 872 1296; x_wconf 86' lang='eng' dir='ltr'><em>(AJ294400)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_71' title="bbox 280 1311 794 1333; baseline 0 -5"><span class='ocrx_word' id='word_1_222' title='bbox 280 1316 303 1317; x_wconf 62' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_223' title='bbox 310 1311 462 1329; x_wconf 84' lang='eng' dir='ltr'><em>Sinorhizobium</em></span> <span class='ocrx_word' id='word_1_224' title='bbox 470 1311 534 1329; x_wconf 86' lang='eng' dir='ltr'><em>saheli</em></span> <span class='ocrx_word' id='word_1_225' title='bbox 542 1311 614 1328; x_wconf 92' lang='eng' dir='ltr'>HAMBI</span> <span class='ocrx_word' id='word_1_226' title='bbox 624 1311 662 1328; x_wconf 91' lang='eng'><strong>217</strong></span> <span class='ocrx_word' id='word_1_227' title='bbox 672 1311 794 1333; x_wconf 78' lang='eng' dir='ltr'><em>(AJ294399)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_39' title="bbox 225 1013 226 1208">
+    <p class='ocr_par' dir='ltr' id='par_1_44' title="bbox 225 1013 226 1208">
+     <span class='ocr_line' id='line_1_72' title="bbox 225 1013 226 1208; baseline 0 288"><span class='ocrx_word' id='word_1_228' title='bbox 225 1013 226 1208; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_40' title="bbox 220 1214 252 1229">
+    <p class='ocr_par' dir='ltr' id='par_1_45' title="bbox 220 1214 252 1229">
+     <span class='ocr_line' id='line_1_73' title="bbox 220 1214 252 1229; baseline 0 0"><span class='ocrx_word' id='word_1_229' title='bbox 220 1214 252 1229; x_wconf 59' lang='eng'><em>810</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_41' title="bbox 280 1279 356 1280">
+    <p class='ocr_par' dir='ltr' id='par_1_46' title="bbox 280 1279 356 1280">
+     <span class='ocr_line' id='line_1_74' title="bbox 280 1279 356 1280; baseline 0 216"><span class='ocrx_word' id='word_1_230' title='bbox 280 1279 356 1280; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_42' title="bbox 244 1280 275 1294">
+    <p class='ocr_par' dir='ltr' id='par_1_47' title="bbox 244 1280 275 1294">
+     <span class='ocr_line' id='line_1_75' title="bbox 244 1280 275 1294; baseline 0 0"><span class='ocrx_word' id='word_1_231' title='bbox 244 1280 275 1294; x_wconf 80' lang='eng'>859</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_43' title="bbox 279 1279 280 1317">
+    <p class='ocr_par' dir='ltr' id='par_1_48' title="bbox 279 1279 280 1317">
+     <span class='ocr_line' id='line_1_76' title="bbox 279 1279 280 1317; baseline 0 179"><span class='ocrx_word' id='word_1_232' title='bbox 279 1279 280 1317; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_44' title="bbox 246 1298 280 1299">
+    <p class='ocr_par' dir='ltr' id='par_1_49' title="bbox 246 1298 280 1299">
+     <span class='ocr_line' id='line_1_77' title="bbox 246 1298 280 1299; baseline 0 197"><span class='ocrx_word' id='word_1_233' title='bbox 246 1298 280 1299; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_45' title="bbox 228 1325 247 1326">
+    <p class='ocr_par' dir='ltr' id='par_1_50' title="bbox 228 1325 247 1326">
+     <span class='ocr_line' id='line_1_78' title="bbox 228 1325 247 1326; baseline 0 170"><span class='ocrx_word' id='word_1_234' title='bbox 228 1325 247 1326; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_46' title="bbox 246 1298 247 1355">
+    <p class='ocr_par' dir='ltr' id='par_1_51' title="bbox 246 1298 247 1355">
+     <span class='ocr_line' id='line_1_79' title="bbox 246 1298 247 1355; baseline 0 141"><span class='ocrx_word' id='word_1_235' title='bbox 246 1298 247 1355; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_47' title="bbox 150 1358 230 1360">
+    <p class='ocr_par' dir='ltr' id='par_1_52' title="bbox 150 1358 230 1360">
+     <span class='ocr_line' id='line_1_80' title="bbox 150 1358 230 1360; baseline 0 136"><span class='ocrx_word' id='word_1_236' title='bbox 150 1358 230 1360; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_48' title="bbox 247 1348 994 1408">
+    <p class='ocr_par' dir='ltr' id='par_1_53' title="bbox 247 1348 994 1408">
+     <span class='ocr_line' id='line_1_81' title="bbox 247 1348 906 1370; baseline 0 -4"><span class='ocrx_word' id='word_1_237' title='bbox 247 1353 343 1355; x_wconf 84' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_238' title='bbox 348 1348 505 1370; x_wconf 75' lang='eng' dir='ltr'><em>Agmbacterium</em></span> <span class='ocrx_word' id='word_1_239' title='bbox 514 1348 643 1366; x_wconf 81' lang='eng' dir='ltr'><em>tumefaciens</em></span> <span class='ocrx_word' id='word_1_240' title='bbox 651 1348 700 1366; x_wconf 88' lang='eng' dir='ltr'><em>ORS</em></span> <span class='ocrx_word' id='word_1_241' title='bbox 711 1348 758 1366; x_wconf 88' lang='eng'><em>1351</em></span> <span class='ocrx_word' id='word_1_242' title='bbox 763 1348 772 1359; x_wconf 62' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_243' title='bbox 780 1348 906 1370; x_wconf 88' lang='eng' dir='ltr'><em>(AY785348)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_82' title="bbox 364 1385 994 1408; baseline 0 -5"><span class='ocrx_word' id='word_1_244' title='bbox 364 1386 535 1408; x_wconf 79' lang='eng' dir='ltr'><em>Phyllobacterium</em></span> <span class='ocrx_word' id='word_1_245' title='bbox 543 1386 706 1408; x_wconf 81' lang='eng' dir='ltr'><em>myrsinacearum</em></span> <span class='ocrx_word' id='word_1_246' title='bbox 714 1385 779 1403; x_wconf 79' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_247' title='bbox 787 1385 864 1403; x_wconf 81' lang='eng' dir='ltr'><em>43590T</em></span> <span class='ocrx_word' id='word_1_248' title='bbox 872 1386 994 1408; x_wconf 85' lang='eng' dir='ltr'><em>(AJ294387)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_49' title="bbox 228 1013 230 1393">
+    <p class='ocr_par' dir='ltr' id='par_1_54' title="bbox 228 1013 230 1393">
+     <span class='ocr_line' id='line_1_83' title="bbox 228 1013 230 1393; baseline 0 103"><span class='ocrx_word' id='word_1_249' title='bbox 228 1013 230 1393; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_50' title="bbox 190 1422 708 1445">
+    <p class='ocr_par' dir='ltr' id='par_1_55' title="bbox 190 1422 708 1445">
+     <span class='ocr_line' id='line_1_84' title="bbox 190 1422 708 1445; baseline 0 -5"><span class='ocrx_word' id='word_1_250' title='bbox 190 1423 356 1445; x_wconf 85' lang='eng' dir='ltr'><em>Bradyrhizobium</em></span> <span class='ocrx_word' id='word_1_251' title='bbox 361 1423 474 1445; x_wconf 84' lang='eng' dir='ltr'><em>japonicum</em></span> <span class='ocrx_word' id='word_1_252' title='bbox 483 1423 548 1440; x_wconf 91' lang='eng' dir='ltr'>USDA</span> <span class='ocrx_word' id='word_1_253' title='bbox 556 1422 578 1440; x_wconf 87' lang='eng' dir='ltr'><em>6T</em></span> <span class='ocrx_word' id='word_1_254' title='bbox 587 1423 708 1445; x_wconf 84' lang='eng' dir='ltr'><em>(AJ294388)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_51' title="bbox 4 1465 146 1496">
+    <p class='ocr_par' dir='ltr' id='par_1_56' title="bbox 39 1476 62 1490">
+     <span class='ocr_line' id='line_1_85' title="bbox 39 1476 62 1490; baseline 0 0"><span class='ocrx_word' id='word_1_255' title='bbox 39 1476 62 1490; x_wconf 89' lang='eng'><em>0.1</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_52' title="bbox 150 1460 708 1482">
+    <p class='ocr_par' dir='ltr' id='par_1_57' title="bbox 150 1460 708 1482">
+     <span class='ocr_line' id='line_1_86' title="bbox 150 1460 708 1482; baseline 0.002 -5"><span class='ocrx_word' id='word_1_256' title='bbox 150 1460 297 1478; x_wconf 83' lang='eng' dir='ltr'><em>Azorhizobium</em></span> <span class='ocrx_word' id='word_1_257' title='bbox 305 1460 433 1478; x_wconf 82' lang='eng' dir='ltr'><em>cau/inodans</em></span> <span class='ocrx_word' id='word_1_258' title='bbox 442 1460 507 1478; x_wconf 85' lang='eng' dir='ltr'>USDA</span> <span class='ocrx_word' id='word_1_259' title='bbox 515 1460 578 1478; x_wconf 84' lang='eng' dir='ltr'><em>4892T</em></span> <span class='ocrx_word' id='word_1_260' title='bbox 586 1460 708 1482; x_wconf 83' lang='eng' dir='ltr'><em>(AJ294389)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003368-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003368-0-000.pbm.png
new file mode 100644
index 00000000..2db7920d
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003368-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003368-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003368-0-000.pbm.png.hocr
new file mode 100644
index 00000000..52175170
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003368-0-000.pbm.png.hocr
@@ -0,0 +1,113 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003368-0-000.pbm.png"; bbox 0 0 994 804; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 62 0 993 803">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 100 2 593 28">
+     <span class='ocr_line' id='line_1_1' title="bbox 100 2 593 28; baseline 0 -6"><span class='ocrx_word' id='word_1_1' title='bbox 100 2 255 23; x_wconf 90' lang='eng' dir='ltr'><em>Burkholderia</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 264 2 357 28; x_wconf 86' lang='eng' dir='ltr'><em>cepacia</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 367 2 436 23; x_wconf 85' lang='eng' dir='ltr'><em>B7aM</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 447 2 593 28; x_wconf 85' lang='eng' dir='ltr'><em>(AB164394)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 62 47 837 174">
+     <span class='ocr_line' id='line_1_2' title="bbox 62 47 837 78; baseline 0 -5"><span class='ocrx_word' id='word_1_5' title='bbox 62 56 104 77; x_wconf 89' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 228 53 366 73; x_wconf 83' lang='eng' dir='ltr'><em>Pe/omonas</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 375 53 545 78; x_wconf 80' lang='eng' dir='ltr'><em>saccharophi/a</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 556 52 613 73; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 624 47 681 73; x_wconf 87' lang='eng' dir='ltr'><em>654T</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 691 52 837 78; x_wconf 80' lang='eng' dir='ltr'><em>(ABOZ1407)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 229 98 777 124; baseline 0 -5"><span class='ocrx_word' id='word_1_11' title='bbox 229 98 366 119; x_wconf 84' lang='eng' dir='ltr'><em>Roseate/es</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 375 98 549 124; x_wconf 83' lang='eng' dir='ltr'><em>depolymerans</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 558 98 582 119; x_wconf 84' lang='eng'>61</span> <span class='ocrx_word' id='word_1_14' title='bbox 589 98 620 118; x_wconf 92' lang='eng' dir='ltr'><em>B2</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 631 98 777 124; x_wconf 86' lang='eng' dir='ltr'><em>(AB003625)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 280 142 723 174; baseline 0 -6"><span class='ocrx_word' id='word_1_16' title='bbox 280 148 401 173; x_wconf 80' lang='eng' dir='ltr'><em>Leptothrix</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 410 148 495 168; x_wconf 89' lang='eng' dir='ltr'><em>mobilis</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 506 142 602 168; x_wconf 91' lang='eng' dir='ltr'><em>Feox-1T</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 612 147 723 174; x_wconf 84' lang='eng' dir='ltr'><em>(X97071)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 220 193 752 273">
+     <span class='ocr_line' id='line_1_5' title="bbox 223 193 723 219; baseline 0 -5"><span class='ocrx_word' id='word_1_20' title='bbox 223 194 345 219; x_wconf 77' lang='eng' dir='ltr'><em>Leptothrix</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 354 194 463 214; x_wconf 87' lang='eng' dir='ltr'><em>cholodnii</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 471 193 531 214; x_wconf 81' lang='eng' dir='ltr'><em>COM</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 544 194 601 214; x_wconf 88' lang='eng'><em>1827</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 612 193 723 219; x_wconf 86' lang='eng' dir='ltr'><em>(X97070)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 220 242 752 273; baseline 0.002 -6"><span class='ocrx_word' id='word_1_25' title='bbox 220 247 422 273; x_wconf 86' lang='eng' dir='ltr'><em>Azohydromonas</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 430 247 473 268; x_wconf 82' lang='eng' dir='ltr'><em>lata</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 484 247 529 267; x_wconf 93' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 542 242 629 268; x_wconf 81' lang='eng' dir='ltr'><em>12599T</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 638 247 752 273; x_wconf 88' lang='eng' dir='ltr'><em>(D88007)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 225 296 907 468">
+     <span class='ocr_line' id='line_1_7' title="bbox 308 296 817 324; baseline 0.002 -7"><span class='ocrx_word' id='word_1_30' title='bbox 308 296 437 317; x_wconf 83' lang='eng' dir='ltr'><em>Rubrivivax</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 445 297 585 323; x_wconf 82' lang='eng' dir='ltr'><em>gelatinosus</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 595 297 661 318; x_wconf 93' lang='eng' dir='ltr'><em>|L144</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 671 298 817 324; x_wconf 88' lang='eng' dir='ltr'><em>(ABO16167)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 370 341 907 372; baseline 0.002 -6"><span class='ocrx_word' id='word_1_34' title='bbox 370 346 498 367; x_wconf 86' lang='eng' dir='ltr'><em>Rubrivivax</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 507 346 688 372; x_wconf 78' lang='eng' dir='ltr'><em>benzoati/yticus</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 696 341 756 367; x_wconf 77' lang='eng' dir='ltr'><em>JA2T</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 766 346 907 372; x_wconf 86' lang='eng' dir='ltr'><em>(AJ888903)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 225 388 842 418; baseline 0.002 -6"><span class='ocrx_word' id='word_1_38' title='bbox 225 388 254 409; x_wconf 81' lang='eng'><em>69</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 370 392 505 413; x_wconf 81' lang='eng' dir='ltr'><em>‘Rubrivivax</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 513 392 625 413; x_wconf 78' lang='eng' dir='ltr'><em>indolicus’</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 635 392 690 413; x_wconf 91' lang='eng' dir='ltr'>OU5</span> <span class='ocrx_word' id='word_1_42' title='bbox 700 392 842 418; x_wconf 84' lang='eng' dir='ltr'><em>(AJ620346)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 251 441 793 468; baseline 0 -6"><span class='ocrx_word' id='word_1_43' title='bbox 251 442 373 467; x_wconf 84' lang='eng' dir='ltr'><em>Aquinco/a</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 383 442 564 462; x_wconf 78' lang='eng' dir='ltr'><em>tertiaricarbonis</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 573 442 632 462; x_wconf 88' lang='eng' dir='ltr'><em>L108</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 643 441 793 468; x_wconf 83' lang='eng' dir='ltr'><em>(DQ436455)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 257 487 543 513">
+     <span class='ocr_line' id='line_1_11' title="bbox 257 487 543 513; baseline 0 -5"><span class='ocrx_word' id='word_1_47' title='bbox 257 487 317 508; x_wconf 88' lang='eng' dir='ltr'><em>Gsoil</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 329 488 387 508; x_wconf 92' lang='eng'><em>1005</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 397 487 543 513; x_wconf 80' lang='eng' dir='ltr'><em>(ABZ71046)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 311 532 628 563">
+     <span class='ocr_line' id='line_1_12' title="bbox 311 532 628 563; baseline 0 -6"><span class='ocrx_word' id='word_1_50' title='bbox 311 537 387 557; x_wconf 88' lang='eng' dir='ltr'><em>Strain</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 399 532 471 557; x_wconf 90' lang='eng' dir='ltr'><em>1a22T</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 480 537 628 563; x_wconf 89' lang='eng' dir='ltr'><em>(EU542576)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 278 583 568 610">
+     <span class='ocr_line' id='line_1_13' title="bbox 278 583 568 610; baseline 0 -6"><span class='ocrx_word' id='word_1_53' title='bbox 278 583 407 604; x_wconf 88' lang='eng' dir='ltr'><em>|MCC1722</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 418 583 568 610; x_wconf 87' lang='eng' dir='ltr'><em>(DQ664241)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 413 633 993 710">
+     <span class='ocr_line' id='line_1_14' title="bbox 413 633 993 664; baseline 0 -6"><span class='ocrx_word' id='word_1_55' title='bbox 413 638 523 658; x_wconf 81' lang='eng' dir='ltr'><em>Ideone/la</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 533 638 691 658; x_wconf 80' lang='eng' dir='ltr'><em>dechloratans</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 699 638 773 658; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 783 633 872 658; x_wconf 82' lang='eng' dir='ltr'><em>51718T</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 881 638 993 664; x_wconf 89' lang='eng' dir='ltr'><em>(X72724)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 483 683 701 710; baseline 0 -6"><span class='ocrx_word' id='word_1_60' title='bbox 483 684 541 704; x_wconf 79' lang='eng'>8511</span> <span class='ocrx_word' id='word_1_61' title='bbox 555 683 701 710; x_wconf 85' lang='eng' dir='ltr'><em>(AB049106)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 518 729 735 755">
+     <span class='ocr_line' id='line_1_16' title="bbox 518 729 735 755; baseline 0 -5"><span class='ocrx_word' id='word_1_62' title='bbox 518 730 579 750; x_wconf 77' lang='eng'>8513</span> <span class='ocrx_word' id='word_1_63' title='bbox 590 729 735 755; x_wconf 86' lang='eng' dir='ltr'><em>(ABO49107)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 518 776 757 802">
+     <span class='ocr_line' id='line_1_17' title="bbox 518 776 757 802; baseline -0.017 -3"><span class='ocrx_word' id='word_1_64' title='bbox 518 779 600 800; x_wconf 76' lang='eng'>8508-1</span> <span class='ocrx_word' id='word_1_65' title='bbox 611 776 757 802; x_wconf 87' lang='eng' dir='ltr'><em>(ABO49105)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 0 7 510 797">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 0 7 510 797">
+     <span class='ocr_line' id='line_1_18' title="bbox 0 7 96 46; baseline 0 -3"><span class='ocrx_word' id='word_1_66' title='bbox 0 7 96 46; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 0 46 229 137; baseline 0 -50"><span class='ocrx_word' id='word_1_67' title='bbox 0 46 229 137; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 0 137 274 232; baseline 0 -52"><span class='ocrx_word' id='word_1_68' title='bbox 0 137 274 232; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 0 232 308 338; baseline 0 0"><span class='ocrx_word' id='word_1_69' title='bbox 0 232 308 338; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 2 338 364 387; baseline 0 0"><span class='ocrx_word' id='word_1_70' title='bbox 2 338 364 387; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> <span class='ocrx_word' id='word_1_71' title='bbox 254 378 364 387; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 2 387 364 481; baseline 0 -62"><span class='ocrx_word' id='word_1_72' title='bbox 2 387 364 481; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> <span class='ocrx_word' id='word_1_73' title='bbox 265 387 364 419; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 40 481 257 526; baseline 0 0"><span class='ocrx_word' id='word_1_74' title='bbox 40 481 257 526; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 40 526 305 623; baseline 0 0"><span class='ocrx_word' id='word_1_75' title='bbox 40 526 305 623; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 68 623 413 679; baseline 0 125"><span class='ocrx_word' id='word_1_76' title='bbox 68 623 413 679; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 125 679 483 723; baseline 0 81"><span class='ocrx_word' id='word_1_77' title='bbox 125 679 483 723; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 170 723 510 797; baseline 0 7"><span class='ocrx_word' id='word_1_78' title='bbox 170 723 510 797; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 56 767 186 797">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 95 767 143 787">
+     <span class='ocr_line' id='line_1_29' title="bbox 95 767 143 787; baseline 0 0"><span class='ocrx_word' id='word_1_79' title='bbox 95 767 143 787; x_wconf 92' lang='eng'>0.01</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003376-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003376-0-000.pbm.png
new file mode 100644
index 00000000..64c8f2dc
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003376-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003376-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003376-0-000.pbm.png.hocr
new file mode 100644
index 00000000..fbedc4e1
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003376-0-000.pbm.png.hocr
@@ -0,0 +1,117 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003376-0-000.pbm.png"; bbox 0 0 1302 591; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 0 7 669 570">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 0 7 669 570">
+     <span class='ocr_line' id='line_1_1' title="bbox 449 7 583 47; baseline 0 -17"><span class='ocrx_word' id='word_1_1' title='bbox 449 7 583 47; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 434 47 668 109; baseline 0 -23"><span class='ocrx_word' id='word_1_2' title='bbox 434 47 668 109; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 399 109 618 205; baseline 0 -18"><span class='ocrx_word' id='word_1_3' title='bbox 399 109 618 205; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 271 205 587 262; baseline 0 -18"><span class='ocrx_word' id='word_1_4' title='bbox 271 205 587 262; x_wconf 95' lang='eng' dir='ltr'><em>     </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 271 262 540 283; baseline 0 308"><span class='ocrx_word' id='word_1_5' title='bbox 271 262 540 283; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 245 283 542 323; baseline 0 268"><span class='ocrx_word' id='word_1_6' title='bbox 245 283 542 323; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 0 323 561 402; baseline 0 0"><span class='ocrx_word' id='word_1_7' title='bbox 0 323 561 402; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 0 402 282 442; baseline 0 149"><span class='ocrx_word' id='word_1_8' title='bbox 0 402 282 442; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 0 442 472 481; baseline 0 110"><span class='ocrx_word' id='word_1_9' title='bbox 0 442 472 481; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 0 481 491 520; baseline 0 0"><span class='ocrx_word' id='word_1_10' title='bbox 0 481 491 520; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 0 520 669 570; baseline 0 0"><span class='ocrx_word' id='word_1_11' title='bbox 0 520 669 570; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 443 5 1295 585">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 587 5 1108 33">
+     <span class='ocr_line' id='line_1_12' title="bbox 587 5 1108 33; baseline 0 -5"><span class='ocrx_word' id='word_1_12' title='bbox 587 7 611 28; x_wconf 94' lang='eng' dir='ltr'><em>N.</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 622 7 783 33; x_wconf 76' lang='eng' dir='ltr'><em>Xinjiangensis</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 793 7 851 28; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 864 5 951 28; x_wconf 88' lang='eng' dir='ltr'><em>15475T</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 961 7 1108 33; x_wconf 85' lang='eng' dir='ltr'><em>(AY226510)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 547 44 1035 72">
+     <span class='ocr_line' id='line_1_13' title="bbox 547 44 1035 72; baseline 0 -5"><span class='ocrx_word' id='word_1_17' title='bbox 547 46 571 67; x_wconf 91' lang='eng' dir='ltr'><em>N.</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 583 46 710 72; x_wconf 81' lang='eng' dir='ltr'><em>aethiopica</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 721 46 779 67; x_wconf 86' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 792 44 879 67; x_wconf 71' lang='eng' dir='ltr'><em>17733T</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 889 46 1035 72; x_wconf 87' lang='eng' dir='ltr'><em>(AY574575)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 670 83 1071 111">
+     <span class='ocr_line' id='line_1_14' title="bbox 670 83 1071 111; baseline 0 -5"><span class='ocrx_word' id='word_1_22' title='bbox 670 86 695 106; x_wconf 96' lang='eng' dir='ltr'><strong><em>N.</em></strong></span> <span class='ocrx_word' id='word_1_23' title='bbox 707 86 761 106; x_wconf 86' lang='eng' dir='ltr'><em>alba</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 771 85 848 106; x_wconf 90' lang='eng' dir='ltr'><em>CAAS</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 858 83 916 106; x_wconf 92' lang='eng' dir='ltr'><em>252T</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 923 85 1071 111; x_wconf 83' lang='eng' dir='ltr'><em>(EU566871)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 582 123 995 151">
+     <span class='ocr_line' id='line_1_15' title="bbox 582 123 995 151; baseline 0 -5"><span class='ocrx_word' id='word_1_27' title='bbox 582 125 606 146; x_wconf 94' lang='eng' dir='ltr'><em>N.</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 618 125 676 146; x_wconf 82' lang='eng' dir='ltr'><em>flava</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 685 125 740 146; x_wconf 85' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 753 123 840 146; x_wconf 89' lang='eng' dir='ltr'><em>14814T</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 850 125 995 151; x_wconf 85' lang='eng' dir='ltr'><em>(EF680886)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 582 162 1163 230">
+     <span class='ocr_line' id='line_1_16' title="bbox 620 162 1163 191; baseline 0 -5"><span class='ocrx_word' id='word_1_32' title='bbox 620 165 643 185; x_wconf 93' lang='eng' dir='ltr'><em>N.</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 655 165 847 186; x_wconf 82' lang='eng' dir='ltr'><em>Iacusekhoensis</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 860 165 915 186; x_wconf 91' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 929 162 1163 191; x_wconf 77' lang='eng' dir='ltr'><em>11953T(AJ290397)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 582 201 994 230; baseline -0.002 -5"><span class='ocrx_word' id='word_1_36' title='bbox 582 204 606 224; x_wconf 92' lang='eng' dir='ltr'><em>N.</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 618 204 707 225; x_wconf 85' lang='eng' dir='ltr'><em>halobia</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 716 204 771 225; x_wconf 91' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 784 201 871 225; x_wconf 85' lang='eng' dir='ltr'><em>11483T</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 882 204 994 230; x_wconf 88' lang='eng' dir='ltr'><em>(X80747)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 589 241 1047 269">
+     <span class='ocr_line' id='line_1_18' title="bbox 589 241 1047 269; baseline 0 -5"><span class='ocrx_word' id='word_1_41' title='bbox 589 244 612 264; x_wconf 94' lang='eng' dir='ltr'><em>N.</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 625 244 735 269; x_wconf 83' lang='eng' dir='ltr'><em>ha/ophila</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 743 244 790 264; x_wconf 93' lang='eng' dir='ltr'><em>YIM</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 802 241 891 264; x_wconf 80' lang='eng' dir='ltr'><em>70179T</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 901 244 1047 269; x_wconf 81' lang='eng' dir='ltr'><em>(AY820953)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 542 280 953 309">
+     <span class='ocr_line' id='line_1_19' title="bbox 542 280 953 309; baseline 0 -5"><span class='ocrx_word' id='word_1_46' title='bbox 542 283 567 304; x_wconf 93' lang='eng' dir='ltr'><em>N.</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 578 283 637 304; x_wconf 84' lang='eng' dir='ltr'><em>Iutea</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 651 283 699 304; x_wconf 92' lang='eng' dir='ltr'><em>YIM</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 710 280 798 304; x_wconf 90' lang='eng' dir='ltr'><em>70081T</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 806 283 953 309; x_wconf 90' lang='eng' dir='ltr'><em>(AY588278)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 562 320 1062 349">
+     <span class='ocr_line' id='line_1_20' title="bbox 562 320 1062 349; baseline 0.002 -6"><span class='ocrx_word' id='word_1_51' title='bbox 562 323 586 343; x_wconf 95' lang='eng' dir='ltr'><em>N.</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 598 323 751 344; x_wconf 82' lang='eng' dir='ltr'><em>halotolerans</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 759 323 806 343; x_wconf 93' lang='eng' dir='ltr'><em>YIM</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 818 320 906 344; x_wconf 81' lang='eng' dir='ltr'><em>70084T</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 916 323 1062 349; x_wconf 86' lang='eng' dir='ltr'><em>(AY226508)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 565 359 958 388">
+     <span class='ocr_line' id='line_1_21' title="bbox 565 359 958 388; baseline -0.003 -5"><span class='ocrx_word' id='word_1_56' title='bbox 565 362 589 382; x_wconf 97' lang='eng' dir='ltr'><em>N.</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 597 362 691 388; x_wconf 82' lang='eng' dir='ltr'><em>jeotgali</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 698 359 801 383; x_wconf 79' lang='eng' dir='ltr'><em>.JG—241T</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 811 362 958 388; x_wconf 84' lang='eng' dir='ltr'><em>(AY928901)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 443 399 1295 585">
+     <span class='ocr_line' id='line_1_22' title="bbox 521 399 1061 428; baseline 0 -6"><span class='ocrx_word' id='word_1_60' title='bbox 521 399 540 413; x_wconf 69' lang='eng'>35</span> <span class='ocrx_word' id='word_1_61' title='bbox 560 402 584 422; x_wconf 77' lang='eng' dir='ltr'><em>N.</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 596 402 748 422; x_wconf 83' lang='eng' dir='ltr'><em>sandarakina</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 758 402 804 422; x_wconf 93' lang='eng' dir='ltr'><em>YIM</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 816 399 904 422; x_wconf 77' lang='eng' dir='ltr'><em>70009T</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 915 402 1061 428; x_wconf 86' lang='eng' dir='ltr'><em>(AY588277)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 472 438 1051 467; baseline 0 -6"><span class='ocrx_word' id='word_1_66' title='bbox 472 441 630 461; x_wconf 70' lang='eng' dir='ltr'><em>Arthrobacter</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 636 441 762 461; x_wconf 87' lang='eng' dir='ltr'><em>cumminsii</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 771 440 828 461; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 842 438 928 461; x_wconf 73' lang='eng' dir='ltr'><em>10493T</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 939 441 1051 467; x_wconf 84' lang='eng' dir='ltr'><em>(X93354)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 494 478 1083 506; baseline -0.002 -5"><span class='ocrx_word' id='word_1_71' title='bbox 494 480 652 501; x_wconf 80' lang='eng' dir='ltr'><em>Arthrobacter</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 657 480 793 506; x_wconf 86' lang='eng' dir='ltr'><em>globiformis</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 803 480 861 501; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 872 478 961 501; x_wconf 88' lang='eng' dir='ltr'><em>20124T</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 971 480 1083 506; x_wconf 85' lang='eng' dir='ltr'><em>(X80736)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 443 517 1040 546; baseline 0.002 -6"><span class='ocrx_word' id='word_1_76' title='bbox 443 520 601 541; x_wconf 78' lang='eng' dir='ltr'><em>Arthrobacter</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 607 520 750 541; x_wconf 84' lang='eng' dir='ltr'><em>wo/uwensis</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 760 520 818 541; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 831 517 918 541; x_wconf 75' lang='eng' dir='ltr'><em>10495T</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 929 520 1040 546; x_wconf 87' lang='eng' dir='ltr'>(X93353)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 673 557 1295 585; baseline -0.002 -5"><span class='ocrx_word' id='word_1_81' title='bbox 673 559 843 585; x_wconf 78' lang='eng' dir='ltr'><em>Streptomyces</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 852 564 1007 585; x_wconf 84' lang='eng' dir='ltr'><em>megasporus</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 1017 559 1074 580; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 1085 557 1175 580; x_wconf 74' lang='eng' dir='ltr'><em>41476T</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 1185 559 1295 585; x_wconf 85' lang='eng'><em>(268100)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 76 79 108 92">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 76 79 108 92">
+     <span class='ocr_line' id='line_1_27' title="bbox 76 79 108 92; baseline 0 0"><span class='ocrx_word' id='word_1_86' title='bbox 76 79 108 92; x_wconf 58' lang='eng'><em>001</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 364 225 559 255">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 364 225 559 255">
+     <span class='ocr_line' id='line_1_28' title="bbox 364 225 393 239; baseline 0 0"><span class='ocrx_word' id='word_1_87' title='bbox 364 225 393 239; x_wconf 85' lang='eng'><em>100</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 530 241 559 255; baseline 0 0"><span class='ocrx_word' id='word_1_88' title='bbox 530 241 559 255; x_wconf 84' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003384-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003384-0-000.pbm.png
new file mode 100644
index 00000000..89f734e0
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003384-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003384-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003384-0-000.pbm.png.hocr
new file mode 100644
index 00000000..a2bc9c34
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003384-0-000.pbm.png.hocr
@@ -0,0 +1,390 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003384-0-000.pbm.png"; bbox 0 0 994 911; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 86 549 105 565">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 86 549 105 565">
+     <span class='ocr_line' id='line_1_1' title="bbox 86 549 105 565; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 86 549 105 565; x_wconf 82' lang='eng'><em>91</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 0 708 91 710">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 0 708 91 710">
+     <span class='ocr_line' id='line_1_2' title="bbox 0 708 91 710; baseline 0 201"><span class='ocrx_word' id='word_1_2' title='bbox 0 708 91 710; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 0 708 3 896">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 0 708 3 896">
+     <span class='ocr_line' id='line_1_3' title="bbox 0 708 3 896; baseline 0 15"><span class='ocrx_word' id='word_1_3' title='bbox 0 708 3 896; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 88 566 92 852">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 88 566 92 852">
+     <span class='ocr_line' id='line_1_4' title="bbox 88 566 92 852; baseline 0 59"><span class='ocrx_word' id='word_1_4' title='bbox 88 566 92 852; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 233 38 255 54">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 233 38 255 54">
+     <span class='ocr_line' id='line_1_5' title="bbox 233 38 255 54; baseline 0 0"><span class='ocrx_word' id='word_1_5' title='bbox 233 38 255 54; x_wconf 78' lang='eng'>79</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 219 97 275 116">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 219 97 275 116">
+     <span class='ocr_line' id='line_1_6' title="bbox 219 97 275 116; baseline 0 0"><span class='ocrx_word' id='word_1_6' title='bbox 219 100 241 116; x_wconf 78' lang='eng'>99</span> <span class='ocrx_word' id='word_1_7' title='bbox 253 97 275 113; x_wconf 70' lang='eng'>93</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 230 190 252 206">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 230 190 252 206">
+     <span class='ocr_line' id='line_1_7' title="bbox 230 190 252 206; baseline 0 0"><span class='ocrx_word' id='word_1_8' title='bbox 230 190 252 206; x_wconf 87' lang='eng'>79</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 218 120 222 277">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 218 120 222 277">
+     <span class='ocr_line' id='line_1_8' title="bbox 218 120 222 277; baseline 0 634"><span class='ocrx_word' id='word_1_9' title='bbox 218 120 222 277; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 213 333 234 349">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 213 333 234 349">
+     <span class='ocr_line' id='line_1_9' title="bbox 213 333 234 349; baseline 0 0"><span class='ocrx_word' id='word_1_10' title='bbox 213 333 234 349; x_wconf 79' lang='eng'>99</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 239 305 241 351">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 239 305 241 351">
+     <span class='ocr_line' id='line_1_10' title="bbox 239 305 241 351; baseline 0 560"><span class='ocrx_word' id='word_1_11' title='bbox 239 305 241 351; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 221 275 309 277">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 221 275 309 277">
+     <span class='ocr_line' id='line_1_11' title="bbox 221 275 309 277; baseline 0 634"><span class='ocrx_word' id='word_1_12' title='bbox 221 275 309 277; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 294 10 371 12">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 294 10 371 12">
+     <span class='ocr_line' id='line_1_12' title="bbox 294 10 371 12; baseline 0 899"><span class='ocrx_word' id='word_1_13' title='bbox 294 10 371 12; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 263 0 993 294">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 263 0 992 292">
+     <span class='ocr_line' id='line_1_13' title="bbox 263 0 917 27; baseline 0.002 -6"><span class='ocrx_word' id='word_1_14' title='bbox 263 5 285 21; x_wconf 86' lang='eng'>99</span> <span class='ocrx_word' id='word_1_15' title='bbox 383 3 570 27; x_wconf 76' lang='eng' dir='ltr'><em>Parapedobacter</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 576 3 687 22; x_wconf 77' lang='eng' dir='ltr'><em>koreensis</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 695 0 767 27; x_wconf 57' lang='eng' dir='ltr'><em>\Jip14T</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 777 2 917 27; x_wconf 85' lang='eng' dir='ltr'><em>(DQ680836)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 420 30 876 56; baseline 0 -5"><span class='ocrx_word' id='word_1_19' title='bbox 420 32 544 51; x_wconf 75' lang='eng' dir='ltr'><em>Olivibacter</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 550 32 642 51; x_wconf 82' lang='eng' dir='ltr'><em>sltiensis</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 649 30 726 51; x_wconf 75' lang='eng' dir='ltr'><em>AW-GT</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 735 32 876 56; x_wconf 89' lang='eng' dir='ltr'>(DQ421387)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 283 59 895 86; baseline 0 -5"><span class='ocrx_word' id='word_1_23' title='bbox 283 69 335 71; x_wconf 92' lang='eng'>—</span> <span class='ocrx_word' id='word_1_24' title='bbox 341 61 551 86; x_wconf 77' lang='eng' dir='ltr'><em>Sphingobacterium</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 559 62 664 86; x_wconf 79' lang='eng' dir='ltr'><em>composti</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 671 59 749 81; x_wconf 89' lang='eng' dir='ltr'><em>T5-12T</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 759 62 895 86; x_wconf 84' lang='eng' dir='ltr'><em>(ABZ44764)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 339 89 931 115; baseline 0 -5"><span class='ocrx_word' id='word_1_28' title='bbox 339 91 548 115; x_wconf 84' lang='eng' dir='ltr'><em>Sphingobacterium</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 556 91 645 110; x_wconf 81' lang='eng' dir='ltr'><em>mizutaii</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 651 91 721 110; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 732 89 813 110; x_wconf 78' lang='eng' dir='ltr'><em>33299T</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 823 91 931 115; x_wconf 86' lang='eng' dir='ltr'>(M58796)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 338 118 955 145; baseline 0 -5"><span class='ocrx_word' id='word_1_33' title='bbox 338 120 547 145; x_wconf 76' lang='eng' dir='ltr'><em>Sphingobacterium</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 556 121 704 145; x_wconf 79' lang='eng' dir='ltr'><em>daejeonense</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 712 118 810 140; x_wconf 72' lang='eng' dir='ltr'><em>TRE5-04T</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 819 121 955 145; x_wconf 83' lang='eng' dir='ltr'><em>(ABZ49372)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 348 150 968 174; baseline 0 -5"><span class='ocrx_word' id='word_1_37' title='bbox 348 150 557 174; x_wconf 78' lang='eng' dir='ltr'><em>Sphingobacterium</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 566 150 698 174; x_wconf 80' lang='eng' dir='ltr'><em>spiritivorum</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 708 150 763 169; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 772 150 828 169; x_wconf 89' lang='eng'>2582</span> <span class='ocrx_word' id='word_1_41' title='bbox 836 150 942 174; x_wconf 85' lang='eng' dir='ltr'><em>(AJ45941</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 950 150 968 174; x_wconf 93' lang='eng'>1)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 274 177 949 204; baseline 0.001 -6"><span class='ocrx_word' id='word_1_43' title='bbox 274 187 340 188; x_wconf 40' lang='eng'><em>7</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 346 179 555 204; x_wconf 81' lang='eng' dir='ltr'><em>Sphingobacterium</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 564 179 654 199; x_wconf 81' lang='eng' dir='ltr'><em>faecium</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 664 179 718 199; x_wconf 85' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_47' title='bbox 730 177 811 199; x_wconf 82' lang='eng' dir='ltr'><em>11690T</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 818 180 949 204; x_wconf 84' lang='eng' dir='ltr'><em>(AJ438176)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 294 207 992 233; baseline 0 -5"><span class='ocrx_word' id='word_1_49' title='bbox 294 209 541 233; x_wconf 79' lang='eng' dir='ltr'><em>—Sphingobacterium</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 550 209 696 233; x_wconf 80' lang='eng' dir='ltr'><em>thalpophi/um</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 706 209 761 228; x_wconf 92' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_52' title='bbox 773 207 853 228; x_wconf 82' lang='eng' dir='ltr'><em>11723T</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 860 209 992 233; x_wconf 87' lang='eng' dir='ltr'>(AJ438177)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 294 238 919 263; baseline 0 -5"><span class='ocrx_word' id='word_1_54' title='bbox 294 246 332 248; x_wconf 92' lang='eng'>—</span> <span class='ocrx_word' id='word_1_55' title='bbox 338 238 547 263; x_wconf 81' lang='eng' dir='ltr'><em>Sphingobacterium</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 556 239 682 258; x_wconf 79' lang='eng' dir='ltr'><em>multivorum</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 691 238 773 258; x_wconf 86' lang='eng' dir='ltr'><em>OM—A8</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 782 239 919 263; x_wconf 82' lang='eng' dir='ltr'><em>(ABOZOZOS)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 311 266 829 292; baseline 0 -5"><span class='ocrx_word' id='word_1_59' title='bbox 311 268 446 287; x_wconf 85' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 452 268 534 287; x_wconf 82' lang='eng' dir='ltr'><em>sa/tans</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 544 268 598 287; x_wconf 90' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_62' title='bbox 610 266 690 287; x_wconf 71' lang='eng' dir='ltr'><em>12145T</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 697 268 829 292; x_wconf 83' lang='eng' dir='ltr'><em>(AJ438173)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 261 25 294 27">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 261 25 294 27">
+     <span class='ocr_line' id='line_1_23' title="bbox 261 25 294 27; baseline 0 884"><span class='ocrx_word' id='word_1_64' title='bbox 261 25 294 27; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 292 10 294 41">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 292 10 294 41">
+     <span class='ocr_line' id='line_1_24' title="bbox 292 10 294 41; baseline 0 870"><span class='ocrx_word' id='word_1_65' title='bbox 292 10 294 41; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 281 69 283 115">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 281 69 283 115">
+     <span class='ocr_line' id='line_1_25' title="bbox 281 69 283 115; baseline 0 796"><span class='ocrx_word' id='word_1_66' title='bbox 281 69 283 115; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 264 119 297 135">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 264 119 297 135">
+     <span class='ocr_line' id='line_1_26' title="bbox 264 119 297 135; baseline 0 0"><span class='ocrx_word' id='word_1_67' title='bbox 264 119 297 135; x_wconf 89' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 260 157 342 159">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 260 157 342 159">
+     <span class='ocr_line' id='line_1_27' title="bbox 260 157 342 159; baseline 0 752"><span class='ocrx_word' id='word_1_68' title='bbox 260 157 342 159; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 259 25 264 210">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 259 25 264 210">
+     <span class='ocr_line' id='line_1_28' title="bbox 259 25 264 210; baseline 0 701"><span class='ocrx_word' id='word_1_69' title='bbox 259 25 264 210; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 265 237 287 253">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 265 237 287 253">
+     <span class='ocr_line' id='line_1_29' title="bbox 265 237 287 253; baseline 0 0"><span class='ocrx_word' id='word_1_70' title='bbox 265 237 287 253; x_wconf 83' lang='eng'>98</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 273 231 294 233">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 273 231 294 233">
+     <span class='ocr_line' id='line_1_30' title="bbox 273 231 294 233; baseline 0 678"><span class='ocrx_word' id='word_1_71' title='bbox 273 231 294 233; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 291 216 295 248">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 291 216 295 248">
+     <span class='ocr_line' id='line_1_31' title="bbox 291 216 295 248; baseline 0 663"><span class='ocrx_word' id='word_1_72' title='bbox 291 216 295 248; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 241 294 926 324">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 241 294 926 322">
+     <span class='ocr_line' id='line_1_32' title="bbox 241 294 926 322; baseline 0 -5"><span class='ocrx_word' id='word_1_73' title='bbox 241 305 299 307; x_wconf 92' lang='eng'>—</span> <span class='ocrx_word' id='word_1_74' title='bbox 304 297 513 322; x_wconf 85' lang='eng' dir='ltr'><em>Mucilaginibacter</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 520 297 685 322; x_wconf 85' lang='eng' dir='ltr'><em>daejeonensis</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 692 297 729 322; x_wconf 87' lang='eng' dir='ltr'>Jip</span> <span class='ocrx_word' id='word_1_77' title='bbox 739 294 777 317; x_wconf 59' lang='eng'><em>101&#39;</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 786 297 926 322; x_wconf 82' lang='eng' dir='ltr'>(A3267717)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 276 324 841 353">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 276 324 841 351">
+     <span class='ocr_line' id='line_1_33' title="bbox 276 324 841 351; baseline 0 -6"><span class='ocrx_word' id='word_1_79' title='bbox 276 334 311 336; x_wconf 97' lang='eng'>—</span> <span class='ocrx_word' id='word_1_80' title='bbox 316 326 506 351; x_wconf 84' lang='eng' dir='ltr'><em>Muci/aginibacter</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 511 326 594 351; x_wconf 85' lang='eng' dir='ltr'><em>paludis</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 602 324 690 346; x_wconf 81' lang='eng' dir='ltr'><em>TPT56T</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 700 326 841 351; x_wconf 84' lang='eng' dir='ltr'><em>(AM490402)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 239 349 276 351">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 239 349 276 351">
+     <span class='ocr_line' id='line_1_34' title="bbox 239 349 276 351; baseline 0 560"><span class='ocrx_word' id='word_1_84' title='bbox 239 349 276 351; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 166 355 256 403">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 166 355 256 403">
+     <span class='ocr_line' id='line_1_35' title="bbox 166 355 199 371; baseline 0 0"><span class='ocrx_word' id='word_1_85' title='bbox 166 355 199 371; x_wconf 90' lang='eng'><em>100</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 223 387 256 403; baseline 0 0"><span class='ocrx_word' id='word_1_86' title='bbox 223 387 256 403; x_wconf 87' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 247 468 257 484">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 247 468 257 484">
+     <span class='ocr_line' id='line_1_37' title="bbox 247 468 257 484; baseline 0 0"><span class='ocrx_word' id='word_1_87' title='bbox 247 468 257 484; x_wconf 82' lang='eng'><em>9</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 196 493 252 509">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 196 493 252 509">
+     <span class='ocr_line' id='line_1_38' title="bbox 196 493 252 509; baseline 0 0"><span class='ocrx_word' id='word_1_88' title='bbox 196 493 218 509; x_wconf 80' lang='eng'>88</span> <span class='ocrx_word' id='word_1_89' title='bbox 230 493 252 509; x_wconf 85' lang='eng'>70</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 222 408 226 562">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 222 408 226 562">
+     <span class='ocr_line' id='line_1_39' title="bbox 222 408 226 562; baseline 0 349"><span class='ocrx_word' id='word_1_90' title='bbox 222 408 226 562; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 212 569 255 630">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 212 569 255 630">
+     <span class='ocr_line' id='line_1_40' title="bbox 212 569 245 585; baseline 0.03 -1"><span class='ocrx_word' id='word_1_91' title='bbox 212 569 245 585; x_wconf 90' lang='eng'><em>100</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 235 614 255 630; baseline 0 0"><span class='ocrx_word' id='word_1_92' title='bbox 235 614 255 630; x_wconf 81' lang='eng'><em>91</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 213 711 246 727">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 213 711 246 727">
+     <span class='ocr_line' id='line_1_42' title="bbox 213 711 246 727; baseline 0 0"><span class='ocrx_word' id='word_1_93' title='bbox 213 711 246 727; x_wconf 87' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 155 732 258 734">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 155 732 258 734">
+     <span class='ocr_line' id='line_1_43' title="bbox 155 732 258 734; baseline 0 177"><span class='ocrx_word' id='word_1_94' title='bbox 155 732 258 734; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 256 717 258 749">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 256 717 258 749">
+     <span class='ocr_line' id='line_1_44' title="bbox 256 717 258 749; baseline 0 162"><span class='ocrx_word' id='word_1_95' title='bbox 256 717 258 749; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 154 732 158 793">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 154 732 158 793">
+     <span class='ocr_line' id='line_1_45' title="bbox 154 732 158 793; baseline 0 118"><span class='ocrx_word' id='word_1_96' title='bbox 154 732 158 793; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 123 770 147 787">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 124 771 146 787">
+     <span class='ocr_line' id='line_1_46' title="bbox 124 771 146 787; baseline 0 0"><span class='ocrx_word' id='word_1_97' title='bbox 124 771 146 787; x_wconf 84' lang='eng'><em>97</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 155 791 185 793">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 155 791 185 793">
+     <span class='ocr_line' id='line_1_47' title="bbox 155 791 185 793; baseline 0 118"><span class='ocrx_word' id='word_1_98' title='bbox 155 791 185 793; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_37' title="bbox 183 776 185 808">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 183 776 185 808">
+     <span class='ocr_line' id='line_1_48' title="bbox 183 776 185 808; baseline 0 103"><span class='ocrx_word' id='word_1_99' title='bbox 183 776 185 808; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_38' title="bbox 155 801 177 817">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 155 801 177 817">
+     <span class='ocr_line' id='line_1_49' title="bbox 155 801 177 817; baseline 0 0"><span class='ocrx_word' id='word_1_100' title='bbox 155 801 177 817; x_wconf 84' lang='eng'><em>95</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_39' title="bbox 89 849 231 853">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 89 849 231 853">
+     <span class='ocr_line' id='line_1_50' title="bbox 89 849 231 853; baseline 0 58"><span class='ocrx_word' id='word_1_101' title='bbox 89 849 231 853; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_40' title="bbox 229 835 231 867">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 229 835 231 867">
+     <span class='ocr_line' id='line_1_51' title="bbox 229 835 231 867; baseline 0 44"><span class='ocrx_word' id='word_1_102' title='bbox 229 835 231 867; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_41' title="bbox 190 857 223 873">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 190 857 223 873">
+     <span class='ocr_line' id='line_1_52' title="bbox 190 857 223 873; baseline 0 0"><span class='ocrx_word' id='word_1_103' title='bbox 190 857 223 873; x_wconf 87' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_42' title="bbox 234 356 267 372">
+    <p class='ocr_par' dir='ltr' id='par_1_42' title="bbox 234 356 267 372">
+     <span class='ocr_line' id='line_1_53' title="bbox 234 356 267 372; baseline 0 0"><span class='ocrx_word' id='word_1_104' title='bbox 234 356 267 372; x_wconf 87' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_43' title="bbox 258 717 332 719">
+    <p class='ocr_par' dir='ltr' id='par_1_43' title="bbox 258 717 332 719">
+     <span class='ocr_line' id='line_1_54' title="bbox 258 717 332 719; baseline 0 192"><span class='ocrx_word' id='word_1_105' title='bbox 258 717 332 719; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_44' title="bbox 273 187 276 366">
+    <p class='ocr_par' dir='ltr' id='par_1_44' title="bbox 273 187 276 366">
+     <span class='ocr_line' id='line_1_55' title="bbox 273 187 276 366; baseline 0 545"><span class='ocrx_word' id='word_1_106' title='bbox 273 187 276 366; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_45' title="bbox 259 351 994 882">
+    <p class='ocr_par' dir='ltr' id='par_1_45' title="bbox 276 353 836 438">
+     <span class='ocr_line' id='line_1_56' title="bbox 276 353 836 380; baseline 0 -5"><span class='ocrx_word' id='word_1_107' title='bbox 276 364 307 366; x_wconf 95' lang='eng'>—</span> <span class='ocrx_word' id='word_1_108' title='bbox 313 356 503 380; x_wconf 79' lang='eng' dir='ltr'><em>Muci/aginibacter</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 509 356 589 380; x_wconf 77' lang='eng' dir='ltr'><em>gracilis</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 597 353 686 375; x_wconf 88' lang='eng' dir='ltr'><em>TPT18T</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 695 356 836 380; x_wconf 80' lang='eng' dir='ltr'><em>(AM490403)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_57' title="bbox 294 382 741 409; baseline -0.002 -5"><span class='ocrx_word' id='word_1_112' title='bbox 294 385 504 404; x_wconf 77' lang='eng' dir='ltr'><em>Pedobacterlentus</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 514 382 596 404; x_wconf 82' lang='eng' dir='ltr'><em>DS-40T</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 606 384 741 409; x_wconf 86' lang='eng' dir='ltr'><em>(EF446146)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_58' title="bbox 304 411 774 438; baseline 0 -5"><span class='ocrx_word' id='word_1_115' title='bbox 304 414 439 433; x_wconf 79' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 446 414 537 433; x_wconf 84' lang='eng' dir='ltr'><em>terrico/a</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 547 411 630 433; x_wconf 79' lang='eng' dir='ltr'><em>DS-45T</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 639 414 774 438; x_wconf 85' lang='eng' dir='ltr'>(EF446147)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_46' title="bbox 260 440 765 467">
+     <span class='ocr_line' id='line_1_59' title="bbox 260 440 765 467; baseline 0 -5"><span class='ocrx_word' id='word_1_119' title='bbox 260 446 282 462; x_wconf 88' lang='eng'><em>75</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 314 443 449 462; x_wconf 83' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 456 443 523 462; x_wconf 71' lang='eng' dir='ltr'><em>tenae</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 533 440 615 462; x_wconf 65' lang='eng' dir='ltr'><em>DS»57T</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 624 443 765 467; x_wconf 78' lang='eng' dir='ltr'>(D0889723)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_47' title="bbox 259 468 800 496">
+     <span class='ocr_line' id='line_1_60' title="bbox 259 468 800 496; baseline 0 -5"><span class='ocrx_word' id='word_1_124' title='bbox 259 468 269 484; x_wconf 86' lang='eng'>5</span> <span class='ocrx_word' id='word_1_125' title='bbox 304 472 439 491; x_wconf 80' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 445 477 523 491; x_wconf 84' lang='eng' dir='ltr'><em>roseus</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 532 470 650 491; x_wconf 89' lang='eng' dir='ltr'><em>CL-GP80T</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 659 472 800 496; x_wconf 82' lang='eng' dir='ltr'><em>(DQ112353)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_48' title="bbox 278 499 852 585">
+     <span class='ocr_line' id='line_1_61' title="bbox 278 499 852 526; baseline 0 -5"><span class='ocrx_word' id='word_1_129' title='bbox 278 502 449 521; x_wconf 83' lang='eng' dir='ltr'><em>—Pedobacter</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 455 502 610 521; x_wconf 84' lang='eng' dir='ltr'><em>sandarakinus</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 620 499 702 521; x_wconf 88' lang='eng' dir='ltr'><em>DS-27T</em></span> <span class='ocrx_word' id='word_1_132' title='bbox 711 502 852 526; x_wconf 77' lang='eng' dir='ltr'>(D0235228)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_62' title="bbox 310 529 791 555; baseline 0 -5"><span class='ocrx_word' id='word_1_133' title='bbox 310 531 445 550; x_wconf 82' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_134' title='bbox 451 531 546 555; x_wconf 83' lang='eng' dir='ltr'><em>aquatilis</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 553 529 643 550; x_wconf 85' lang='eng' dir='ltr'><em>AR1O7T</em></span> <span class='ocrx_word' id='word_1_136' title='bbox 650 531 706 555; x_wconf 84' lang='eng' dir='ltr'>(AM1</span> <span class='ocrx_word' id='word_1_137' title='bbox 714 531 791 555; x_wconf 83' lang='eng'><em>14396)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_63' title="bbox 309 558 784 585; baseline 0 -5"><span class='ocrx_word' id='word_1_138' title='bbox 309 561 444 580; x_wconf 81' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_139' title='bbox 450 561 532 580; x_wconf 84' lang='eng' dir='ltr'><em>insulae</em></span> <span class='ocrx_word' id='word_1_140' title='bbox 542 561 595 580; x_wconf 86' lang='eng' dir='ltr'><em>DS-1</em></span> <span class='ocrx_word' id='word_1_141' title='bbox 601 558 639 580; x_wconf 76' lang='eng' dir='ltr'><em>39T</em></span> <span class='ocrx_word' id='word_1_142' title='bbox 648 561 784 585; x_wconf 85' lang='eng' dir='ltr'>(EF100697)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_49' title="bbox 272 588 860 644">
+     <span class='ocr_line' id='line_1_64' title="bbox 272 588 860 615; baseline -0.002 -5"><span class='ocrx_word' id='word_1_143' title='bbox 272 597 277 613; x_wconf 69' lang='eng'><strong>1</strong></span> <span class='ocrx_word' id='word_1_144' title='bbox 301 590 436 610; x_wconf 82' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_145' title='bbox 441 590 586 615; x_wconf 80' lang='eng' dir='ltr'><em>panaciterrae</em></span> <span class='ocrx_word' id='word_1_146' title='bbox 595 590 652 610; x_wconf 81' lang='eng' dir='ltr'><em>Gsoil</em></span> <span class='ocrx_word' id='word_1_147' title='bbox 662 588 714 610; x_wconf 88' lang='eng' dir='ltr'><em>042T</em></span> <span class='ocrx_word' id='word_1_148' title='bbox 723 590 860 614; x_wconf 77' lang='eng' dir='ltr'><em>(ABZ45368)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_65' title="bbox 306 618 842 644; baseline 0 -5"><span class='ocrx_word' id='word_1_149' title='bbox 306 620 441 639; x_wconf 81' lang='eng' dir='ltr'><em>Pedobacter</em></span> <span class='ocrx_word' id='word_1_150' title='bbox 447 620 561 644; x_wconf 83' lang='eng' dir='ltr'><em>heparinus</em></span> <span class='ocrx_word' id='word_1_151' title='bbox 571 620 625 639; x_wconf 90' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_152' title='bbox 635 618 842 644; x_wconf 61' lang='eng' dir='ltr'><em>2366T(AJ438172)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_50' title="bbox 279 647 852 674">
+     <span class='ocr_line' id='line_1_66' title="bbox 279 647 852 674; baseline 0 -5"><span class='ocrx_word' id='word_1_153' title='bbox 279 650 436 669; x_wconf 38' lang='eng' dir='ltr'><em>*Pedobacter</em></span> <span class='ocrx_word' id='word_1_154' title='bbox 442 650 579 674; x_wconf 63' lang='eng' dir='ltr'><em>ginseng/&#39;50”</em></span> <span class='ocrx_word' id='word_1_155' title='bbox 586 649 643 669; x_wconf 84' lang='eng' dir='ltr'><em>Gsoil</em></span> <span class='ocrx_word' id='word_1_156' title='bbox 655 647 706 669; x_wconf 82' lang='eng' dir='ltr'><em>104T</em></span> <span class='ocrx_word' id='word_1_157' title='bbox 715 650 852 674; x_wconf 82' lang='eng' dir='ltr'><em>(ABZ45371)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_51' title="bbox 279 677 865 704">
+     <span class='ocr_line' id='line_1_67' title="bbox 279 677 865 704; baseline 0 -6"><span class='ocrx_word' id='word_1_158' title='bbox 279 679 460 698; x_wconf 83' lang='eng' dir='ltr'><em>—Pedobaoter</em></span> <span class='ocrx_word' id='word_1_159' title='bbox 467 679 617 704; x_wconf 84' lang='eng' dir='ltr'><em>himalayensis</em></span> <span class='ocrx_word' id='word_1_160' title='bbox 626 679 678 698; x_wconf 91' lang='eng' dir='ltr'><em>HHS</em></span> <span class='ocrx_word' id='word_1_161' title='bbox 688 677 726 698; x_wconf 92' lang='eng' dir='ltr'><em>22T</em></span> <span class='ocrx_word' id='word_1_162' title='bbox 733 679 865 703; x_wconf 88' lang='eng' dir='ltr'><em>(AJ583425)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_52' title="bbox 338 709 708 733">
+     <span class='ocr_line' id='line_1_68' title="bbox 338 709 708 733; baseline 0 -5"><span class='ocrx_word' id='word_1_163' title='bbox 338 709 426 728; x_wconf 79' lang='eng' dir='ltr'><em>Bel/fella</em></span> <span class='ocrx_word' id='word_1_164' title='bbox 435 709 510 728; x_wconf 72' lang='eng' dir='ltr'><em>ballica</em></span> <span class='ocrx_word' id='word_1_165' title='bbox 520 709 563 728; x_wconf 91' lang='eng' dir='ltr'><em>BA1</em></span> <span class='ocrx_word' id='word_1_166' title='bbox 576 709 708 733; x_wconf 87' lang='eng' dir='ltr'><em>(AJ564642)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_53' title="bbox 321 738 994 822">
+     <span class='ocr_line' id='line_1_69' title="bbox 380 738 944 763; baseline 0 -6"><span class='ocrx_word' id='word_1_167' title='bbox 380 738 558 763; x_wconf 84' lang='eng' dir='ltr'><em>Cyclobacterium</em></span> <span class='ocrx_word' id='word_1_168' title='bbox 566 738 667 757; x_wconf 77' lang='eng' dir='ltr'><em>marinum</em></span> <span class='ocrx_word' id='word_1_169' title='bbox 675 738 744 757; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_170' title='bbox 754 738 825 757; x_wconf 87' lang='eng'><em>43824</em></span> <span class='ocrx_word' id='word_1_171' title='bbox 835 738 944 762; x_wconf 88' lang='eng' dir='ltr'><em>(M62788)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_70' title="bbox 341 765 897 792; baseline 0 -5"><span class='ocrx_word' id='word_1_172' title='bbox 341 767 464 792; x_wconf 79' lang='eng' dir='ltr'><em>Cytophaga</em></span> <span class='ocrx_word' id='word_1_173' title='bbox 473 767 611 787; x_wconf 78' lang='eng' dir='ltr'><em>hutchinsonii</em></span> <span class='ocrx_word' id='word_1_174' title='bbox 618 767 687 787; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_175' title='bbox 698 765 779 787; x_wconf 77' lang='eng' dir='ltr'><em>33406T</em></span> <span class='ocrx_word' id='word_1_176' title='bbox 789 767 897 792; x_wconf 88' lang='eng' dir='ltr'><em>(M58768)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_71' title="bbox 321 795 994 822; baseline 0 -6"><span class='ocrx_word' id='word_1_177' title='bbox 321 797 510 822; x_wconf 81' lang='eng' dir='ltr'><em>Sporocytophaga</em></span> <span class='ocrx_word' id='word_1_178' title='bbox 519 797 696 822; x_wconf 81' lang='eng' dir='ltr'><em>myxococcoides</em></span> <span class='ocrx_word' id='word_1_179' title='bbox 706 797 760 816; x_wconf 90' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_180' title='bbox 773 795 853 816; x_wconf 73' lang='eng' dir='ltr'><em>11118T</em></span> <span class='ocrx_word' id='word_1_181' title='bbox 862 797 994 821; x_wconf 85' lang='eng' dir='ltr'><em>(AJ310654)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_54' title="bbox 368 824 932 851">
+     <span class='ocr_line' id='line_1_72' title="bbox 368 824 932 851; baseline -0.002 -5"><span class='ocrx_word' id='word_1_182' title='bbox 368 827 545 846; x_wconf 76' lang='eng' dir='ltr'><em>Flavobacterium</em></span> <span class='ocrx_word' id='word_1_183' title='bbox 555 827 645 851; x_wconf 79' lang='eng' dir='ltr'><em>aquatile</em></span> <span class='ocrx_word' id='word_1_184' title='bbox 653 826 722 846; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_185' title='bbox 734 824 815 846; x_wconf 75' lang='eng' dir='ltr'><em>11947T</em></span> <span class='ocrx_word' id='word_1_186' title='bbox 824 827 932 851; x_wconf 85' lang='eng' dir='ltr'>(M62797)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_55' title="bbox 341 856 865 881">
+     <span class='ocr_line' id='line_1_73' title="bbox 341 856 865 881; baseline 0 -6"><span class='ocrx_word' id='word_1_187' title='bbox 341 856 490 881; x_wconf 75' lang='eng' dir='ltr'><em>Cellulophaga</em></span> <span class='ocrx_word' id='word_1_188' title='bbox 499 856 557 881; x_wconf 79' lang='eng' dir='ltr'><em>lytioa</em></span> <span class='ocrx_word' id='word_1_189' title='bbox 567 856 638 875; x_wconf 90' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_190' title='bbox 649 856 718 875; x_wconf 87' lang='eng'>16022</span> <span class='ocrx_word' id='word_1_191' title='bbox 728 856 865 880; x_wconf 85' lang='eng' dir='ltr'><em>(AB032513)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_46' title="bbox 273 187 278 513">
+    <p class='ocr_par' dir='ltr' id='par_1_56' title="bbox 273 187 278 513">
+     <span class='ocr_line' id='line_1_74' title="bbox 273 187 278 513; baseline 0 398"><span class='ocrx_word' id='word_1_192' title='bbox 273 187 278 513; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_47' title="bbox 277 659 279 690">
+    <p class='ocr_par' dir='ltr' id='par_1_57' title="bbox 277 659 279 690">
+     <span class='ocr_line' id='line_1_75' title="bbox 277 659 279 690; baseline 0 221"><span class='ocrx_word' id='word_1_193' title='bbox 277 659 279 690; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_48' title="bbox 205 882 712 911">
+    <p class='ocr_par' dir='ltr' id='par_1_58' title="bbox 205 883 712 911">
+     <span class='ocr_line' id='line_1_76' title="bbox 205 883 712 911; baseline 0 -6"><span class='ocrx_word' id='word_1_194' title='bbox 205 885 342 905; x_wconf 79' lang='eng' dir='ltr'><em>Bacteroides</em></span> <span class='ocrx_word' id='word_1_195' title='bbox 351 885 425 911; x_wconf 76' lang='eng' dir='ltr'><em>fragi/is</em></span> <span class='ocrx_word' id='word_1_196' title='bbox 435 885 489 905; x_wconf 87' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_197' title='bbox 499 883 567 905; x_wconf 82' lang='eng' dir='ltr'><em>2151T</em></span> <span class='ocrx_word' id='word_1_198' title='bbox 576 885 712 911; x_wconf 79' lang='eng' dir='ltr'><em>(ABOSO106)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003400-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003400-0-000.pbm.png
new file mode 100644
index 00000000..b31ebf8d
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003400-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003400-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003400-0-000.pbm.png.hocr
new file mode 100644
index 00000000..e69e93fa
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003400-0-000.pbm.png.hocr
@@ -0,0 +1,208 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003400-0-000.pbm.png"; bbox 0 0 1183 716; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 177 10 287 12">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 177 10 287 12">
+     <span class='ocr_line' id='line_1_1' title="bbox 177 10 287 12; baseline 0 704"><span class='ocrx_word' id='word_1_1' title='bbox 177 10 287 12; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 0 7 166 53">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 0 7 166 53">
+     <span class='ocr_line' id='line_1_2' title="bbox 8 7 166 25; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 8 7 45 25; x_wconf 70' lang='eng' dir='ltr'><em>I—l</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 143 7 166 22; x_wconf 82' lang='eng'>42</span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 0 32 142 53; baseline 0 -6"><span class='ocrx_word' id='word_1_4' title='bbox 0 32 52 47; x_wconf 86' lang='eng'>0.005</span> <span class='ocrx_word' id='word_1_5' title='bbox 120 37 142 53; x_wconf 80' lang='eng'><strong>34</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 103 72 125 88">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 103 72 125 88">
+     <span class='ocr_line' id='line_1_4' title="bbox 103 72 125 88; baseline -0.045 0"><span class='ocrx_word' id='word_1_6' title='bbox 103 72 125 88; x_wconf 89' lang='eng'><em>59</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 41 0 1183 716">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 41 0 1183 716">
+     <span class='ocr_line' id='line_1_5' title="bbox 299 0 960 33; baseline 0 -6"><span class='ocrx_word' id='word_1_7' title='bbox 299 3 455 27; x_wconf 85' lang='eng' dir='ltr'><em>Oceanico/a</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 466 3 600 27; x_wconf 84' lang='eng' dir='ltr'><em>batsensis</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 612 0 782 27; x_wconf 87' lang='eng' dir='ltr'><em>HTCC2597T</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 793 3 960 33; x_wconf 86' lang='eng' dir='ltr'><em>(AY424898)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 177 41 1039 73; baseline 0 -6"><span class='ocrx_word' id='word_1_11' title='bbox 177 43 472 67; x_wconf 87' lang='eng' dir='ltr'><em>—Oceanicola</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 483 44 652 67; x_wconf 84' lang='eng' dir='ltr'><em>nanhaiensis</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 663 41 855 67; x_wconf 82' lang='eng' dir='ltr'><em>SSO11B1-20T</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 866 43 1039 73; x_wconf 90' lang='eng' dir='ltr'><em>(DQ414420)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 337 81 922 113; baseline 0 -6"><span class='ocrx_word' id='word_1_15' title='bbox 337 83 493 107; x_wconf 86' lang='eng' dir='ltr'><em>Oceanicola</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 504 84 617 107; x_wconf 83' lang='eng' dir='ltr'><em>marinus</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 626 81 738 107; x_wconf 92' lang='eng' dir='ltr'><em>AZO-CT</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 749 83 922 113; x_wconf 85' lang='eng' dir='ltr'><em>(DQ822569)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 86 121 950 153; baseline 0 -6"><span class='ocrx_word' id='word_1_19' title='bbox 86 127 109 143; x_wconf 86' lang='eng'><em>60</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 136 130 299 132; x_wconf 91' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_21' title='bbox 311 123 478 147; x_wconf 86' lang='eng' dir='ltr'><em>Oceanicola</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 488 123 627 153; x_wconf 87' lang='eng' dir='ltr'><em>pacificus</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 637 121 766 147; x_wconf 82' lang='eng' dir='ltr'><em>W11-ZBT</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 777 123 950 153; x_wconf 81' lang='eng' dir='ltr'><em>(DQS59449)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 186 161 928 194; baseline 0 -7"><span class='ocrx_word' id='word_1_25' title='bbox 186 163 595 187; x_wconf 78' lang='eng' dir='ltr'><em>—Octadecabacter</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 603 164 712 187; x_wconf 84' lang='eng' dir='ltr'><em>arcticus</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 722 161 787 187; x_wconf 84' lang='eng' dir='ltr'><em>238T</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 798 163 928 194; x_wconf 87' lang='eng' dir='ltr'><em>(U73725)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 120 201 1006 235; baseline 0 -8"><span class='ocrx_word' id='word_1_29' title='bbox 120 205 183 235; x_wconf 46' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_30' title='bbox 212 210 292 212; x_wconf 90' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_31' title='bbox 305 204 489 227; x_wconf 85' lang='eng' dir='ltr'><em>Thalassobius</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 499 204 689 233; x_wconf 83' lang='eng' dir='ltr'><em>gelatinovorus</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 700 204 752 227; x_wconf 93' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 767 201 865 227; x_wconf 79' lang='eng' dir='ltr'><em>12617T</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 876 203 1006 234; x_wconf 86' lang='eng' dir='ltr'><em>(D88523)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 41 241 957 274; baseline 0 -7"><span class='ocrx_word' id='word_1_36' title='bbox 41 257 63 273; x_wconf 69' lang='eng'><em>59</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 179 255 201 270; x_wconf 81' lang='eng'>75</span> <span class='ocrx_word' id='word_1_38' title='bbox 333 244 517 267; x_wconf 85' lang='eng' dir='ltr'><em>Thalassobius</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 527 244 649 267; x_wconf 83' lang='eng' dir='ltr'><em>aestuarii</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 657 241 779 267; x_wconf 79' lang='eng' dir='ltr'><em>JC2049T</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 790 244 957 274; x_wconf 91' lang='eng' dir='ltr'><em>(AY442178)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 200 281 1104 314; baseline 0.001 -7"><span class='ocrx_word' id='word_1_42' title='bbox 200 285 219 300; x_wconf 76' lang='eng'><strong>71</strong></span> <span class='ocrx_word' id='word_1_43' title='bbox 344 284 528 308; x_wconf 89' lang='eng' dir='ltr'><em>Thalassobius</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 538 284 742 308; x_wconf 84' lang='eng' dir='ltr'><em>mediterraneus</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 752 284 837 308; x_wconf 90' lang='eng' dir='ltr'><em>CECT</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 848 281 931 308; x_wconf 83' lang='eng' dir='ltr'><em>5383T</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 942 284 1104 314; x_wconf 89' lang='eng' dir='ltr'><em>(AJ878874)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 321 321 992 354; baseline 0 -6"><span class='ocrx_word' id='word_1_48' title='bbox 321 324 480 348; x_wconf 85' lang='eng' dir='ltr'><em>Jannaschia</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 491 324 703 354; x_wconf 86' lang='eng' dir='ltr'><em>helgo/andensis</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 714 324 758 348; x_wconf 93' lang='eng' dir='ltr'><em>Hel</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 772 321 817 348; x_wconf 77' lang='eng' dir='ltr'><em>1OT</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 829 324 992 354; x_wconf 88' lang='eng' dir='ltr'><em>(AJ438157)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 407 361 1183 394; baseline 0 -6"><span class='ocrx_word' id='word_1_53' title='bbox 407 364 702 388; x_wconf 86' lang='eng' dir='ltr'><em>Marinosulfonomonas</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 712 365 913 394; x_wconf 86' lang='eng' dir='ltr'><em>methylotropha</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 925 361 1042 388; x_wconf 90' lang='eng' dir='ltr'><em>PSCH4T</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 1053 364 1183 394; x_wconf 85' lang='eng' dir='ltr'><em>(U62894)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 293 402 1082 434; baseline 0 -6"><span class='ocrx_word' id='word_1_57' title='bbox 293 408 326 424; x_wconf 83' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 342 405 618 434; x_wconf 86' lang='eng' dir='ltr'><em>Ketogu/onicigenium</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 630 405 732 434; x_wconf 89' lang='eng' dir='ltr'><em>vulgare</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 744 404 810 428; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 822 402 905 428; x_wconf 90' lang='eng' dir='ltr'><em>4025T</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 917 404 1082 434; x_wconf 86' lang='eng' dir='ltr'><em>(AF136846)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 337 442 1033 474; baseline 0 -6"><span class='ocrx_word' id='word_1_63' title='bbox 337 445 634 474; x_wconf 61' lang='eng' dir='ltr'><em>‘Ketogulonicigenium</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 645 445 777 468; x_wconf 85' lang='eng' dir='ltr'><em>robustum</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 786 442 856 468; x_wconf 89' lang='eng' dir='ltr'><em>X6LT</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 867 444 1033 474; x_wconf 88' lang='eng' dir='ltr'><em>(AF136850)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 173 482 990 514; baseline 0 -6"><span class='ocrx_word' id='word_1_67' title='bbox 173 491 296 493; x_wconf 90' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_68' title='bbox 308 484 464 508; x_wconf 85' lang='eng' dir='ltr'><em>Oceanicola</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 475 485 630 514; x_wconf 88' lang='eng' dir='ltr'><em>granulosus</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 642 482 811 508; x_wconf 80' lang='eng' dir='ltr'><em>HTCCZS16T</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 823 484 990 514; x_wconf 86' lang='eng' dir='ltr'><em>(AY424896)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 303 522 927 555; baseline 0 -7"><span class='ocrx_word' id='word_1_72' title='bbox 303 525 483 548; x_wconf 87' lang='eng' dir='ltr'><em>Roseisalinus</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 493 525 646 548; x_wconf 79' lang='eng' dir='ltr'><em>antarcticus</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 658 522 753 548; x_wconf 89' lang='eng' dir='ltr'><em>EL-88T</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 765 524 927 555; x_wconf 88' lang='eng' dir='ltr'><em>(AJ605747)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 291 562 933 595; baseline 0 -7"><span class='ocrx_word' id='word_1_76' title='bbox 291 565 460 595; x_wconf 83' lang='eng' dir='ltr'><em>Roseicyclus</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 470 565 675 595; x_wconf 86' lang='eng' dir='ltr'><em>mahoneyensis</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 687 562 759 588; x_wconf 84' lang='eng' dir='ltr'><em>ML6T</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 770 564 933 595; x_wconf 86' lang='eng' dir='ltr'><em>(AJ315682)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 299 602 986 635; baseline -0.001 -6"><span class='ocrx_word' id='word_1_80' title='bbox 299 605 476 629; x_wconf 87' lang='eng' dir='ltr'><em>Rhodovulum</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 486 605 671 635; x_wconf 88' lang='eng' dir='ltr'><em>sulﬁdophilum</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 683 605 749 629; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 764 602 844 629; x_wconf 80' lang='eng' dir='ltr'><em>1374T</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 855 605 986 635; x_wconf 84' lang='eng' dir='ltr'><em>(D16423)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 414 642 1098 675; baseline 0.001 -7"><span class='ocrx_word' id='word_1_85' title='bbox 414 645 587 669; x_wconf 89' lang='eng' dir='ltr'><em>Albidovulum</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 598 645 787 675; x_wconf 85' lang='eng' dir='ltr'><em>inexpectatum</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 799 642 921 669; x_wconf 80' lang='eng' dir='ltr'><em>FRR-10T</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 932 645 1098 675; x_wconf 84' lang='eng' dir='ltr'><em>(AF465833)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 363 682 910 716; baseline 0 -7"><span class='ocrx_word' id='word_1_89' title='bbox 363 685 547 709; x_wconf 83' lang='eng' dir='ltr'><em>Rhodobacter</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 555 685 706 715; x_wconf 85' lang='eng' dir='ltr'><em>capsulatus</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 717 682 768 709; x_wconf 74' lang='eng' dir='ltr'><em>CST</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 780 685 910 716; x_wconf 86' lang='eng' dir='ltr'><em>(D16427)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 151 30 177 32">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 151 30 177 32">
+     <span class='ocr_line' id='line_1_23' title="bbox 151 30 177 32; baseline 0 684"><span class='ocrx_word' id='word_1_93' title='bbox 151 30 177 32; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 175 10 177 52">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 175 10 177 52">
+     <span class='ocr_line' id='line_1_24' title="bbox 175 10 177 52; baseline 0 664"><span class='ocrx_word' id='word_1_94' title='bbox 175 10 177 52; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 134 60 153 62">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 134 60 153 62">
+     <span class='ocr_line' id='line_1_25' title="bbox 134 60 153 62; baseline 0 654"><span class='ocrx_word' id='word_1_95' title='bbox 134 60 153 62; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 151 30 153 92">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 151 30 153 92">
+     <span class='ocr_line' id='line_1_26' title="bbox 151 30 153 92; baseline 0 624"><span class='ocrx_word' id='word_1_96' title='bbox 151 30 153 92; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 118 95 136 97">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 118 95 136 97">
+     <span class='ocr_line' id='line_1_27' title="bbox 118 95 136 97; baseline 0 619"><span class='ocrx_word' id='word_1_97' title='bbox 118 95 136 97; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 134 60 136 132">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 134 60 136 132">
+     <span class='ocr_line' id='line_1_28' title="bbox 134 60 136 132; baseline 0 584"><span class='ocrx_word' id='word_1_98' title='bbox 134 60 136 132; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 118 95 120 207">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 118 95 120 207">
+     <span class='ocr_line' id='line_1_29' title="bbox 118 95 120 207; baseline 0 509"><span class='ocrx_word' id='word_1_99' title='bbox 118 95 120 207; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 184 170 186 242">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 184 170 186 242">
+     <span class='ocr_line' id='line_1_30' title="bbox 184 170 186 242; baseline 0 474"><span class='ocrx_word' id='word_1_100' title='bbox 184 170 186 242; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 184 240 212 242">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 184 240 212 242">
+     <span class='ocr_line' id='line_1_31' title="bbox 184 240 212 242; baseline 0 474"><span class='ocrx_word' id='word_1_101' title='bbox 184 240 212 242; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 210 210 212 270">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 210 210 212 270">
+     <span class='ocr_line' id='line_1_32' title="bbox 210 210 212 270; baseline 0 446"><span class='ocrx_word' id='word_1_102' title='bbox 210 210 212 270; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 72 150 74 413">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 72 150 74 413">
+     <span class='ocr_line' id='line_1_33' title="bbox 72 150 74 413; baseline 0 303"><span class='ocrx_word' id='word_1_103' title='bbox 72 150 74 413; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 105 431 337 433">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 105 431 337 433">
+     <span class='ocr_line' id='line_1_34' title="bbox 105 431 337 433; baseline 0 283"><span class='ocrx_word' id='word_1_104' title='bbox 105 431 337 433; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 335 411 337 453">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 335 411 337 453">
+     <span class='ocr_line' id='line_1_35' title="bbox 335 411 337 453; baseline 0 263"><span class='ocrx_word' id='word_1_105' title='bbox 335 411 337 453; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 76 351 78 473">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 76 351 78 473">
+     <span class='ocr_line' id='line_1_36' title="bbox 76 351 78 473; baseline 0 243"><span class='ocrx_word' id='word_1_106' title='bbox 76 351 78 473; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 76 471 107 473">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 76 471 107 473">
+     <span class='ocr_line' id='line_1_37' title="bbox 76 471 107 473; baseline 0 243"><span class='ocrx_word' id='word_1_107' title='bbox 76 471 107 473; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 105 511 173 513">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 105 511 173 513">
+     <span class='ocr_line' id='line_1_38' title="bbox 105 511 173 513; baseline 0 203"><span class='ocrx_word' id='word_1_108' title='bbox 105 511 173 513; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 171 491 173 533">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 171 491 173 533">
+     <span class='ocr_line' id='line_1_39' title="bbox 171 491 173 533; baseline 0 183"><span class='ocrx_word' id='word_1_109' title='bbox 171 491 173 533; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 173 531 292 533">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 173 531 292 533">
+     <span class='ocr_line' id='line_1_40' title="bbox 173 531 292 533; baseline 0 183"><span class='ocrx_word' id='word_1_110' title='bbox 173 531 292 533; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 104 331 108 674">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 104 331 108 674">
+     <span class='ocr_line' id='line_1_41' title="bbox 104 331 108 674; baseline -2082.75 -19959"><span class='ocrx_word' id='word_1_111' title='bbox 104 331 108 674; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 104 672 146 674">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 104 672 146 674">
+     <span class='ocr_line' id='line_1_42' title="bbox 104 672 146 674; baseline 1037.976 -19958"><span class='ocrx_word' id='word_1_112' title='bbox 104 672 146 674; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 0 277 284 702">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 0 277 284 702">
+     <span class='ocr_line' id='line_1_43' title="bbox 0 277 284 702; baseline 0 14"><span class='ocrx_word' id='word_1_113' title='bbox 0 277 284 702; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 144 652 146 694">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 144 652 146 694">
+     <span class='ocr_line' id='line_1_44' title="bbox 144 652 146 694; baseline -2083 27783"><span class='ocrx_word' id='word_1_114' title='bbox 144 652 146 694; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003434-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003434-0-000.pbm.png
new file mode 100644
index 00000000..1384adc9
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003434-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003434-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003434-0-000.pbm.png.hocr
new file mode 100644
index 00000000..27608046
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003434-0-000.pbm.png.hocr
@@ -0,0 +1,161 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003434-0-000.pbm.png"; bbox 0 0 1302 1350; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 269 1 1302 1216">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 397 2 1300 646">
+     <span class='ocr_line' id='line_1_1' title="bbox 626 2 1043 30; baseline 0 -6"><span class='ocrx_word' id='word_1_1' title='bbox 626 2 647 24; x_wconf 94' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_2' title='bbox 661 7 753 24; x_wconf 87' lang='eng' dir='ltr'>ezurae</span> <span class='ocrx_word' id='word_1_3' title='bbox 765 2 866 24; x_wconf 83' lang='eng' dir='ltr'>HDV1—1</span> <span class='ocrx_word' id='word_1_4' title='bbox 883 2 1043 30; x_wconf 86' lang='eng' dir='ltr'>(AY426982)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 642 49 1058 78; baseline 0 -7"><span class='ocrx_word' id='word_1_5' title='bbox 642 49 663 71; x_wconf 93' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_6' title='bbox 676 55 768 72; x_wconf 87' lang='eng' dir='ltr'>ezurae</span> <span class='ocrx_word' id='word_1_7' title='bbox 780 49 886 72; x_wconf 78' lang='eng' dir='ltr'>HDS1-2</span> <span class='ocrx_word' id='word_1_8' title='bbox 898 49 1058 78; x_wconf 83' lang='eng' dir='ltr'>(AY426981)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 625 94 1054 125; baseline 0.002 -7"><span class='ocrx_word' id='word_1_9' title='bbox 625 96 646 118; x_wconf 91' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_10' title='bbox 659 102 751 119; x_wconf 86' lang='eng' dir='ltr'>ezurae</span> <span class='ocrx_word' id='word_1_11' title='bbox 763 94 884 119; x_wconf 81' lang='eng' dir='ltr'>HDS1-1T</span> <span class='ocrx_word' id='word_1_12' title='bbox 894 96 1054 125; x_wconf 87' lang='eng' dir='ltr'>(AY426980)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 570 141 1034 172; baseline 0 -6"><span class='ocrx_word' id='word_1_13' title='bbox 570 144 591 166; x_wconf 94' lang='eng' dir='ltr'><em>V.</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 604 144 729 166; x_wconf 79' lang='eng' dir='ltr'>neonatus</span> <span class='ocrx_word' id='word_1_15' title='bbox 741 141 863 166; x_wconf 83' lang='eng' dir='ltr'>HDD3—1T</span> <span class='ocrx_word' id='word_1_16' title='bbox 874 144 1034 172; x_wconf 86' lang='eng' dir='ltr'>(AY426979)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 505 191 993 220; baseline 0.002 -7"><span class='ocrx_word' id='word_1_17' title='bbox 505 191 526 213; x_wconf 94' lang='eng' dir='ltr'><em>V.</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 539 191 666 214; x_wconf 85' lang='eng' dir='ltr'>halioticoli</span> <span class='ocrx_word' id='word_1_19' title='bbox 676 191 726 213; x_wconf 93' lang='eng' dir='ltr'>IAM</span> <span class='ocrx_word' id='word_1_20' title='bbox 740 191 821 214; x_wconf 81' lang='eng'>14599</span> <span class='ocrx_word' id='word_1_21' title='bbox 832 191 993 220; x_wconf 90' lang='eng' dir='ltr'>(AB000393)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 476 238 963 267; baseline 0.002 -7"><span class='ocrx_word' id='word_1_22' title='bbox 476 238 496 260; x_wconf 95' lang='eng' dir='ltr'><em>V.</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 510 238 637 261; x_wconf 82' lang='eng' dir='ltr'>halioticoli</span> <span class='ocrx_word' id='word_1_24' title='bbox 647 238 697 260; x_wconf 93' lang='eng' dir='ltr'>IAM</span> <span class='ocrx_word' id='word_1_25' title='bbox 711 238 791 261; x_wconf 87' lang='eng'>14597</span> <span class='ocrx_word' id='word_1_26' title='bbox 803 238 963 267; x_wconf 80' lang='eng' dir='ltr'>(ABOOO391)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 399 283 954 314; baseline 0.002 -6"><span class='ocrx_word' id='word_1_27' title='bbox 399 293 440 295; x_wconf 90' lang='eng'>—</span> <span class='ocrx_word' id='word_1_28' title='bbox 453 286 474 308; x_wconf 94' lang='eng' dir='ltr'><em>V.</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 488 286 614 309; x_wconf 83' lang='eng' dir='ltr'>halioticoli</span> <span class='ocrx_word' id='word_1_30' title='bbox 624 286 674 308; x_wconf 93' lang='eng' dir='ltr'>IAM</span> <span class='ocrx_word' id='word_1_31' title='bbox 689 283 783 309; x_wconf 81' lang='eng' dir='ltr'>14596T</span> <span class='ocrx_word' id='word_1_32' title='bbox 794 286 954 314; x_wconf 86' lang='eng' dir='ltr'>(AB000390)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 810 333 1287 362; baseline 0 -6"><span class='ocrx_word' id='word_1_33' title='bbox 810 334 831 356; x_wconf 93' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_34' title='bbox 844 334 946 362; x_wconf 83' lang='eng' dir='ltr'>gal/icus</span> <span class='ocrx_word' id='word_1_35' title='bbox 956 333 1004 356; x_wconf 89' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_36' title='bbox 1017 334 1115 356; x_wconf 87' lang='eng'>107867</span> <span class='ocrx_word' id='word_1_37' title='bbox 1127 334 1287 362; x_wconf 88' lang='eng' dir='ltr'>(AY257975)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 810 378 1300 410; baseline 0 -7"><span class='ocrx_word' id='word_1_38' title='bbox 810 381 830 403; x_wconf 95' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_39' title='bbox 844 381 946 410; x_wconf 80' lang='eng' dir='ltr'>gal/icus</span> <span class='ocrx_word' id='word_1_40' title='bbox 956 381 1004 404; x_wconf 93' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_41' title='bbox 1017 378 1130 404; x_wconf 78' lang='eng' dir='ltr'>107863T</span> <span class='ocrx_word' id='word_1_42' title='bbox 1140 381 1300 410; x_wconf 89' lang='eng' dir='ltr'>(AY257972)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 810 428 1287 457; baseline 0 -6"><span class='ocrx_word' id='word_1_43' title='bbox 810 428 831 451; x_wconf 92' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_44' title='bbox 844 428 946 457; x_wconf 79' lang='eng' dir='ltr'>gall/Gus</span> <span class='ocrx_word' id='word_1_45' title='bbox 956 428 1004 451; x_wconf 93' lang='eng' dir='ltr'>CIP</span> <span class='ocrx_word' id='word_1_46' title='bbox 1017 428 1115 451; x_wconf 88' lang='eng'>107865</span> <span class='ocrx_word' id='word_1_47' title='bbox 1127 428 1287 457; x_wconf 88' lang='eng' dir='ltr'>(AY257973)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 397 473 867 504; baseline 0 -6"><span class='ocrx_word' id='word_1_48' title='bbox 397 475 418 498; x_wconf 86' lang='eng' dir='ltr'>V</span> <span class='ocrx_word' id='word_1_49' title='bbox 432 475 554 498; x_wconf 84' lang='eng' dir='ltr'>comitans</span> <span class='ocrx_word' id='word_1_50' title='bbox 564 473 690 498; x_wconf 92' lang='eng' dir='ltr'>GHG2-1T</span> <span class='ocrx_word' id='word_1_51' title='bbox 701 475 867 504; x_wconf 77' lang='eng' dir='ltr'>(D0922915)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 402 523 859 551; baseline 0 -5"><span class='ocrx_word' id='word_1_52' title='bbox 402 523 423 545; x_wconf 95' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_53' title='bbox 437 523 559 546; x_wconf 80' lang='eng' dir='ltr'>comitans</span> <span class='ocrx_word' id='word_1_54' title='bbox 570 523 681 545; x_wconf 83' lang='eng' dir='ltr'>NHM1—4</span> <span class='ocrx_word' id='word_1_55' title='bbox 693 523 859 551; x_wconf 79' lang='eng' dir='ltr'>(D0922919)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 425 570 897 599; baseline 0 -6"><span class='ocrx_word' id='word_1_56' title='bbox 425 570 447 592; x_wconf 98' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_57' title='bbox 460 570 582 593; x_wconf 80' lang='eng' dir='ltr'>comitans</span> <span class='ocrx_word' id='word_1_58' title='bbox 593 570 716 593; x_wconf 83' lang='eng' dir='ltr'>NHG1-11</span> <span class='ocrx_word' id='word_1_59' title='bbox 732 570 897 599; x_wconf 87' lang='eng' dir='ltr'>(DQ922918)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 450 615 895 646; baseline 0 -5"><span class='ocrx_word' id='word_1_60' title='bbox 450 618 471 640; x_wconf 93' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_61' title='bbox 484 618 617 646; x_wconf 85' lang='eng' dir='ltr'>superstes</span> <span class='ocrx_word' id='word_1_62' title='bbox 626 615 724 641; x_wconf 83' lang='eng' dir='ltr'>G3—29T</span> <span class='ocrx_word' id='word_1_63' title='bbox 734 618 895 646; x_wconf 79' lang='eng' dir='ltr'>(AY155585)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 270 665 1125 1216">
+     <span class='ocr_line' id='line_1_15' title="bbox 368 665 874 699; baseline 0 -11"><span class='ocrx_word' id='word_1_64' title='bbox 368 679 392 699; x_wconf 65' lang='eng'>51</span> <span class='ocrx_word' id='word_1_65' title='bbox 442 665 463 688; x_wconf 97' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_66' title='bbox 477 666 609 694; x_wconf 80' lang='eng' dir='ltr'>superstes</span> <span class='ocrx_word' id='word_1_67' title='bbox 619 665 698 688; x_wconf 76' lang='eng'>63-11</span> <span class='ocrx_word' id='word_1_68' title='bbox 713 665 874 694; x_wconf 82' lang='eng' dir='ltr'>(AY155583)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 377 713 854 741; baseline 0 -6"><span class='ocrx_word' id='word_1_69' title='bbox 377 715 405 735; x_wconf 90' lang='eng'>58</span> <span class='ocrx_word' id='word_1_70' title='bbox 445 713 466 735; x_wconf 97' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_71' title='bbox 480 713 612 741; x_wconf 83' lang='eng' dir='ltr'>superstes</span> <span class='ocrx_word' id='word_1_72' title='bbox 623 713 684 735; x_wconf 88' lang='eng' dir='ltr'>B1—5</span> <span class='ocrx_word' id='word_1_73' title='bbox 696 713 854 741; x_wconf 80' lang='eng' dir='ltr'>(AF519806)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 439 758 887 789; baseline 0 -7"><span class='ocrx_word' id='word_1_74' title='bbox 439 767 487 769; x_wconf 88' lang='eng'>—</span> <span class='ocrx_word' id='word_1_75' title='bbox 500 760 521 782; x_wconf 98' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_76' title='bbox 535 766 603 783; x_wconf 88' lang='eng' dir='ltr'>rarus</span> <span class='ocrx_word' id='word_1_77' title='bbox 614 758 711 782; x_wconf 90' lang='eng' dir='ltr'>RW22T</span> <span class='ocrx_word' id='word_1_78' title='bbox 722 760 887 789; x_wconf 88' lang='eng' dir='ltr'>(DQ914239)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 499 805 946 836; baseline 0 -6"><span class='ocrx_word' id='word_1_79' title='bbox 499 808 520 830; x_wconf 97' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_80' title='bbox 534 808 663 830; x_wconf 78' lang='eng' dir='ltr'>inusitatus</span> <span class='ocrx_word' id='word_1_81' title='bbox 674 805 770 830; x_wconf 88' lang='eng' dir='ltr'>RW14T</span> <span class='ocrx_word' id='word_1_82' title='bbox 781 807 946 836; x_wconf 84' lang='eng' dir='ltr'>(DQ922920)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 437 855 933 884; baseline 0 -7"><span class='ocrx_word' id='word_1_83' title='bbox 437 857 466 877; x_wconf 86' lang='eng'>94</span> <span class='ocrx_word' id='word_1_84' title='bbox 499 855 520 877; x_wconf 88' lang='eng' dir='ltr'>v.</span> <span class='ocrx_word' id='word_1_85' title='bbox 533 855 662 878; x_wconf 82' lang='eng' dir='ltr'>inusitatus</span> <span class='ocrx_word' id='word_1_86' title='bbox 673 855 751 877; x_wconf 83' lang='eng' dir='ltr'>RW21</span> <span class='ocrx_word' id='word_1_87' title='bbox 767 855 933 884; x_wconf 86' lang='eng' dir='ltr'>(DQ922921)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 285 900 644 931; baseline -0.006 -4"><span class='ocrx_word' id='word_1_88' title='bbox 285 906 315 927; x_wconf 87' lang='eng'>64</span> <span class='ocrx_word' id='word_1_89' title='bbox 334 903 375 925; x_wconf 94' lang='eng' dir='ltr'><strong>RD</strong></span> <span class='ocrx_word' id='word_1_90' title='bbox 387 900 644 931; x_wconf 77' lang='eng' dir='ltr'>15.11T(EF599161)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 333 950 638 979; baseline 0.003 -7"><span class='ocrx_word' id='word_1_91' title='bbox 333 950 395 973; x_wconf 92' lang='eng' dir='ltr'>CMJ</span> <span class='ocrx_word' id='word_1_92' title='bbox 408 950 464 973; x_wconf 89' lang='eng'>13.7</span> <span class='ocrx_word' id='word_1_93' title='bbox 475 950 638 979; x_wconf 85' lang='eng' dir='ltr'>(EU541610)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 324 998 607 1026; baseline 0 -6"><span class='ocrx_word' id='word_1_94' title='bbox 324 998 365 1020; x_wconf 96' lang='eng' dir='ltr'><em>VB</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 377 998 433 1020; x_wconf 88' lang='eng'><strong>16.3</strong></span> <span class='ocrx_word' id='word_1_96' title='bbox 445 998 607 1026; x_wconf 89' lang='eng' dir='ltr'>(EU541611)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 270 1035 1125 1077; baseline 0.006 -10"><span class='ocrx_word' id='word_1_97' title='bbox 270 1035 299 1055; x_wconf 77' lang='eng'>95</span> <span class='ocrx_word' id='word_1_98' title='bbox 326 1045 366 1067; x_wconf 92' lang='eng' dir='ltr'>RD</span> <span class='ocrx_word' id='word_1_99' title='bbox 378 1044 607 1073; x_wconf 80' lang='eng' dir='ltr'>265(EU541609)</span> <span class='ocrx_word' id='word_1_100' title='bbox 830 1048 852 1071; x_wconf 94' lang='eng' dir='ltr'>v.</span> <span class='ocrx_word' id='word_1_101' title='bbox 864 1048 1053 1077; x_wconf 89' lang='eng' dir='ltr'>breoganiisp.</span> <span class='ocrx_word' id='word_1_102' title='bbox 1066 1054 1125 1071; x_wconf 93' lang='eng' dir='ltr'>nov.</span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 325 1092 570 1121; baseline 0.004 -7"><span class='ocrx_word' id='word_1_103' title='bbox 325 1092 344 1114; x_wconf 90' lang='eng' dir='ltr'><strong>C</strong></span> <span class='ocrx_word' id='word_1_104' title='bbox 355 1092 396 1115; x_wconf 92' lang='eng'>5.5</span> <span class='ocrx_word' id='word_1_105' title='bbox 407 1092 570 1121; x_wconf 87' lang='eng' dir='ltr'>(EU541608)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 325 1139 587 1168; baseline 0 -7"><span class='ocrx_word' id='word_1_106' title='bbox 325 1139 344 1161; x_wconf 91' lang='eng' dir='ltr'><strong>C</strong></span> <span class='ocrx_word' id='word_1_107' title='bbox 355 1139 413 1162; x_wconf 91' lang='eng'>4.15</span> <span class='ocrx_word' id='word_1_108' title='bbox 424 1139 587 1168; x_wconf 88' lang='eng' dir='ltr'>(EU931112)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 326 1187 606 1216; baseline 0 -6"><span class='ocrx_word' id='word_1_109' title='bbox 326 1187 366 1210; x_wconf 94' lang='eng' dir='ltr'>RD</span> <span class='ocrx_word' id='word_1_110' title='bbox 378 1187 432 1210; x_wconf 80' lang='eng'>232</span> <span class='ocrx_word' id='word_1_111' title='bbox 444 1187 606 1216; x_wconf 89' lang='eng' dir='ltr'>(EU931113)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 395 4 633 251">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 395 4 633 251">
+     <span class='ocr_line' id='line_1_27' title="bbox 551 4 626 44; baseline 0 1306"><span class='ocrx_word' id='word_1_112' title='bbox 551 4 626 44; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 486 44 633 79; baseline 0 1271"><span class='ocrx_word' id='word_1_113' title='bbox 486 44 633 79; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 449 79 625 140; baseline 0 -14"><span class='ocrx_word' id='word_1_114' title='bbox 449 79 625 140; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 395 140 561 177; baseline 0 1173"><span class='ocrx_word' id='word_1_115' title='bbox 395 140 561 177; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 395 177 505 251; baseline 0 0"><span class='ocrx_word' id='word_1_116' title='bbox 395 177 505 251; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 397 199 400 295">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 397 199 400 295">
+     <span class='ocr_line' id='line_1_32' title="bbox 397 199 400 295; baseline 0 1055"><span class='ocrx_word' id='word_1_117' title='bbox 397 199 400 295; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 0 246 801 851">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 0 246 801 851">
+     <span class='ocr_line' id='line_1_33' title="bbox 330 246 399 329; baseline 0 -48"><span class='ocrx_word' id='word_1_118' title='bbox 330 246 399 329; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 310 329 801 458; baseline 0 -17"><span class='ocrx_word' id='word_1_119' title='bbox 310 329 801 458; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 277 458 336 565; baseline 0 -46"><span class='ocrx_word' id='word_1_120' title='bbox 277 458 336 565; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 271 565 320 669; baseline 0 0"><span class='ocrx_word' id='word_1_121' title='bbox 271 565 320 669; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 276 669 320 709; baseline 0 641"><span class='ocrx_word' id='word_1_122' title='bbox 276 669 320 709; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 276 709 320 755; baseline 0 595"><span class='ocrx_word' id='word_1_123' title='bbox 276 709 320 755; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 0 755 443 811; baseline 0 -7"><span class='ocrx_word' id='word_1_124' title='bbox 0 755 443 811; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 0 811 399 851; baseline 0 499"><span class='ocrx_word' id='word_1_125' title='bbox 0 811 399 851; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 331 316 335 530">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 331 316 335 530">
+     <span class='ocr_line' id='line_1_41' title="bbox 331 316 335 530; baseline 0 820"><span class='ocrx_word' id='word_1_126' title='bbox 331 316 335 530; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 437 767 439 840">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 437 767 439 840">
+     <span class='ocr_line' id='line_1_42' title="bbox 437 767 439 840; baseline 0 510"><span class='ocrx_word' id='word_1_127' title='bbox 437 767 439 840; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 0 811 443 1245">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 0 811 443 1245">
+     <span class='ocr_line' id='line_1_43' title="bbox 0 811 443 946; baseline 0 0"><span class='ocrx_word' id='word_1_128' title='bbox 0 851 287 946; x_wconf 95' lang='eng' dir='ltr'>  </span> <span class='ocrx_word' id='word_1_129' title='bbox 427 811 443 841; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 0 946 323 1092; baseline 0 -76"><span class='ocrx_word' id='word_1_130' title='bbox 0 946 323 1092; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 0 1092 319 1245; baseline 0 105"><span class='ocrx_word' id='word_1_131' title='bbox 0 1092 319 1245; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 399 821 427 841">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 399 821 427 841">
+     <span class='ocr_line' id='line_1_46' title="bbox 399 821 427 841; baseline 0 0"><span class='ocrx_word' id='word_1_132' title='bbox 399 821 427 841; x_wconf 88' lang='eng'>97</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 5 1241 796 1245">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 5 1241 796 1245">
+     <span class='ocr_line' id='line_1_47' title="bbox 5 1241 796 1245; baseline 0 105"><span class='ocrx_word' id='word_1_133' title='bbox 5 1241 796 1245; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 809 1232 1293 1264">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 809 1232 1293 1263">
+     <span class='ocr_line' id='line_1_48' title="bbox 809 1232 1293 1263; baseline 0 -6"><span class='ocrx_word' id='word_1_134' title='bbox 809 1235 829 1257; x_wconf 96' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_135' title='bbox 844 1235 960 1257; x_wconf 88' lang='eng' dir='ltr'>cholerae</span> <span class='ocrx_word' id='word_1_136' title='bbox 969 1234 1051 1257; x_wconf 91' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_137' title='bbox 1065 1232 1159 1257; x_wconf 89' lang='eng' dir='ltr'>14035T</span> <span class='ocrx_word' id='word_1_138' title='bbox 1170 1235 1293 1263; x_wconf 86' lang='eng' dir='ltr'>(X74695)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 153 1328 221 1348">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 153 1328 221 1348">
+     <span class='ocr_line' id='line_1_49' title="bbox 153 1328 221 1348; baseline 0 0"><span class='ocrx_word' id='word_1_139' title='bbox 153 1328 221 1348; x_wconf 90' lang='eng'>0.005</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003434-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003434-0-001.pbm.png
new file mode 100644
index 00000000..dabca4b0
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003434-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003434-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003434-0-001.pbm.png.hocr
new file mode 100644
index 00000000..911da5a7
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003434-0-001.pbm.png.hocr
@@ -0,0 +1,368 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003434-0-001.pbm.png"; bbox 0 0 1243 2260; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 60 27 1204 629">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 60 27 1204 629">
+     <span class='ocr_line' id='line_1_1' title="bbox 529 27 769 52; baseline 0 -5"><span class='ocrx_word' id='word_1_1' title='bbox 529 28 564 47; x_wconf 91' lang='eng' dir='ltr'>RD</span> <span class='ocrx_word' id='word_1_2' title='bbox 573 27 621 47; x_wconf 89' lang='eng' dir='ltr'>2G5</span> <span class='ocrx_word' id='word_1_3' title='bbox 631 28 769 52; x_wconf 88' lang='eng' dir='ltr'>(EU541576)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 529 63 762 88; baseline 0.004 -6"><span class='ocrx_word' id='word_1_4' title='bbox 529 63 564 82; x_wconf 93' lang='eng' dir='ltr'>RD</span> <span class='ocrx_word' id='word_1_5' title='bbox 573 63 618 82; x_wconf 81' lang='eng'>282</span> <span class='ocrx_word' id='word_1_6' title='bbox 629 63 762 88; x_wconf 83' lang='eng' dir='ltr'>(FJ214964)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 528 98 783 123; baseline 0 -5"><span class='ocrx_word' id='word_1_7' title='bbox 528 98 581 118; x_wconf 92' lang='eng' dir='ltr'>CMJ</span> <span class='ocrx_word' id='word_1_8' title='bbox 592 99 640 118; x_wconf 81' lang='eng'>13.7</span> <span class='ocrx_word' id='word_1_9' title='bbox 650 99 783 123; x_wconf 82' lang='eng' dir='ltr'>(FJ214963)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 60 132 1173 162; baseline 0.006 -12"><span class='ocrx_word' id='word_1_10' title='bbox 60 143 99 160; x_wconf 61' lang='eng'>001</span> <span class='ocrx_word' id='word_1_11' title='bbox 529 134 564 153; x_wconf 94' lang='eng' dir='ltr'>RD</span> <span class='ocrx_word' id='word_1_12' title='bbox 575 132 649 154; x_wconf 84' lang='eng' dir='ltr'>15.11T</span> <span class='ocrx_word' id='word_1_13' title='bbox 658 134 797 159; x_wconf 79' lang='eng' dir='ltr'>(EU541565)</span> <span class='ocrx_word' id='word_1_14' title='bbox 920 137 940 156; x_wconf 96' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_15' title='bbox 951 137 1111 162; x_wconf 85' lang='eng' dir='ltr'>breoganiisp.</span> <span class='ocrx_word' id='word_1_16' title='bbox 1123 142 1173 157; x_wconf 90' lang='eng' dir='ltr'>nov.</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 485 169 737 195; baseline 0.004 -6"><span class='ocrx_word' id='word_1_17' title='bbox 485 169 505 186; x_wconf 82' lang='eng'>61</span> <span class='ocrx_word' id='word_1_18' title='bbox 528 170 589 190; x_wconf 83' lang='eng'>05.5</span> <span class='ocrx_word' id='word_1_19' title='bbox 598 170 737 195; x_wconf 87' lang='eng' dir='ltr'>(EU541575)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 478 206 774 230; baseline 0 -5"><span class='ocrx_word' id='word_1_20' title='bbox 478 213 501 230; x_wconf 69' lang='eng'>99</span> <span class='ocrx_word' id='word_1_21' title='bbox 537 206 572 225; x_wconf 88' lang='eng' dir='ltr'>VB</span> <span class='ocrx_word' id='word_1_22' title='bbox 583 206 631 225; x_wconf 84' lang='eng'>16.3</span> <span class='ocrx_word' id='word_1_23' title='bbox 641 206 774 230; x_wconf 84' lang='eng' dir='ltr'>(FJ214965)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 410 245 757 272; baseline 0.006 -9"><span class='ocrx_word' id='word_1_24' title='bbox 410 256 434 272; x_wconf 70' lang='eng'>95</span> <span class='ocrx_word' id='word_1_25' title='bbox 539 245 555 264; x_wconf 89' lang='eng' dir='ltr'>c</span> <span class='ocrx_word' id='word_1_26' title='bbox 564 245 614 265; x_wconf 86' lang='eng'>4.15</span> <span class='ocrx_word' id='word_1_27' title='bbox 624 245 757 270; x_wconf 85' lang='eng' dir='ltr'>(FJ214962)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 539 280 985 307; baseline -0.002 -5"><span class='ocrx_word' id='word_1_28' title='bbox 539 282 557 301; x_wconf 82' lang='eng' dir='ltr'>V</span> <span class='ocrx_word' id='word_1_29' title='bbox 568 282 682 307; x_wconf 86' lang='eng' dir='ltr'>superstes</span> <span class='ocrx_word' id='word_1_30' title='bbox 692 281 744 302; x_wconf 88' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_31' title='bbox 755 280 838 301; x_wconf 76' lang='eng' dir='ltr'>213st</span> <span class='ocrx_word' id='word_1_32' title='bbox 847 282 985 307; x_wconf 86' lang='eng' dir='ltr'>(EU541580)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 346 316 1010 343; baseline 0.003 -8"><span class='ocrx_word' id='word_1_33' title='bbox 346 318 380 335; x_wconf 81' lang='eng'>100</span> <span class='ocrx_word' id='word_1_34' title='bbox 448 321 562 323; x_wconf 91' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_35' title='bbox 573 318 591 337; x_wconf 93' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_36' title='bbox 603 318 707 338; x_wconf 87' lang='eng' dir='ltr'>comitans</span> <span class='ocrx_word' id='word_1_37' title='bbox 717 318 770 338; x_wconf 93' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_38' title='bbox 780 316 864 337; x_wconf 80' lang='eng' dir='ltr'>23416T</span> <span class='ocrx_word' id='word_1_39' title='bbox 873 318 1010 343; x_wconf 85' lang='eng' dir='ltr'>(EU541577)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 570 352 1012 379; baseline -0.002 -5"><span class='ocrx_word' id='word_1_40' title='bbox 570 354 587 373; x_wconf 94' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_41' title='bbox 599 354 709 374; x_wconf 78' lang='eng' dir='ltr'>inus/tatus</span> <span class='ocrx_word' id='word_1_42' title='bbox 719 354 772 374; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_43' title='bbox 782 352 865 373; x_wconf 78' lang='eng' dir='ltr'>23434T</span> <span class='ocrx_word' id='word_1_44' title='bbox 875 354 1012 379; x_wconf 89' lang='eng' dir='ltr'>(EU541579)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 812 388 1204 414; baseline 0 -5"><span class='ocrx_word' id='word_1_45' title='bbox 812 390 829 409; x_wconf 89' lang='eng' dir='ltr'><em>V.</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 841 394 900 409; x_wconf 84' lang='eng' dir='ltr'><em>rarus</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 910 389 963 409; x_wconf 93' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_48' title='bbox 974 388 1057 409; x_wconf 82' lang='eng' dir='ltr'>23674T</span> <span class='ocrx_word' id='word_1_49' title='bbox 1066 390 1204 414; x_wconf 88' lang='eng' dir='ltr'>(EU541578)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 403 416 1094 467; baseline -0.001 -22"><span class='ocrx_word' id='word_1_50' title='bbox 403 416 427 432; x_wconf 76' lang='eng'>74</span> <span class='ocrx_word' id='word_1_51' title='bbox 639 426 663 442; x_wconf 83' lang='eng'>89</span> <span class='ocrx_word' id='word_1_52' title='bbox 663 429 676 467; x_wconf 73' lang='eng'>_|</span> <span class='ocrx_word' id='word_1_53' title='bbox 688 425 705 444; x_wconf 92' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_54' title='bbox 717 430 796 445; x_wconf 88' lang='eng' dir='ltr'>ezurae</span> <span class='ocrx_word' id='word_1_55' title='bbox 806 425 859 445; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_56' title='bbox 871 423 953 444; x_wconf 83' lang='eng' dir='ltr'>19970T</span> <span class='ocrx_word' id='word_1_57' title='bbox 962 425 1094 450; x_wconf 87' lang='eng' dir='ltr'>(AJ842600)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 484 460 1083 486; baseline -0.002 -5"><span class='ocrx_word' id='word_1_58' title='bbox 484 460 508 477; x_wconf 82' lang='eng'>90</span> <span class='ocrx_word' id='word_1_59' title='bbox 688 461 705 480; x_wconf 95' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_60' title='bbox 717 466 796 481; x_wconf 84' lang='eng' dir='ltr'>ezurae</span> <span class='ocrx_word' id='word_1_61' title='bbox 806 461 859 481; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_62' title='bbox 871 462 940 480; x_wconf 88' lang='eng'>19979</span> <span class='ocrx_word' id='word_1_63' title='bbox 951 461 1083 486; x_wconf 86' lang='eng' dir='ltr'>(AJ842601)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 712 495 1146 521; baseline 0 -5"><span class='ocrx_word' id='word_1_64' title='bbox 712 497 729 516; x_wconf 94' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_65' title='bbox 741 498 848 516; x_wconf 74' lang='eng' dir='ltr'>neonatus</span> <span class='ocrx_word' id='word_1_66' title='bbox 858 496 911 516; x_wconf 93' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_67' title='bbox 923 495 1004 516; x_wconf 81' lang='eng' dir='ltr'>19973T</span> <span class='ocrx_word' id='word_1_68' title='bbox 1014 497 1146 521; x_wconf 87' lang='eng' dir='ltr'>(AJ842660)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 712 532 1134 557; baseline 0 -6"><span class='ocrx_word' id='word_1_69' title='bbox 712 532 729 551; x_wconf 90' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_70' title='bbox 741 532 849 552; x_wconf 81' lang='eng' dir='ltr'>halioticoli</span> <span class='ocrx_word' id='word_1_71' title='bbox 857 532 910 552; x_wconf 91' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_72' title='bbox 922 533 991 551; x_wconf 86' lang='eng'>19963</span> <span class='ocrx_word' id='word_1_73' title='bbox 1002 532 1134 557; x_wconf 85' lang='eng' dir='ltr'>(AJ842619)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 664 566 1156 593; baseline 0.004 -8"><span class='ocrx_word' id='word_1_74' title='bbox 664 568 687 585; x_wconf 83' lang='eng'>99</span> <span class='ocrx_word' id='word_1_75' title='bbox 722 568 740 587; x_wconf 86' lang='eng' dir='ltr'>V</span> <span class='ocrx_word' id='word_1_76' title='bbox 752 568 860 588; x_wconf 76' lang='eng' dir='ltr'>haliot/co/i</span> <span class='ocrx_word' id='word_1_77' title='bbox 868 568 921 588; x_wconf 90' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_78' title='bbox 933 566 1014 587; x_wconf 79' lang='eng' dir='ltr'>18542T</span> <span class='ocrx_word' id='word_1_79' title='bbox 1023 568 1156 593; x_wconf 85' lang='eng' dir='ltr'>(AJ842617)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 712 604 1135 629; baseline 0 -5"><span class='ocrx_word' id='word_1_80' title='bbox 712 605 729 624; x_wconf 90' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_81' title='bbox 742 605 849 624; x_wconf 82' lang='eng' dir='ltr'>neonatus</span> <span class='ocrx_word' id='word_1_82' title='bbox 858 604 911 624; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_83' title='bbox 923 605 992 624; x_wconf 87' lang='eng'>19976</span> <span class='ocrx_word' id='word_1_84' title='bbox 1003 605 1135 629; x_wconf 87' lang='eng' dir='ltr'>(AJ842661)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 551 654 970 680">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 551 654 970 680">
+     <span class='ocr_line' id='line_1_18' title="bbox 551 654 970 680; baseline 0 -5"><span class='ocrx_word' id='word_1_85' title='bbox 551 656 569 675; x_wconf 82' lang='eng' dir='ltr'>V</span> <span class='ocrx_word' id='word_1_86' title='bbox 580 656 667 680; x_wconf 71' lang='eng' dir='ltr'>gall/Gus</span> <span class='ocrx_word' id='word_1_87' title='bbox 676 655 729 675; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_88' title='bbox 739 654 823 675; x_wconf 84' lang='eng' dir='ltr'>21330T</span> <span class='ocrx_word' id='word_1_89' title='bbox 832 656 970 680; x_wconf 84' lang='eng' dir='ltr'>(EU541581)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 446 235 448 323">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 446 235 448 323">
+     <span class='ocr_line' id='line_1_19' title="bbox 446 235 448 323; baseline 0 1937"><span class='ocrx_word' id='word_1_90' title='bbox 446 235 448 323; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 438 357 440 449">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 438 357 440 449">
+     <span class='ocr_line' id='line_1_20' title="bbox 438 357 440 449; baseline 0 1811"><span class='ocrx_word' id='word_1_91' title='bbox 438 357 440 449; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 438 447 521 449">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 438 447 521 449">
+     <span class='ocr_line' id='line_1_21' title="bbox 438 447 521 449; baseline 0 1811"><span class='ocrx_word' id='word_1_92' title='bbox 438 447 521 449; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 519 393 521 503">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 519 393 521 503">
+     <span class='ocr_line' id='line_1_22' title="bbox 519 393 521 503; baseline 0 1757"><span class='ocrx_word' id='word_1_93' title='bbox 519 393 521 503; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 132 501 169 503">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 132 501 169 503">
+     <span class='ocr_line' id='line_1_23' title="bbox 132 501 169 503; baseline 0 1757"><span class='ocrx_word' id='word_1_94' title='bbox 132 501 169 503; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 519 501 663 503">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 519 501 663 503">
+     <span class='ocr_line' id='line_1_24' title="bbox 519 501 663 503; baseline 0 1757"><span class='ocrx_word' id='word_1_95' title='bbox 519 501 663 503; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 626 515 650 531">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 626 515 650 531">
+     <span class='ocr_line' id='line_1_25' title="bbox 626 515 650 531; baseline 0 0"><span class='ocrx_word' id='word_1_96' title='bbox 626 515 650 531; x_wconf 91' lang='eng'>99</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 661 447 663 557">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 661 447 663 557">
+     <span class='ocr_line' id='line_1_26' title="bbox 661 447 663 557; baseline 0 1703"><span class='ocrx_word' id='word_1_97' title='bbox 661 447 663 557; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 167 340 169 665">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 167 340 169 665">
+     <span class='ocr_line' id='line_1_27' title="bbox 167 340 169 665; baseline 0 1595"><span class='ocrx_word' id='word_1_98' title='bbox 167 340 169 665; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 132 501 133 719">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 132 501 133 719">
+     <span class='ocr_line' id='line_1_28' title="bbox 132 501 133 719; baseline 0 1541"><span class='ocrx_word' id='word_1_99' title='bbox 132 501 133 719; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 132 717 800 719">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 132 717 800 719">
+     <span class='ocr_line' id='line_1_29' title="bbox 132 717 800 719; baseline 0 1541"><span class='ocrx_word' id='word_1_100' title='bbox 132 717 800 719; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 812 712 1227 737">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 812 712 1227 737">
+     <span class='ocr_line' id='line_1_30' title="bbox 812 712 1227 737; baseline -0.002 -5"><span class='ocrx_word' id='word_1_101' title='bbox 812 712 829 731; x_wconf 92' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_102' title='bbox 842 712 941 732; x_wconf 85' lang='eng' dir='ltr'>cholerae</span> <span class='ocrx_word' id='word_1_103' title='bbox 951 712 1003 732; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_104' title='bbox 1014 713 1084 731; x_wconf 88' lang='eng'>21698</span> <span class='ocrx_word' id='word_1_105' title='bbox 1095 712 1227 737; x_wconf 85' lang='eng' dir='ltr'>(AJ842573)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 523 797 1240 1508">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 523 797 1240 1508">
+     <span class='ocr_line' id='line_1_31' title="bbox 581 797 849 823; baseline 0 -5"><span class='ocrx_word' id='word_1_106' title='bbox 581 799 616 818; x_wconf 91' lang='eng' dir='ltr'><strong>RD</strong></span> <span class='ocrx_word' id='word_1_107' title='bbox 627 797 702 818; x_wconf 90' lang='eng' dir='ltr'>15.11T</span> <span class='ocrx_word' id='word_1_108' title='bbox 711 799 849 823; x_wconf 90' lang='eng' dir='ltr'>(EU541585)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 569 838 823 863; baseline 0 -5"><span class='ocrx_word' id='word_1_109' title='bbox 569 838 622 858; x_wconf 89' lang='eng' dir='ltr'>CMJ</span> <span class='ocrx_word' id='word_1_110' title='bbox 633 839 680 858; x_wconf 83' lang='eng'>13.7</span> <span class='ocrx_word' id='word_1_111' title='bbox 691 839 823 863; x_wconf 87' lang='eng' dir='ltr'>(FJ214959)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 554 878 771 918; baseline 0 -20"><span class='ocrx_word' id='word_1_112' title='bbox 554 878 578 918; x_wconf 62' lang='eng'>4%</span> <span class='ocrx_word' id='word_1_113' title='bbox 588 879 623 898; x_wconf 90' lang='eng'>5.5</span> <span class='ocrx_word' id='word_1_114' title='bbox 633 879 771 904; x_wconf 84' lang='eng' dir='ltr'>(EU541595)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 562 919 1166 951; baseline 0.003 -7"><span class='ocrx_word' id='word_1_115' title='bbox 562 919 578 939; x_wconf 79' lang='eng' dir='ltr'>c</span> <span class='ocrx_word' id='word_1_116' title='bbox 588 920 638 939; x_wconf 83' lang='eng'>4-15</span> <span class='ocrx_word' id='word_1_117' title='bbox 648 920 780 944; x_wconf 78' lang='eng' dir='ltr'>(FJ214958)</span> <span class='ocrx_word' id='word_1_118' title='bbox 920 926 940 945; x_wconf 98' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_119' title='bbox 950 926 1069 951; x_wconf 88' lang='eng' dir='ltr'>breoganii</span> <span class='ocrx_word' id='word_1_120' title='bbox 1076 931 1111 951; x_wconf 88' lang='eng' dir='ltr'><strong>sp.</strong></span> <span class='ocrx_word' id='word_1_121' title='bbox 1123 931 1166 946; x_wconf 91' lang='eng' dir='ltr'>nov</span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 574 959 815 984; baseline 0.004 -6"><span class='ocrx_word' id='word_1_122' title='bbox 574 959 609 978; x_wconf 95' lang='eng' dir='ltr'><strong>RD</strong></span> <span class='ocrx_word' id='word_1_123' title='bbox 619 959 667 979; x_wconf 78' lang='eng'>265</span> <span class='ocrx_word' id='word_1_124' title='bbox 676 959 815 984; x_wconf 81' lang='eng' dir='ltr'>(EU541596)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 596 1000 829 1024; baseline 0 -5"><span class='ocrx_word' id='word_1_125' title='bbox 596 1000 631 1019; x_wconf 91' lang='eng' dir='ltr'>RD</span> <span class='ocrx_word' id='word_1_126' title='bbox 641 1000 687 1019; x_wconf 89' lang='eng' dir='ltr'>2B2</span> <span class='ocrx_word' id='word_1_127' title='bbox 697 1000 829 1024; x_wconf 87' lang='eng' dir='ltr'>(FJ214960)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 551 1040 840 1065; baseline 0.007 -8"><span class='ocrx_word' id='word_1_128' title='bbox 551 1041 574 1057; x_wconf 87' lang='eng'>98</span> <span class='ocrx_word' id='word_1_129' title='bbox 603 1040 639 1059; x_wconf 89' lang='eng' dir='ltr'><em>VB</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 649 1040 697 1060; x_wconf 85' lang='eng'><strong>16.3</strong></span> <span class='ocrx_word' id='word_1_131' title='bbox 707 1040 840 1065; x_wconf 85' lang='eng' dir='ltr'>(FJ214961)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 523 1078 960 1104; baseline 0 -5"><span class='ocrx_word' id='word_1_132' title='bbox 523 1080 540 1099; x_wconf 96' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_133' title='bbox 553 1080 657 1099; x_wconf 70' lang='eng' dir='ltr'>comitans</span> <span class='ocrx_word' id='word_1_134' title='bbox 667 1080 720 1099; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_135' title='bbox 730 1078 813 1099; x_wconf 77' lang='eng' dir='ltr'>2341GT</span> <span class='ocrx_word' id='word_1_136' title='bbox 823 1080 960 1104; x_wconf 86' lang='eng' dir='ltr'>(EU541597)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 632 1118 1075 1145; baseline -0.002 -5"><span class='ocrx_word' id='word_1_137' title='bbox 632 1120 649 1139; x_wconf 91' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_138' title='bbox 662 1120 771 1140; x_wconf 83' lang='eng' dir='ltr'>inusitatus</span> <span class='ocrx_word' id='word_1_139' title='bbox 781 1120 834 1140; x_wconf 89' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_140' title='bbox 845 1118 928 1139; x_wconf 74' lang='eng' dir='ltr'>23434T</span> <span class='ocrx_word' id='word_1_141' title='bbox 937 1120 1075 1145; x_wconf 87' lang='eng' dir='ltr'>(EU541600)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 614 1159 1053 1185; baseline 0 -5"><span class='ocrx_word' id='word_1_142' title='bbox 614 1161 632 1180; x_wconf 97' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_143' title='bbox 643 1161 752 1180; x_wconf 74' lang='eng' dir='ltr'><em>halioticoli</em></span> <span class='ocrx_word' id='word_1_144' title='bbox 760 1160 812 1180; x_wconf 90' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_145' title='bbox 825 1159 906 1180; x_wconf 78' lang='eng' dir='ltr'>18542T</span> <span class='ocrx_word' id='word_1_146' title='bbox 916 1161 1053 1185; x_wconf 85' lang='eng' dir='ltr'>(EU871966)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 630 1201 1052 1226; baseline 0 -6"><span class='ocrx_word' id='word_1_147' title='bbox 630 1201 647 1220; x_wconf 95' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_148' title='bbox 658 1202 766 1221; x_wconf 82' lang='eng' dir='ltr'>halloticoll</span> <span class='ocrx_word' id='word_1_149' title='bbox 774 1201 827 1221; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_150' title='bbox 840 1202 909 1220; x_wconf 87' lang='eng'>19963</span> <span class='ocrx_word' id='word_1_151' title='bbox 919 1201 1052 1226; x_wconf 83' lang='eng' dir='ltr'>(AJ842432)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 554 1239 1013 1265; baseline -0.002 -4"><span class='ocrx_word' id='word_1_152' title='bbox 554 1245 577 1261; x_wconf 86' lang='eng'>95</span> <span class='ocrx_word' id='word_1_153' title='bbox 607 1241 625 1260; x_wconf 94' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_154' title='bbox 637 1246 715 1261; x_wconf 85' lang='eng' dir='ltr'><em>ezurae</em></span> <span class='ocrx_word' id='word_1_155' title='bbox 725 1241 779 1261; x_wconf 89' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_156' title='bbox 791 1239 872 1260; x_wconf 78' lang='eng' dir='ltr'>19970T</span> <span class='ocrx_word' id='word_1_157' title='bbox 881 1241 1013 1265; x_wconf 83' lang='eng' dir='ltr'>(AJ842413)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 619 1281 1014 1306; baseline 0 -5"><span class='ocrx_word' id='word_1_158' title='bbox 619 1282 637 1301; x_wconf 88' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_159' title='bbox 649 1286 728 1301; x_wconf 89' lang='eng' dir='ltr'>ezurae</span> <span class='ocrx_word' id='word_1_160' title='bbox 738 1281 791 1301; x_wconf 91' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_161' title='bbox 803 1282 872 1301; x_wconf 88' lang='eng'>19979</span> <span class='ocrx_word' id='word_1_162' title='bbox 883 1282 1014 1306; x_wconf 88' lang='eng' dir='ltr'>(AJ842414)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 657 1322 1080 1346; baseline -0.002 -4"><span class='ocrx_word' id='word_1_163' title='bbox 657 1322 675 1341; x_wconf 93' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_164' title='bbox 687 1322 794 1342; x_wconf 86' lang='eng' dir='ltr'>neonatus</span> <span class='ocrx_word' id='word_1_165' title='bbox 804 1322 857 1342; x_wconf 91' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_166' title='bbox 869 1323 938 1341; x_wconf 88' lang='eng'>19976</span> <span class='ocrx_word' id='word_1_167' title='bbox 949 1322 1080 1346; x_wconf 84' lang='eng' dir='ltr'>(AJ842476)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 637 1361 1060 1386; baseline 0 -5"><span class='ocrx_word' id='word_1_168' title='bbox 637 1362 654 1381; x_wconf 96' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_169' title='bbox 666 1362 773 1381; x_wconf 80' lang='eng' dir='ltr'>neonatus</span> <span class='ocrx_word' id='word_1_170' title='bbox 783 1361 836 1381; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_171' title='bbox 849 1362 917 1381; x_wconf 86' lang='eng'>19978</span> <span class='ocrx_word' id='word_1_172' title='bbox 928 1362 1060 1386; x_wconf 86' lang='eng' dir='ltr'>(AJ842477)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 694 1400 1086 1427; baseline 0 -6"><span class='ocrx_word' id='word_1_173' title='bbox 694 1402 712 1421; x_wconf 92' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_174' title='bbox 723 1407 783 1422; x_wconf 85' lang='eng' dir='ltr'><em>rarus</em></span> <span class='ocrx_word' id='word_1_175' title='bbox 792 1402 846 1422; x_wconf 93' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_176' title='bbox 856 1400 939 1421; x_wconf 77' lang='eng' dir='ltr'>23674T</span> <span class='ocrx_word' id='word_1_177' title='bbox 949 1402 1086 1427; x_wconf 84' lang='eng' dir='ltr'>(EU541599)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 781 1440 1201 1467; baseline -0.002 -5"><span class='ocrx_word' id='word_1_178' title='bbox 781 1442 799 1461; x_wconf 92' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_179' title='bbox 810 1442 897 1467; x_wconf 82' lang='eng' dir='ltr'>gallicus</span> <span class='ocrx_word' id='word_1_180' title='bbox 906 1442 960 1462; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_181' title='bbox 972 1440 1054 1461; x_wconf 82' lang='eng' dir='ltr'>16639T</span> <span class='ocrx_word' id='word_1_182' title='bbox 1064 1442 1201 1467; x_wconf 85' lang='eng' dir='ltr'>(EU541601)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_48' title="bbox 781 1480 1240 1508; baseline -0.002 -5"><span class='ocrx_word' id='word_1_183' title='bbox 781 1483 799 1502; x_wconf 70' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_184' title='bbox 810 1483 957 1508; x_wconf 82' lang='eng' dir='ltr'>proteolyticus</span> <span class='ocrx_word' id='word_1_185' title='bbox 967 1482 1020 1503; x_wconf 90' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_186' title='bbox 1030 1480 1099 1502; x_wconf 77' lang='eng' dir='ltr'>3772T</span> <span class='ocrx_word' id='word_1_187' title='bbox 1109 1483 1240 1508; x_wconf 84' lang='eng' dir='ltr'>(AJ842499)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 3 801 541 863">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 3 801 541 863">
+     <span class='ocr_line' id='line_1_49' title="bbox 3 801 541 828; baseline -0.011 0"><span class='ocrx_word' id='word_1_188' title='bbox 3 801 36 828; x_wconf 81' lang='eng' dir='ltr'>(b)</span> <span class='ocrx_word' id='word_1_189' title='bbox 517 806 541 822; x_wconf 89' lang='eng'>55</span> 
+     </span>
+     <span class='ocr_line' id='line_1_50' title="bbox 511 847 535 863; baseline 0 0"><span class='ocrx_word' id='word_1_190' title='bbox 511 847 535 863; x_wconf 87' lang='eng'>45</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 26 802 650 1453">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 26 802 650 1453">
+     <span class='ocr_line' id='line_1_51' title="bbox 539 802 576 836; baseline 0 0"><span class='ocrx_word' id='word_1_191' title='bbox 539 802 576 836; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_52' title="bbox 532 836 561 917; baseline 0 0"><span class='ocrx_word' id='word_1_192' title='bbox 532 836 561 917; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_53' title="bbox 128 917 574 996; baseline 0 -31"><span class='ocrx_word' id='word_1_193' title='bbox 128 917 574 996; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_54' title="bbox 128 996 591 1036; baseline 0 0"><span class='ocrx_word' id='word_1_194' title='bbox 128 996 591 1036; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_55' title="bbox 128 1036 516 1077; baseline 0 1183"><span class='ocrx_word' id='word_1_195' title='bbox 128 1036 516 1077; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_56' title="bbox 89 1077 523 1117; baseline 0 1143"><span class='ocrx_word' id='word_1_196' title='bbox 89 1077 523 1117; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_57' title="bbox 89 1117 625 1158; baseline 0 0"><span class='ocrx_word' id='word_1_197' title='bbox 89 1117 625 1158; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_58' title="bbox 89 1158 614 1198; baseline 0 1062"><span class='ocrx_word' id='word_1_198' title='bbox 89 1158 614 1198; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_59' title="bbox 89 1198 622 1238; baseline 0 0"><span class='ocrx_word' id='word_1_199' title='bbox 89 1198 622 1238; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_60' title="bbox 49 1238 554 1278; baseline 0 982"><span class='ocrx_word' id='word_1_200' title='bbox 49 1238 554 1278; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_61' title="bbox 49 1278 619 1318; baseline 0 942"><span class='ocrx_word' id='word_1_201' title='bbox 49 1278 619 1318; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_62' title="bbox 26 1318 650 1349; baseline 0 911"><span class='ocrx_word' id='word_1_202' title='bbox 26 1318 650 1349; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_63' title="bbox 26 1349 637 1398; baseline 0 862"><span class='ocrx_word' id='word_1_203' title='bbox 26 1349 637 1398; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_64' title="bbox 26 1398 630 1453; baseline 0 807"><span class='ocrx_word' id='word_1_204' title='bbox 26 1398 630 1453; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 76 908 526 925">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 76 908 526 925">
+     <span class='ocr_line' id='line_1_65' title="bbox 76 908 526 925; baseline 0.002 -1"><span class='ocrx_word' id='word_1_205' title='bbox 76 908 118 924; x_wconf 87' lang='eng'>0.02</span> <span class='ocrx_word' id='word_1_206' title='bbox 491 909 526 925; x_wconf 90' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 96 1409 683 1411">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 96 1409 683 1411">
+     <span class='ocr_line' id='line_1_66' title="bbox 96 1409 683 1411; baseline 0 849"><span class='ocrx_word' id='word_1_207' title='bbox 96 1409 683 1411; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 53 1449 770 1451">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 53 1449 770 1451">
+     <span class='ocr_line' id='line_1_67' title="bbox 53 1449 770 1451; baseline 0 809"><span class='ocrx_word' id='word_1_208' title='bbox 53 1449 770 1451; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 28 1360 30 1491">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 28 1360 30 1491">
+     <span class='ocr_line' id='line_1_68' title="bbox 28 1360 30 1491; baseline 0 769"><span class='ocrx_word' id='word_1_209' title='bbox 28 1360 30 1491; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 28 1489 770 1491">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 28 1489 770 1491">
+     <span class='ocr_line' id='line_1_69' title="bbox 28 1489 770 1491; baseline 0 769"><span class='ocrx_word' id='word_1_210' title='bbox 28 1489 770 1491; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 385 1564 587 1907">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 385 1670 576 1907">
+     <span class='ocr_line' id='line_1_70' title="bbox 483 1670 576 1832; baseline 0 -105"><span class='ocrx_word' id='word_1_211' title='bbox 483 1670 576 1832; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_71' title="bbox 385 1832 498 1907; baseline 0 0"><span class='ocrx_word' id='word_1_212' title='bbox 385 1832 498 1907; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 3 1561 1173 2166">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 3 1561 1173 2166">
+     <span class='ocr_line' id='line_1_72' title="bbox 3 1561 861 1598; baseline 0 -15"><span class='ocrx_word' id='word_1_213' title='bbox 3 1570 34 1598; x_wconf 70' lang='eng' dir='ltr'>(c)</span> <span class='ocrx_word' id='word_1_214' title='bbox 534 1570 557 1586; x_wconf 75' lang='eng'>78</span> <span class='ocrx_word' id='word_1_215' title='bbox 593 1564 628 1583; x_wconf 93' lang='eng' dir='ltr'>RD</span> <span class='ocrx_word' id='word_1_216' title='bbox 639 1561 713 1583; x_wconf 91' lang='eng' dir='ltr'>15.11T</span> <span class='ocrx_word' id='word_1_217' title='bbox 722 1564 861 1588; x_wconf 90' lang='eng' dir='ltr'>(EU541550)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_73' title="bbox 527 1596 784 1623; baseline 0 -5"><span class='ocrx_word' id='word_1_218' title='bbox 527 1596 551 1612; x_wconf 74' lang='eng'>68</span> <span class='ocrx_word' id='word_1_219' title='bbox 576 1598 592 1617; x_wconf 91' lang='eng' dir='ltr'><strong>C</strong></span> <span class='ocrx_word' id='word_1_220' title='bbox 602 1599 636 1618; x_wconf 88' lang='eng'><strong>5.5</strong></span> <span class='ocrx_word' id='word_1_221' title='bbox 646 1598 784 1623; x_wconf 90' lang='eng' dir='ltr'>(EU541552)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_74' title="bbox 521 1633 791 1658; baseline 0.004 -6"><span class='ocrx_word' id='word_1_222' title='bbox 521 1639 545 1656; x_wconf 78' lang='eng'>79</span> <span class='ocrx_word' id='word_1_223' title='bbox 573 1633 589 1652; x_wconf 89' lang='eng' dir='ltr'><strong>C</strong></span> <span class='ocrx_word' id='word_1_224' title='bbox 598 1633 649 1653; x_wconf 90' lang='eng'>4.15</span> <span class='ocrx_word' id='word_1_225' title='bbox 658 1633 791 1658; x_wconf 84' lang='eng' dir='ltr'>(FJ214954)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_75' title="bbox 585 1668 1173 1694; baseline 0.003 -7"><span class='ocrx_word' id='word_1_226' title='bbox 585 1668 620 1688; x_wconf 92' lang='eng' dir='ltr'>RD</span> <span class='ocrx_word' id='word_1_227' title='bbox 630 1668 677 1688; x_wconf 82' lang='eng'>265</span> <span class='ocrx_word' id='word_1_228' title='bbox 687 1668 825 1693; x_wconf 89' lang='eng' dir='ltr'>(EU541551)</span> <span class='ocrx_word' id='word_1_229' title='bbox 920 1670 940 1689; x_wconf 95' lang='eng' dir='ltr'><em>V.</em></span> <span class='ocrx_word' id='word_1_230' title='bbox 950 1670 1069 1694; x_wconf 86' lang='eng' dir='ltr'>breoganii</span> <span class='ocrx_word' id='word_1_231' title='bbox 1076 1674 1111 1694; x_wconf 87' lang='eng' dir='ltr'>sp.</span> <span class='ocrx_word' id='word_1_232' title='bbox 1123 1674 1173 1689; x_wconf 91' lang='eng' dir='ltr'><strong>nov.</strong></span> 
+     </span>
+     <span class='ocr_line' id='line_1_76' title="bbox 577 1703 810 1728; baseline 0.004 -6"><span class='ocrx_word' id='word_1_233' title='bbox 577 1703 612 1722; x_wconf 94' lang='eng' dir='ltr'>RD</span> <span class='ocrx_word' id='word_1_234' title='bbox 622 1703 667 1722; x_wconf 81' lang='eng'>232</span> <span class='ocrx_word' id='word_1_235' title='bbox 678 1703 810 1728; x_wconf 85' lang='eng' dir='ltr'>(FJ214956)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_77' title="bbox 576 1739 811 1763; baseline 0 -5"><span class='ocrx_word' id='word_1_236' title='bbox 576 1739 610 1758; x_wconf 92' lang='eng' dir='ltr'><em>VB</em></span> <span class='ocrx_word' id='word_1_237' title='bbox 621 1739 669 1758; x_wconf 87' lang='eng'><strong>16.3</strong></span> <span class='ocrx_word' id='word_1_238' title='bbox 679 1739 811 1763; x_wconf 85' lang='eng' dir='ltr'>(FJ214957)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_78' title="bbox 575 1773 830 1798; baseline 0 -5"><span class='ocrx_word' id='word_1_239' title='bbox 575 1773 628 1793; x_wconf 91' lang='eng' dir='ltr'>CMJ</span> <span class='ocrx_word' id='word_1_240' title='bbox 639 1774 687 1793; x_wconf 87' lang='eng'>13.7</span> <span class='ocrx_word' id='word_1_241' title='bbox 697 1774 830 1798; x_wconf 88' lang='eng' dir='ltr'>(FJ214955)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_79' title="bbox 584 1807 1025 1833; baseline 0 -5"><span class='ocrx_word' id='word_1_242' title='bbox 584 1809 602 1828; x_wconf 91' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_243' title='bbox 613 1809 727 1833; x_wconf 80' lang='eng' dir='ltr'>superstes</span> <span class='ocrx_word' id='word_1_244' title='bbox 737 1808 789 1828; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_245' title='bbox 800 1807 1025 1833; x_wconf 64' lang='eng' dir='ltr'>21323T(EF601344)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_80' title="bbox 518 1844 1015 1868; baseline 0.004 -7"><span class='ocrx_word' id='word_1_246' title='bbox 518 1844 552 1861; x_wconf 70' lang='eng'>100</span> <span class='ocrx_word' id='word_1_247' title='bbox 584 1844 601 1863; x_wconf 94' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_248' title='bbox 613 1844 726 1868; x_wconf 83' lang='eng' dir='ltr'>superstes</span> <span class='ocrx_word' id='word_1_249' title='bbox 736 1844 789 1863; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_250' title='bbox 799 1844 870 1863; x_wconf 80' lang='eng'>21319</span> <span class='ocrx_word' id='word_1_251' title='bbox 881 1844 1015 1868; x_wconf 80' lang='eng' dir='ltr'>(EF601348)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_81' title="bbox 584 1877 1020 1903; baseline -0.002 -4"><span class='ocrx_word' id='word_1_252' title='bbox 584 1879 601 1898; x_wconf 95' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_253' title='bbox 613 1879 717 1899; x_wconf 87' lang='eng' dir='ltr'>comitans</span> <span class='ocrx_word' id='word_1_254' title='bbox 727 1879 780 1899; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_255' title='bbox 791 1877 874 1898; x_wconf 74' lang='eng' dir='ltr'>23416T</span> <span class='ocrx_word' id='word_1_256' title='bbox 883 1879 1020 1903; x_wconf 78' lang='eng' dir='ltr'>(EU541553)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_82' title="bbox 460 1912 1030 1938; baseline 0 -5"><span class='ocrx_word' id='word_1_257' title='bbox 460 1914 484 1930; x_wconf 87' lang='eng'>50</span> <span class='ocrx_word' id='word_1_258' title='bbox 588 1914 605 1933; x_wconf 94' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_259' title='bbox 617 1914 727 1933; x_wconf 76' lang='eng' dir='ltr'>inusitatus</span> <span class='ocrx_word' id='word_1_260' title='bbox 737 1913 790 1933; x_wconf 90' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_261' title='bbox 801 1912 884 1933; x_wconf 82' lang='eng' dir='ltr'>23434T</span> <span class='ocrx_word' id='word_1_262' title='bbox 893 1914 1030 1938; x_wconf 88' lang='eng' dir='ltr'>(EU541555)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_83' title="bbox 677 1947 1069 1973; baseline 0 -5"><span class='ocrx_word' id='word_1_263' title='bbox 677 1949 695 1968; x_wconf 85' lang='eng' dir='ltr'>V</span> <span class='ocrx_word' id='word_1_264' title='bbox 706 1953 766 1968; x_wconf 85' lang='eng' dir='ltr'><em>rarus</em></span> <span class='ocrx_word' id='word_1_265' title='bbox 775 1948 829 1968; x_wconf 94' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_266' title='bbox 839 1947 922 1968; x_wconf 83' lang='eng' dir='ltr'>23674T</span> <span class='ocrx_word' id='word_1_267' title='bbox 931 1949 1069 1973; x_wconf 89' lang='eng' dir='ltr'>(EU541554)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_84' title="bbox 576 1982 985 2008; baseline 0 -5"><span class='ocrx_word' id='word_1_268' title='bbox 576 1984 594 2003; x_wconf 96' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_269' title='bbox 606 1988 685 2003; x_wconf 89' lang='eng' dir='ltr'>ezurae</span> <span class='ocrx_word' id='word_1_270' title='bbox 695 1983 748 2003; x_wconf 95' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_271' title='bbox 760 1982 842 2003; x_wconf 81' lang='eng' dir='ltr'>1997GT</span> <span class='ocrx_word' id='word_1_272' title='bbox 851 1984 985 2008; x_wconf 81' lang='eng' dir='ltr'>(EF601309)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_85' title="bbox 572 2018 969 2043; baseline 0 -5"><span class='ocrx_word' id='word_1_273' title='bbox 572 2019 589 2038; x_wconf 95' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_274' title='bbox 601 2023 680 2038; x_wconf 76' lang='eng' dir='ltr'>ezurae</span> <span class='ocrx_word' id='word_1_275' title='bbox 690 2018 743 2038; x_wconf 93' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_276' title='bbox 755 2019 824 2038; x_wconf 85' lang='eng'>19979</span> <span class='ocrx_word' id='word_1_277' title='bbox 835 2019 969 2043; x_wconf 82' lang='eng' dir='ltr'>(EF601313)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_86' title="bbox 561 2054 1011 2079; baseline 0 -6"><span class='ocrx_word' id='word_1_278' title='bbox 561 2059 575 2061; x_wconf 77' lang='eng'>—</span> <span class='ocrx_word' id='word_1_279' title='bbox 586 2054 604 2073; x_wconf 87' lang='eng' dir='ltr'>V</span> <span class='ocrx_word' id='word_1_280' title='bbox 616 2054 723 2074; x_wconf 82' lang='eng' dir='ltr'>haliotico/i</span> <span class='ocrx_word' id='word_1_281' title='bbox 732 2054 785 2074; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_282' title='bbox 797 2055 866 2073; x_wconf 87' lang='eng'>19700</span> <span class='ocrx_word' id='word_1_283' title='bbox 877 2054 1011 2079; x_wconf 86' lang='eng' dir='ltr'>(EF601267)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_87' title="bbox 525 2087 1041 2166; baseline 0 -57"><span class='ocrx_word' id='word_1_284' title='bbox 525 2102 549 2119; x_wconf 72' lang='eng'>95</span> <span class='ocrx_word' id='word_1_285' title='bbox 560 2089 623 2166; x_wconf 45' lang='eng' dir='ltr'><em>ﬁV.</em></span> <span class='ocrx_word' id='word_1_286' title='bbox 635 2089 803 2109; x_wconf 69' lang='eng' dir='ltr'>halioticol/‘LMG</span> <span class='ocrx_word' id='word_1_287' title='bbox 816 2087 897 2109; x_wconf 78' lang='eng' dir='ltr'>18542T</span> <span class='ocrx_word' id='word_1_288' title='bbox 907 2089 1041 2114; x_wconf 85' lang='eng' dir='ltr'>(EF601260)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 440 1816 475 1832">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 440 1816 475 1832">
+     <span class='ocr_line' id='line_1_88' title="bbox 440 1816 475 1832; baseline 0 0"><span class='ocrx_word' id='word_1_289' title='bbox 440 1816 475 1832; x_wconf 90' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 496 1883 572 1885">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 496 1883 572 1885">
+     <span class='ocr_line' id='line_1_89' title="bbox 496 1883 572 1885; baseline 0 375"><span class='ocrx_word' id='word_1_290' title='bbox 496 1883 572 1885; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 494 1883 496 1921">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 494 1883 496 1921">
+     <span class='ocr_line' id='line_1_90' title="bbox 494 1883 496 1921; baseline 0 339"><span class='ocrx_word' id='word_1_291' title='bbox 494 1883 496 1921; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 335 1898 370 1914">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 335 1898 370 1914">
+     <span class='ocr_line' id='line_1_91' title="bbox 335 1898 370 1914; baseline 0 0"><span class='ocrx_word' id='word_1_292' title='bbox 335 1898 370 1914; x_wconf 82' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 211 1919 577 1921">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 211 1919 577 1921">
+     <span class='ocr_line' id='line_1_92' title="bbox 211 1919 577 1921; baseline 0 339"><span class='ocrx_word' id='word_1_293' title='bbox 211 1919 577 1921; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 381 1949 670 2091">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 381 1949 670 2091">
+     <span class='ocr_line' id='line_1_93' title="bbox 381 1949 670 2021; baseline 0 -52"><span class='ocrx_word' id='word_1_294' title='bbox 381 1949 670 2021; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_94' title="bbox 381 2021 562 2042; baseline 0 218"><span class='ocrx_word' id='word_1_295' title='bbox 381 2021 562 2042; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_95' title="bbox 430 2042 559 2091; baseline 0 169"><span class='ocrx_word' id='word_1_296' title='bbox 430 2042 559 2091; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 383 1838 385 2003">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 383 1838 385 2003">
+     <span class='ocr_line' id='line_1_96' title="bbox 383 1838 385 2003; baseline 0 257"><span class='ocrx_word' id='word_1_297' title='bbox 383 1838 385 2003; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 3 2051 215 2095">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 3 2051 215 2095">
+     <span class='ocr_line' id='line_1_97' title="bbox 3 2051 215 2095; baseline 0 165"><span class='ocrx_word' id='word_1_298' title='bbox 3 2051 215 2095; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 558 1989 561 2122">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 558 1989 561 2122">
+     <span class='ocr_line' id='line_1_98' title="bbox 558 1989 561 2122; baseline 0 138"><span class='ocrx_word' id='word_1_299' title='bbox 558 1989 561 2122; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 539 2124 1095 2254">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 539 2124 1095 2254">
+     <span class='ocr_line' id='line_1_99' title="bbox 539 2124 1035 2150; baseline -0.002 -6"><span class='ocrx_word' id='word_1_300' title='bbox 539 2133 563 2150; x_wconf 75' lang='eng'>55</span> <span class='ocrx_word' id='word_1_301' title='bbox 609 2124 627 2143; x_wconf 95' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_302' title='bbox 639 2125 746 2144; x_wconf 81' lang='eng' dir='ltr'>neonatus</span> <span class='ocrx_word' id='word_1_303' title='bbox 756 2124 809 2144; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_304' title='bbox 821 2125 890 2143; x_wconf 90' lang='eng'>19978</span> <span class='ocrx_word' id='word_1_305' title='bbox 901 2124 1035 2149; x_wconf 85' lang='eng' dir='ltr'>(EF601312)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_100' title="bbox 555 2157 1042 2184; baseline 0.004 -8"><span class='ocrx_word' id='word_1_306' title='bbox 555 2160 579 2176; x_wconf 82' lang='eng'>93</span> <span class='ocrx_word' id='word_1_307' title='bbox 607 2159 625 2178; x_wconf 96' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_308' title='bbox 637 2160 744 2179; x_wconf 83' lang='eng' dir='ltr'>neonatus</span> <span class='ocrx_word' id='word_1_309' title='bbox 754 2159 806 2179; x_wconf 91' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_310' title='bbox 819 2157 1042 2184; x_wconf 80' lang='eng' dir='ltr'>19973T(EF601310)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_101' title="bbox 657 2192 1072 2219; baseline -0.002 -5"><span class='ocrx_word' id='word_1_311' title='bbox 657 2194 674 2213; x_wconf 92' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_312' title='bbox 686 2194 772 2219; x_wconf 80' lang='eng' dir='ltr'>gal/icus</span> <span class='ocrx_word' id='word_1_313' title='bbox 782 2194 835 2214; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_314' title='bbox 845 2192 928 2213; x_wconf 75' lang='eng' dir='ltr'>21330T</span> <span class='ocrx_word' id='word_1_315' title='bbox 938 2194 1072 2219; x_wconf 84' lang='eng' dir='ltr'>(EF601347)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_102' title="bbox 677 2229 1095 2254; baseline 0 -5"><span class='ocrx_word' id='word_1_316' title='bbox 677 2230 695 2249; x_wconf 95' lang='eng' dir='ltr'>V.</span> <span class='ocrx_word' id='word_1_317' title='bbox 707 2230 806 2249; x_wconf 86' lang='eng' dir='ltr'>cholerae</span> <span class='ocrx_word' id='word_1_318' title='bbox 816 2229 869 2249; x_wconf 91' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_319' title='bbox 879 2230 950 2249; x_wconf 88' lang='eng'>21698</span> <span class='ocrx_word' id='word_1_320' title='bbox 960 2230 1095 2254; x_wconf 85' lang='eng' dir='ltr'>(EF601300)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 5 2059 7 2236">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 5 2059 7 2236">
+     <span class='ocr_line' id='line_1_103' title="bbox 5 2059 7 2236; baseline 0 24"><span class='ocrx_word' id='word_1_321' title='bbox 5 2059 7 2236; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 5 2234 666 2236">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 5 2234 666 2236">
+     <span class='ocr_line' id='line_1_104' title="bbox 5 2234 666 2236; baseline 0 24"><span class='ocrx_word' id='word_1_322' title='bbox 5 2234 666 2236; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003442-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003442-0-001.pbm.png
new file mode 100644
index 00000000..788383d6
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003442-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003442-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003442-0-001.pbm.png.hocr
new file mode 100644
index 00000000..4c74a8cd
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003442-0-001.pbm.png.hocr
@@ -0,0 +1,212 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003442-0-001.pbm.png"; bbox 0 0 1302 2256; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 183 13 1071 670">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 183 13 1071 670">
+     <span class='ocr_line' id='line_1_1' title="bbox 262 13 878 48; baseline 0 -14"><span class='ocrx_word' id='word_1_1' title='bbox 262 29 288 48; x_wconf 67' lang='eng'>89</span> <span class='ocrx_word' id='word_1_2' title='bbox 320 13 343 34; x_wconf 90' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_3' title='bbox 355 13 525 34; x_wconf 85' lang='eng' dir='ltr'>coerulescens</span> <span class='ocrx_word' id='word_1_4' title='bbox 535 13 613 34; x_wconf 88' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_5' title='bbox 626 13 715 34; x_wconf 83' lang='eng' dir='ltr'>12758T</span> <span class='ocrx_word' id='word_1_6' title='bbox 725 13 878 40; x_wconf 87' lang='eng' dir='ltr'>(AB184122)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 336 42 848 69; baseline 0 -6"><span class='ocrx_word' id='word_1_7' title='bbox 336 42 358 63; x_wconf 94' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_8' title='bbox 370 42 507 63; x_wconf 85' lang='eng' dir='ltr'>abikoensis</span> <span class='ocrx_word' id='word_1_9' title='bbox 517 42 595 63; x_wconf 88' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_10' title='bbox 608 42 685 63; x_wconf 86' lang='eng'>12887</span> <span class='ocrx_word' id='word_1_11' title='bbox 696 42 848 69; x_wconf 85' lang='eng' dir='ltr'>(AB249967)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 255 70 820 97; baseline 0.002 -6"><span class='ocrx_word' id='word_1_12' title='bbox 255 72 277 91; x_wconf 86' lang='eng'>81</span> <span class='ocrx_word' id='word_1_13' title='bbox 314 70 336 92; x_wconf 92' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_14' title='bbox 349 70 478 92; x_wconf 87' lang='eng' dir='ltr'>ehimensis</span> <span class='ocrx_word' id='word_1_15' title='bbox 489 70 567 92; x_wconf 88' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_16' title='bbox 579 70 656 92; x_wconf 88' lang='eng'>13802</span> <span class='ocrx_word' id='word_1_17' title='bbox 667 70 820 97; x_wconf 87' lang='eng' dir='ltr'>(AB184493)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 238 99 880 129; baseline -0.002 -8"><span class='ocrx_word' id='word_1_18' title='bbox 238 110 264 129; x_wconf 74' lang='eng'>53</span> <span class='ocrx_word' id='word_1_19' title='bbox 314 99 336 121; x_wconf 92' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_20' title='bbox 348 99 554 121; x_wconf 78' lang='eng' dir='ltr'>Iuteoverﬁcil/atus</span> <span class='ocrx_word' id='word_1_21' title='bbox 564 99 642 121; x_wconf 90' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_22' title='bbox 654 99 715 121; x_wconf 90' lang='eng'>3722</span> <span class='ocrx_word' id='word_1_23' title='bbox 727 99 880 126; x_wconf 85' lang='eng' dir='ltr'>(AB184791)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 305 127 896 155; baseline 0 -6"><span class='ocrx_word' id='word_1_24' title='bbox 305 127 327 149; x_wconf 93' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_25' title='bbox 339 128 554 149; x_wconf 83' lang='eng' dir='ltr'>roseovertici/Iatus</span> <span class='ocrx_word' id='word_1_26' title='bbox 565 127 643 149; x_wconf 90' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_27' title='bbox 656 128 732 149; x_wconf 89' lang='eng'>15920</span> <span class='ocrx_word' id='word_1_28' title='bbox 744 127 896 155; x_wconf 87' lang='eng' dir='ltr'>(AB184715)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 352 156 876 183; baseline 0 -6"><span class='ocrx_word' id='word_1_29' title='bbox 352 156 375 177; x_wconf 88' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_30' title='bbox 387 156 524 177; x_wconf 82' lang='eng' dir='ltr'>Iuteireticuli</span> <span class='ocrx_word' id='word_1_31' title='bbox 533 156 611 177; x_wconf 88' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_32' title='bbox 624 156 713 177; x_wconf 83' lang='eng' dir='ltr'>13422T</span> <span class='ocrx_word' id='word_1_33' title='bbox 723 156 876 183; x_wconf 84' lang='eng' dir='ltr'>(AB249969)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 219 185 919 212; baseline 0 -6"><span class='ocrx_word' id='word_1_34' title='bbox 219 190 245 209; x_wconf 79' lang='eng' dir='ltr'>go</span> <span class='ocrx_word' id='word_1_35' title='bbox 260 193 282 211; x_wconf 76' lang='eng'>51</span> <span class='ocrx_word' id='word_1_36' title='bbox 359 185 382 206; x_wconf 91' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_37' title='bbox 395 185 552 206; x_wconf 88' lang='eng' dir='ltr'>varsoviensis</span> <span class='ocrx_word' id='word_1_38' title='bbox 563 185 638 206; x_wconf 89' lang='eng' dir='ltr'>NRRL</span> <span class='ocrx_word' id='word_1_39' title='bbox 649 185 751 206; x_wconf 85' lang='eng' dir='ltr'>B-3589T</span> <span class='ocrx_word' id='word_1_40' title='bbox 762 185 919 212; x_wconf 84' lang='eng' dir='ltr'>(DQOZ6653)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 261 213 894 240; baseline 0 -6"><span class='ocrx_word' id='word_1_41' title='bbox 261 221 287 240; x_wconf 83' lang='eng'>55</span> <span class='ocrx_word' id='word_1_42' title='bbox 318 213 341 234; x_wconf 87' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_43' title='bbox 353 213 541 240; x_wconf 86' lang='eng' dir='ltr'>sapporonensis</span> <span class='ocrx_word' id='word_1_44' title='bbox 551 213 630 234; x_wconf 85' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_45' title='bbox 642 213 731 234; x_wconf 84' lang='eng' dir='ltr'>13823T</span> <span class='ocrx_word' id='word_1_46' title='bbox 741 213 894 240; x_wconf 89' lang='eng' dir='ltr'>(AB184508)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 183 242 927 270; baseline -0.001 -6"><span class='ocrx_word' id='word_1_47' title='bbox 183 251 209 270; x_wconf 80' lang='eng'>73</span> <span class='ocrx_word' id='word_1_48' title='bbox 282 245 306 264; x_wconf 84' lang='eng'>9</span> <span class='ocrx_word' id='word_1_49' title='bbox 319 242 341 263; x_wconf 89' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_50' title='bbox 353 242 574 269; x_wconf 81' lang='eng' dir='ltr'>griseoverticil/atus</span> <span class='ocrx_word' id='word_1_51' title='bbox 584 242 663 263; x_wconf 90' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_52' title='bbox 676 242 764 263; x_wconf 88' lang='eng' dir='ltr'>13420T</span> <span class='ocrx_word' id='word_1_53' title='bbox 774 242 927 269; x_wconf 91' lang='eng' dir='ltr'>(AB184862)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 323 270 788 297; baseline 0.002 -6"><span class='ocrx_word' id='word_1_54' title='bbox 323 270 345 292; x_wconf 90' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_55' title='bbox 357 271 459 292; x_wconf 89' lang='eng' dir='ltr'>Ii/acinus</span> <span class='ocrx_word' id='word_1_56' title='bbox 470 270 528 292; x_wconf 92' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_57' title='bbox 539 270 630 292; x_wconf 87' lang='eng' dir='ltr'>20059T</span> <span class='ocrx_word' id='word_1_58' title='bbox 640 270 788 297; x_wconf 85' lang='eng' dir='ltr'>(AJ781346)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 283 299 946 326; baseline 0 -6"><span class='ocrx_word' id='word_1_59' title='bbox 283 304 309 323; x_wconf 79' lang='eng'>98</span> <span class='ocrx_word' id='word_1_60' title='bbox 383 299 405 321; x_wconf 92' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_61' title='bbox 417 299 593 321; x_wconf 88' lang='eng' dir='ltr'>hiroshimensis</span> <span class='ocrx_word' id='word_1_62' title='bbox 603 299 682 321; x_wconf 92' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_63' title='bbox 695 299 783 321; x_wconf 89' lang='eng' dir='ltr'>12785T</span> <span class='ocrx_word' id='word_1_64' title='bbox 793 299 946 326; x_wconf 89' lang='eng' dir='ltr'>(AB184144)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 330 328 883 355; baseline 0 -6"><span class='ocrx_word' id='word_1_65' title='bbox 330 328 352 349; x_wconf 89' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_66' title='bbox 364 328 530 349; x_wconf 84' lang='eng' dir='ltr'>mobaraensis</span> <span class='ocrx_word' id='word_1_67' title='bbox 540 328 618 349; x_wconf 87' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_68' title='bbox 631 328 720 349; x_wconf 78' lang='eng' dir='ltr'>13819T</span> <span class='ocrx_word' id='word_1_69' title='bbox 730 328 883 355; x_wconf 90' lang='eng' dir='ltr'>(AB184870)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 453 356 904 384; baseline -0.002 -6"><span class='ocrx_word' id='word_1_70' title='bbox 453 356 475 378; x_wconf 89' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_71' title='bbox 488 357 578 378; x_wconf 88' lang='eng' dir='ltr'><em>albulus</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 589 356 638 378; x_wconf 92' lang='eng' dir='ltr'>IMC</span> <span class='ocrx_word' id='word_1_73' title='bbox 649 356 740 378; x_wconf 82' lang='eng'>8—0802</span> <span class='ocrx_word' id='word_1_74' title='bbox 751 356 904 384; x_wconf 78' lang='eng' dir='ltr'>(ABOZ4440)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 396 385 884 413; baseline -0.002 -6"><span class='ocrx_word' id='word_1_75' title='bbox 396 385 419 407; x_wconf 87' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_76' title='bbox 431 386 585 407; x_wconf 87' lang='eng' dir='ltr'>mashuensis</span> <span class='ocrx_word' id='word_1_77' title='bbox 595 385 655 407; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_78' title='bbox 666 386 757 407; x_wconf 88' lang='eng' dir='ltr'>40221T</span> <span class='ocrx_word' id='word_1_79' title='bbox 767 385 884 413; x_wconf 83' lang='eng' dir='ltr'>(X79323)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 450 414 908 441; baseline 0 -6"><span class='ocrx_word' id='word_1_80' title='bbox 450 414 472 435; x_wconf 92' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_81' title='bbox 484 415 580 435; x_wconf 85' lang='eng' dir='ltr'>auratus</span> <span class='ocrx_word' id='word_1_82' title='bbox 590 414 666 435; x_wconf 92' lang='eng' dir='ltr'>NRRL</span> <span class='ocrx_word' id='word_1_83' title='bbox 677 414 751 435; x_wconf 82' lang='eng' dir='ltr'>8097T</span> <span class='ocrx_word' id='word_1_84' title='bbox 761 414 908 441; x_wconf 83' lang='eng' dir='ltr'>(AJ391816)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 435 442 1060 480; baseline 0 -17"><span class='ocrx_word' id='word_1_85' title='bbox 435 461 461 480; x_wconf 74' lang='eng'>99</span> <span class='ocrx_word' id='word_1_86' title='bbox 509 442 532 463; x_wconf 89' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_87' title='bbox 544 442 708 463; x_wconf 84' lang='eng' dir='ltr'>nashvi/lensis</span> <span class='ocrx_word' id='word_1_88' title='bbox 718 442 796 463; x_wconf 93' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_89' title='bbox 809 442 897 463; x_wconf 83' lang='eng' dir='ltr'>13064T</span> <span class='ocrx_word' id='word_1_90' title='bbox 908 442 1060 469; x_wconf 89' lang='eng' dir='ltr'>(AB184286)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 509 471 1021 498; baseline 0 -6"><span class='ocrx_word' id='word_1_91' title='bbox 509 471 532 492; x_wconf 89' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_92' title='bbox 544 471 695 492; x_wconf 86' lang='eng' dir='ltr'>mauvecolor</span> <span class='ocrx_word' id='word_1_93' title='bbox 703 471 762 492; x_wconf 91' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_94' title='bbox 772 471 863 492; x_wconf 91' lang='eng' dir='ltr'>20100T</span> <span class='ocrx_word' id='word_1_95' title='bbox 874 471 1021 498; x_wconf 90' lang='eng' dir='ltr'>(AJ781358)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 493 499 1014 526; baseline -0.002 -5"><span class='ocrx_word' id='word_1_96' title='bbox 493 499 515 521; x_wconf 93' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_97' title='bbox 529 500 661 521; x_wconf 87' lang='eng' dir='ltr'>Violascens</span> <span class='ocrx_word' id='word_1_98' title='bbox 672 499 750 521; x_wconf 93' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_99' title='bbox 763 500 851 521; x_wconf 88' lang='eng' dir='ltr'>12920T</span> <span class='ocrx_word' id='word_1_100' title='bbox 862 499 1014 526; x_wconf 84' lang='eng' dir='ltr'>(AB184246)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 508 528 967 555; baseline -0.002 -5"><span class='ocrx_word' id='word_1_101' title='bbox 508 528 531 550; x_wconf 90' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_102' title='bbox 543 534 653 550; x_wconf 87' lang='eng' dir='ltr'>cremeus</span> <span class='ocrx_word' id='word_1_103' title='bbox 662 528 718 550; x_wconf 89' lang='eng' dir='ltr'>JCM</span> <span class='ocrx_word' id='word_1_104' title='bbox 729 528 804 550; x_wconf 85' lang='eng' dir='ltr'>4362T</span> <span class='ocrx_word' id='word_1_105' title='bbox 814 528 967 555; x_wconf 87' lang='eng' dir='ltr'>(AY999744)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 378 556 973 584; baseline -0.003 -4"><span class='ocrx_word' id='word_1_106' title='bbox 378 561 400 580; x_wconf 90' lang='eng'>51</span> <span class='ocrx_word' id='word_1_107' title='bbox 562 556 584 578; x_wconf 89' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_108' title='bbox 595 557 657 584; x_wconf 84' lang='eng' dir='ltr'><em>yanii</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 664 556 700 578; x_wconf 90' lang='eng' dir='ltr'>AS</span> <span class='ocrx_word' id='word_1_110' title='bbox 711 557 810 578; x_wconf 83' lang='eng' dir='ltr'>4.1146T</span> <span class='ocrx_word' id='word_1_111' title='bbox 820 556 973 584; x_wconf 86' lang='eng' dir='ltr'>(ABO15854)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 337 579 1034 613; baseline 0 -6"><span class='ocrx_word' id='word_1_112' title='bbox 337 589 363 608; x_wconf 81' lang='eng'>60</span> <span class='ocrx_word' id='word_1_113' title='bbox 457 579 483 597; x_wconf 82' lang='eng'>97</span> <span class='ocrx_word' id='word_1_114' title='bbox 503 585 526 607; x_wconf 89' lang='eng' dir='ltr'>s.</span> <span class='ocrx_word' id='word_1_115' title='bbox 538 585 683 607; x_wconf 84' lang='eng' dir='ltr'>kurssanovii</span> <span class='ocrx_word' id='word_1_116' title='bbox 692 585 770 607; x_wconf 91' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_117' title='bbox 783 585 871 607; x_wconf 81' lang='eng' dir='ltr'>13192T</span> <span class='ocrx_word' id='word_1_118' title='bbox 882 585 1034 613; x_wconf 89' lang='eng' dir='ltr'>(AB184325)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 421 612 1071 641; baseline 0 -5"><span class='ocrx_word' id='word_1_119' title='bbox 421 612 447 630; x_wconf 82' lang='eng'>99</span> <span class='ocrx_word' id='word_1_120' title='bbox 512 614 534 636; x_wconf 91' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_121' title='bbox 546 614 742 641; x_wconf 85' lang='eng' dir='ltr'>graminofaciens</span> <span class='ocrx_word' id='word_1_122' title='bbox 752 614 811 636; x_wconf 93' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_123' title='bbox 824 614 913 636; x_wconf 83' lang='eng' dir='ltr'>19892T</span> <span class='ocrx_word' id='word_1_124' title='bbox 923 614 1071 641; x_wconf 84' lang='eng' dir='ltr'>(AJ781329)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 423 643 956 670; baseline 0 -6"><span class='ocrx_word' id='word_1_125' title='bbox 423 646 450 664; x_wconf 88' lang='eng'>85</span> <span class='ocrx_word' id='word_1_126' title='bbox 484 643 507 664; x_wconf 92' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_127' title='bbox 518 643 642 669; x_wconf 87' lang='eng' dir='ltr'>peucetius</span> <span class='ocrx_word' id='word_1_128' title='bbox 652 643 708 664; x_wconf 91' lang='eng' dir='ltr'>JCM</span> <span class='ocrx_word' id='word_1_129' title='bbox 719 643 793 664; x_wconf 82' lang='eng' dir='ltr'>9920T</span> <span class='ocrx_word' id='word_1_130' title='bbox 804 643 956 670; x_wconf 89' lang='eng' dir='ltr'>(ABO45887)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 305 488 331 506">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 305 488 331 506">
+     <span class='ocr_line' id='line_1_24' title="bbox 305 488 331 506; baseline 0 0"><span class='ocrx_word' id='word_1_131' title='bbox 305 488 331 506; x_wconf 84' lang='eng'>99</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 207 671 1164 813">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 207 671 1164 813">
+     <span class='ocr_line' id='line_1_25' title="bbox 264 671 1030 703; baseline 0 -10"><span class='ocrx_word' id='word_1_132' title='bbox 264 684 290 703; x_wconf 73' lang='eng'>86</span> <span class='ocrx_word' id='word_1_133' title='bbox 484 671 507 693; x_wconf 90' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_134' title='bbox 518 672 678 693; x_wconf 79' lang='eng' dir='ltr'>xantholiticus</span> <span class='ocrx_word' id='word_1_135' title='bbox 688 671 766 693; x_wconf 92' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_136' title='bbox 779 672 867 693; x_wconf 84' lang='eng' dir='ltr'>13354T</span> <span class='ocrx_word' id='word_1_137' title='bbox 878 671 1030 699; x_wconf 85' lang='eng' dir='ltr'>(AB184349)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 386 700 789 727; baseline 0 -6"><span class='ocrx_word' id='word_1_138' title='bbox 386 700 409 721; x_wconf 89' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_139' title='bbox 416 700 525 727; x_wconf 86' lang='eng' dir='ltr'>javensis</span> <span class='ocrx_word' id='word_1_140' title='bbox 535 700 631 721; x_wconf 89' lang='eng' dir='ltr'>B22P3T</span> <span class='ocrx_word' id='word_1_141' title='bbox 641 700 789 727; x_wconf 87' lang='eng' dir='ltr'>(AJ391833)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 255 728 870 760; baseline 0 -11"><span class='ocrx_word' id='word_1_142' title='bbox 255 741 281 760; x_wconf 73' lang='eng'>86</span> <span class='ocrx_word' id='word_1_143' title='bbox 392 728 414 750; x_wconf 88' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_144' title='bbox 425 729 620 755; x_wconf 72' lang='eng' dir='ltr'>yogyakan‘ensis</span> <span class='ocrx_word' id='word_1_145' title='bbox 629 728 712 750; x_wconf 86' lang='eng' dir='ltr'>C4R3T</span> <span class='ocrx_word' id='word_1_146' title='bbox 723 728 870 755; x_wconf 86' lang='eng' dir='ltr'>(AJ391827)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 207 757 1164 794; baseline 0 -16"><span class='ocrx_word' id='word_1_147' title='bbox 207 776 233 794; x_wconf 71' lang='eng'>78</span> <span class='ocrx_word' id='word_1_148' title='bbox 316 757 338 778; x_wconf 94' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_149' title='bbox 350 757 535 784; x_wconf 82' lang='eng' dir='ltr'>hygroscopicus</span> <span class='ocrx_word' id='word_1_150' title='bbox 544 757 626 784; x_wconf 86' lang='eng' dir='ltr'>subsp.</span> <span class='ocrx_word' id='word_1_151' title='bbox 638 757 822 784; x_wconf 88' lang='eng' dir='ltr'>hygroscopicus</span> <span class='ocrx_word' id='word_1_152' title='bbox 833 757 911 778; x_wconf 91' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_153' title='bbox 924 757 1001 778; x_wconf 88' lang='eng'>14015</span> <span class='ocrx_word' id='word_1_154' title='bbox 1012 757 1164 784; x_wconf 81' lang='eng' dir='ltr'>(AB184566)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 343 786 901 813; baseline 0 -6"><span class='ocrx_word' id='word_1_155' title='bbox 343 786 365 807; x_wconf 94' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_156' title='bbox 377 786 562 813; x_wconf 84' lang='eng' dir='ltr'>hygroscopicus</span> <span class='ocrx_word' id='word_1_157' title='bbox 570 786 647 807; x_wconf 93' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_158' title='bbox 660 786 733 807; x_wconf 92' lang='eng'>14891</span> <span class='ocrx_word' id='word_1_159' title='bbox 748 786 901 813; x_wconf 90' lang='eng' dir='ltr'>(AB217603)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 57 814 1299 1984">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 57 814 1299 1984">
+     <span class='ocr_line' id='line_1_30' title="bbox 335 814 850 842; baseline 0.002 -7"><span class='ocrx_word' id='word_1_160' title='bbox 335 814 357 836; x_wconf 89' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_161' title='bbox 370 815 557 841; x_wconf 89' lang='eng' dir='ltr'>violaceusniger</span> <span class='ocrx_word' id='word_1_162' title='bbox 565 814 607 836; x_wconf 91' lang='eng' dir='ltr'>ISP</span> <span class='ocrx_word' id='word_1_163' title='bbox 619 815 693 836; x_wconf 82' lang='eng' dir='ltr'>5563T</span> <span class='ocrx_word' id='word_1_164' title='bbox 703 814 850 842; x_wconf 86' lang='eng' dir='ltr'>(AJ391823)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 354 843 899 870; baseline 0 -6"><span class='ocrx_word' id='word_1_165' title='bbox 354 843 376 864; x_wconf 93' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_166' title='bbox 388 843 570 870; x_wconf 83' lang='eng' dir='ltr'>sporocinereus</span> <span class='ocrx_word' id='word_1_167' title='bbox 580 843 639 864; x_wconf 94' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_168' title='bbox 650 843 741 864; x_wconf 74' lang='eng' dir='ltr'>20311T</span> <span class='ocrx_word' id='word_1_169' title='bbox 751 843 899 870; x_wconf 86' lang='eng' dir='ltr'>(AJ781368)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 305 871 800 898; baseline -0.004 -4"><span class='ocrx_word' id='word_1_170' title='bbox 305 876 331 894; x_wconf 87' lang='eng'>99</span> <span class='ocrx_word' id='word_1_171' title='bbox 354 871 376 893; x_wconf 91' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_172' title='bbox 389 871 467 893; x_wconf 88' lang='eng' dir='ltr'>endus</span> <span class='ocrx_word' id='word_1_173' title='bbox 477 871 553 892; x_wconf 87' lang='eng' dir='ltr'>NRRL</span> <span class='ocrx_word' id='word_1_174' title='bbox 563 871 637 893; x_wconf 85' lang='eng' dir='ltr'>2339T</span> <span class='ocrx_word' id='word_1_175' title='bbox 647 871 800 898; x_wconf 85' lang='eng' dir='ltr'>(AY999911)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 369 896 989 928; baseline 0 -6"><span class='ocrx_word' id='word_1_176' title='bbox 369 896 381 914; x_wconf 80' lang='eng'><strong>4</strong></span> <span class='ocrx_word' id='word_1_177' title='bbox 403 901 425 922; x_wconf 93' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_178' title='bbox 438 901 636 922; x_wconf 78' lang='eng' dir='ltr'>roseisc/eroticus</span> <span class='ocrx_word' id='word_1_179' title='bbox 646 901 725 922; x_wconf 88' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_180' title='bbox 737 901 826 922; x_wconf 83' lang='eng' dir='ltr'>13002T</span> <span class='ocrx_word' id='word_1_181' title='bbox 836 901 989 928; x_wconf 88' lang='eng' dir='ltr'>(AB184251)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 334 921 850 956; baseline 0 -6"><span class='ocrx_word' id='word_1_182' title='bbox 334 921 360 939; x_wconf 77' lang='eng'>99</span> <span class='ocrx_word' id='word_1_183' title='bbox 396 929 418 950; x_wconf 88' lang='eng' dir='ltr'>s.</span> <span class='ocrx_word' id='word_1_184' title='bbox 431 929 500 950; x_wconf 87' lang='eng' dir='ltr'><em>ruber</em></span> <span class='ocrx_word' id='word_1_185' title='bbox 508 929 586 950; x_wconf 92' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_186' title='bbox 598 929 687 950; x_wconf 83' lang='eng' dir='ltr'>14600T</span> <span class='ocrx_word' id='word_1_187' title='bbox 698 929 850 956; x_wconf 91' lang='eng' dir='ltr'>(AB184604)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 250 954 915 985; baseline 0 -6"><span class='ocrx_word' id='word_1_188' title='bbox 250 954 276 973; x_wconf 76' lang='eng'>82</span> <span class='ocrx_word' id='word_1_189' title='bbox 380 958 402 979; x_wconf 93' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_190' title='bbox 414 958 561 985; x_wconf 85' lang='eng' dir='ltr'>rubiginosus</span> <span class='ocrx_word' id='word_1_191' title='bbox 572 958 650 979; x_wconf 90' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_192' title='bbox 663 958 752 979; x_wconf 79' lang='eng' dir='ltr'>12913T</span> <span class='ocrx_word' id='word_1_193' title='bbox 762 958 915 985; x_wconf 88' lang='eng' dir='ltr'>(AB184241)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 399 986 876 1013; baseline 0 -6"><span class='ocrx_word' id='word_1_194' title='bbox 399 986 422 1008; x_wconf 88' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_195' title='bbox 434 986 523 1013; x_wconf 87' lang='eng' dir='ltr'>spiralis</span> <span class='ocrx_word' id='word_1_196' title='bbox 533 986 611 1008; x_wconf 91' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_197' title='bbox 624 986 712 1008; x_wconf 92' lang='eng' dir='ltr'>14215T</span> <span class='ocrx_word' id='word_1_198' title='bbox 723 986 876 1013; x_wconf 88' lang='eng' dir='ltr'>(AB184575)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 410 1015 929 1042; baseline 0 -6"><span class='ocrx_word' id='word_1_199' title='bbox 410 1015 432 1036; x_wconf 93' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_200' title='bbox 443 1015 576 1041; x_wconf 90' lang='eng' dir='ltr'>poonensis</span> <span class='ocrx_word' id='word_1_201' title='bbox 586 1015 665 1036; x_wconf 85' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_202' title='bbox 677 1015 766 1036; x_wconf 84' lang='eng' dir='ltr'>13485T</span> <span class='ocrx_word' id='word_1_203' title='bbox 776 1015 929 1042; x_wconf 88' lang='eng' dir='ltr'>(AB184437)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 365 1045 1173 1072; baseline 0 -6"><span class='ocrx_word' id='word_1_204' title='bbox 365 1051 391 1070; x_wconf 82' lang='eng'>97</span> <span class='ocrx_word' id='word_1_205' title='bbox 559 1045 585 1063; x_wconf 80' lang='eng'>99</span> <span class='ocrx_word' id='word_1_206' title='bbox 607 1045 630 1066; x_wconf 89' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_207' title='bbox 642 1045 831 1072; x_wconf 78' lang='eng' dir='ltr'>thermovu/garis</span> <span class='ocrx_word' id='word_1_208' title='bbox 841 1045 920 1066; x_wconf 87' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_209' title='bbox 933 1045 1009 1066; x_wconf 87' lang='eng'>16609</span> <span class='ocrx_word' id='word_1_210' title='bbox 1020 1045 1173 1072; x_wconf 80' lang='eng' dir='ltr'>(ABZ49975)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 607 1074 1194 1101; baseline 0 -6"><span class='ocrx_word' id='word_1_211' title='bbox 607 1074 630 1095; x_wconf 89' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_212' title='bbox 642 1074 825 1101; x_wconf 78' lang='eng' dir='ltr'>thermogriseus</span> <span class='ocrx_word' id='word_1_213' title='bbox 835 1074 913 1095; x_wconf 91' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_214' title='bbox 926 1074 1031 1095; x_wconf 89' lang='eng' dir='ltr'>100772T</span> <span class='ocrx_word' id='word_1_215' title='bbox 1041 1074 1194 1101; x_wconf 81' lang='eng' dir='ltr'>(ABZ49980)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 201 1093 960 1129; baseline 0 -6"><span class='ocrx_word' id='word_1_216' title='bbox 201 1093 227 1112; x_wconf 78' lang='eng'>93</span> <span class='ocrx_word' id='word_1_217' title='bbox 459 1102 481 1123; x_wconf 90' lang='eng' dir='ltr'>s.</span> <span class='ocrx_word' id='word_1_218' title='bbox 493 1102 630 1123; x_wconf 87' lang='eng' dir='ltr'><em>mexicanus</em></span> <span class='ocrx_word' id='word_1_219' title='bbox 640 1102 799 1123; x_wconf 88' lang='eng' dir='ltr'>CH-M-1035T</span> <span class='ocrx_word' id='word_1_220' title='bbox 809 1102 960 1129; x_wconf 89' lang='eng' dir='ltr'>(AF441168)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 262 1131 1111 1160; baseline 0 -8"><span class='ocrx_word' id='word_1_221' title='bbox 262 1142 288 1160; x_wconf 77' lang='eng'>53</span> <span class='ocrx_word' id='word_1_222' title='bbox 464 1131 487 1152; x_wconf 91' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_223' title='bbox 500 1131 809 1158; x_wconf 84' lang='eng' dir='ltr'>thermocarboxydovorans</span> <span class='ocrx_word' id='word_1_224' title='bbox 820 1131 880 1152; x_wconf 87' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_225' title='bbox 891 1131 982 1152; x_wconf 88' lang='eng' dir='ltr'>44296T</span> <span class='ocrx_word' id='word_1_226' title='bbox 992 1131 1111 1158; x_wconf 87' lang='eng' dir='ltr'>(U94489)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 314 1159 1004 1186; baseline -0.003 -4"><span class='ocrx_word' id='word_1_227' title='bbox 314 1164 340 1182; x_wconf 91' lang='eng'>50</span> <span class='ocrx_word' id='word_1_228' title='bbox 512 1159 535 1181; x_wconf 88' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_229' title='bbox 547 1160 656 1181; x_wconf 89' lang='eng' dir='ltr'>nodosus</span> <span class='ocrx_word' id='word_1_230' title='bbox 665 1159 742 1181; x_wconf 94' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_231' title='bbox 754 1160 843 1181; x_wconf 83' lang='eng' dir='ltr'>14899T</span> <span class='ocrx_word' id='word_1_232' title='bbox 853 1159 1004 1186; x_wconf 88' lang='eng' dir='ltr'>(AF114036)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 433 1188 911 1216; baseline 0 -6"><span class='ocrx_word' id='word_1_233' title='bbox 433 1188 456 1210; x_wconf 90' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_234' title='bbox 468 1188 629 1216; x_wconf 81' lang='eng' dir='ltr'>koyangens/s</span> <span class='ocrx_word' id='word_1_235' title='bbox 637 1188 748 1210; x_wconf 90' lang='eng' dir='ltr'>VK—A60T</span> <span class='ocrx_word' id='word_1_236' title='bbox 758 1188 911 1216; x_wconf 87' lang='eng' dir='ltr'>(AY079156)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 341 1217 945 1244; baseline 0 -6"><span class='ocrx_word' id='word_1_237' title='bbox 341 1220 363 1239; x_wconf 85' lang='eng'>81</span> <span class='ocrx_word' id='word_1_238' title='bbox 464 1217 487 1238; x_wconf 88' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_239' title='bbox 499 1217 647 1238; x_wconf 83' lang='eng' dir='ltr'>intermedius</span> <span class='ocrx_word' id='word_1_240' title='bbox 658 1217 718 1238; x_wconf 86' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_241' title='bbox 728 1217 820 1238; x_wconf 89' lang='eng' dir='ltr'>40372T</span> <span class='ocrx_word' id='word_1_242' title='bbox 830 1217 945 1244; x_wconf 90' lang='eng' dir='ltr'>(Z76686)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 405 1245 926 1272; baseline 0.002 -6"><span class='ocrx_word' id='word_1_243' title='bbox 405 1245 428 1267; x_wconf 89' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_244' title='bbox 442 1246 573 1272; x_wconf 83' lang='eng' dir='ltr'>variegatus</span> <span class='ocrx_word' id='word_1_245' title='bbox 583 1245 662 1267; x_wconf 89' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_246' title='bbox 675 1245 763 1267; x_wconf 87' lang='eng' dir='ltr'>15462T</span> <span class='ocrx_word' id='word_1_247' title='bbox 773 1245 926 1272; x_wconf 87' lang='eng' dir='ltr'>(AB184688)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 466 1274 1079 1301; baseline -0.002 -5"><span class='ocrx_word' id='word_1_248' title='bbox 466 1274 488 1296; x_wconf 93' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_249' title='bbox 501 1275 717 1296; x_wconf 81' lang='eng' dir='ltr'>aureoverticil/atus</span> <span class='ocrx_word' id='word_1_250' title='bbox 727 1275 803 1295; x_wconf 93' lang='eng' dir='ltr'>NRRL</span> <span class='ocrx_word' id='word_1_251' title='bbox 814 1274 916 1296; x_wconf 86' lang='eng' dir='ltr'>B—3326T</span> <span class='ocrx_word' id='word_1_252' title='bbox 927 1274 1079 1301; x_wconf 85' lang='eng' dir='ltr'>(AY999774)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 370 1303 919 1330; baseline 0 -6"><span class='ocrx_word' id='word_1_253' title='bbox 370 1307 396 1325; x_wconf 87' lang='eng'>88</span> <span class='ocrx_word' id='word_1_254' title='bbox 449 1303 478 1324; x_wconf 85' lang='eng' dir='ltr'>‘S.</span> <span class='ocrx_word' id='word_1_255' title='bbox 490 1303 576 1324; x_wconf 89' lang='eng' dir='ltr'>nobi/is’</span> <span class='ocrx_word' id='word_1_256' title='bbox 588 1303 666 1324; x_wconf 85' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_257' title='bbox 679 1303 755 1324; x_wconf 85' lang='eng'>13386</span> <span class='ocrx_word' id='word_1_258' title='bbox 766 1303 919 1330; x_wconf 86' lang='eng' dir='ltr'>(AB184370)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_48' title="bbox 413 1331 935 1358; baseline -0.002 -5"><span class='ocrx_word' id='word_1_259' title='bbox 413 1331 436 1353; x_wconf 90' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_260' title='bbox 448 1332 582 1358; x_wconf 86' lang='eng' dir='ltr'>spectabilis</span> <span class='ocrx_word' id='word_1_261' title='bbox 593 1331 671 1353; x_wconf 87' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_262' title='bbox 684 1332 772 1353; x_wconf 87' lang='eng' dir='ltr'>13424T</span> <span class='ocrx_word' id='word_1_263' title='bbox 783 1331 935 1358; x_wconf 87' lang='eng' dir='ltr'>(AB184393)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_49' title="bbox 341 1360 915 1387; baseline 0 -6"><span class='ocrx_word' id='word_1_264' title='bbox 341 1360 364 1381; x_wconf 86' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_265' title='bbox 376 1360 586 1387; x_wconf 86' lang='eng' dir='ltr'>spinoverrucosus</span> <span class='ocrx_word' id='word_1_266' title='bbox 596 1360 656 1381; x_wconf 90' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_267' title='bbox 667 1360 757 1381; x_wconf 86' lang='eng' dir='ltr'>20321T</span> <span class='ocrx_word' id='word_1_268' title='bbox 767 1360 915 1387; x_wconf 88' lang='eng' dir='ltr'>(AJ781376)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_50' title="bbox 401 1388 893 1415; baseline -0.002 -5"><span class='ocrx_word' id='word_1_269' title='bbox 401 1388 424 1410; x_wconf 89' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_270' title='bbox 436 1389 564 1410; x_wconf 88' lang='eng' dir='ltr'>indiaensis</span> <span class='ocrx_word' id='word_1_271' title='bbox 574 1388 633 1410; x_wconf 93' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_272' title='bbox 646 1388 735 1410; x_wconf 87' lang='eng' dir='ltr'>19961T</span> <span class='ocrx_word' id='word_1_273' title='bbox 746 1388 893 1415; x_wconf 85' lang='eng' dir='ltr'>(AJ781344)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_51' title="bbox 274 1411 969 1444; baseline 0.003 -8"><span class='ocrx_word' id='word_1_274' title='bbox 274 1417 300 1436; x_wconf 88' lang='eng'>52</span> <span class='ocrx_word' id='word_1_275' title='bbox 340 1411 366 1429; x_wconf 73' lang='eng'>57</span> <span class='ocrx_word' id='word_1_276' title='bbox 448 1417 471 1438; x_wconf 89' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_277' title='bbox 483 1417 617 1438; x_wconf 86' lang='eng' dir='ltr'><em>f/avoviridis</em></span> <span class='ocrx_word' id='word_1_278' title='bbox 627 1417 705 1438; x_wconf 90' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_279' title='bbox 718 1417 806 1438; x_wconf 90' lang='eng' dir='ltr'>12772T</span> <span class='ocrx_word' id='word_1_280' title='bbox 817 1417 969 1444; x_wconf 90' lang='eng' dir='ltr'>(AB184842)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_52' title="bbox 430 1445 945 1472; baseline 0 -5"><span class='ocrx_word' id='word_1_281' title='bbox 430 1445 453 1467; x_wconf 92' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_282' title='bbox 464 1446 627 1467; x_wconf 85' lang='eng' dir='ltr'>Iomondensis</span> <span class='ocrx_word' id='word_1_283' title='bbox 637 1445 696 1467; x_wconf 93' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_284' title='bbox 707 1446 786 1467; x_wconf 88' lang='eng'>20088</span> <span class='ocrx_word' id='word_1_285' title='bbox 797 1445 945 1472; x_wconf 87' lang='eng' dir='ltr'>(AJ781352)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_53' title="bbox 57 1468 1019 1510; baseline 0 -14"><span class='ocrx_word' id='word_1_286' title='bbox 57 1488 83 1507; x_wconf 73' lang='eng'>76</span> <span class='ocrx_word' id='word_1_287' title='bbox 385 1468 430 1510; x_wconf 62' lang='eng'>5153</span> <span class='ocrx_word' id='word_1_288' title='bbox 525 1474 548 1496; x_wconf 89' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_289' title='bbox 560 1475 667 1496; x_wconf 83' lang='eng' dir='ltr'>Iateritius</span> <span class='ocrx_word' id='word_1_290' title='bbox 677 1474 755 1496; x_wconf 92' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_291' title='bbox 768 1475 856 1496; x_wconf 88' lang='eng' dir='ltr'>12788T</span> <span class='ocrx_word' id='word_1_292' title='bbox 867 1474 1019 1502; x_wconf 84' lang='eng' dir='ltr'>(AY999855)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_54' title="bbox 488 1503 1005 1530; baseline -0.002 -5"><span class='ocrx_word' id='word_1_293' title='bbox 488 1503 510 1525; x_wconf 90' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_294' title='bbox 522 1503 676 1530; x_wconf 83' lang='eng' dir='ltr'>griseoﬂavus</span> <span class='ocrx_word' id='word_1_295' title='bbox 686 1503 745 1525; x_wconf 93' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_296' title='bbox 758 1503 847 1525; x_wconf 77' lang='eng' dir='ltr'>19344T</span> <span class='ocrx_word' id='word_1_297' title='bbox 857 1503 1005 1530; x_wconf 89' lang='eng' dir='ltr'>(AJ781322)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_55' title="bbox 430 1531 946 1559; baseline 0 -6"><span class='ocrx_word' id='word_1_298' title='bbox 430 1531 452 1553; x_wconf 93' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_299' title='bbox 465 1532 585 1558; x_wconf 80' lang='eng' dir='ltr'><em>almquistii</em></span> <span class='ocrx_word' id='word_1_300' title='bbox 594 1532 670 1553; x_wconf 92' lang='eng' dir='ltr'>NRRL</span> <span class='ocrx_word' id='word_1_301' title='bbox 681 1532 783 1553; x_wconf 89' lang='eng' dir='ltr'>B-1685T</span> <span class='ocrx_word' id='word_1_302' title='bbox 794 1531 946 1559; x_wconf 86' lang='eng' dir='ltr'>(AY999782)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_56' title="bbox 403 1554 1299 1585; baseline -0.001 -5"><span class='ocrx_word' id='word_1_303' title='bbox 403 1554 430 1572; x_wconf 79' lang='eng'>49</span> <span class='ocrx_word' id='word_1_304' title='bbox 630 1558 653 1580; x_wconf 86' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_305' title='bbox 666 1558 947 1585; x_wconf 83' lang='eng' dir='ltr'>violaceochromogenes</span> <span class='ocrx_word' id='word_1_306' title='bbox 957 1558 1035 1580; x_wconf 91' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_307' title='bbox 1048 1558 1137 1580; x_wconf 82' lang='eng' dir='ltr'>13100T</span> <span class='ocrx_word' id='word_1_308' title='bbox 1147 1558 1299 1585; x_wconf 84' lang='eng' dir='ltr'>(AY999867)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_57' title="bbox 348 1584 988 1614; baseline 0 -6"><span class='ocrx_word' id='word_1_309' title='bbox 348 1584 374 1602; x_wconf 89' lang='eng'>77</span> <span class='ocrx_word' id='word_1_310' title='bbox 478 1586 500 1608; x_wconf 94' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_311' title='bbox 512 1587 603 1614; x_wconf 84' lang='eng' dir='ltr'><em>iakyrus</em></span> <span class='ocrx_word' id='word_1_312' title='bbox 613 1586 745 1608; x_wconf 91' lang='eng' dir='ltr'>NRRL-ISP</span> <span class='ocrx_word' id='word_1_313' title='bbox 756 1587 830 1608; x_wconf 89' lang='eng' dir='ltr'>5482T</span> <span class='ocrx_word' id='word_1_314' title='bbox 840 1586 988 1614; x_wconf 88' lang='eng' dir='ltr'>(AJ399489)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_58' title="bbox 478 1615 1066 1643; baseline 0 -6"><span class='ocrx_word' id='word_1_315' title='bbox 478 1615 500 1637; x_wconf 92' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_316' title='bbox 512 1616 716 1643; x_wconf 88' lang='eng' dir='ltr'>Iongispororuber</span> <span class='ocrx_word' id='word_1_317' title='bbox 724 1615 802 1637; x_wconf 88' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_318' title='bbox 814 1616 903 1637; x_wconf 85' lang='eng' dir='ltr'>13488T</span> <span class='ocrx_word' id='word_1_319' title='bbox 914 1615 1066 1643; x_wconf 89' lang='eng' dir='ltr'>(AB184440)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_59' title="bbox 471 1644 1032 1671; baseline 0 -6"><span class='ocrx_word' id='word_1_320' title='bbox 471 1644 493 1665; x_wconf 91' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_321' title='bbox 506 1644 675 1671; x_wconf 85' lang='eng' dir='ltr'>albogriseolus</span> <span class='ocrx_word' id='word_1_322' title='bbox 686 1644 761 1665; x_wconf 89' lang='eng' dir='ltr'>NRRL</span> <span class='ocrx_word' id='word_1_323' title='bbox 773 1644 875 1665; x_wconf 85' lang='eng' dir='ltr'>B-1305T</span> <span class='ocrx_word' id='word_1_324' title='bbox 885 1644 1032 1671; x_wconf 87' lang='eng' dir='ltr'>(AJ494865)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_60' title="bbox 540 1673 1037 1700; baseline 0 -6"><span class='ocrx_word' id='word_1_325' title='bbox 540 1673 563 1694; x_wconf 91' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_326' title='bbox 575 1673 724 1694; x_wconf 83' lang='eng' dir='ltr'>armeniacus</span> <span class='ocrx_word' id='word_1_327' title='bbox 732 1673 789 1694; x_wconf 87' lang='eng' dir='ltr'>JCM</span> <span class='ocrx_word' id='word_1_328' title='bbox 801 1673 875 1694; x_wconf 81' lang='eng' dir='ltr'>3070T</span> <span class='ocrx_word' id='word_1_329' title='bbox 885 1673 1037 1700; x_wconf 83' lang='eng' dir='ltr'>(ABO18092)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_61' title="bbox 394 1701 1050 1728; baseline -0.002 -5"><span class='ocrx_word' id='word_1_330' title='bbox 394 1701 417 1723; x_wconf 86' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_331' title='bbox 429 1701 603 1728; x_wconf 83' lang='eng' dir='ltr'>cacaoisubsp.</span> <span class='ocrx_word' id='word_1_332' title='bbox 615 1701 699 1723; x_wconf 84' lang='eng' dir='ltr'>cacaoi</span> <span class='ocrx_word' id='word_1_333' title='bbox 708 1701 786 1723; x_wconf 90' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_334' title='bbox 799 1701 888 1723; x_wconf 87' lang='eng' dir='ltr'>12748T</span> <span class='ocrx_word' id='word_1_335' title='bbox 898 1701 1050 1728; x_wconf 89' lang='eng' dir='ltr'>(AB184115)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_62' title="bbox 533 1729 1089 1757; baseline 0 -6"><span class='ocrx_word' id='word_1_336' title='bbox 533 1729 556 1751; x_wconf 92' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_337' title='bbox 568 1730 726 1751; x_wconf 89' lang='eng' dir='ltr'>nanshensis</span> <span class='ocrx_word' id='word_1_338' title='bbox 736 1729 824 1751; x_wconf 89' lang='eng' dir='ltr'>SCSIO</span> <span class='ocrx_word' id='word_1_339' title='bbox 834 1730 925 1751; x_wconf 74' lang='eng' dir='ltr'>01066T</span> <span class='ocrx_word' id='word_1_340' title='bbox 935 1729 1089 1757; x_wconf 88' lang='eng' dir='ltr'>(EU589334)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_63' title="bbox 449 1758 940 1785; baseline 0.002 -6"><span class='ocrx_word' id='word_1_341' title='bbox 449 1758 471 1780; x_wconf 89' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_342' title='bbox 484 1759 618 1785; x_wconf 87' lang='eng' dir='ltr'>sodiiphi/us</span> <span class='ocrx_word' id='word_1_343' title='bbox 627 1759 676 1779; x_wconf 94' lang='eng' dir='ltr'>YIM</span> <span class='ocrx_word' id='word_1_344' title='bbox 687 1758 778 1780; x_wconf 73' lang='eng' dir='ltr'>80305T</span> <span class='ocrx_word' id='word_1_345' title='bbox 788 1758 940 1785; x_wconf 86' lang='eng' dir='ltr'>(AY236339)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_64' title="bbox 335 1787 901 1814; baseline 0 -6"><span class='ocrx_word' id='word_1_346' title='bbox 335 1789 361 1808; x_wconf 86' lang='eng'>99</span> <span class='ocrx_word' id='word_1_347' title='bbox 402 1787 424 1808; x_wconf 92' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_348' title='bbox 437 1787 548 1808; x_wconf 86' lang='eng' dir='ltr'>ﬂocculus</span> <span class='ocrx_word' id='word_1_349' title='bbox 558 1787 637 1808; x_wconf 91' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_350' title='bbox 649 1787 738 1808; x_wconf 84' lang='eng' dir='ltr'>13041T</span> <span class='ocrx_word' id='word_1_351' title='bbox 749 1787 901 1814; x_wconf 89' lang='eng' dir='ltr'>(AB184272)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_65' title="bbox 196 1807 955 1843; baseline 0 -6"><span class='ocrx_word' id='word_1_352' title='bbox 196 1807 223 1826; x_wconf 71' lang='eng'>88</span> <span class='ocrx_word' id='word_1_353' title='bbox 394 1816 417 1837; x_wconf 92' lang='eng' dir='ltr'>s.</span> <span class='ocrx_word' id='word_1_354' title='bbox 429 1816 603 1843; x_wconf 83' lang='eng' dir='ltr'>rangoonensis</span> <span class='ocrx_word' id='word_1_355' title='bbox 613 1816 691 1837; x_wconf 91' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_356' title='bbox 704 1816 792 1837; x_wconf 81' lang='eng' dir='ltr'>13078T</span> <span class='ocrx_word' id='word_1_357' title='bbox 803 1816 955 1843; x_wconf 84' lang='eng' dir='ltr'>(AY999859)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_66' title="bbox 337 1844 895 1872; baseline 0.002 -7"><span class='ocrx_word' id='word_1_358' title='bbox 337 1846 363 1865; x_wconf 89' lang='eng'>65</span> <span class='ocrx_word' id='word_1_359' title='bbox 410 1844 432 1866; x_wconf 91' lang='eng' dir='ltr'>s.</span> <span class='ocrx_word' id='word_1_360' title='bbox 444 1845 543 1871; x_wconf 88' lang='eng' dir='ltr'>gibsonii</span> <span class='ocrx_word' id='word_1_361' title='bbox 552 1844 630 1866; x_wconf 91' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_362' title='bbox 643 1845 731 1866; x_wconf 91' lang='eng' dir='ltr'>15415T</span> <span class='ocrx_word' id='word_1_363' title='bbox 742 1844 895 1872; x_wconf 86' lang='eng' dir='ltr'>(AB184663)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_67' title="bbox 354 1873 1015 1900; baseline 0 -6"><span class='ocrx_word' id='word_1_364' title='bbox 354 1874 377 1893; x_wconf 92' lang='eng'>71</span> <span class='ocrx_word' id='word_1_365' title='bbox 410 1873 433 1894; x_wconf 88' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_366' title='bbox 446 1873 513 1894; x_wconf 89' lang='eng' dir='ltr'><em>albus</em></span> <span class='ocrx_word' id='word_1_367' title='bbox 523 1873 605 1900; x_wconf 88' lang='eng' dir='ltr'>subsp.</span> <span class='ocrx_word' id='word_1_368' title='bbox 617 1873 685 1894; x_wconf 89' lang='eng' dir='ltr'><em>albus</em></span> <span class='ocrx_word' id='word_1_369' title='bbox 696 1873 756 1894; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_370' title='bbox 766 1873 857 1894; x_wconf 81' lang='eng' dir='ltr'>40313T</span> <span class='ocrx_word' id='word_1_371' title='bbox 868 1873 1015 1900; x_wconf 86' lang='eng' dir='ltr'>(AJ621602)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_68' title="bbox 302 1902 837 1929; baseline 0 -6"><span class='ocrx_word' id='word_1_372' title='bbox 302 1902 325 1923; x_wconf 90' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_373' title='bbox 337 1902 481 1923; x_wconf 85' lang='eng' dir='ltr'>ﬂavofuscus</span> <span class='ocrx_word' id='word_1_374' title='bbox 491 1902 567 1923; x_wconf 93' lang='eng' dir='ltr'>NRRL</span> <span class='ocrx_word' id='word_1_375' title='bbox 578 1902 669 1923; x_wconf 88' lang='eng' dir='ltr'>B-8036</span> <span class='ocrx_word' id='word_1_376' title='bbox 680 1902 837 1929; x_wconf 89' lang='eng' dir='ltr'>(DQ026648)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_69' title="bbox 348 1929 772 1956; baseline 0.002 -6"><span class='ocrx_word' id='word_1_377' title='bbox 348 1929 370 1951; x_wconf 91' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_378' title='bbox 383 1929 483 1951; x_wconf 81' lang='eng' dir='ltr'>ferralitis</span> <span class='ocrx_word' id='word_1_379' title='bbox 492 1929 609 1956; x_wconf 85' lang='eng' dir='ltr'>SFOp68T</span> <span class='ocrx_word' id='word_1_380' title='bbox 620 1929 772 1956; x_wconf 83' lang='eng' dir='ltr'>(AY262826)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_70' title="bbox 463 1957 892 1984; baseline 0 -6"><span class='ocrx_word' id='word_1_381' title='bbox 463 1957 486 1978; x_wconf 90' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_382' title='bbox 498 1957 662 1984; x_wconf 87' lang='eng' dir='ltr'>guanduensis</span> <span class='ocrx_word' id='word_1_383' title='bbox 672 1957 729 1978; x_wconf 89' lang='eng' dir='ltr'>701T</span> <span class='ocrx_word' id='word_1_384' title='bbox 748 1957 892 1984; x_wconf 86' lang='eng' dir='ltr'>AY876942)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 136 1978 958 2093">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 136 1978 958 2093">
+     <span class='ocr_line' id='line_1_71' title="bbox 136 1978 958 2016; baseline 0 -11"><span class='ocrx_word' id='word_1_385' title='bbox 136 1997 161 2016; x_wconf 69' lang='eng'>58</span> <span class='ocrx_word' id='word_1_386' title='bbox 249 1978 275 1997; x_wconf 78' lang='eng'>66</span> <span class='ocrx_word' id='word_1_387' title='bbox 477 1984 499 2005; x_wconf 89' lang='eng' dir='ltr'>s.</span> <span class='ocrx_word' id='word_1_388' title='bbox 510 1984 688 2011; x_wconf 87' lang='eng' dir='ltr'>yeochonensis</span> <span class='ocrx_word' id='word_1_389' title='bbox 697 1984 736 2005; x_wconf 92' lang='eng' dir='ltr'>CN</span> <span class='ocrx_word' id='word_1_390' title='bbox 755 1984 797 2005; x_wconf 86' lang='eng' dir='ltr'>32T</span> <span class='ocrx_word' id='word_1_391' title='bbox 807 1984 958 2011; x_wconf 90' lang='eng' dir='ltr'>(AF101415)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_72' title="bbox 251 2011 762 2044; baseline 0 -12"><span class='ocrx_word' id='word_1_392' title='bbox 251 2026 277 2044; x_wconf 75' lang='eng'>87</span> <span class='ocrx_word' id='word_1_393' title='bbox 372 2011 395 2033; x_wconf 88' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_394' title='bbox 407 2012 501 2033; x_wconf 87' lang='eng' dir='ltr'><em>rubidus</em></span> <span class='ocrx_word' id='word_1_395' title='bbox 513 2011 600 2033; x_wconf 90' lang='eng' dir='ltr'>13c15T</span> <span class='ocrx_word' id='word_1_396' title='bbox 610 2011 762 2038; x_wconf 86' lang='eng' dir='ltr'>(AY876941)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_73' title="bbox 179 2039 881 2065; baseline 0 -5"><span class='ocrx_word' id='word_1_397' title='bbox 179 2041 205 2060; x_wconf 85' lang='eng'>69</span> <span class='ocrx_word' id='word_1_398' title='bbox 438 2039 460 2060; x_wconf 91' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_399' title='bbox 471 2039 644 2065; x_wconf 87' lang='eng' dir='ltr'>paucisporeus</span> <span class='ocrx_word' id='word_1_400' title='bbox 656 2039 728 2060; x_wconf 88' lang='eng' dir='ltr'>1413T</span> <span class='ocrx_word' id='word_1_401' title='bbox 746 2039 881 2060; x_wconf 82' lang='eng' dir='ltr'>AY876943</span> 
+     </span>
+     <span class='ocr_line' id='line_1_74' title="bbox 452 2066 882 2093; baseline 0 -6"><span class='ocrx_word' id='word_1_402' title='bbox 452 2066 474 2087; x_wconf 89' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_403' title='bbox 485 2066 645 2093; x_wconf 84' lang='eng' dir='ltr'>yang/inensis</span> <span class='ocrx_word' id='word_1_404' title='bbox 656 2066 728 2087; x_wconf 89' lang='eng' dir='ltr'>1307T</span> <span class='ocrx_word' id='word_1_405' title='bbox 747 2066 882 2087; x_wconf 89' lang='eng' dir='ltr'>AY876940</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 5 1535 7 2100">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 5 1535 7 2100">
+     <span class='ocr_line' id='line_1_75' title="bbox 5 1535 7 2100; baseline 0 156"><span class='ocrx_word' id='word_1_406' title='bbox 5 1535 7 2100; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 5 2090 1259 2197">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 40 2090 1259 2197">
+     <span class='ocr_line' id='line_1_76' title="bbox 762 2090 1259 2118; baseline 0 -6"><span class='ocrx_word' id='word_1_407' title='bbox 762 2090 784 2112; x_wconf 93' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_408' title='bbox 796 2091 960 2118; x_wconf 85' lang='eng' dir='ltr'>scabrisporus</span> <span class='ocrx_word' id='word_1_409' title='bbox 970 2091 1097 2112; x_wconf 81' lang='eng' dir='ltr'>KM—4927T</span> <span class='ocrx_word' id='word_1_410' title='bbox 1107 2090 1259 2118; x_wconf 80' lang='eng' dir='ltr'>(A3030585)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_77' title="bbox 434 2120 956 2147; baseline 0.002 -6"><span class='ocrx_word' id='word_1_411' title='bbox 434 2120 457 2142; x_wconf 89' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_412' title='bbox 470 2121 659 2142; x_wconf 83' lang='eng' dir='ltr'>thermol/neatus</span> <span class='ocrx_word' id='word_1_413' title='bbox 669 2120 729 2142; x_wconf 85' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_414' title='bbox 740 2120 831 2142; x_wconf 86' lang='eng' dir='ltr'>41451T</span> <span class='ocrx_word' id='word_1_415' title='bbox 841 2120 956 2147; x_wconf 73' lang='eng' dir='ltr'>(Z6809?)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_78' title="bbox 40 2149 1158 2181; baseline 0 -10"><span class='ocrx_word' id='word_1_416' title='bbox 40 2162 66 2181; x_wconf 84' lang='eng'>77</span> <span class='ocrx_word' id='word_1_417' title='bbox 667 2149 689 2171; x_wconf 92' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_418' title='bbox 701 2155 860 2177; x_wconf 84' lang='eng' dir='ltr'>megasporus</span> <span class='ocrx_word' id='word_1_419' title='bbox 871 2149 930 2171; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_420' title='bbox 941 2150 1032 2171; x_wconf 89' lang='eng' dir='ltr'>41476T</span> <span class='ocrx_word' id='word_1_421' title='bbox 1042 2149 1158 2177; x_wconf 84' lang='eng' dir='ltr'>(Z68100)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_79' title="bbox 286 2178 311 2197; baseline 0 0"><span class='ocrx_word' id='word_1_422' title='bbox 286 2178 311 2197; x_wconf 87' lang='eng'>99</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 140 2178 996 2255">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 140 2178 996 2255">
+     <span class='ocr_line' id='line_1_80' title="bbox 497 2178 996 2206; baseline 0 -6"><span class='ocrx_word' id='word_1_423' title='bbox 497 2178 520 2200; x_wconf 91' lang='eng' dir='ltr'>S.</span> <span class='ocrx_word' id='word_1_424' title='bbox 532 2184 698 2205; x_wconf 86' lang='eng' dir='ltr'>macrosporus</span> <span class='ocrx_word' id='word_1_425' title='bbox 709 2178 769 2200; x_wconf 91' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_426' title='bbox 779 2179 871 2200; x_wconf 91' lang='eng' dir='ltr'>41449T</span> <span class='ocrx_word' id='word_1_427' title='bbox 881 2178 996 2206; x_wconf 85' lang='eng'>(268099)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_81' title="bbox 212 2212 257 2230; baseline 0 0"><span class='ocrx_word' id='word_1_428' title='bbox 212 2212 257 2230; x_wconf 91' lang='eng'>0.01</span> 
+     </span>
+     <span class='ocr_line' id='line_1_82' title="bbox 140 2230 333 2255; baseline 0 0"><span class='ocrx_word' id='word_1_429' title='bbox 140 2230 333 2255; x_wconf 87' lang='eng' dir='ltr'>I—l</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003459-0-002.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003459-0-002.pbm.png
new file mode 100644
index 00000000..9dc0417e
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003459-0-002.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003459-0-002.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003459-0-002.pbm.png.hocr
new file mode 100644
index 00000000..57ca6736
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003459-0-002.pbm.png.hocr
@@ -0,0 +1,270 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003459-0-002.pbm.png"; bbox 0 0 1302 1074; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 1 937 3 1057">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 1 937 3 1057">
+     <span class='ocr_line' id='line_1_1' title="bbox 1 937 3 1057; baseline 0 17"><span class='ocrx_word' id='word_1_1' title='bbox 1 937 3 1057; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 123 694 172 709">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 123 694 172 709">
+     <span class='ocr_line' id='line_1_2' title="bbox 123 694 172 709; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 123 694 172 709; x_wconf 84' lang='eng'>0.005</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 282 836 302 851">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 282 836 302 851">
+     <span class='ocr_line' id='line_1_3' title="bbox 282 836 302 851; baseline 0 0"><span class='ocrx_word' id='word_1_3' title='bbox 282 836 302 851; x_wconf 84' lang='eng'><em>78</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 544 1 1300 102">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 544 1 1300 102">
+     <span class='ocr_line' id='line_1_4' title="bbox 700 1 1298 27; baseline 0 -5"><span class='ocrx_word' id='word_1_4' title='bbox 700 8 721 23; x_wconf 74' lang='eng'>99</span> <span class='ocrx_word' id='word_1_5' title='bbox 808 2 833 22; x_wconf 57' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 845 2 977 22; x_wconf 82' lang='eng' dir='ltr'><em>Chubuense</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 983 2 1053 22; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 1063 1 1148 22; x_wconf 87' lang='eng' dir='ltr'><em>27278T</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 1157 2 1298 27; x_wconf 86' lang='eng' dir='ltr'><em>(AF480597)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 562 10 1300 87; baseline 0 -28"><span class='ocrx_word' id='word_1_10' title='bbox 562 10 834 87; x_wconf 62' lang='eng'>51|:|:</span> <span class='ocrx_word' id='word_1_11' title='bbox 843 39 869 59; x_wconf 90' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 881 39 1092 65; x_wconf 80' lang='eng' dir='ltr'><em>chlorophenolicum</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 1102 38 1183 59; x_wconf 76' lang='eng' dir='ltr'><em>PCP—IT</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 1192 39 1300 65; x_wconf 84' lang='eng' dir='ltr'><em>(X79094)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 544 69 1239 102; baseline 0 -6"><span class='ocrx_word' id='word_1_15' title='bbox 544 69 563 84; x_wconf 67' lang='eng'><em>61</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 775 77 801 96; x_wconf 89' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 811 77 918 102; x_wconf 80' lang='eng' dir='ltr'><em>poriferae</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 925 77 995 96; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 1006 76 1090 96; x_wconf 79' lang='eng' dir='ltr'><em>35087T</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 1099 77 1239 102; x_wconf 86' lang='eng' dir='ltr'><em>(AF480589)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 604 113 1262 311">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 604 113 1262 311">
+     <span class='ocr_line' id='line_1_7' title="bbox 781 113 1262 139; baseline 0 -5"><span class='ocrx_word' id='word_1_21' title='bbox 781 114 807 134; x_wconf 91' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 817 114 1010 139; x_wconf 81' lang='eng' dir='ltr'><em>psychrotolerans</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 1018 114 1070 134; x_wconf 86' lang='eng' dir='ltr'><em>WA1</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 1077 113 1115 134; x_wconf 77' lang='eng' dir='ltr'><em>O1T</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 1124 114 1262 139; x_wconf 86' lang='eng' dir='ltr'><em>(AJ534886)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 604 151 1120 176; baseline 0 -5"><span class='ocrx_word' id='word_1_26' title='bbox 604 159 647 161; x_wconf 96' lang='eng'>—</span> <span class='ocrx_word' id='word_1_27' title='bbox 657 151 682 171; x_wconf 92' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 694 151 812 171; x_wconf 83' lang='eng' dir='ltr'><em>rhodesiae</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 822 151 879 171; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 888 151 973 171; x_wconf 78' lang='eng' dir='ltr'><em>44223T</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 983 151 1120 176; x_wconf 83' lang='eng' dir='ltr'><em>(AJ429047)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 680 188 1120 214; baseline 0 -6"><span class='ocrx_word' id='word_1_32' title='bbox 680 188 705 208; x_wconf 92' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 718 188 831 208; x_wconf 83' lang='eng' dir='ltr'><em>aichiense</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 837 188 908 208; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 918 188 1002 208; x_wconf 78' lang='eng' dir='ltr'><em>27280T</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 1012 188 1120 214; x_wconf 82' lang='eng' dir='ltr'><em>(X55598)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 641 225 1087 311; baseline 0 -65"><span class='ocrx_word' id='word_1_37' title='bbox 641 233 690 311; x_wconf 35' lang='eng' dir='ltr'><em>L?</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 699 226 724 246; x_wconf 93' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 736 226 836 246; x_wconf 84' lang='eng' dir='ltr'><em>bonickei</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 843 225 938 246; x_wconf 79' lang='eng' dir='ltr'><em>W5998T</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 947 226 1087 251; x_wconf 83' lang='eng' dir='ltr'><em>(AYO12573)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 571 59 573 124">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 571 59 573 124">
+     <span class='ocr_line' id='line_1_11' title="bbox 571 59 573 124; baseline 0 950"><span class='ocrx_word' id='word_1_42' title='bbox 571 59 573 124; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 424 89 602 526">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 424 89 602 526">
+     <span class='ocr_line' id='line_1_12' title="bbox 424 89 602 399; baseline 0 0"><span class='ocrx_word' id='word_1_43' title='bbox 424 89 602 399; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 424 399 580 473; baseline 0 0"><span class='ocrx_word' id='word_1_44' title='bbox 424 399 580 473; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 448 473 580 526; baseline 0 548"><span class='ocrx_word' id='word_1_45' title='bbox 448 473 580 526; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 602 159 604 196">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 602 159 604 196">
+     <span class='ocr_line' id='line_1_15' title="bbox 602 159 604 196; baseline 0 878"><span class='ocrx_word' id='word_1_46' title='bbox 602 159 604 196; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 602 196 670 199">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 602 196 670 199">
+     <span class='ocr_line' id='line_1_16' title="bbox 602 196 670 199; baseline 0 875"><span class='ocrx_word' id='word_1_47' title='bbox 602 196 670 199; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 582 261 1296 513">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 582 261 1296 513">
+     <span class='ocr_line' id='line_1_17' title="bbox 646 261 1186 289; baseline 0 -6"><span class='ocrx_word' id='word_1_48' title='bbox 646 261 667 276; x_wconf 72' lang='eng'><em>76</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 699 264 724 283; x_wconf 56' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 736 264 933 283; x_wconf 85' lang='eng' dir='ltr'><em>neworleansense</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 941 262 1036 283; x_wconf 84' lang='eng' dir='ltr'><em>W6705T</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 1046 264 1186 289; x_wconf 89' lang='eng' dir='ltr'><em>(AYO12575)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 691 300 1149 326; baseline 0 -6"><span class='ocrx_word' id='word_1_53' title='bbox 691 301 716 320; x_wconf 93' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 727 301 839 326; x_wconf 90' lang='eng' dir='ltr'><em>porcinum</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 848 300 891 321; x_wconf 89' lang='eng' dir='ltr'><em>CIP</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 902 300 1000 321; x_wconf 76' lang='eng' dir='ltr'><em>105392T</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 1009 301 1149 326; x_wconf 81' lang='eng' dir='ltr'><em>(AY457077)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 582 337 1296 385; baseline 0 -27"><span class='ocrx_word' id='word_1_58' title='bbox 582 353 603 367; x_wconf 71' lang='eng'><em>77</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 722 346 802 385; x_wconf 66' lang='eng' dir='ltr'><em>L—</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 812 338 838 358; x_wconf 93' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 848 338 986 363; x_wconf 82' lang='eng' dir='ltr'><em>peregrinum</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 995 338 1038 358; x_wconf 95' lang='eng' dir='ltr'><em>CIP</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 1049 337 1146 358; x_wconf 80' lang='eng' dir='ltr'><em>105382T</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 1156 338 1296 363; x_wconf 85' lang='eng' dir='ltr'><em>(AY457069)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 693 374 1221 400; baseline 0 -5"><span class='ocrx_word' id='word_1_65' title='bbox 693 374 715 389; x_wconf 81' lang='eng'>95</span> <span class='ocrx_word' id='word_1_66' title='bbox 741 375 766 395; x_wconf 94' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 778 375 885 400; x_wconf 81' lang='eng' dir='ltr'><em>septicum</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 892 375 962 395; x_wconf 89' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 973 374 1072 395; x_wconf 83' lang='eng' dir='ltr'><em>700731T</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 1081 375 1221 400; x_wconf 86' lang='eng' dir='ltr'><em>(AY457070)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 610 412 1190 438; baseline 0.002 -6"><span class='ocrx_word' id='word_1_71' title='bbox 610 420 644 422; x_wconf 95' lang='eng'>—</span> <span class='ocrx_word' id='word_1_72' title='bbox 654 413 679 432; x_wconf 94' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 691 413 880 438; x_wconf 78' lang='eng' dir='ltr'><em>conceptionense</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 890 412 933 433; x_wconf 85' lang='eng' dir='ltr'><em>CIP</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 944 412 1041 433; x_wconf 73' lang='eng' dir='ltr'><em>108544T</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 1051 413 1190 438; x_wconf 86' lang='eng' dir='ltr'><em>(AY859684)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 666 449 1118 475; baseline 0 -5"><span class='ocrx_word' id='word_1_77' title='bbox 666 450 691 470; x_wconf 93' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 703 450 808 470; x_wconf 83' lang='eng' dir='ltr'><em>fortuitum</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 817 450 860 470; x_wconf 90' lang='eng' dir='ltr'><em>CIP</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 871 449 968 470; x_wconf 83' lang='eng' dir='ltr'><em>104534T</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 978 450 1118 475; x_wconf 86' lang='eng' dir='ltr'><em>(AY457066)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 585 486 1102 513; baseline 0 -6"><span class='ocrx_word' id='word_1_82' title='bbox 585 487 610 507; x_wconf 93' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 622 487 777 513; x_wconf 82' lang='eng' dir='ltr'><em>farcinogenes</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 787 487 859 507; x_wconf 92' lang='eng' dir='ltr'><em>NCTC</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 871 486 953 507; x_wconf 76' lang='eng' dir='ltr'><em>10955T</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 962 487 1102 512; x_wconf 89' lang='eng' dir='ltr'><em>(AY457084)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 641 283 643 367">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 641 283 643 367">
+     <span class='ocr_line' id='line_1_24' title="bbox 641 283 643 367; baseline 0 707"><span class='ocrx_word' id='word_1_87' title='bbox 641 283 643 367; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 560 372 610 374">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 560 372 610 374">
+     <span class='ocr_line' id='line_1_25' title="bbox 560 372 610 374; baseline 0 700"><span class='ocrx_word' id='word_1_88' title='bbox 560 372 610 374; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 608 325 610 422">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 608 325 610 422">
+     <span class='ocr_line' id='line_1_26' title="bbox 608 325 610 422; baseline 0 652"><span class='ocrx_word' id='word_1_89' title='bbox 608 325 610 422; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 560 372 562 460">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 560 372 562 460">
+     <span class='ocr_line' id='line_1_27' title="bbox 560 372 562 460; baseline 0 614"><span class='ocrx_word' id='word_1_90' title='bbox 560 372 562 460; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 562 458 656 460">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 562 458 656 460">
+     <span class='ocr_line' id='line_1_28' title="bbox 562 458 656 460; baseline 0 614"><span class='ocrx_word' id='word_1_91' title='bbox 562 458 656 460; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 384 540 428 542">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 384 540 428 542">
+     <span class='ocr_line' id='line_1_29' title="bbox 384 540 428 542; baseline 0 532"><span class='ocrx_word' id='word_1_92' title='bbox 384 540 428 542; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 369 649 386 651">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 369 649 386 651">
+     <span class='ocr_line' id='line_1_30' title="bbox 369 649 386 651; baseline 0 423"><span class='ocrx_word' id='word_1_93' title='bbox 369 649 386 651; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 384 540 386 756">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 384 540 386 756">
+     <span class='ocr_line' id='line_1_31' title="bbox 384 540 386 756; baseline 0 318"><span class='ocrx_word' id='word_1_94' title='bbox 384 540 386 756; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 308 749 370 751">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 308 749 370 751">
+     <span class='ocr_line' id='line_1_32' title="bbox 308 749 370 751; baseline 0 323"><span class='ocrx_word' id='word_1_95' title='bbox 308 749 370 751; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 369 649 370 852">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 369 649 370 852">
+     <span class='ocr_line' id='line_1_33' title="bbox 369 649 370 852; baseline 0 222"><span class='ocrx_word' id='word_1_96' title='bbox 369 649 370 852; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 585 524 1086 623">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 585 524 1086 623">
+     <span class='ocr_line' id='line_1_34' title="bbox 585 524 1022 550; baseline 0 -5"><span class='ocrx_word' id='word_1_97' title='bbox 585 525 610 544; x_wconf 94' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 622 525 777 545; x_wconf 83' lang='eng' dir='ltr'><em>houstonense</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 787 524 873 545; x_wconf 73' lang='eng' dir='ltr'><em>Ho1asT</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 882 525 1022 550; x_wconf 89' lang='eng' dir='ltr'><em>(AYO12579)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 585 561 1086 588; baseline 0 -6"><span class='ocrx_word' id='word_1_101' title='bbox 585 562 610 582; x_wconf 96' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 622 562 775 588; x_wconf 83' lang='eng' dir='ltr'><em>senegalense</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 785 562 827 582; x_wconf 88' lang='eng' dir='ltr'><em>CIP</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 839 561 936 582; x_wconf 73' lang='eng' dir='ltr'><em>104941T</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 945 562 1086 587; x_wconf 86' lang='eng' dir='ltr'><em>(AY457081)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 655 597 1010 623; baseline 0 -5"><span class='ocrx_word' id='word_1_106' title='bbox 655 598 729 618; x_wconf 89' lang='eng' dir='ltr'>Strain</span> <span class='ocrx_word' id='word_1_107' title='bbox 740 597 856 618; x_wconf 80' lang='eng' dir='ltr'><em>FI-06250T</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 865 598 1010 623; x_wconf 86' lang='eng' dir='ltr'><em>(EU605695)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 448 526 640 613">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 448 526 640 613">
+     <span class='ocr_line' id='line_1_37' title="bbox 448 526 580 563; baseline 0 511"><span class='ocrx_word' id='word_1_109' title='bbox 448 526 580 563; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 448 563 640 613; baseline 0 0"><span class='ocrx_word' id='word_1_110' title='bbox 448 563 640 613; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 426 408 428 672">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 426 408 428 672">
+     <span class='ocr_line' id='line_1_39' title="bbox 426 408 428 672; baseline 0 402"><span class='ocrx_word' id='word_1_111' title='bbox 426 408 428 672; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 387 636 1290 759">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 588 636 1290 737">
+     <span class='ocr_line' id='line_1_40' title="bbox 853 636 1290 662; baseline -0.002 -5"><span class='ocrx_word' id='word_1_112' title='bbox 853 637 878 656; x_wconf 94' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 890 637 1037 657; x_wconf 83' lang='eng' dir='ltr'><em>bn&#39;sbanense</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 1045 636 1140 657; x_wconf 81' lang='eng' dir='ltr'><em>W6743T</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 1150 637 1290 662; x_wconf 88' lang='eng' dir='ltr'><em>(AYO12577)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 638 673 1164 699; baseline 0 -5"><span class='ocrx_word' id='word_1_116' title='bbox 638 674 664 694; x_wconf 83' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 675 674 843 699; x_wconf 87' lang='eng' dir='ltr'><em>mucogenicum</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 849 674 920 694; x_wconf 87' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 930 673 1014 694; x_wconf 83' lang='eng' dir='ltr'><em>49650T</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 1024 674 1164 699; x_wconf 89' lang='eng' dir='ltr'><em>(AY457074)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 588 710 1116 737; baseline 0.008 -10"><span class='ocrx_word' id='word_1_121' title='bbox 588 713 619 728; x_wconf 83' lang='eng'>100</span> <span class='ocrx_word' id='word_1_122' title='bbox 638 712 664 731; x_wconf 92' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 674 712 805 737; x_wconf 82' lang='eng' dir='ltr'><em>phocaicum</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 815 711 857 731; x_wconf 87' lang='eng' dir='ltr'><em>CIP</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 869 710 966 731; x_wconf 82' lang='eng' dir='ltr'><em>108542T</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 975 712 1116 737; x_wconf 84' lang='eng' dir='ltr'><em>(AY859682)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 689 748 1131 774">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 689 748 1131 774">
+     <span class='ocr_line' id='line_1_43' title="bbox 689 748 1131 774; baseline 0 -5"><span class='ocrx_word' id='word_1_127' title='bbox 689 749 715 769; x_wconf 91' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 726 749 814 774; x_wconf 82' lang='eng' dir='ltr'><em>gadium</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 824 749 866 769; x_wconf 88' lang='eng' dir='ltr'><em>CIP</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 878 748 975 769; x_wconf 74' lang='eng' dir='ltr'><em>105388T</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 984 749 1131 774; x_wconf 85' lang='eng' dir='ltr'><em>(DQ473310)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 420 785 1155 849">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 420 785 1155 849">
+     <span class='ocr_line' id='line_1_44' title="bbox 420 785 1155 833; baseline 0 -27"><span class='ocrx_word' id='word_1_132' title='bbox 420 793 671 833; x_wconf 67' lang='eng'><em>_71|:</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 681 786 707 806; x_wconf 89' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_134' title='bbox 719 786 844 806; x_wconf 87' lang='eng' dir='ltr'><em>barrassiae</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 854 786 897 806; x_wconf 93' lang='eng' dir='ltr'><em>CIP</em></span> <span class='ocrx_word' id='word_1_136' title='bbox 908 785 1005 806; x_wconf 76' lang='eng' dir='ltr'><em>108545T</em></span> <span class='ocrx_word' id='word_1_137' title='bbox 1015 786 1155 811; x_wconf 86' lang='eng' dir='ltr'><em>(AY859685)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 666 823 1110 849; baseline 0 -6"><span class='ocrx_word' id='word_1_138' title='bbox 666 823 691 843; x_wconf 93' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_139' title='bbox 703 823 851 849; x_wconf 87' lang='eng' dir='ltr'><em>goodiiATCC</em></span> <span class='ocrx_word' id='word_1_140' title='bbox 862 823 961 843; x_wconf 74' lang='eng' dir='ltr'><em>700504T</em></span> <span class='ocrx_word' id='word_1_141' title='bbox 970 823 1110 849; x_wconf 88' lang='eng' dir='ltr'><em>(AY457079)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 369 850 420 852">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 369 850 420 852">
+     <span class='ocr_line' id='line_1_46' title="bbox 369 850 420 852; baseline 0 222"><span class='ocrx_word' id='word_1_142' title='bbox 369 850 420 852; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 196 856 310 858">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 196 856 310 858">
+     <span class='ocr_line' id='line_1_47' title="bbox 196 856 310 858; baseline 0 216"><span class='ocrx_word' id='word_1_143' title='bbox 196 856 310 858; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 196 856 198 1020">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 196 856 198 1020">
+     <span class='ocr_line' id='line_1_48' title="bbox 196 856 198 1020; baseline 0 54"><span class='ocrx_word' id='word_1_144' title='bbox 196 856 198 1020; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 308 749 310 964">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 308 749 310 964">
+     <span class='ocr_line' id='line_1_49' title="bbox 308 749 310 964; baseline 0 110"><span class='ocrx_word' id='word_1_145' title='bbox 308 749 310 964; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 418 813 420 889">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 418 813 420 889">
+     <span class='ocr_line' id='line_1_50' title="bbox 418 813 420 889; baseline 0 185"><span class='ocrx_word' id='word_1_146' title='bbox 418 813 420 889; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 420 860 1079 924">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 420 860 1079 924">
+     <span class='ocr_line' id='line_1_51' title="bbox 420 860 1079 908; baseline 0 -28"><span class='ocrx_word' id='word_1_147' title='bbox 420 868 573 908; x_wconf 57' lang='eng' dir='ltr'><em>_i——</em></span> <span class='ocrx_word' id='word_1_148' title='bbox 583 861 609 880; x_wconf 92' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_149' title='bbox 621 861 769 886; x_wconf 81' lang='eng' dir='ltr'><em>mageritense</em></span> <span class='ocrx_word' id='word_1_150' title='bbox 778 861 821 880; x_wconf 93' lang='eng' dir='ltr'><em>CIP</em></span> <span class='ocrx_word' id='word_1_151' title='bbox 832 860 930 880; x_wconf 75' lang='eng' dir='ltr'><em>104973T</em></span> <span class='ocrx_word' id='word_1_152' title='bbox 939 861 1079 886; x_wconf 89' lang='eng' dir='ltr'><em>(AY457076)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_52' title="bbox 439 897 1027 924; baseline 0 -6"><span class='ocrx_word' id='word_1_153' title='bbox 439 902 460 917; x_wconf 77' lang='eng'><em>68</em></span> <span class='ocrx_word' id='word_1_154' title='bbox 546 898 572 918; x_wconf 94' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_155' title='bbox 584 898 768 924; x_wconf 83' lang='eng' dir='ltr'><em>wolinskyiATCC</em></span> <span class='ocrx_word' id='word_1_156' title='bbox 778 897 877 918; x_wconf 88' lang='eng' dir='ltr'><em>700010T</em></span> <span class='ocrx_word' id='word_1_157' title='bbox 887 898 1027 923; x_wconf 84' lang='eng' dir='ltr'><em>(AY457083)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 481 935 1189 998">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 481 935 1189 998">
+     <span class='ocr_line' id='line_1_53' title="bbox 481 935 901 960; baseline 0.002 -5"><span class='ocrx_word' id='word_1_158' title='bbox 481 936 506 955; x_wconf 93' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_159' title='bbox 518 935 581 956; x_wconf 87' lang='eng' dir='ltr'><em>faIIaX</em></span> <span class='ocrx_word' id='word_1_160' title='bbox 586 935 657 956; x_wconf 86' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_161' title='bbox 667 935 751 956; x_wconf 71' lang='eng' dir='ltr'><em>35219T</em></span> <span class='ocrx_word' id='word_1_162' title='bbox 761 936 901 960; x_wconf 84' lang='eng' dir='ltr'>(AF480600)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_54' title="bbox 739 972 1189 998; baseline 0.002 -6"><span class='ocrx_word' id='word_1_163' title='bbox 739 973 765 992; x_wconf 92' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_164' title='bbox 776 973 867 993; x_wconf 88' lang='eng' dir='ltr'><em>brumae</em></span> <span class='ocrx_word' id='word_1_165' title='bbox 873 972 944 993; x_wconf 86' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_166' title='bbox 955 972 1039 993; x_wconf 84' lang='eng' dir='ltr'><em>51384T</em></span> <span class='ocrx_word' id='word_1_167' title='bbox 1048 973 1189 998; x_wconf 84' lang='eng' dir='ltr'><em>(AF480576)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 196 1018 758 1020">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 196 1018 758 1020">
+     <span class='ocr_line' id='line_1_55' title="bbox 196 1018 758 1020; baseline 0 54"><span class='ocrx_word' id='word_1_168' title='bbox 196 1018 758 1020; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 417 1009 1171 1072">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 417 1009 1171 1072">
+     <span class='ocr_line' id='line_1_56' title="bbox 767 1009 1171 1035; baseline 0 -5"><span class='ocrx_word' id='word_1_169' title='bbox 767 1010 792 1030; x_wconf 96' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_170' title='bbox 805 1010 882 1030; x_wconf 83' lang='eng' dir='ltr'><em>trivia/e</em></span> <span class='ocrx_word' id='word_1_171' title='bbox 888 1010 958 1030; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_172' title='bbox 968 1009 1053 1030; x_wconf 80' lang='eng' dir='ltr'><em>23292T</em></span> <span class='ocrx_word' id='word_1_173' title='bbox 1062 1010 1171 1035; x_wconf 83' lang='eng' dir='ltr'><em>(X88924)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_57' title="bbox 417 1047 842 1072; baseline 0 -5"><span class='ocrx_word' id='word_1_174' title='bbox 417 1048 442 1067; x_wconf 96' lang='eng' dir='ltr'><em>M.</em></span> <span class='ocrx_word' id='word_1_175' title='bbox 455 1048 598 1067; x_wconf 79' lang='eng' dir='ltr'><em>tuberculosis</em></span> <span class='ocrx_word' id='word_1_176' title='bbox 608 1048 690 1067; x_wconf 84' lang='eng' dir='ltr'><em>H37Ra</em></span> <span class='ocrx_word' id='word_1_177' title='bbox 700 1047 842 1072; x_wconf 80' lang='eng' dir='ltr'><em>(CPOOOG11)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003509-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003509-0-001.pbm.png
new file mode 100644
index 00000000..56889bc2
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003509-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003509-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003509-0-001.pbm.png.hocr
new file mode 100644
index 00000000..17ae9a96
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003509-0-001.pbm.png.hocr
@@ -0,0 +1,408 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003509-0-001.pbm.png"; bbox 0 0 1775 1016; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 7 62 103 64">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 7 62 103 64">
+     <span class='ocr_line' id='line_1_1' title="bbox 7 62 103 64; baseline 0 952"><span class='ocrx_word' id='word_1_1' title='bbox 7 62 103 64; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 686 8 1640 163">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 769 8 1640 113">
+     <span class='ocr_line' id='line_1_2' title="bbox 769 8 1640 39; baseline 0 -6"><span class='ocrx_word' id='word_1_2' title='bbox 769 13 797 34; x_wconf 86' lang='eng'><em>96</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 807 23 861 25; x_wconf 30' lang='eng'>*</span> <span class='ocrx_word' id='word_1_4' title='bbox 872 10 1123 33; x_wconf 84' lang='eng' dir='ltr'><em>Chromohalobacter</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 1130 10 1273 39; x_wconf 87' lang='eng' dir='ltr'><em>beijerinckii</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 1281 10 1363 33; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 1376 8 1469 33; x_wconf 88' lang='eng' dir='ltr'><em>19372T</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 1480 10 1640 39; x_wconf 85' lang='eng' dir='ltr'><em>(AB021386)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 817 46 1425 77; baseline 0 -6"><span class='ocrx_word' id='word_1_9' title='bbox 817 48 1202 77; x_wconf 85' lang='eng' dir='ltr'><em>Chromohalobacterjaponicus</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 1211 46 1257 71; x_wconf 90' lang='eng' dir='ltr'><em>43T</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 1265 48 1425 77; x_wconf 90' lang='eng' dir='ltr'><em>(AB105159)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 838 77 1616 113; baseline 0 -6"><span class='ocrx_word' id='word_1_12' title='bbox 838 77 866 97; x_wconf 74' lang='eng'>52</span> <span class='ocrx_word' id='word_1_13' title='bbox 886 92 955 94; x_wconf 61' lang='eng'><strong>‘</strong></span> <span class='ocrx_word' id='word_1_14' title='bbox 967 84 1218 107; x_wconf 85' lang='eng' dir='ltr'><em>Chromohalobacter</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 1225 85 1370 107; x_wconf 85' lang='eng' dir='ltr'><em>sarecensis</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 1381 82 1445 107; x_wconf 95' lang='eng' dir='ltr'><em>LV4T</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 1456 84 1616 113; x_wconf 83' lang='eng' dir='ltr'><em>(AY373448)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 767 39 807 41">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 767 39 807 41">
+     <span class='ocr_line' id='line_1_5' title="bbox 767 39 807 41; baseline 0 975"><span class='ocrx_word' id='word_1_18' title='bbox 767 39 807 41; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 805 23 807 59">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 805 23 807 59">
+     <span class='ocr_line' id='line_1_6' title="bbox 805 23 807 59; baseline 0 957"><span class='ocrx_word' id='word_1_19' title='bbox 805 23 807 59; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 24 32 77 55">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 24 32 77 55">
+     <span class='ocr_line' id='line_1_7' title="bbox 24 32 77 55; baseline -0.019 0"><span class='ocrx_word' id='word_1_20' title='bbox 24 32 77 55; x_wconf 91' lang='eng'><em>0.01</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 767 39 770 110">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 767 39 770 110">
+     <span class='ocr_line' id='line_1_8' title="bbox 767 39 770 110; baseline 0 906"><span class='ocrx_word' id='word_1_21' title='bbox 767 39 770 110; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 767 108 886 110">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 767 108 886 110">
+     <span class='ocr_line' id='line_1_9' title="bbox 767 108 886 110; baseline 0 906"><span class='ocrx_word' id='word_1_22' title='bbox 767 108 886 110; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 884 92 886 128">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 884 92 886 128">
+     <span class='ocr_line' id='line_1_10' title="bbox 884 92 886 128; baseline 0 888"><span class='ocrx_word' id='word_1_23' title='bbox 884 92 886 128; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 356 116 1772 876">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 356 116 1772 876">
+     <span class='ocr_line' id='line_1_11' title="bbox 1019 116 1772 148; baseline -0.001 -6"><span class='ocrx_word' id='word_1_24' title='bbox 1019 119 1269 142; x_wconf 85' lang='eng' dir='ltr'><em>Chromohalobacter</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 1276 119 1480 148; x_wconf 89' lang='eng' dir='ltr'><em>nigrandesensis</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 1490 116 1607 142; x_wconf 88' lang='eng' dir='ltr'><em>LTS-4NT</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 1617 119 1772 148; x_wconf 89' lang='eng' dir='ltr'><em>(AJ277205)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 780 151 1553 183; baseline 0 -7"><span class='ocrx_word' id='word_1_28' title='bbox 780 153 1030 176; x_wconf 79' lang='eng' dir='ltr'><em>Chromohalobacter</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 1038 154 1190 176; x_wconf 87' lang='eng' dir='ltr'><em>canadensis</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 1198 153 1281 176; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 1291 151 1388 176; x_wconf 78' lang='eng' dir='ltr'><em>43984T</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 1398 153 1553 183; x_wconf 86' lang='eng' dir='ltr'><em>(AJ295143)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 686 186 1531 217; baseline 0 -6"><span class='ocrx_word' id='word_1_33' title='bbox 686 196 775 198; x_wconf 79' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_34' title='bbox 784 188 1035 211; x_wconf 88' lang='eng' dir='ltr'><em>Chromohalobacter</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 1042 189 1202 211; x_wconf 82' lang='eng' dir='ltr'><em>marismortui</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 1209 188 1292 211; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 1305 186 1398 211; x_wconf 90' lang='eng' dir='ltr'><em>17056T</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 1409 188 1531 217; x_wconf 88' lang='eng' dir='ltr'><em>(X87219)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 738 219 1525 267; baseline 0 -22"><span class='ocrx_word' id='word_1_39' title='bbox 738 230 750 267; x_wconf 60' lang='eng'>[</span> <span class='ocrx_word' id='word_1_40' title='bbox 761 222 1012 245; x_wconf 86' lang='eng' dir='ltr'><em>Chromohalobacter</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 1019 222 1162 245; x_wconf 86' lang='eng' dir='ltr'><em>israelensis</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 1171 222 1253 245; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 1263 219 1360 245; x_wconf 81' lang='eng' dir='ltr'><em>43985T</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 1371 222 1525 251; x_wconf 91' lang='eng' dir='ltr'><em>(AJ295144)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 758 256 1489 288; baseline 0 -6"><span class='ocrx_word' id='word_1_45' title='bbox 758 259 1009 282; x_wconf 86' lang='eng' dir='ltr'><em>Chromohalobacter</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 1016 259 1159 288; x_wconf 87' lang='eng' dir='ltr'><em>salexigens</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 1170 259 1233 282; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 1245 256 1324 282; x_wconf 91' lang='eng' dir='ltr'><em>3043T</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 1335 259 1489 288; x_wconf 89' lang='eng' dir='ltr'><em>(AJ295146)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 853 292 1507 323; baseline 0 -6"><span class='ocrx_word' id='word_1_50' title='bbox 853 301 874 302; x_wconf 44' lang='eng'><em>*</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 884 294 1037 317; x_wconf 88' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 1047 294 1176 317; x_wconf 87' lang='eng' dir='ltr'><em>euriha/ina</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 1186 294 1268 317; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 1278 292 1375 317; x_wconf 88' lang='eng' dir='ltr'><em>49336T</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 1385 294 1507 323; x_wconf 89' lang='eng' dir='ltr'><em>(X87218)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 853 325 1517 357; baseline 0 -7"><span class='ocrx_word' id='word_1_56' title='bbox 853 328 1062 350; x_wconf 22' lang='eng' dir='ltr'><em>*Halomonas</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 1071 328 1185 356; x_wconf 75' lang='eng' dir='ltr'><em>elongate</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 1195 327 1277 350; x_wconf 93' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 1288 325 1384 350; x_wconf 81' lang='eng' dir='ltr'><em>33173T</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 1395 327 1517 357; x_wconf 89' lang='eng' dir='ltr'><em>(X67023)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 702 357 1435 388; baseline 0 -6"><span class='ocrx_word' id='word_1_61' title='bbox 702 370 839 371; x_wconf 91' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_62' title='bbox 848 359 1001 382; x_wconf 88' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 1010 359 1130 388; x_wconf 84' lang='eng' dir='ltr'><em>ha/ophila</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 1142 359 1206 382; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 1217 357 1297 382; x_wconf 91' lang='eng' dir='ltr'><em>4770T</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 1307 359 1435 388; x_wconf 90' lang='eng' dir='ltr'><em>(M93353)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 628 394 1188 425; baseline 0 -6"><span class='ocrx_word' id='word_1_67' title='bbox 628 396 782 419; x_wconf 88' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 789 396 892 425; x_wconf 84' lang='eng' dir='ltr'><em>paciﬁca</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 904 396 967 419; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 978 394 1059 419; x_wconf 91' lang='eng' dir='ltr'><em>4742T</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 1069 396 1188 425; x_wconf 85' lang='eng' dir='ltr'><em>(L42616)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 471 430 1071 462; baseline 0.002 -7"><span class='ocrx_word' id='word_1_72' title='bbox 471 439 527 441; x_wconf 89' lang='eng'>—</span> <span class='ocrx_word' id='word_1_73' title='bbox 534 433 687 456; x_wconf 86' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 697 434 818 456; x_wconf 86' lang='eng' dir='ltr'><em>ventosae</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 827 430 900 455; x_wconf 87' lang='eng' dir='ltr'><em>A|12T</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 911 433 1071 462; x_wconf 87' lang='eng' dir='ltr'><em>(AY268080)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 496 458 1458 497; baseline 0 -7"><span class='ocrx_word' id='word_1_77' title='bbox 496 458 524 479; x_wconf 74' lang='eng'><em>98</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 542 473 743 475; x_wconf 34' lang='eng'><strong>¥</strong></span> <span class='ocrx_word' id='word_1_79' title='bbox 749 468 902 491; x_wconf 86' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 912 468 1131 491; x_wconf 84' lang='eng' dir='ltr'><em>halodenitriﬁcans</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 1139 468 1221 491; x_wconf 93' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 1234 465 1329 491; x_wconf 84' lang='eng' dir='ltr'><em>13511T</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 1339 468 1458 497; x_wconf 91' lang='eng' dir='ltr'><em>(L04942)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 419 492 1162 529; baseline 0 -7"><span class='ocrx_word' id='word_1_84' title='bbox 419 492 447 512; x_wconf 84' lang='eng'>55</span> <span class='ocrx_word' id='word_1_85' title='bbox 542 500 714 523; x_wconf 84' lang='eng' dir='ltr'><em>-Halomonas</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 723 500 871 523; x_wconf 85' lang='eng' dir='ltr'><em>alimentaria</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 881 497 993 523; x_wconf 79' lang='eng' dir='ltr'><em>YKJ-16T</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 1004 500 1162 529; x_wconf 88' lang='eng' dir='ltr'><em>(AF211860)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 471 535 1203 566; baseline 0 -7"><span class='ocrx_word' id='word_1_89' title='bbox 471 543 649 544; x_wconf 91' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_90' title='bbox 658 537 811 560; x_wconf 86' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 821 537 908 565; x_wconf 89' lang='eng' dir='ltr'><em>cupida</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 919 537 983 560; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 994 535 1074 560; x_wconf 92' lang='eng' dir='ltr'><em>4740T</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 1085 537 1203 566; x_wconf 86' lang='eng' dir='ltr'><em>(L42615)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 623 567 1187 598; baseline 0 -6"><span class='ocrx_word' id='word_1_95' title='bbox 623 569 777 592; x_wconf 86' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 786 569 920 598; x_wconf 86' lang='eng' dir='ltr'><em>kenyensis</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 929 567 1020 592; x_wconf 91' lang='eng' dir='ltr'><em>AIR-2T</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 1028 569 1187 598; x_wconf 87' lang='eng' dir='ltr'><em>(AY962237)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 619 603 1307 634; baseline 0 -6"><span class='ocrx_word' id='word_1_99' title='bbox 619 605 773 628; x_wconf 85' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 783 605 924 633; x_wconf 86' lang='eng' dir='ltr'><em>campisa/is</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 932 605 1014 628; x_wconf 93' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 1025 603 1138 628; x_wconf 90' lang='eng' dir='ltr'><em>700597T</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 1149 605 1307 634; x_wconf 86' lang='eng' dir='ltr'><em>(AF054286)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 440 637 1166 668; baseline 0 -6"><span class='ocrx_word' id='word_1_104' title='bbox 440 647 563 649; x_wconf 89' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_105' title='bbox 571 640 724 662; x_wconf 85' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 734 640 919 668; x_wconf 86' lang='eng' dir='ltr'><em>campaniensis</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 929 637 1001 662; x_wconf 84' lang='eng' dir='ltr'><em>SAGT</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 1012 639 1166 668; x_wconf 89' lang='eng' dir='ltr'><em>(AJ515365)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 479 667 1298 701; baseline 0 -6"><span class='ocrx_word' id='word_1_109' title='bbox 479 667 507 688; x_wconf 89' lang='eng'>57</span> <span class='ocrx_word' id='word_1_110' title='bbox 525 681 679 683; x_wconf 79' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_111' title='bbox 692 673 845 695; x_wconf 86' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 854 673 952 695; x_wconf 87' lang='eng' dir='ltr'><em>muralis</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 963 672 1026 695; x_wconf 93' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 1037 670 1133 695; x_wconf 85' lang='eng' dir='ltr'><em>20969T</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 1143 672 1298 701; x_wconf 89' lang='eng' dir='ltr'><em>(AJ320530)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 431 708 1028 740; baseline 0.002 -7"><span class='ocrx_word' id='word_1_116' title='bbox 431 708 459 728; x_wconf 87' lang='eng'>95</span> <span class='ocrx_word' id='word_1_117' title='bbox 525 716 780 718; x_wconf 86' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_118' title='bbox 787 709 857 734; x_wconf 89' lang='eng' dir='ltr'><em>SP8T</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 867 711 1028 740; x_wconf 87' lang='eng' dir='ltr'><em>(EU218533)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 480 742 1209 773; baseline 0.001 -7"><span class='ocrx_word' id='word_1_120' title='bbox 480 750 627 753; x_wconf 69' lang='eng'><em>——</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 637 744 791 767; x_wconf 85' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 799 744 994 772; x_wconf 84' lang='eng' dir='ltr'><em>pantelleriensis</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 1002 742 1076 766; x_wconf 95' lang='eng' dir='ltr'><em>AAPT</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 1087 744 1209 773; x_wconf 90' lang='eng' dir='ltr'><em>(X93493)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 438 771 1409 806; baseline 0 -6"><span class='ocrx_word' id='word_1_125' title='bbox 438 771 466 792; x_wconf 75' lang='eng'><em>87</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 488 777 974 800; x_wconf 57' lang='eng' dir='ltr'><em>—Halomonas</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 983 777 1120 800; x_wconf 88' lang='eng' dir='ltr'><em>kribbensis</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 1130 774 1234 800; x_wconf 89' lang='eng' dir='ltr'><em>BH843T</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 1244 777 1409 806; x_wconf 87' lang='eng' dir='ltr'><em>(DQ280368)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 356 809 1326 840; baseline 0 -6"><span class='ocrx_word' id='word_1_130' title='bbox 356 809 384 830; x_wconf 85' lang='eng'><em>93</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 488 820 724 822; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_132' title='bbox 731 812 884 834; x_wconf 85' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 894 812 1062 834; x_wconf 84' lang='eng' dir='ltr'><em>anticariensis</em></span> <span class='ocrx_word' id='word_1_134' title='bbox 1073 809 1156 834; x_wconf 89' lang='eng' dir='ltr'><em>FP35T</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 1166 811 1326 840; x_wconf 87' lang='eng' dir='ltr'><em>(AY489405)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 572 844 1086 876; baseline 0 -7"><span class='ocrx_word' id='word_1_136' title='bbox 572 847 725 869; x_wconf 89' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_137' title='bbox 735 847 875 870; x_wconf 84' lang='eng' dir='ltr'><em>desiderata</em></span> <span class='ocrx_word' id='word_1_138' title='bbox 887 844 953 869; x_wconf 91' lang='eng' dir='ltr'><em>FB2T</em></span> <span class='ocrx_word' id='word_1_139' title='bbox 963 847 1086 876; x_wconf 90' lang='eng' dir='ltr'><em>(X92417)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 684 143 686 197">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 684 143 686 197">
+     <span class='ocr_line' id='line_1_33' title="bbox 684 143 686 197; baseline 0 819"><span class='ocrx_word' id='word_1_140' title='bbox 684 143 686 197; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 602 178 686 180">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 602 178 686 180">
+     <span class='ocr_line' id='line_1_34' title="bbox 602 178 686 180; baseline 0 836"><span class='ocrx_word' id='word_1_141' title='bbox 602 178 686 180; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 373 212 604 215">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 373 212 604 215">
+     <span class='ocr_line' id='line_1_35' title="bbox 373 212 604 215; baseline 0 801"><span class='ocrx_word' id='word_1_142' title='bbox 373 212 604 215; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 602 178 604 249">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 602 178 604 249">
+     <span class='ocr_line' id='line_1_36' title="bbox 602 178 604 249; baseline 0 767"><span class='ocrx_word' id='word_1_143' title='bbox 602 178 604 249; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 346 282 375 284">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 346 282 375 284">
+     <span class='ocr_line' id='line_1_37' title="bbox 346 282 375 284; baseline 0 732"><span class='ocrx_word' id='word_1_144' title='bbox 346 282 375 284; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 701 316 853 319">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 701 316 853 319">
+     <span class='ocr_line' id='line_1_38' title="bbox 701 316 853 319; baseline 0 697"><span class='ocrx_word' id='word_1_145' title='bbox 701 316 853 319; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 852 301 853 336">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 852 301 853 336">
+     <span class='ocr_line' id='line_1_39' title="bbox 852 301 853 336; baseline 0 680"><span class='ocrx_word' id='word_1_146' title='bbox 852 301 853 336; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 700 316 702 371">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 700 316 702 371">
+     <span class='ocr_line' id='line_1_40' title="bbox 700 316 702 371; baseline 0 645"><span class='ocrx_word' id='word_1_147' title='bbox 700 316 702 371; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 537 351 702 353">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 537 351 702 353">
+     <span class='ocr_line' id='line_1_41' title="bbox 537 351 702 353; baseline 0 663"><span class='ocrx_word' id='word_1_148' title='bbox 537 351 702 353; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 470 386 539 387">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 470 386 539 387">
+     <span class='ocr_line' id='line_1_42' title="bbox 470 386 539 387; baseline 0 629"><span class='ocrx_word' id='word_1_149' title='bbox 470 386 539 387; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 539 404 622 406">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 539 404 622 406">
+     <span class='ocr_line' id='line_1_43' title="bbox 539 404 622 406; baseline 0 610"><span class='ocrx_word' id='word_1_150' title='bbox 539 404 622 406; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 452 421 471 422">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 452 421 471 422">
+     <span class='ocr_line' id='line_1_44' title="bbox 452 421 471 422; baseline 0 594"><span class='ocrx_word' id='word_1_151' title='bbox 452 421 471 422; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 411 455 454 457">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 411 455 454 457">
+     <span class='ocr_line' id='line_1_45' title="bbox 411 455 454 457; baseline 0 559"><span class='ocrx_word' id='word_1_152' title='bbox 411 455 454 457; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 537 351 545 510">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 537 351 545 510">
+     <span class='ocr_line' id='line_1_46' title="bbox 537 351 545 510; baseline 0 506"><span class='ocrx_word' id='word_1_153' title='bbox 537 351 545 510; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 470 490 542 492">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 470 490 542 492">
+     <span class='ocr_line' id='line_1_47' title="bbox 470 490 542 492; baseline 0 524"><span class='ocrx_word' id='word_1_154' title='bbox 470 490 542 492; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 452 421 454 526">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 452 421 454 526">
+     <span class='ocr_line' id='line_1_48' title="bbox 452 421 454 526; baseline 0 490"><span class='ocrx_word' id='word_1_155' title='bbox 452 421 454 526; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 452 524 471 526">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 452 524 471 526">
+     <span class='ocr_line' id='line_1_49' title="bbox 452 524 471 526; baseline 0 490"><span class='ocrx_word' id='word_1_156' title='bbox 452 524 471 526; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 373 213 375 560">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 373 213 375 560">
+     <span class='ocr_line' id='line_1_50' title="bbox 373 213 375 560; baseline 0 456"><span class='ocrx_word' id='word_1_157' title='bbox 373 213 375 560; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 470 386 471 544">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 470 386 471 544">
+     <span class='ocr_line' id='line_1_51' title="bbox 470 386 471 544; baseline 0 472"><span class='ocrx_word' id='word_1_158' title='bbox 470 386 471 544; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 373 559 412 561">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 373 559 412 561">
+     <span class='ocr_line' id='line_1_52' title="bbox 373 559 412 561; baseline 0 455"><span class='ocrx_word' id='word_1_159' title='bbox 373 559 412 561; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 456 567 485 587">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 456 567 485 587">
+     <span class='ocr_line' id='line_1_53' title="bbox 456 567 485 587; baseline 0 0"><span class='ocrx_word' id='word_1_160' title='bbox 456 567 485 587; x_wconf 85' lang='eng'><em>89</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 500 578 612 579">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 500 578 612 579">
+     <span class='ocr_line' id='line_1_54' title="bbox 500 578 612 579; baseline 0 437"><span class='ocrx_word' id='word_1_161' title='bbox 500 578 612 579; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 439 594 500 596">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 439 594 500 596">
+     <span class='ocr_line' id='line_1_55' title="bbox 439 594 500 596; baseline 0 420"><span class='ocrx_word' id='word_1_162' title='bbox 439 594 500 596; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 499 578 500 613">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 499 578 500 613">
+     <span class='ocr_line' id='line_1_56' title="bbox 499 578 500 613; baseline 0 403"><span class='ocrx_word' id='word_1_163' title='bbox 499 578 500 613; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_34' title="bbox 378 596 406 617">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 378 596 406 617">
+     <span class='ocr_line' id='line_1_57' title="bbox 378 596 406 617; baseline 0 0"><span class='ocrx_word' id='word_1_164' title='bbox 378 596 406 617; x_wconf 92' lang='eng'>77</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_35' title="bbox 500 612 610 614">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 500 612 610 614">
+     <span class='ocr_line' id='line_1_58' title="bbox 500 612 610 614; baseline 0 402"><span class='ocrx_word' id='word_1_165' title='bbox 500 612 610 614; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_36' title="bbox 439 594 440 648">
+    <p class='ocr_par' dir='ltr' id='par_1_36' title="bbox 439 594 440 648">
+     <span class='ocr_line' id='line_1_59' title="bbox 439 594 440 648; baseline 0 368"><span class='ocrx_word' id='word_1_166' title='bbox 439 594 440 648; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_37' title="bbox 411 629 440 630">
+    <p class='ocr_par' dir='ltr' id='par_1_37' title="bbox 411 629 440 630">
+     <span class='ocr_line' id='line_1_60' title="bbox 411 629 440 630; baseline 0 386"><span class='ocrx_word' id='word_1_167' title='bbox 411 629 440 630; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_38' title="bbox 208 663 347 665">
+    <p class='ocr_par' dir='ltr' id='par_1_38' title="bbox 208 663 347 665">
+     <span class='ocr_line' id='line_1_61' title="bbox 208 663 347 665; baseline 0 351"><span class='ocrx_word' id='word_1_168' title='bbox 208 663 347 665; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_39' title="bbox 478 697 525 700">
+    <p class='ocr_par' dir='ltr' id='par_1_39' title="bbox 478 697 525 700">
+     <span class='ocr_line' id='line_1_62' title="bbox 478 697 525 700; baseline 0 316"><span class='ocrx_word' id='word_1_169' title='bbox 478 697 525 700; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_40' title="bbox 523 681 525 718">
+    <p class='ocr_par' dir='ltr' id='par_1_40' title="bbox 523 681 525 718">
+     <span class='ocr_line' id='line_1_63' title="bbox 523 681 525 718; baseline 0 298"><span class='ocrx_word' id='word_1_170' title='bbox 523 681 525 718; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_41' title="bbox 413 733 480 734">
+    <p class='ocr_par' dir='ltr' id='par_1_41' title="bbox 413 733 480 734">
+     <span class='ocr_line' id='line_1_64' title="bbox 413 733 480 734; baseline 0 282"><span class='ocrx_word' id='word_1_171' title='bbox 413 733 480 734; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_42' title="bbox 478 698 480 752">
+    <p class='ocr_par' dir='ltr' id='par_1_42' title="bbox 478 698 480 752">
+     <span class='ocr_line' id='line_1_65' title="bbox 478 698 480 752; baseline 0 264"><span class='ocrx_word' id='word_1_172' title='bbox 478 698 480 752; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_43' title="bbox 411 455 415 803">
+    <p class='ocr_par' dir='ltr' id='par_1_43' title="bbox 411 455 415 803">
+     <span class='ocr_line' id='line_1_66' title="bbox 411 455 415 803; baseline 0 213"><span class='ocrx_word' id='word_1_173' title='bbox 411 455 415 803; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_44' title="bbox 413 802 488 803">
+    <p class='ocr_par' dir='ltr' id='par_1_44' title="bbox 413 802 488 803">
+     <span class='ocr_line' id='line_1_67' title="bbox 413 802 488 803; baseline 0 213"><span class='ocrx_word' id='word_1_174' title='bbox 413 802 488 803; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_45' title="bbox 346 282 347 838">
+    <p class='ocr_par' dir='ltr' id='par_1_45' title="bbox 346 282 347 838">
+     <span class='ocr_line' id='line_1_68' title="bbox 346 282 347 838; baseline 0 178"><span class='ocrx_word' id='word_1_175' title='bbox 346 282 347 838; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_46' title="bbox 487 786 488 822">
+    <p class='ocr_par' dir='ltr' id='par_1_46' title="bbox 487 786 488 822">
+     <span class='ocr_line' id='line_1_69' title="bbox 487 786 488 822; baseline 0 194"><span class='ocrx_word' id='word_1_176' title='bbox 487 786 488 822; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_47' title="bbox 346 837 404 838">
+    <p class='ocr_par' dir='ltr' id='par_1_47' title="bbox 346 837 404 838">
+     <span class='ocr_line' id='line_1_70' title="bbox 346 837 404 838; baseline 0 178"><span class='ocrx_word' id='word_1_177' title='bbox 346 837 404 838; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_48' title="bbox 403 767 404 856">
+    <p class='ocr_par' dir='ltr' id='par_1_48' title="bbox 403 767 404 856">
+     <span class='ocr_line' id='line_1_71' title="bbox 403 767 404 856; baseline 0 160"><span class='ocrx_word' id='word_1_178' title='bbox 403 767 404 856; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_49' title="bbox 6 870 209 873">
+    <p class='ocr_par' dir='ltr' id='par_1_49' title="bbox 6 870 209 873">
+     <span class='ocr_line' id='line_1_72' title="bbox 6 870 209 873; baseline 0 143"><span class='ocrx_word' id='word_1_179' title='bbox 6 870 209 873; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_50' title="bbox 6 871 7 995">
+    <p class='ocr_par' dir='ltr' id='par_1_50' title="bbox 6 871 7 995">
+     <span class='ocr_line' id='line_1_73' title="bbox 6 871 7 995; baseline 0 21"><span class='ocrx_word' id='word_1_180' title='bbox 6 871 7 995; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_51' title="bbox 383 880 1150 948">
+    <p class='ocr_par' dir='ltr' id='par_1_51' title="bbox 383 880 1150 948">
+     <span class='ocr_line' id='line_1_74' title="bbox 383 880 1002 912; baseline -0.002 -6"><span class='ocrx_word' id='word_1_181' title='bbox 383 889 429 891; x_wconf 85' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_182' title='bbox 438 883 592 906; x_wconf 87' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_183' title='bbox 601 882 731 906; x_wconf 86' lang='eng' dir='ltr'><em>marisflavi</em></span> <span class='ocrx_word' id='word_1_184' title='bbox 739 880 834 906; x_wconf 90' lang='eng' dir='ltr'><em>SW32T</em></span> <span class='ocrx_word' id='word_1_185' title='bbox 844 882 937 912; x_wconf 90' lang='eng' dir='ltr'><em>(AF251</em></span> <span class='ocrx_word' id='word_1_186' title='bbox 946 882 1002 912; x_wconf 90' lang='eng'><em>143)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_75' title="bbox 383 916 1150 948; baseline -0.001 -6"><span class='ocrx_word' id='word_1_187' title='bbox 383 925 578 927; x_wconf 32' lang='eng'>*</span> <span class='ocrx_word' id='word_1_188' title='bbox 585 919 738 942; x_wconf 88' lang='eng' dir='ltr'><em>Halomonas</em></span> <span class='ocrx_word' id='word_1_189' title='bbox 748 919 875 942; x_wconf 87' lang='eng' dir='ltr'><em>indalinina</em></span> <span class='ocrx_word' id='word_1_190' title='bbox 885 916 985 942; x_wconf 90' lang='eng' dir='ltr'><em>CG2.1T</em></span> <span class='ocrx_word' id='word_1_191' title='bbox 995 919 1150 948; x_wconf 87' lang='eng' dir='ltr'><em>(AJ427627)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_52' title="bbox 215 951 996 1016">
+    <p class='ocr_par' dir='ltr' id='par_1_52' title="bbox 215 951 996 1016">
+     <span class='ocr_line' id='line_1_76' title="bbox 356 951 996 982; baseline 0 -6"><span class='ocrx_word' id='word_1_192' title='bbox 356 953 560 976; x_wconf 86' lang='eng' dir='ltr'><em>—Ha/omonas</em></span> <span class='ocrx_word' id='word_1_193' title='bbox 569 953 713 976; x_wconf 87' lang='eng' dir='ltr'><em>av/cenniae</em></span> <span class='ocrx_word' id='word_1_194' title='bbox 724 951 823 976; x_wconf 89' lang='eng' dir='ltr'><em>MW2aT</em></span> <span class='ocrx_word' id='word_1_195' title='bbox 831 953 996 982; x_wconf 81' lang='eng' dir='ltr'><em>(D0888315)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_77' title="bbox 215 984 787 1016; baseline 0 -7"><span class='ocrx_word' id='word_1_196' title='bbox 215 987 234 1009; x_wconf 94' lang='eng' dir='ltr'><em>Z</em></span> <span class='ocrx_word' id='word_1_197' title='bbox 233 987 378 1016; x_wconf 78' lang='eng' dir='ltr'><em>ymobacter</em></span> <span class='ocrx_word' id='word_1_198' title='bbox 384 987 483 1015; x_wconf 85' lang='eng' dir='ltr'><em>palmae</em></span> <span class='ocrx_word' id='word_1_199' title='bbox 495 987 545 1009; x_wconf 94' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_200' title='bbox 558 984 652 1009; x_wconf 82' lang='eng' dir='ltr'><em>14233T</em></span> <span class='ocrx_word' id='word_1_201' title='bbox 663 986 787 1016; x_wconf 89' lang='eng' dir='ltr'><em>(D14555)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_53' title="bbox 354 906 383 908">
+    <p class='ocr_par' dir='ltr' id='par_1_53' title="bbox 354 906 383 908">
+     <span class='ocr_line' id='line_1_78' title="bbox 354 906 383 908; baseline 0 108"><span class='ocrx_word' id='word_1_202' title='bbox 354 906 383 908; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_54' title="bbox 382 889 383 926">
+    <p class='ocr_par' dir='ltr' id='par_1_54' title="bbox 382 889 383 926">
+     <span class='ocr_line' id='line_1_79' title="bbox 382 889 383 926; baseline 0 90"><span class='ocrx_word' id='word_1_203' title='bbox 382 889 383 926; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_55' title="bbox 208 663 209 942">
+    <p class='ocr_par' dir='ltr' id='par_1_55' title="bbox 208 663 209 942">
+     <span class='ocr_line' id='line_1_80' title="bbox 208 663 209 942; baseline 0 74"><span class='ocrx_word' id='word_1_204' title='bbox 208 663 209 942; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_56' title="bbox 208 940 356 943">
+    <p class='ocr_par' dir='ltr' id='par_1_56' title="bbox 208 940 356 943">
+     <span class='ocr_line' id='line_1_81' title="bbox 208 940 356 943; baseline 0 73"><span class='ocrx_word' id='word_1_205' title='bbox 208 940 356 943; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_57' title="bbox 354 906 356 961">
+    <p class='ocr_par' dir='ltr' id='par_1_57' title="bbox 354 906 356 961">
+     <span class='ocr_line' id='line_1_82' title="bbox 354 906 356 961; baseline 0 55"><span class='ocrx_word' id='word_1_206' title='bbox 354 906 356 961; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003525-0-001.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003525-0-001.pbm.png
new file mode 100644
index 00000000..eb883dab
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003525-0-001.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003525-0-001.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003525-0-001.pbm.png.hocr
new file mode 100644
index 00000000..be0d14b3
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003525-0-001.pbm.png.hocr
@@ -0,0 +1,140 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003525-0-001.pbm.png"; bbox 0 0 1716 1112; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 227 170 270 186">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 227 170 270 186">
+     <span class='ocr_line' id='line_1_1' title="bbox 227 170 270 186; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 227 170 270 186; x_wconf 89' lang='eng'><em>0.10</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 598 187 634 203">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 598 187 634 203">
+     <span class='ocr_line' id='line_1_2' title="bbox 598 187 634 203; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 598 187 634 203; x_wconf 90' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 532 291 568 307">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 532 291 568 307">
+     <span class='ocr_line' id='line_1_3' title="bbox 532 291 568 307; baseline 0 0"><span class='ocrx_word' id='word_1_3' title='bbox 532 291 568 307; x_wconf 90' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 544 863 580 879">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 544 863 580 879">
+     <span class='ocr_line' id='line_1_4' title="bbox 544 863 580 879; baseline 0 0"><span class='ocrx_word' id='word_1_4' title='bbox 544 863 580 879; x_wconf 91' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 664 2 1470 390">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 664 2 1470 390">
+     <span class='ocr_line' id='line_1_5' title="bbox 747 2 1408 31; baseline 0 -4"><span class='ocrx_word' id='word_1_5' title='bbox 747 8 768 23; x_wconf 86' lang='eng'><em>91</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 813 4 960 27; x_wconf 77' lang='eng' dir='ltr'><em>‘Geobacter</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 968 5 1161 27; x_wconf 84' lang='eng' dir='ltr'><em>humireducens’</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 1172 5 1231 27; x_wconf 86' lang='eng' dir='ltr'><em>JW3</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 1243 2 1408 31; x_wconf 85' lang='eng' dir='ltr'>(AY187306)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 700 40 1335 69; baseline 0 -4"><span class='ocrx_word' id='word_1_10' title='bbox 700 43 725 59; x_wconf 72' lang='eng'>54</span> <span class='ocrx_word' id='word_1_11' title='bbox 836 42 975 65; x_wconf 81' lang='eng' dir='ltr'><em>Geobacter</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 983 43 1119 65; x_wconf 86' lang='eng' dir='ltr'><em>bremensis</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 1130 41 1195 65; x_wconf 75' lang='eng' dir='ltr'><em>Dfr1T</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 1205 40 1301 69; x_wconf 88' lang='eng' dir='ltr'>(U9691</span> <span class='ocrx_word' id='word_1_15' title='bbox 1311 40 1335 69; x_wconf 91' lang='eng'><em>7)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 783 76 1406 106; baseline 0 -5"><span class='ocrx_word' id='word_1_16' title='bbox 783 78 929 101; x_wconf 88' lang='eng' dir='ltr'><em>Geobacter</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 939 79 1139 106; x_wconf 81' lang='eng' dir='ltr'><em>toluenoxydans</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 1149 77 1231 101; x_wconf 89' lang='eng' dir='ltr'><em>TMJ1T</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 1241 76 1406 106; x_wconf 90' lang='eng' dir='ltr'>(EU711072)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 732 111 1298 143; baseline 0 -7"><span class='ocrx_word' id='word_1_20' title='bbox 732 113 758 129; x_wconf 71' lang='eng'><em>85</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 822 114 961 136; x_wconf 84' lang='eng' dir='ltr'><em>Geobacter</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 970 114 1088 143; x_wconf 74' lang='eng' dir='ltr'><em>chapel/6i</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 1099 115 1106 136; x_wconf 96' lang='eng'>1</span> <span class='ocrx_word' id='word_1_24' title='bbox 1116 112 1159 136; x_wconf 88' lang='eng' dir='ltr'><em>72T</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 1169 111 1298 141; x_wconf 86' lang='eng' dir='ltr'>(U41561)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 664 147 1398 178; baseline -0.001 -6"><span class='ocrx_word' id='word_1_26' title='bbox 664 149 685 165; x_wconf 74' lang='eng'><em>61</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 821 149 964 172; x_wconf 84' lang='eng' dir='ltr'><em>Pelobacter</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 971 149 1125 178; x_wconf 82' lang='eng' dir='ltr'><em>propionicus</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 1136 149 1177 172; x_wconf 86' lang='eng' dir='ltr'><em>Ott</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 1188 149 1223 172; x_wconf 90' lang='eng' dir='ltr'>Bd</span> <span class='ocrx_word' id='word_1_31' title='bbox 1237 148 1261 171; x_wconf 91' lang='eng' dir='ltr'><em>1T</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 1271 147 1398 176; x_wconf 84' lang='eng' dir='ltr'>(X70954)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 814 183 1312 214; baseline 0 -7"><span class='ocrx_word' id='word_1_33' title='bbox 814 185 953 207; x_wconf 80' lang='eng' dir='ltr'><em>Geobacter</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 960 185 1096 214; x_wconf 84' lang='eng' dir='ltr'><em>pelophilus</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 1107 184 1172 207; x_wconf 77' lang='eng' dir='ltr'><em>Dfr2T</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 1182 183 1312 212; x_wconf 87' lang='eng' dir='ltr'>(U96918)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 717 218 1327 249; baseline 0 -6"><span class='ocrx_word' id='word_1_37' title='bbox 717 223 754 239; x_wconf 84' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 776 220 914 243; x_wconf 82' lang='eng' dir='ltr'><em>Geobacter</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 922 221 1027 249; x_wconf 81' lang='eng' dir='ltr'><em>grbiciae</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 1036 219 1154 243; x_wconf 77' lang='eng' dir='ltr'><em>TACP-5T</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 1164 218 1275 247; x_wconf 85' lang='eng' dir='ltr'>(AF3351</span> <span class='ocrx_word' id='word_1_42' title='bbox 1284 218 1327 247; x_wconf 86' lang='eng'><em>83)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 664 254 1382 283; baseline -0.001 -4"><span class='ocrx_word' id='word_1_43' title='bbox 664 256 689 272; x_wconf 81' lang='eng'><em>99</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 781 256 920 279; x_wconf 83' lang='eng' dir='ltr'><em>Geobacter</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 928 256 1136 279; x_wconf 80' lang='eng' dir='ltr'><em>metallireducens</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 1146 255 1248 279; x_wconf 63' lang='eng' dir='ltr'><em>(ES-15T</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 1258 254 1382 283; x_wconf 89' lang='eng' dir='ltr'>(LO7834)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 762 289 1325 319; baseline -0.002 -4"><span class='ocrx_word' id='word_1_48' title='bbox 762 292 901 315; x_wconf 85' lang='eng' dir='ltr'><em>Geobacter</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 909 292 1104 315; x_wconf 83' lang='eng' dir='ltr'><em>sulfurreducens</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 1116 290 1186 315; x_wconf 91' lang='eng' dir='ltr'><em>PCAT</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 1196 289 1223 319; x_wconf 90' lang='eng' dir='ltr'><em>(U</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 1230 293 1237 314; x_wconf 96' lang='eng'>1</span> <span class='ocrx_word' id='word_1_53' title='bbox 1245 290 1325 319; x_wconf 87' lang='eng'><em>3928)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 712 325 1470 356; baseline 0 -6"><span class='ocrx_word' id='word_1_54' title='bbox 712 327 748 343; x_wconf 67' lang='eng'><em>‘00</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 862 328 1078 350; x_wconf 81' lang='eng' dir='ltr'><em>Desu/furornonas</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 1087 328 1211 356; x_wconf 79' lang='eng' dir='ltr'><em>palm/tatis</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 1221 326 1331 350; x_wconf 87' lang='eng' dir='ltr'><em>SDBY1T</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 1341 325 1419 354; x_wconf 85' lang='eng' dir='ltr'>(U281</span> <span class='ocrx_word' id='word_1_59' title='bbox 1428 325 1470 354; x_wconf 86' lang='eng'>72)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 688 361 1455 390; baseline -0.001 -4"><span class='ocrx_word' id='word_1_60' title='bbox 688 362 725 378; x_wconf 76' lang='eng'><em>‘00</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 865 363 1008 386; x_wconf 80' lang='eng' dir='ltr'><em>Pe/obacter</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 1017 363 1175 386; x_wconf 79' lang='eng' dir='ltr'><em>carbinolicus</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 1185 363 1234 386; x_wconf 85' lang='eng' dir='ltr'><em>Gra</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 1245 363 1280 386; x_wconf 93' lang='eng' dir='ltr'>Bd</span> <span class='ocrx_word' id='word_1_65' title='bbox 1294 362 1318 385; x_wconf 92' lang='eng' dir='ltr'><em>1T</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 1328 361 1455 390; x_wconf 87' lang='eng' dir='ltr'>(X79413)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 849 396 1525 461">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 849 396 1525 461">
+     <span class='ocr_line' id='line_1_16' title="bbox 851 396 1525 426; baseline 0 -5"><span class='ocrx_word' id='word_1_67' title='bbox 851 399 1067 421; x_wconf 81' lang='eng' dir='ltr'><em>Desu/furomonas</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 1077 399 1233 421; x_wconf 73' lang='eng' dir='ltr'><em>acetoxidans</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 1244 399 1308 422; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 1320 398 1382 421; x_wconf 89' lang='eng' dir='ltr'><em>684T</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 1392 396 1525 426; x_wconf 85' lang='eng' dir='ltr'><em>(M26634)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 849 429 1446 461; baseline 0.002 -8"><span class='ocrx_word' id='word_1_72' title='bbox 849 436 873 452; x_wconf 91' lang='eng'><em>74</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 914 432 1160 461; x_wconf 82' lang='eng' dir='ltr'><em>Desulfosporosinus</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 1170 439 1206 461; x_wconf 84' lang='eng' dir='ltr'><em>sp.</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 1218 432 1273 455; x_wconf 89' lang='eng' dir='ltr'><em>S10</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 1284 429 1446 459; x_wconf 85' lang='eng' dir='ltr'>(AFO76527)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 791 465 1557 570">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 791 465 1557 570">
+     <span class='ocr_line' id='line_1_18' title="bbox 846 465 1427 497; baseline 0.003 -9"><span class='ocrx_word' id='word_1_77' title='bbox 846 472 870 488; x_wconf 81' lang='eng'><em>97</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 917 468 1163 496; x_wconf 79' lang='eng' dir='ltr'><em>Desu/fosporosinus</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 1173 475 1209 497; x_wconf 91' lang='eng' dir='ltr'><em>sp.</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 1220 468 1248 490; x_wconf 93' lang='eng' dir='ltr'>T1</span> <span class='ocrx_word' id='word_1_81' title='bbox 1265 465 1427 495; x_wconf 88' lang='eng' dir='ltr'>(AFO76525)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 815 503 1557 534; baseline 0 -6"><span class='ocrx_word' id='word_1_82' title='bbox 815 507 840 523; x_wconf 79' lang='eng'>96</span> <span class='ocrx_word' id='word_1_83' title='bbox 917 506 1163 534; x_wconf 79' lang='eng' dir='ltr'><em>Desu/fosporosinus</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 1173 506 1255 534; x_wconf 84' lang='eng' dir='ltr'><em>hippei</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 1264 505 1327 528; x_wconf 92' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 1339 504 1419 528; x_wconf 82' lang='eng' dir='ltr'><em>8344T</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 1429 503 1468 532; x_wconf 92' lang='eng' dir='ltr'>(Y1</span> <span class='ocrx_word' id='word_1_88' title='bbox 1479 503 1557 532; x_wconf 88' lang='eng'>1571)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 791 539 1526 570; baseline -0.001 -6"><span class='ocrx_word' id='word_1_89' title='bbox 791 543 816 559; x_wconf 84' lang='eng'><em>94</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 923 541 1168 570; x_wconf 85' lang='eng' dir='ltr'><em>Desu/fosporosinus</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 1179 541 1247 564; x_wconf 86' lang='eng' dir='ltr'><em>lacus</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 1257 541 1324 564; x_wconf 89' lang='eng' dir='ltr'>STP1</span> <span class='ocrx_word' id='word_1_93' title='bbox 1333 540 1359 563; x_wconf 85' lang='eng' dir='ltr'><em>2T</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 1368 539 1526 568; x_wconf 74' lang='eng' dir='ltr'>(A1582757)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 865 574 1508 637">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 865 574 1508 637">
+     <span class='ocr_line' id='line_1_21' title="bbox 870 574 1508 606; baseline 0 -7"><span class='ocrx_word' id='word_1_95' title='bbox 870 577 1116 606; x_wconf 85' lang='eng' dir='ltr'><em>Desulfosporosinus</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 1127 577 1221 599; x_wconf 77' lang='eng' dir='ltr'><em>orient/&#39;5</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 1233 576 1297 599; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 1310 575 1371 599; x_wconf 80' lang='eng' dir='ltr'><em>765T</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 1381 575 1420 604; x_wconf 91' lang='eng' dir='ltr'>(Y1</span> <span class='ocrx_word' id='word_1_100' title='bbox 1430 574 1508 604; x_wconf 86' lang='eng'>1570)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 865 608 1504 637; baseline 0.002 -6"><span class='ocrx_word' id='word_1_101' title='bbox 865 615 889 631; x_wconf 82' lang='eng'><em>99</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 997 611 1174 633; x_wconf 83' lang='eng' dir='ltr'><em>Deha/obacter</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 1183 611 1303 633; x_wconf 81' lang='eng' dir='ltr'><em>restrictus</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 1312 611 1367 632; x_wconf 95' lang='eng' dir='ltr'><em>TEA</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 1377 608 1452 637; x_wconf 92' lang='eng' dir='ltr'>(Y101</span> <span class='ocrx_word' id='word_1_106' title='bbox 1461 608 1504 637; x_wconf 88' lang='eng'><em>64)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 686 643 1715 924">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 686 643 1715 924">
+     <span class='ocr_line' id='line_1_23' title="bbox 739 643 1657 675; baseline 0.002 -9"><span class='ocrx_word' id='word_1_107' title='bbox 739 650 763 666; x_wconf 84' lang='eng'><em>99</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 1041 646 1274 675; x_wconf 80' lang='eng' dir='ltr'><em>Syntrophobotu/us</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 1283 646 1414 675; x_wconf 77' lang='eng' dir='ltr'><em>glycol/Gus</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 1424 646 1518 675; x_wconf 90' lang='eng' dir='ltr'><em>SIGIym</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 1530 643 1657 673; x_wconf 88' lang='eng' dir='ltr'>(X99706)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 889 679 1577 708; baseline 0.003 -6"><span class='ocrx_word' id='word_1_112' title='bbox 889 686 914 702; x_wconf 84' lang='eng'>92</span> <span class='ocrx_word' id='word_1_113' title='bbox 953 681 1200 704; x_wconf 82' lang='eng' dir='ltr'><em>Desu/ﬁtobacterium</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 1211 682 1337 704; x_wconf 81' lang='eng' dir='ltr'><em>hafniense</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 1348 681 1431 704; x_wconf 87' lang='eng' dir='ltr'>PCP-1</span> <span class='ocrx_word' id='word_1_116' title='bbox 1448 679 1577 708; x_wconf 89' lang='eng' dir='ltr'>(U40078)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 861 717 1576 746; baseline 0 -4"><span class='ocrx_word' id='word_1_117' title='bbox 861 722 880 738; x_wconf 83' lang='eng'><em>71</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 939 720 1186 742; x_wconf 81' lang='eng' dir='ltr'><em>Desu/ﬁtobacterium</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 1197 720 1324 742; x_wconf 76' lang='eng' dir='ltr'><em>hafniense</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 1335 718 1438 742; x_wconf 84' lang='eng' dir='ltr'><em>DOB-2T</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 1448 717 1576 746; x_wconf 89' lang='eng' dir='ltr'>(X94975)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 838 753 1606 784; baseline 0 -7"><span class='ocrx_word' id='word_1_122' title='bbox 838 757 862 773; x_wconf 81' lang='eng'><em>63</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 912 755 1159 778; x_wconf 80' lang='eng' dir='ltr'><em>Desu/fitobacterium</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 1170 755 1372 784; x_wconf 79' lang='eng' dir='ltr'><em>chlororespirans</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 1382 754 1467 778; x_wconf 80' lang='eng' dir='ltr'><em>0023T</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 1477 753 1606 782; x_wconf 87' lang='eng' dir='ltr'><em>(U68528)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 802 788 1667 820; baseline 0 -7"><span class='ocrx_word' id='word_1_127' title='bbox 802 793 826 809; x_wconf 89' lang='eng'><em>50</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 914 791 1161 813; x_wconf 81' lang='eng' dir='ltr'><em>Desu/ﬁtobacterium</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 1173 791 1357 820; x_wconf 85' lang='eng' dir='ltr'><em>deha/ogenans</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 1366 789 1533 813; x_wconf 91' lang='eng' dir='ltr'><em>JW/IU-DC1T</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 1543 788 1667 818; x_wconf 86' lang='eng' dir='ltr'>(L28946)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 789 824 1715 853; baseline -0.001 -4"><span class='ocrx_word' id='word_1_132' title='bbox 789 829 813 845; x_wconf 82' lang='eng'>76</span> <span class='ocrx_word' id='word_1_133' title='bbox 936 826 1183 849; x_wconf 82' lang='eng' dir='ltr'><em>Desulfitobacterium</em></span> <span class='ocrx_word' id='word_1_134' title='bbox 1194 827 1402 849; x_wconf 84' lang='eng' dir='ltr'><em>meta/lireducens</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 1412 825 1542 848; x_wconf 80' lang='eng' dir='ltr'><em>853—15AT</em></span> <span class='ocrx_word' id='word_1_136' title='bbox 1552 824 1715 853; x_wconf 83' lang='eng' dir='ltr'>(AF297871)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 927 860 1697 889; baseline -0.001 -4"><span class='ocrx_word' id='word_1_137' title='bbox 927 862 1191 885; x_wconf 87' lang='eng' dir='ltr'><em>Desulfitobacterium</em></span> <span class='ocrx_word' id='word_1_138' title='bbox 1202 862 1426 885; x_wconf 87' lang='eng' dir='ltr'><em>aromaticivorans</em></span> <span class='ocrx_word' id='word_1_139' title='bbox 1437 861 1521 885; x_wconf 87' lang='eng' dir='ltr'><em>UKTLT</em></span> <span class='ocrx_word' id='word_1_140' title='bbox 1532 860 1697 889; x_wconf 92' lang='eng' dir='ltr'>(EU711071)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 686 895 1673 924; baseline 0 -4"><span class='ocrx_word' id='word_1_141' title='bbox 686 900 711 916; x_wconf 81' lang='eng'>68</span> <span class='ocrx_word' id='word_1_142' title='bbox 967 898 1213 920; x_wconf 82' lang='eng' dir='ltr'><em>Desulfotomaculum</em></span> <span class='ocrx_word' id='word_1_143' title='bbox 1224 898 1371 920; x_wconf 85' lang='eng' dir='ltr'><em>kuznetsovii</em></span> <span class='ocrx_word' id='word_1_144' title='bbox 1380 897 1444 921; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_145' title='bbox 1456 899 1484 920; x_wconf 86' lang='eng'><em>61</em></span> <span class='ocrx_word' id='word_1_146' title='bbox 1494 896 1536 920; x_wconf 84' lang='eng' dir='ltr'><em>15T</em></span> <span class='ocrx_word' id='word_1_147' title='bbox 1546 895 1585 924; x_wconf 94' lang='eng' dir='ltr'><em>(Y1</em></span> <span class='ocrx_word' id='word_1_148' title='bbox 1596 899 1603 920; x_wconf 96' lang='eng'>1</span> <span class='ocrx_word' id='word_1_149' title='bbox 1612 895 1673 924; x_wconf 85' lang='eng'>569)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 631 928 1467 960">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 631 928 1467 960">
+     <span class='ocr_line' id='line_1_31' title="bbox 631 928 1467 960; baseline 0.001 -8"><span class='ocrx_word' id='word_1_150' title='bbox 631 936 656 952; x_wconf 83' lang='eng'><em>97</em></span> <span class='ocrx_word' id='word_1_151' title='bbox 923 931 1169 954; x_wconf 84' lang='eng' dir='ltr'><em>Desu/fotomacu/um</em></span> <span class='ocrx_word' id='word_1_152' title='bbox 1179 938 1215 960; x_wconf 85' lang='eng' dir='ltr'><em>sp.</em></span> <span class='ocrx_word' id='word_1_153' title='bbox 1228 931 1298 954; x_wconf 85' lang='eng' dir='ltr'><em>0x39</em></span> <span class='ocrx_word' id='word_1_154' title='bbox 1310 928 1467 958; x_wconf 86' lang='eng' dir='ltr'>(AJ577273)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 455 1006 492 1022">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 455 1006 492 1022">
+     <span class='ocr_line' id='line_1_32' title="bbox 455 1006 492 1022; baseline 0 0"><span class='ocrx_word' id='word_1_155' title='bbox 455 1006 492 1022; x_wconf 88' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 648 967 1669 1034">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 648 967 1669 1034">
+     <span class='ocr_line' id='line_1_33' title="bbox 969 967 1669 996; baseline -0.001 -4"><span class='ocrx_word' id='word_1_156' title='bbox 969 969 1216 992; x_wconf 79' lang='eng' dir='ltr'><em>Desul/otomaculum</em></span> <span class='ocrx_word' id='word_1_157' title='bbox 1226 969 1382 992; x_wconf 81' lang='eng' dir='ltr'><em>acetoxidans</em></span> <span class='ocrx_word' id='word_1_158' title='bbox 1394 969 1457 992; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_159' title='bbox 1470 968 1531 991; x_wconf 90' lang='eng' dir='ltr'><em>771T</em></span> <span class='ocrx_word' id='word_1_160' title='bbox 1542 967 1581 996; x_wconf 94' lang='eng' dir='ltr'>(Y1</span> <span class='ocrx_word' id='word_1_161' title='bbox 1591 967 1669 996; x_wconf 88' lang='eng'><em>1566)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 648 1002 1278 1034; baseline 0 -7"><span class='ocrx_word' id='word_1_162' title='bbox 648 1005 879 1034; x_wconf 84' lang='eng' dir='ltr'><em>Hydrogenobacter</em></span> <span class='ocrx_word' id='word_1_163' title='bbox 888 1005 1057 1033; x_wconf 82' lang='eng' dir='ltr'><em>thermophi/us</em></span> <span class='ocrx_word' id='word_1_164' title='bbox 1066 1003 1141 1027; x_wconf 88' lang='eng' dir='ltr'><em>TK-6T</em></span> <span class='ocrx_word' id='word_1_165' title='bbox 1151 1002 1278 1032; x_wconf 86' lang='eng'>(230214)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 553 1038 1150 1105">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 553 1038 1150 1105">
+     <span class='ocr_line' id='line_1_35' title="bbox 614 1038 1150 1067; baseline 0 -5"><span class='ocrx_word' id='word_1_166' title='bbox 614 1040 782 1063; x_wconf 84' lang='eng' dir='ltr'><em>Thermocrinis</em></span> <span class='ocrx_word' id='word_1_167' title='bbox 793 1040 862 1063; x_wconf 89' lang='eng' dir='ltr'><em>ruber</em></span> <span class='ocrx_word' id='word_1_168' title='bbox 870 1040 917 1063; x_wconf 92' lang='eng' dir='ltr'><em>OC</em></span> <span class='ocrx_word' id='word_1_169' title='bbox 930 1039 982 1062; x_wconf 81' lang='eng' dir='ltr'><em>1/4T</em></span> <span class='ocrx_word' id='word_1_170' title='bbox 993 1038 1150 1067; x_wconf 86' lang='eng' dir='ltr'><em>(AJ005640)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 553 1073 1035 1105; baseline 0 -7"><span class='ocrx_word' id='word_1_171' title='bbox 553 1076 654 1105; x_wconf 76' lang='eng' dir='ltr'><em>Aquifex</em></span> <span class='ocrx_word' id='word_1_172' title='bbox 660 1076 797 1105; x_wconf 84' lang='eng' dir='ltr'><em>pyrophilus</em></span> <span class='ocrx_word' id='word_1_173' title='bbox 808 1075 892 1098; x_wconf 74' lang='eng' dir='ltr'><em>Ko|5aT</em></span> <span class='ocrx_word' id='word_1_174' title='bbox 902 1073 1035 1103; x_wconf 87' lang='eng' dir='ltr'><em>(M83548)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003541-0-000.pbm.png b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003541-0-000.pbm.png
new file mode 100644
index 00000000..c9aab033
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003541-0-000.pbm.png differ
diff --git a/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003541-0-000.pbm.png.hocr b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003541-0-000.pbm.png.hocr
new file mode 100644
index 00000000..93e7da84
--- /dev/null
+++ b/examples/hocr-tesseract-ijsem-140/sourceimages/ijs.0.003541-0-000.pbm.png.hocr
@@ -0,0 +1,243 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003541-0-000.pbm.png"; bbox 0 0 1716 1138; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 38 9 80 29">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 38 9 80 29">
+     <span class='ocr_line' id='line_1_1' title="bbox 38 9 80 29; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 38 9 80 29; x_wconf 85' lang='eng'>1%</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 351 60 1022 146">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 351 60 1022 146">
+     <span class='ocr_line' id='line_1_2' title="bbox 495 60 879 88; baseline 0 -6"><span class='ocrx_word' id='word_1_2' title='bbox 495 63 518 82; x_wconf 98' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_3' title='bbox 530 60 729 82; x_wconf 76' lang='eng' dir='ltr'>towneriAB1110T</span> <span class='ocrx_word' id='word_1_4' title='bbox 740 62 879 88; x_wconf 88' lang='eng' dir='ltr'>(AF509823)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 360 92 1022 117; baseline 0 -5"><span class='ocrx_word' id='word_1_5' title='bbox 360 92 527 112; x_wconf 85' lang='eng' dir='ltr'>Acinetobacter</span> <span class='ocrx_word' id='word_1_6' title='bbox 534 92 634 117; x_wconf 89' lang='eng' dir='ltr'>genomic</span> <span class='ocrx_word' id='word_1_7' title='bbox 643 92 733 117; x_wconf 86' lang='eng' dir='ltr'>species</span> <span class='ocrx_word' id='word_1_8' title='bbox 744 92 806 112; x_wconf 92' lang='eng' dir='ltr'>15TU</span> <span class='ocrx_word' id='word_1_9' title='bbox 817 92 836 111; x_wconf 93' lang='eng' dir='ltr'>M</span> <span class='ocrx_word' id='word_1_10' title='bbox 848 92 904 112; x_wconf 89' lang='eng' dir='ltr'>151a</span> <span class='ocrx_word' id='word_1_11' title='bbox 914 92 1022 117; x_wconf 88' lang='eng'>(293448)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 351 119 843 146; baseline 0 -5"><span class='ocrx_word' id='word_1_12' title='bbox 351 121 374 141; x_wconf 92' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_13' title='bbox 385 121 552 141; x_wconf 84' lang='eng' dir='ltr'>radioresistens</span> <span class='ocrx_word' id='word_1_14' title='bbox 560 121 632 141; x_wconf 93' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_15' title='bbox 641 119 726 141; x_wconf 91' lang='eng' dir='ltr'>43998T</span> <span class='ocrx_word' id='word_1_16' title='bbox 736 121 843 146; x_wconf 88' lang='eng'>(293445)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 287 148 771 202">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 287 148 771 201">
+     <span class='ocr_line' id='line_1_5' title="bbox 310 148 725 176; baseline 0 -6"><span class='ocrx_word' id='word_1_17' title='bbox 310 150 335 170; x_wconf 92' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_18' title='bbox 347 150 485 170; x_wconf 85' lang='eng' dir='ltr'>venetianus</span> <span class='ocrx_word' id='word_1_19' title='bbox 495 148 588 170; x_wconf 91' lang='eng' dir='ltr'>RAG-1T</span> <span class='ocrx_word' id='word_1_20' title='bbox 595 150 725 176; x_wconf 87' lang='eng' dir='ltr'>(AJ295007</span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 287 173 771 201; baseline 0.002 -6"><span class='ocrx_word' id='word_1_21' title='bbox 287 173 333 195; x_wconf 82' lang='eng' dir='ltr'>61A.</span> <span class='ocrx_word' id='word_1_22' title='bbox 345 176 484 196; x_wconf 86' lang='eng' dir='ltr'>venetianus</span> <span class='ocrx_word' id='word_1_23' title='bbox 494 176 545 196; x_wconf 95' lang='eng' dir='ltr'><strong>LUH</strong></span> <span class='ocrx_word' id='word_1_24' title='bbox 555 176 613 196; x_wconf 87' lang='eng'>4379</span> <span class='ocrx_word' id='word_1_25' title='bbox 623 176 717 201; x_wconf 88' lang='eng' dir='ltr'>(AM909</span> <span class='ocrx_word' id='word_1_26' title='bbox 734 176 771 201; x_wconf 92' lang='eng'>51)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 286 195 765 288">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 286 195 765 287">
+     <span class='ocr_line' id='line_1_7' title="bbox 287 195 765 233; baseline 0 -9"><span class='ocrx_word' id='word_1_27' title='bbox 287 195 332 233; x_wconf 52' lang='eng' dir='ltr'><em>21A.</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 344 204 482 224; x_wconf 82' lang='eng' dir='ltr'>venetianus</span> <span class='ocrx_word' id='word_1_29' title='bbox 492 204 544 224; x_wconf 95' lang='eng' dir='ltr'><strong>LUH</strong></span> <span class='ocrx_word' id='word_1_30' title='bbox 554 204 612 224; x_wconf 90' lang='eng'><strong>8758</strong></span> <span class='ocrx_word' id='word_1_31' title='bbox 622 204 765 229; x_wconf 86' lang='eng' dir='ltr'>(EU258609)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 286 232 765 260; baseline 0 -8"><span class='ocrx_word' id='word_1_32' title='bbox 286 232 332 260; x_wconf 38' lang='eng' dir='ltr'>1054i.</span> <span class='ocrx_word' id='word_1_33' title='bbox 344 232 482 252; x_wconf 87' lang='eng' dir='ltr'>venetianus</span> <span class='ocrx_word' id='word_1_34' title='bbox 492 232 544 252; x_wconf 93' lang='eng' dir='ltr'><strong>LUH</strong></span> <span class='ocrx_word' id='word_1_35' title='bbox 554 232 612 252; x_wconf 88' lang='eng'>7437</span> <span class='ocrx_word' id='word_1_36' title='bbox 622 232 765 257; x_wconf 88' lang='eng' dir='ltr'>(EU258610)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 306 261 765 287; baseline 0.002 -6"><span class='ocrx_word' id='word_1_37' title='bbox 306 262 332 281; x_wconf 90' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_38' title='bbox 343 262 482 282; x_wconf 86' lang='eng' dir='ltr'>venetianus</span> <span class='ocrx_word' id='word_1_39' title='bbox 492 262 544 282; x_wconf 96' lang='eng' dir='ltr'>LUH</span> <span class='ocrx_word' id='word_1_40' title='bbox 554 262 611 282; x_wconf 88' lang='eng'>5627</span> <span class='ocrx_word' id='word_1_41' title='bbox 622 261 765 287; x_wconf 82' lang='eng' dir='ltr'>(EU258608)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 317 294 1118 702">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 425 294 830 322">
+     <span class='ocr_line' id='line_1_10' title="bbox 425 294 830 322; baseline 0.002 -6"><span class='ocrx_word' id='word_1_42' title='bbox 425 296 448 316; x_wconf 95' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_43' title='bbox 460 296 545 322; x_wconf 85' lang='eng' dir='ltr'>ursingii</span> <span class='ocrx_word' id='word_1_44' title='bbox 554 296 604 317; x_wconf 96' lang='eng' dir='ltr'>LUH</span> <span class='ocrx_word' id='word_1_45' title='bbox 615 294 684 317; x_wconf 82' lang='eng' dir='ltr'>3792T</span> <span class='ocrx_word' id='word_1_46' title='bbox 693 296 830 322; x_wconf 87' lang='eng' dir='ltr'>(AJ275038)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 380 325 689 353">
+     <span class='ocr_line' id='line_1_11' title="bbox 380 325 689 353; baseline 0 -6"><span class='ocrx_word' id='word_1_47' title='bbox 380 328 403 347; x_wconf 93' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_48' title='bbox 415 328 484 353; x_wconf 86' lang='eng' dir='ltr'><em>baylyi</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 492 325 534 347; x_wconf 79' lang='eng' dir='ltr'>BzT</span> <span class='ocrx_word' id='word_1_50' title='bbox 544 327 689 353; x_wconf 91' lang='eng' dir='ltr'>(AM410709)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 337 357 1117 470">
+     <span class='ocr_line' id='line_1_12' title="bbox 400 357 784 383; baseline 0 -6"><span class='ocrx_word' id='word_1_51' title='bbox 400 358 423 377; x_wconf 92' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_52' title='bbox 435 357 581 377; x_wconf 84' lang='eng' dir='ltr'>IwoffiiATCC</span> <span class='ocrx_word' id='word_1_53' title='bbox 593 358 664 377; x_wconf 87' lang='eng'>17925</span> <span class='ocrx_word' id='word_1_54' title='bbox 674 357 784 383; x_wconf 88' lang='eng' dir='ltr'>(U10871)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 353 386 1030 412; baseline 0 -5"><span class='ocrx_word' id='word_1_55' title='bbox 353 387 521 407; x_wconf 84' lang='eng' dir='ltr'>Acinetobacter</span> <span class='ocrx_word' id='word_1_56' title='bbox 527 387 628 412; x_wconf 90' lang='eng' dir='ltr'>genomic</span> <span class='ocrx_word' id='word_1_57' title='bbox 637 387 726 412; x_wconf 86' lang='eng' dir='ltr'>species</span> <span class='ocrx_word' id='word_1_58' title='bbox 736 387 749 407; x_wconf 82' lang='eng'>8</span> <span class='ocrx_word' id='word_1_59' title='bbox 757 386 830 407; x_wconf 85' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_60' title='bbox 841 387 912 407; x_wconf 92' lang='eng'>17979</span> <span class='ocrx_word' id='word_1_61' title='bbox 922 387 1030 412; x_wconf 89' lang='eng'>(293439)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 358 416 1105 441; baseline 0 -5"><span class='ocrx_word' id='word_1_62' title='bbox 358 416 525 436; x_wconf 85' lang='eng' dir='ltr'>Acinetobacter</span> <span class='ocrx_word' id='word_1_63' title='bbox 532 416 632 441; x_wconf 87' lang='eng' dir='ltr'>genomic</span> <span class='ocrx_word' id='word_1_64' title='bbox 641 416 730 441; x_wconf 85' lang='eng' dir='ltr'>species</span> <span class='ocrx_word' id='word_1_65' title='bbox 740 416 801 436; x_wconf 89' lang='eng' dir='ltr'>close</span> <span class='ocrx_word' id='word_1_66' title='bbox 810 417 831 436; x_wconf 86' lang='eng' dir='ltr'>to</span> <span class='ocrx_word' id='word_1_67' title='bbox 843 416 904 436; x_wconf 91' lang='eng' dir='ltr'>13TU</span> <span class='ocrx_word' id='word_1_68' title='bbox 916 416 987 436; x_wconf 89' lang='eng'>10090</span> <span class='ocrx_word' id='word_1_69' title='bbox 998 416 1105 441; x_wconf 84' lang='eng'>(293449)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 337 445 1117 470; baseline 0 -5"><span class='ocrx_word' id='word_1_70' title='bbox 337 445 505 465; x_wconf 77' lang='eng' dir='ltr'>Acinetobacter</span> <span class='ocrx_word' id='word_1_71' title='bbox 511 445 612 470; x_wconf 87' lang='eng' dir='ltr'>genomic</span> <span class='ocrx_word' id='word_1_72' title='bbox 621 445 710 470; x_wconf 89' lang='eng' dir='ltr'>species</span> <span class='ocrx_word' id='word_1_73' title='bbox 720 445 819 465; x_wconf 86' lang='eng' dir='ltr'>between</span> <span class='ocrx_word' id='word_1_74' title='bbox 831 445 839 465; x_wconf 97' lang='eng'>1</span> <span class='ocrx_word' id='word_1_75' title='bbox 852 445 894 465; x_wconf 88' lang='eng' dir='ltr'>and</span> <span class='ocrx_word' id='word_1_76' title='bbox 905 445 917 465; x_wconf 86' lang='eng'>3</span> <span class='ocrx_word' id='word_1_77' title='bbox 929 445 1000 465; x_wconf 90' lang='eng'>10095</span> <span class='ocrx_word' id='word_1_78' title='bbox 1011 445 1117 470; x_wconf 89' lang='eng'>(293450)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 317 472 1090 644">
+     <span class='ocr_line' id='line_1_16' title="bbox 358 472 829 500; baseline 0 -6"><span class='ocrx_word' id='word_1_79' title='bbox 358 475 381 494; x_wconf 92' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_80' title='bbox 392 475 553 494; x_wconf 81' lang='eng' dir='ltr'>calcoaceticus</span> <span class='ocrx_word' id='word_1_81' title='bbox 563 474 619 494; x_wconf 94' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_82' title='bbox 629 472 714 494; x_wconf 87' lang='eng' dir='ltr'>30006T</span> <span class='ocrx_word' id='word_1_83' title='bbox 721 474 829 500; x_wconf 88' lang='eng' dir='ltr'>(X81661)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 341 500 1018 526; baseline 0 -5"><span class='ocrx_word' id='word_1_84' title='bbox 341 501 509 521; x_wconf 81' lang='eng' dir='ltr'>Acinetobacter</span> <span class='ocrx_word' id='word_1_85' title='bbox 515 501 616 526; x_wconf 86' lang='eng' dir='ltr'>genomic</span> <span class='ocrx_word' id='word_1_86' title='bbox 625 501 714 526; x_wconf 86' lang='eng' dir='ltr'>species</span> <span class='ocrx_word' id='word_1_87' title='bbox 724 501 737 521; x_wconf 87' lang='eng'>3</span> <span class='ocrx_word' id='word_1_88' title='bbox 745 500 818 521; x_wconf 88' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_89' title='bbox 829 501 900 521; x_wconf 95' lang='eng'>17922</span> <span class='ocrx_word' id='word_1_90' title='bbox 910 501 1018 526; x_wconf 83' lang='eng'>(293436)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 398 530 1090 556; baseline 0 -6"><span class='ocrx_word' id='word_1_91' title='bbox 398 531 566 550; x_wconf 81' lang='eng' dir='ltr'>Acinetobacter</span> <span class='ocrx_word' id='word_1_92' title='bbox 572 531 673 556; x_wconf 81' lang='eng' dir='ltr'>genomic</span> <span class='ocrx_word' id='word_1_93' title='bbox 682 531 771 556; x_wconf 86' lang='eng' dir='ltr'>species</span> <span class='ocrx_word' id='word_1_94' title='bbox 783 531 809 550; x_wconf 92' lang='eng'>10</span> <span class='ocrx_word' id='word_1_95' title='bbox 817 530 890 550; x_wconf 85' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_96' title='bbox 901 531 972 550; x_wconf 86' lang='eng'>17924</span> <span class='ocrx_word' id='word_1_97' title='bbox 983 530 1090 556; x_wconf 88' lang='eng'>(293443)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 392 560 1084 585; baseline -0.001 -5"><span class='ocrx_word' id='word_1_98' title='bbox 392 560 559 580; x_wconf 82' lang='eng' dir='ltr'>Acinetobacter</span> <span class='ocrx_word' id='word_1_99' title='bbox 565 560 666 585; x_wconf 88' lang='eng' dir='ltr'>genomic</span> <span class='ocrx_word' id='word_1_100' title='bbox 675 560 764 585; x_wconf 91' lang='eng' dir='ltr'>species</span> <span class='ocrx_word' id='word_1_101' title='bbox 776 560 798 579; x_wconf 89' lang='eng'>11</span> <span class='ocrx_word' id='word_1_102' title='bbox 811 560 883 580; x_wconf 90' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_103' title='bbox 894 560 961 579; x_wconf 92' lang='eng'>11171</span> <span class='ocrx_word' id='word_1_104' title='bbox 975 560 1084 585; x_wconf 87' lang='eng' dir='ltr'>(X81659)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 317 587 797 621; baseline 0 -12"><span class='ocrx_word' id='word_1_105' title='bbox 317 608 326 621; x_wconf 64' lang='eng'>9</span> <span class='ocrx_word' id='word_1_106' title='bbox 349 589 372 609; x_wconf 92' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_107' title='bbox 383 589 587 609; x_wconf 86' lang='eng' dir='ltr'>baumanniiATCC</span> <span class='ocrx_word' id='word_1_108' title='bbox 598 587 681 609; x_wconf 83' lang='eng' dir='ltr'>19606T</span> <span class='ocrx_word' id='word_1_109' title='bbox 690 589 797 615; x_wconf 85' lang='eng'>(293435)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 322 619 1049 644; baseline 0 -5"><span class='ocrx_word' id='word_1_110' title='bbox 322 619 489 639; x_wconf 85' lang='eng' dir='ltr'>Acinetobacter</span> <span class='ocrx_word' id='word_1_111' title='bbox 496 619 596 644; x_wconf 89' lang='eng' dir='ltr'>genomic</span> <span class='ocrx_word' id='word_1_112' title='bbox 605 619 694 644; x_wconf 79' lang='eng' dir='ltr'>species</span> <span class='ocrx_word' id='word_1_113' title='bbox 706 619 767 639; x_wconf 89' lang='eng' dir='ltr'>13TU</span> <span class='ocrx_word' id='word_1_114' title='bbox 777 619 849 639; x_wconf 89' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_115' title='bbox 861 619 932 639; x_wconf 89' lang='eng'>17903</span> <span class='ocrx_word' id='word_1_116' title='bbox 942 619 1049 644; x_wconf 86' lang='eng'>(293446)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 338 646 872 701">
+     <span class='ocr_line' id='line_1_22' title="bbox 524 646 872 673; baseline 0.003 -6"><span class='ocrx_word' id='word_1_117' title='bbox 524 648 547 667; x_wconf 92' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_118' title='bbox 559 648 643 673; x_wconf 87' lang='eng' dir='ltr'>gerneri</span> <span class='ocrx_word' id='word_1_119' title='bbox 650 646 723 668; x_wconf 79' lang='eng' dir='ltr'>9A01T</span> <span class='ocrx_word' id='word_1_120' title='bbox 732 648 872 673; x_wconf 87' lang='eng' dir='ltr'>(AF509829)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 338 673 709 701; baseline 0.003 -6"><span class='ocrx_word' id='word_1_121' title='bbox 338 676 360 695; x_wconf 95' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_122' title='bbox 368 676 499 701; x_wconf 85' lang='eng' dir='ltr'>juniiATCC</span> <span class='ocrx_word' id='word_1_123' title='bbox 510 673 593 696; x_wconf 91' lang='eng' dir='ltr'>17908T</span> <span class='ocrx_word' id='word_1_124' title='bbox 603 676 709 701; x_wconf 89' lang='eng'>(293438)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 244 704 1036 786">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 428 704 1036 786">
+     <span class='ocr_line' id='line_1_24' title="bbox 428 704 823 732; baseline 0 -6"><span class='ocrx_word' id='word_1_125' title='bbox 428 706 450 726; x_wconf 63' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_126' title='bbox 461 711 542 731; x_wconf 87' lang='eng' dir='ltr'><em>parvus</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 552 706 612 726; x_wconf 94' lang='eng' dir='ltr'>NIPH</span> <span class='ocrx_word' id='word_1_128' title='bbox 623 704 677 726; x_wconf 81' lang='eng' dir='ltr'>384T</span> <span class='ocrx_word' id='word_1_129' title='bbox 687 706 823 732; x_wconf 86' lang='eng' dir='ltr'>(AJ293691)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 628 731 1036 759; baseline 0 -6"><span class='ocrx_word' id='word_1_130' title='bbox 628 733 651 753; x_wconf 97' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_131' title='bbox 663 733 803 758; x_wconf 84' lang='eng' dir='ltr'>tjernbergiae</span> <span class='ocrx_word' id='word_1_132' title='bbox 813 731 886 753; x_wconf 78' lang='eng' dir='ltr'>7N16T</span> <span class='ocrx_word' id='word_1_133' title='bbox 896 733 1036 759; x_wconf 88' lang='eng' dir='ltr'>(AF509825)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 545 759 889 786; baseline 0 -5"><span class='ocrx_word' id='word_1_134' title='bbox 545 761 568 781; x_wconf 94' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_135' title='bbox 579 759 740 781; x_wconf 78' lang='eng' dir='ltr'>tandoii4N13T</span> <span class='ocrx_word' id='word_1_136' title='bbox 750 761 889 786; x_wconf 89' lang='eng' dir='ltr'>(AF509830)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 0 69 491 1079">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 0 69 491 1079">
+     <span class='ocr_line' id='line_1_27' title="bbox 98 69 491 102; baseline 0 -22"><span class='ocrx_word' id='word_1_137' title='bbox 98 69 491 102; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 0 102 359 134; baseline 0 0"><span class='ocrx_word' id='word_1_138' title='bbox 0 102 359 134; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 0 134 310 159; baseline 0 979"><span class='ocrx_word' id='word_1_139' title='bbox 0 134 310 159; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 0 159 286 190; baseline 0 948"><span class='ocrx_word' id='word_1_140' title='bbox 0 159 286 190; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 3 190 283 215; baseline 0 923"><span class='ocrx_word' id='word_1_141' title='bbox 3 190 283 215; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 3 215 283 252; baseline 0 886"><span class='ocrx_word' id='word_1_142' title='bbox 3 215 283 252; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 0 252 286 274; baseline 0 864"><span class='ocrx_word' id='word_1_143' title='bbox 0 252 286 274; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 0 274 287 300; baseline 0 838"><span class='ocrx_word' id='word_1_144' title='bbox 0 274 287 300; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 0 300 287 336; baseline 0 802"><span class='ocrx_word' id='word_1_145' title='bbox 0 300 287 336; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 0 336 380 367; baseline 0 771"><span class='ocrx_word' id='word_1_146' title='bbox 0 336 380 367; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 0 367 350 396; baseline 0 742"><span class='ocrx_word' id='word_1_147' title='bbox 0 367 350 396; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 0 396 350 425; baseline 0 713"><span class='ocrx_word' id='word_1_148' title='bbox 0 396 350 425; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 0 425 334 453; baseline 0 685"><span class='ocrx_word' id='word_1_149' title='bbox 0 425 334 453; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 0 453 337 482; baseline 0 656"><span class='ocrx_word' id='word_1_150' title='bbox 0 453 337 482; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 0 482 336 514; baseline 0 624"><span class='ocrx_word' id='word_1_151' title='bbox 0 482 336 514; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 0 514 341 539; baseline 0 599"><span class='ocrx_word' id='word_1_152' title='bbox 0 514 341 539; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 0 539 388 573; baseline 0 -2"><span class='ocrx_word' id='word_1_153' title='bbox 0 539 388 573; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_44' title="bbox 0 573 321 597; baseline 0 0"><span class='ocrx_word' id='word_1_154' title='bbox 0 573 321 597; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_45' title="bbox 0 597 317 629; baseline 0 509"><span class='ocrx_word' id='word_1_155' title='bbox 0 597 317 629; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 0 629 317 677; baseline 0 0"><span class='ocrx_word' id='word_1_156' title='bbox 0 629 317 677; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 0 677 244 798; baseline 0 0"><span class='ocrx_word' id='word_1_157' title='bbox 0 677 244 798; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_48' title="bbox 0 798 417 834; baseline 0 0"><span class='ocrx_word' id='word_1_158' title='bbox 0 798 417 834; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_49' title="bbox 0 834 386 858; baseline 0 280"><span class='ocrx_word' id='word_1_159' title='bbox 0 834 386 858; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_50' title="bbox 0 858 389 939; baseline 0 0"><span class='ocrx_word' id='word_1_160' title='bbox 0 858 389 939; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_51' title="bbox 0 939 287 1059; baseline 0 -21"><span class='ocrx_word' id='word_1_161' title='bbox 0 939 287 1059; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_52' title="bbox 0 1059 82 1079; baseline 0 59"><span class='ocrx_word' id='word_1_162' title='bbox 0 1059 82 1079; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 226 303 228 334">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 226 303 228 334">
+     <span class='ocr_line' id='line_1_53' title="bbox 226 303 228 334; baseline 0 804"><span class='ocrx_word' id='word_1_163' title='bbox 226 303 228 334; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 82 820 1122 1079">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 389 821 1001 932">
+     <span class='ocr_line' id='line_1_54' title="bbox 421 821 1001 846; baseline 0 -5"><span class='ocrx_word' id='word_1_164' title='bbox 421 821 588 841; x_wconf 84' lang='eng' dir='ltr'>Acinetobacter</span> <span class='ocrx_word' id='word_1_165' title='bbox 595 821 695 846; x_wconf 88' lang='eng' dir='ltr'>genomic</span> <span class='ocrx_word' id='word_1_166' title='bbox 704 821 794 846; x_wconf 88' lang='eng' dir='ltr'>species</span> <span class='ocrx_word' id='word_1_167' title='bbox 805 821 831 841; x_wconf 93' lang='eng'>17</span> <span class='ocrx_word' id='word_1_168' title='bbox 841 821 883 841; x_wconf 86' lang='eng'>942</span> <span class='ocrx_word' id='word_1_169' title='bbox 894 821 1001 846; x_wconf 87' lang='eng'>(293454)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_55' title="bbox 389 847 1001 873; baseline 0 -6"><span class='ocrx_word' id='word_1_170' title='bbox 389 847 557 867; x_wconf 81' lang='eng' dir='ltr'>Acinetobacter</span> <span class='ocrx_word' id='word_1_171' title='bbox 563 847 664 873; x_wconf 87' lang='eng' dir='ltr'>genomic</span> <span class='ocrx_word' id='word_1_172' title='bbox 673 847 762 872; x_wconf 89' lang='eng' dir='ltr'>species</span> <span class='ocrx_word' id='word_1_173' title='bbox 774 847 830 867; x_wconf 90' lang='eng' dir='ltr'>14BJ</span> <span class='ocrx_word' id='word_1_174' title='bbox 841 847 883 867; x_wconf 87' lang='eng'>382</span> <span class='ocrx_word' id='word_1_175' title='bbox 894 847 1001 873; x_wconf 89' lang='eng'>(293453)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_56' title="bbox 457 877 890 905; baseline 0 -6"><span class='ocrx_word' id='word_1_176' title='bbox 457 880 480 899; x_wconf 69' lang='eng' dir='ltr'><em>A,</em></span> <span class='ocrx_word' id='word_1_177' title='bbox 492 880 605 899; x_wconf 85' lang='eng' dir='ltr'>schind/eri</span> <span class='ocrx_word' id='word_1_178' title='bbox 614 880 664 899; x_wconf 97' lang='eng' dir='ltr'>LUH</span> <span class='ocrx_word' id='word_1_179' title='bbox 675 877 744 899; x_wconf 80' lang='eng' dir='ltr'>5832T</span> <span class='ocrx_word' id='word_1_180' title='bbox 754 879 890 905; x_wconf 87' lang='eng' dir='ltr'>(AJ278311)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_57' title="bbox 520 905 877 932; baseline 0 -5"><span class='ocrx_word' id='word_1_181' title='bbox 520 907 543 927; x_wconf 92' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_182' title='bbox 554 907 648 927; x_wconf 78' lang='eng' dir='ltr'>bouvetii</span> <span class='ocrx_word' id='word_1_183' title='bbox 654 905 727 927; x_wconf 88' lang='eng' dir='ltr'>4B02T</span> <span class='ocrx_word' id='word_1_184' title='bbox 737 907 877 932; x_wconf 88' lang='eng' dir='ltr'>(AF509827)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 381 934 811 961">
+     <span class='ocr_line' id='line_1_58' title="bbox 381 934 811 961; baseline 0 -5"><span class='ocrx_word' id='word_1_185' title='bbox 381 936 403 956; x_wconf 92' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_186' title='bbox 411 936 521 961; x_wconf 85' lang='eng' dir='ltr'>johnsonii</span> <span class='ocrx_word' id='word_1_187' title='bbox 528 936 600 956; x_wconf 90' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_188' title='bbox 611 934 694 956; x_wconf 85' lang='eng' dir='ltr'>17909T</span> <span class='ocrx_word' id='word_1_189' title='bbox 704 936 811 961; x_wconf 89' lang='eng'>(293440)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 287 963 1096 1029">
+     <span class='ocr_line' id='line_1_59' title="bbox 390 963 871 991; baseline 0 -6"><span class='ocrx_word' id='word_1_190' title='bbox 390 966 412 985; x_wconf 92' lang='eng' dir='ltr'>A.</span> <span class='ocrx_word' id='word_1_191' title='bbox 424 966 580 991; x_wconf 81' lang='eng' dir='ltr'>haemo/yticus</span> <span class='ocrx_word' id='word_1_192' title='bbox 588 965 660 985; x_wconf 90' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_193' title='bbox 672 963 754 985; x_wconf 80' lang='eng' dir='ltr'>17906T</span> <span class='ocrx_word' id='word_1_194' title='bbox 764 965 871 991; x_wconf 88' lang='eng'>(293437)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_60' title="bbox 287 969 1096 1029; baseline 0 -15"><span class='ocrx_word' id='word_1_195' title='bbox 287 969 397 1029; x_wconf 39' lang='eng'>4%</span> <span class='ocrx_word' id='word_1_196' title='bbox 405 995 573 1014; x_wconf 80' lang='eng' dir='ltr'>Acinetobacter</span> <span class='ocrx_word' id='word_1_197' title='bbox 579 995 680 1020; x_wconf 87' lang='eng' dir='ltr'>genomic</span> <span class='ocrx_word' id='word_1_198' title='bbox 688 995 778 1019; x_wconf 81' lang='eng' dir='ltr'>species</span> <span class='ocrx_word' id='word_1_199' title='bbox 789 995 815 1014; x_wconf 89' lang='eng'>16</span> <span class='ocrx_word' id='word_1_200' title='bbox 824 994 896 1014; x_wconf 87' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_201' title='bbox 908 995 979 1014; x_wconf 90' lang='eng'>17988</span> <span class='ocrx_word' id='word_1_202' title='bbox 989 994 1096 1020; x_wconf 88' lang='eng'>(293451)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 82 1024 1122 1078">
+     <span class='ocr_line' id='line_1_61' title="bbox 392 1024 988 1049; baseline 0 -5"><span class='ocrx_word' id='word_1_203' title='bbox 392 1024 559 1044; x_wconf 77' lang='eng' dir='ltr'>Acinetobacter</span> <span class='ocrx_word' id='word_1_204' title='bbox 565 1024 666 1049; x_wconf 90' lang='eng' dir='ltr'>genomic</span> <span class='ocrx_word' id='word_1_205' title='bbox 675 1024 764 1049; x_wconf 87' lang='eng' dir='ltr'>species</span> <span class='ocrx_word' id='word_1_206' title='bbox 776 1024 832 1044; x_wconf 88' lang='eng' dir='ltr'>15BJ</span> <span class='ocrx_word' id='word_1_207' title='bbox 843 1024 871 1044; x_wconf 96' lang='eng'>79</span> <span class='ocrx_word' id='word_1_208' title='bbox 881 1024 988 1049; x_wconf 88' lang='eng'>(293452)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_62' title="bbox 82 1051 1122 1078; baseline 0 -5"><span class='ocrx_word' id='word_1_209' title='bbox 82 1054 449 1056; x_wconf 94' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_210' title='bbox 457 1053 610 1078; x_wconf 81' lang='eng' dir='ltr'>Alkanindiges</span> <span class='ocrx_word' id='word_1_211' title='bbox 619 1053 754 1073; x_wconf 88' lang='eng' dir='ltr'>i/Iinoisensis</span> <span class='ocrx_word' id='word_1_212' title='bbox 763 1053 805 1073; x_wconf 88' lang='eng' dir='ltr'>GTI</span> <span class='ocrx_word' id='word_1_213' title='bbox 816 1053 890 1073; x_wconf 93' lang='eng' dir='ltr'>MVAB</span> <span class='ocrx_word' id='word_1_214' title='bbox 901 1051 972 1073; x_wconf 91' lang='eng' dir='ltr'>Hex1T</span> <span class='ocrx_word' id='word_1_215' title='bbox 982 1053 1122 1078; x_wconf 88' lang='eng' dir='ltr'>(AF513979)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 82 1076 1118 1116">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 82 1076 1118 1115">
+     <span class='ocr_line' id='line_1_63' title="bbox 85 1076 113 1089; baseline 0 0"><span class='ocrx_word' id='word_1_216' title='bbox 85 1076 113 1089; x_wconf 86' lang='eng'>100</span> 
+     </span>
+     <span class='ocr_line' id='line_1_64' title="bbox 82 1083 1118 1115; baseline 0 0"><span class='ocrx_word' id='word_1_217' title='bbox 82 1083 1118 1115; x_wconf 46' lang='eng' dir='ltr'><strong>J</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 898 1109 1122 1129">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 898 1109 1122 1129">
+     <span class='ocr_line' id='line_1_65' title="bbox 898 1109 1122 1129; baseline 0 0"><span class='ocrx_word' id='word_1_218' title='bbox 898 1109 1012 1129; x_wconf 86' lang='eng' dir='ltr'>Moraxe/la</span> <span class='ocrx_word' id='word_1_219' title='bbox 1022 1109 1122 1129; x_wconf 83' lang='eng' dir='ltr'>lacunata</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 242 730 244 869">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 242 730 244 869">
+     <span class='ocr_line' id='line_1_66' title="bbox 242 730 244 869; baseline 0 269"><span class='ocrx_word' id='word_1_220' title='bbox 242 730 244 869; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 285 926 287 991">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 285 926 287 991">
+     <span class='ocr_line' id='line_1_67' title="bbox 285 926 287 991; baseline 0 147"><span class='ocrx_word' id='word_1_221' title='bbox 285 926 287 991; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 80 1054 82 1100">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 80 1054 82 1100">
+     <span class='ocr_line' id='line_1_68' title="bbox 80 1054 82 1100; baseline 0 38"><span class='ocrx_word' id='word_1_222' title='bbox 80 1054 82 1100; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 421 791 1217 818">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 421 792 1217 817">
+     <span class='ocr_line' id='line_1_69' title="bbox 421 792 1217 817; baseline -0.001 -5"><span class='ocrx_word' id='word_1_223' title='bbox 421 792 588 812; x_wconf 85' lang='eng' dir='ltr'>Acinetobacter</span> <span class='ocrx_word' id='word_1_224' title='bbox 595 792 695 817; x_wconf 89' lang='eng' dir='ltr'>genomic</span> <span class='ocrx_word' id='word_1_225' title='bbox 704 792 794 817; x_wconf 85' lang='eng' dir='ltr'>species</span> <span class='ocrx_word' id='word_1_226' title='bbox 805 792 935 812; x_wconf 89' lang='eng' dir='ltr'>13BJ/14TU</span> <span class='ocrx_word' id='word_1_227' title='bbox 945 792 1018 812; x_wconf 90' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_228' title='bbox 1029 792 1100 812; x_wconf 90' lang='eng'>17905</span> <span class='ocrx_word' id='word_1_229' title='bbox 1110 792 1217 817; x_wconf 92' lang='eng'>(293447)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 1129 1076 1714 1134">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 1129 1076 1714 1134">
+     <span class='ocr_line' id='line_1_70' title="bbox 1129 1076 1714 1104; baseline 0 -6"><span class='ocrx_word' id='word_1_230' title='bbox 1129 1079 1302 1104; x_wconf 82' lang='eng' dir='ltr'>Psychrobacter</span> <span class='ocrx_word' id='word_1_231' title='bbox 1308 1079 1420 1098; x_wconf 85' lang='eng' dir='ltr'>immobilis</span> <span class='ocrx_word' id='word_1_232' title='bbox 1428 1078 1500 1098; x_wconf 91' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_233' title='bbox 1509 1079 1549 1098; x_wconf 90' lang='eng'>431</span> <span class='ocrx_word' id='word_1_234' title='bbox 1557 1076 1594 1098; x_wconf 79' lang='eng' dir='ltr'>1ST</span> <span class='ocrx_word' id='word_1_235' title='bbox 1604 1078 1714 1104; x_wconf 85' lang='eng' dir='ltr'>(U39399)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_71' title="bbox 1131 1107 1446 1134; baseline 0 -5"><span class='ocrx_word' id='word_1_236' title='bbox 1131 1109 1203 1129; x_wconf 89' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_237' title='bbox 1214 1107 1297 1129; x_wconf 84' lang='eng' dir='ltr'>17967T</span> <span class='ocrx_word' id='word_1_238' title='bbox 1307 1109 1446 1134; x_wconf 85' lang='eng' dir='ltr'>(AF005160)</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/hocr-tesseract-ijsem-140/tree-checking.xls b/examples/hocr-tesseract-ijsem-140/tree-checking.xls
new file mode 100644
index 00000000..04ec9606
Binary files /dev/null and b/examples/hocr-tesseract-ijsem-140/tree-checking.xls differ
diff --git a/examples/ijs.0.003566-0-000.pbm.png b/examples/ijs.0.003566-0-000.pbm.png
new file mode 100644
index 00000000..79550c10
Binary files /dev/null and b/examples/ijs.0.003566-0-000.pbm.png differ
diff --git a/examples/ijs.0.003566-0-000.pbm.png.hocr b/examples/ijs.0.003566-0-000.pbm.png.hocr
new file mode 100644
index 00000000..6e71cb8a
--- /dev/null
+++ b/examples/ijs.0.003566-0-000.pbm.png.hocr
@@ -0,0 +1,128 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003566-0-000.pbm.png"; bbox 0 0 1065 592; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 3 36 1064 550">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 3 36 1064 550">
+     <span class='ocr_line' id='line_1_1' title="bbox 172 36 872 63; baseline -0.003 -2"><span class='ocrx_word' id='word_1_1' title='bbox 172 47 194 61; x_wconf 78' lang='eng'>95</span> <span class='ocrx_word' id='word_1_2' title='bbox 244 38 420 59; x_wconf 79' lang='eng' dir='ltr'>Coral/ococcus</span> <span class='ocrx_word' id='word_1_3' title='bbox 430 39 562 59; x_wconf 82' lang='eng' dir='ltr'>coral/oides</span> <span class='ocrx_word' id='word_1_4' title='bbox 572 38 631 59; x_wconf 90' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_5' title='bbox 643 37 716 59; x_wconf 87' lang='eng' dir='ltr'>2259T</span> <span class='ocrx_word' id='word_1_6' title='bbox 726 36 790 63; x_wconf 85' lang='eng' dir='ltr'>(AJ81</span> <span class='ocrx_word' id='word_1_7' title='bbox 800 36 872 63; x_wconf 87' lang='eng'>1588)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 108 71 866 97; baseline -0.001 -3"><span class='ocrx_word' id='word_1_8' title='bbox 108 83 129 97; x_wconf 75' lang='eng'>59</span> <span class='ocrx_word' id='word_1_9' title='bbox 230 73 406 94; x_wconf 85' lang='eng' dir='ltr'>Cora/lococcus</span> <span class='ocrx_word' id='word_1_10' title='bbox 416 73 548 94; x_wconf 80' lang='eng' dir='ltr'>coral/aides</span> <span class='ocrx_word' id='word_1_11' title='bbox 559 73 617 94; x_wconf 87' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_12' title='bbox 629 74 709 94; x_wconf 93' lang='eng'>51547</span> <span class='ocrx_word' id='word_1_13' title='bbox 720 71 784 97; x_wconf 91' lang='eng' dir='ltr'>(AJ81</span> <span class='ocrx_word' id='word_1_14' title='bbox 794 71 866 97; x_wconf 85' lang='eng'>1592)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 161 105 873 132; baseline -0.003 -2"><span class='ocrx_word' id='word_1_15' title='bbox 161 116 222 130; x_wconf 85' lang='eng'>96—</span> <span class='ocrx_word' id='word_1_16' title='bbox 237 107 413 128; x_wconf 81' lang='eng' dir='ltr'>Cora/Iococcus</span> <span class='ocrx_word' id='word_1_17' title='bbox 423 108 555 128; x_wconf 76' lang='eng' dir='ltr'>coral/aides</span> <span class='ocrx_word' id='word_1_18' title='bbox 566 108 624 128; x_wconf 91' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_19' title='bbox 636 108 716 128; x_wconf 88' lang='eng'>52500</span> <span class='ocrx_word' id='word_1_20' title='bbox 727 105 791 132; x_wconf 89' lang='eng' dir='ltr'>(AJ81</span> <span class='ocrx_word' id='word_1_21' title='bbox 801 105 873 132; x_wconf 85' lang='eng'>1612)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 80 140 875 167; baseline 0 -4"><span class='ocrx_word' id='word_1_22' title='bbox 80 140 101 154; x_wconf 63' lang='eng'>84</span> <span class='ocrx_word' id='word_1_23' title='bbox 190 152 222 154; x_wconf 95' lang='eng'>—</span> <span class='ocrx_word' id='word_1_24' title='bbox 239 142 415 163; x_wconf 84' lang='eng' dir='ltr'>Cora/lococcus</span> <span class='ocrx_word' id='word_1_25' title='bbox 425 142 557 163; x_wconf 79' lang='eng' dir='ltr'>coral/aides</span> <span class='ocrx_word' id='word_1_26' title='bbox 568 142 626 163; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_27' title='bbox 638 143 718 163; x_wconf 89' lang='eng'>51620</span> <span class='ocrx_word' id='word_1_28' title='bbox 729 140 793 167; x_wconf 91' lang='eng' dir='ltr'>(AJ81</span> <span class='ocrx_word' id='word_1_29' title='bbox 804 140 875 167; x_wconf 87' lang='eng'>1608)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 144 175 780 202; baseline -0.002 -4"><span class='ocrx_word' id='word_1_30' title='bbox 144 177 320 198; x_wconf 83' lang='eng' dir='ltr'>Coral/ococcus</span> <span class='ocrx_word' id='word_1_31' title='bbox 330 177 462 198; x_wconf 81' lang='eng' dir='ltr'>coral/aides</span> <span class='ocrx_word' id='word_1_32' title='bbox 472 177 531 198; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_33' title='bbox 543 178 624 198; x_wconf 90' lang='eng'>51408</span> <span class='ocrx_word' id='word_1_34' title='bbox 634 175 698 202; x_wconf 86' lang='eng' dir='ltr'>(AJ81</span> <span class='ocrx_word' id='word_1_35' title='bbox 708 175 780 202; x_wconf 89' lang='eng'>1615)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 24 209 792 240; baseline 0 -8"><span class='ocrx_word' id='word_1_36' title='bbox 24 226 46 240; x_wconf 69' lang='eng'>99</span> <span class='ocrx_word' id='word_1_37' title='bbox 95 210 117 224; x_wconf 69' lang='eng'>54</span> <span class='ocrx_word' id='word_1_38' title='bbox 156 211 332 232; x_wconf 81' lang='eng' dir='ltr'>Cora/lococcus</span> <span class='ocrx_word' id='word_1_39' title='bbox 342 212 474 232; x_wconf 82' lang='eng' dir='ltr'>coral/oides</span> <span class='ocrx_word' id='word_1_40' title='bbox 484 211 543 232; x_wconf 87' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_41' title='bbox 555 212 635 232; x_wconf 86' lang='eng'>51433</span> <span class='ocrx_word' id='word_1_42' title='bbox 646 209 710 236; x_wconf 90' lang='eng' dir='ltr'>(AJ81</span> <span class='ocrx_word' id='word_1_43' title='bbox 720 209 792 236; x_wconf 87' lang='eng'>1616)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 3 244 865 273; baseline -0.005 -3"><span class='ocrx_word' id='word_1_44' title='bbox 3 247 51 249; x_wconf 86' lang='eng'>—</span> <span class='ocrx_word' id='word_1_45' title='bbox 163 255 185 269; x_wconf 74' lang='eng' dir='ltr'>as</span> <span class='ocrx_word' id='word_1_46' title='bbox 262 246 414 273; x_wconf 79' lang='eng' dir='ltr'>Myxococcus</span> <span class='ocrx_word' id='word_1_47' title='bbox 424 246 532 273; x_wconf 78' lang='eng' dir='ltr'>stipitatus</span> <span class='ocrx_word' id='word_1_48' title='bbox 543 246 602 267; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_49' title='bbox 615 247 694 267; x_wconf 88' lang='eng'>14675</span> <span class='ocrx_word' id='word_1_50' title='bbox 704 244 817 271; x_wconf 83' lang='eng' dir='ltr'>(DO7681</span> <span class='ocrx_word' id='word_1_51' title='bbox 827 244 865 271; x_wconf 90' lang='eng'>18)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 192 279 797 308; baseline 0 -6"><span class='ocrx_word' id='word_1_52' title='bbox 192 290 204 292; x_wconf 94' lang='eng'><em>-</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 211 281 363 308; x_wconf 73' lang='eng' dir='ltr'>Myxococcus</span> <span class='ocrx_word' id='word_1_54' title='bbox 373 281 443 302; x_wconf 78' lang='eng' dir='ltr'>Iu/vus</span> <span class='ocrx_word' id='word_1_55' title='bbox 452 281 526 302; x_wconf 91' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_56' title='bbox 537 279 797 306; x_wconf 70' lang='eng' dir='ltr'>25199T(DQ768117)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 114 313 936 343; baseline 0 -7"><span class='ocrx_word' id='word_1_57' title='bbox 114 325 136 339; x_wconf 77' lang='eng'>95</span> <span class='ocrx_word' id='word_1_58' title='bbox 328 316 480 343; x_wconf 73' lang='eng' dir='ltr'>Myxococcus</span> <span class='ocrx_word' id='word_1_59' title='bbox 488 316 583 336; x_wconf 79' lang='eng' dir='ltr'>xanthus</span> <span class='ocrx_word' id='word_1_60' title='bbox 592 316 665 336; x_wconf 87' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_61' title='bbox 676 314 766 336; x_wconf 82' lang='eng' dir='ltr'>25232T</span> <span class='ocrx_word' id='word_1_62' title='bbox 776 313 888 340; x_wconf 86' lang='eng' dir='ltr'>(DO7681</span> <span class='ocrx_word' id='word_1_63' title='bbox 898 313 936 340; x_wconf 86' lang='eng'>16)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 275 348 936 377; baseline 0 -6"><span class='ocrx_word' id='word_1_64' title='bbox 275 350 297 364; x_wconf 81' lang='eng'>97</span> <span class='ocrx_word' id='word_1_65' title='bbox 322 350 474 377; x_wconf 76' lang='eng' dir='ltr'>Myxococcus</span> <span class='ocrx_word' id='word_1_66' title='bbox 484 350 611 371; x_wconf 81' lang='eng' dir='ltr'>flavescens</span> <span class='ocrx_word' id='word_1_67' title='bbox 622 350 681 371; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_68' title='bbox 692 349 766 371; x_wconf 78' lang='eng' dir='ltr'>4946T</span> <span class='ocrx_word' id='word_1_69' title='bbox 776 348 936 375; x_wconf 84' lang='eng' dir='ltr'>(DO768130)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 210 380 968 412; baseline -0.001 -6"><span class='ocrx_word' id='word_1_70' title='bbox 210 380 243 394; x_wconf 63' lang='eng'>10°</span> <span class='ocrx_word' id='word_1_71' title='bbox 320 385 472 412; x_wconf 76' lang='eng' dir='ltr'>Myxococcus</span> <span class='ocrx_word' id='word_1_72' title='bbox 483 385 597 406; x_wconf 85' lang='eng' dir='ltr'>virescens</span> <span class='ocrx_word' id='word_1_73' title='bbox 607 385 686 406; x_wconf 90' lang='eng' dir='ltr'>NBRC</span> <span class='ocrx_word' id='word_1_74' title='bbox 698 384 803 406; x_wconf 76' lang='eng' dir='ltr'>100334T</span> <span class='ocrx_word' id='word_1_75' title='bbox 813 383 968 409; x_wconf 89' lang='eng' dir='ltr'>(AB218225)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 267 417 954 446; baseline 0 -6"><span class='ocrx_word' id='word_1_76' title='bbox 267 417 457 444; x_wconf 86' lang='eng' dir='ltr'>[Coral/ococcus]</span> <span class='ocrx_word' id='word_1_77' title='bbox 469 426 626 446; x_wconf 83' lang='eng' dir='ltr'>macrosporus</span> <span class='ocrx_word' id='word_1_78' title='bbox 637 419 696 440; x_wconf 87' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_79' title='bbox 709 418 798 440; x_wconf 73' lang='eng' dir='ltr'>14697T</span> <span class='ocrx_word' id='word_1_80' title='bbox 808 417 872 444; x_wconf 89' lang='eng' dir='ltr'>(AJ81</span> <span class='ocrx_word' id='word_1_81' title='bbox 882 417 954 444; x_wconf 84' lang='eng'>1623)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 103 452 897 481; baseline 0 -6"><span class='ocrx_word' id='word_1_82' title='bbox 103 464 124 478; x_wconf 82' lang='eng'>97</span> <span class='ocrx_word' id='word_1_83' title='bbox 133 464 327 466; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_84' title='bbox 345 454 493 481; x_wconf 82' lang='eng' dir='ltr'>Cystobacter</span> <span class='ocrx_word' id='word_1_85' title='bbox 501 454 580 475; x_wconf 83' lang='eng' dir='ltr'>fuscus</span> <span class='ocrx_word' id='word_1_86' title='bbox 589 454 663 475; x_wconf 89' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_87' title='bbox 673 453 764 475; x_wconf 80' lang='eng' dir='ltr'>25194T</span> <span class='ocrx_word' id='word_1_88' title='bbox 773 452 897 479; x_wconf 87' lang='eng' dir='ltr'>(M94276)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 3 486 899 516; baseline 0.001 -8"><span class='ocrx_word' id='word_1_89' title='bbox 3 488 51 508; x_wconf 77' lang='eng'>1_00</span> <span class='ocrx_word' id='word_1_90' title='bbox 132 498 282 501; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_91' title='bbox 292 489 439 515; x_wconf 81' lang='eng' dir='ltr'>Archangium</span> <span class='ocrx_word' id='word_1_92' title='bbox 448 489 546 516; x_wconf 85' lang='eng' dir='ltr'>gephyra</span> <span class='ocrx_word' id='word_1_93' title='bbox 555 489 628 509; x_wconf 88' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_94' title='bbox 639 487 729 509; x_wconf 90' lang='eng' dir='ltr'>25201T</span> <span class='ocrx_word' id='word_1_95' title='bbox 738 486 899 514; x_wconf 87' lang='eng' dir='ltr'>(DQ768106)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 54 521 1064 550; baseline 0 -6"><span class='ocrx_word' id='word_1_96' title='bbox 54 533 430 535; x_wconf 94' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_97' title='bbox 442 523 576 550; x_wconf 69' lang='eng' dir='ltr'>Stigmata/la</span> <span class='ocrx_word' id='word_1_98' title='bbox 586 523 710 544; x_wconf 83' lang='eng' dir='ltr'>aurantiaca</span> <span class='ocrx_word' id='word_1_99' title='bbox 719 523 793 544; x_wconf 90' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_100' title='bbox 804 522 894 544; x_wconf 85' lang='eng' dir='ltr'>25190T</span> <span class='ocrx_word' id='word_1_101' title='bbox 904 521 1064 548; x_wconf 85' lang='eng' dir='ltr'>(DO768127)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 136 1 861 85">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 136 1 861 85">
+     <span class='ocr_line' id='line_1_16' title="bbox 136 1 861 85; baseline 0 -60"><span class='ocrx_word' id='word_1_102' title='bbox 136 12 244 85; x_wconf 40' lang='eng'>474‘?</span> <span class='ocrx_word' id='word_1_103' title='bbox 255 4 431 25; x_wconf 80' lang='eng' dir='ltr'>Coral/ococcus</span> <span class='ocrx_word' id='word_1_104' title='bbox 442 4 534 31; x_wconf 72' lang='eng' dir='ltr'>exiguus</span> <span class='ocrx_word' id='word_1_105' title='bbox 545 4 604 25; x_wconf 91' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_106' title='bbox 617 2 706 25; x_wconf 75' lang='eng' dir='ltr'>14696T</span> <span class='ocrx_word' id='word_1_107' title='bbox 715 1 779 28; x_wconf 75' lang='eng' dir='ltr'>(A181</span> <span class='ocrx_word' id='word_1_108' title='bbox 789 1 861 28; x_wconf 89' lang='eng'>1598)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 134 66 136 137">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 134 66 136 137">
+     <span class='ocr_line' id='line_1_17' title="bbox 134 66 136 137; baseline 0 455"><span class='ocrx_word' id='word_1_109' title='bbox 134 66 136 137; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 134 135 190 137">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 134 135 190 137">
+     <span class='ocr_line' id='line_1_18' title="bbox 134 135 190 137; baseline 0 455"><span class='ocrx_word' id='word_1_110' title='bbox 134 135 190 137; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 192 256 256 258">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 192 256 256 258">
+     <span class='ocr_line' id='line_1_19' title="bbox 192 256 256 258; baseline 0 334"><span class='ocrx_word' id='word_1_111' title='bbox 192 256 256 258; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 188 117 192 292">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 188 117 192 292">
+     <span class='ocr_line' id='line_1_20' title="bbox 188 117 192 292; baseline 0 300"><span class='ocrx_word' id='word_1_112' title='bbox 188 117 192 292; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 138 273 192 275">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 138 273 192 275">
+     <span class='ocr_line' id='line_1_21' title="bbox 138 273 192 275; baseline 0 317"><span class='ocrx_word' id='word_1_113' title='bbox 138 273 192 275; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 52 348 140 350">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 52 348 140 350">
+     <span class='ocr_line' id='line_1_22' title="bbox 52 348 140 350; baseline 0 242"><span class='ocrx_word' id='word_1_114' title='bbox 52 348 140 350; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 138 273 140 402">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 138 273 140 402">
+     <span class='ocr_line' id='line_1_23' title="bbox 138 273 140 402; baseline 0 190"><span class='ocrx_word' id='word_1_115' title='bbox 138 273 140 402; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 52 481 133 483">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 52 481 133 483">
+     <span class='ocr_line' id='line_1_24' title="bbox 52 481 133 483; baseline 0 109"><span class='ocrx_word' id='word_1_116' title='bbox 52 481 133 483; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 1 247 3 508">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 1 247 3 508">
+     <span class='ocr_line' id='line_1_25' title="bbox 1 247 3 508; baseline 0 84"><span class='ocrx_word' id='word_1_117' title='bbox 1 247 3 508; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 131 464 133 500">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 131 464 133 500">
+     <span class='ocr_line' id='line_1_26' title="bbox 131 464 133 500; baseline 0 92"><span class='ocrx_word' id='word_1_118' title='bbox 131 464 133 500; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 52 157 54 535">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 52 157 54 535">
+     <span class='ocr_line' id='line_1_27' title="bbox 52 157 54 535; baseline 0 57"><span class='ocrx_word' id='word_1_119' title='bbox 52 157 54 535; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 158 561 197 578">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 158 561 197 578">
+     <span class='ocr_line' id='line_1_28' title="bbox 158 561 197 578; baseline 0 0"><span class='ocrx_word' id='word_1_120' title='bbox 158 561 169 578; x_wconf 81' lang='eng'>2</span> <span class='ocrx_word' id='word_1_121' title='bbox 177 561 197 578; x_wconf 76' lang='eng' dir='ltr'>0/o</span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/ijs.0.003616-0-000.pbm.png b/examples/ijs.0.003616-0-000.pbm.png
new file mode 100644
index 00000000..08effd5e
Binary files /dev/null and b/examples/ijs.0.003616-0-000.pbm.png differ
diff --git a/examples/ijs.0.003616-0-000.pbm.png.hocr b/examples/ijs.0.003616-0-000.pbm.png.hocr
new file mode 100644
index 00000000..2646197e
--- /dev/null
+++ b/examples/ijs.0.003616-0-000.pbm.png.hocr
@@ -0,0 +1,94 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003616-0-000.pbm.png"; bbox 0 0 1183 773; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 214 1 1182 772">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 214 1 1182 565">
+     <span class='ocr_line' id='line_1_1' title="bbox 214 1 1032 30; baseline -0.001 -5"><span class='ocrx_word' id='word_1_1' title='bbox 214 5 267 25; x_wconf 77' lang='eng'><em>100*</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 436 1 603 25; x_wconf 85' lang='eng' dir='ltr'><em>Carnimonas</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 613 1 753 30; x_wconf 85' lang='eng' dir='ltr'><em>nigrificans</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 764 1 1032 30; x_wconf 84' lang='eng' dir='ltr'><em>CTCBS1T(Y13299)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 411 42 1053 71; baseline -0.002 -5"><span class='ocrx_word' id='word_1_5' title='bbox 411 43 638 66; x_wconf 84' lang='eng' dir='ltr'><em>Modicisa/ibacter</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 646 43 791 66; x_wconf 83' lang='eng' dir='ltr'><em>tunisiensis</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 803 43 875 65; x_wconf 95' lang='eng' dir='ltr'><em>LIT2T</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 883 42 1053 71; x_wconf 81' lang='eng' dir='ltr'><em>(DQS41495)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 417 84 1036 112; baseline 0.002 -6"><span class='ocrx_word' id='word_1_9' title='bbox 417 84 627 112; x_wconf 86' lang='eng' dir='ltr'><em>Marinospiril/um</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 637 84 802 112; x_wconf 88' lang='eng' dir='ltr'><em>megaterium</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 814 84 863 106; x_wconf 91' lang='eng' dir='ltr'><em>H7T</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 871 84 1036 112; x_wconf 81' lang='eng' dir='ltr'><em>(A8006770)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 384 125 995 154; baseline 0 -6"><span class='ocrx_word' id='word_1_13' title='bbox 384 125 594 154; x_wconf 86' lang='eng' dir='ltr'><em>Marinospirillum</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 604 125 766 154; x_wconf 87' lang='eng' dir='ltr'><em>alka/iphilum</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 776 125 824 148; x_wconf 90' lang='eng' dir='ltr'><em>Z4T</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 832 125 963 154; x_wconf 89' lang='eng' dir='ltr'><em>(AF27571</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 971 125 995 154; x_wconf 90' lang='eng'>3)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 373 166 1022 195; baseline 0 -6"><span class='ocrx_word' id='word_1_18' title='bbox 373 166 596 195; x_wconf 86' lang='eng' dir='ltr'><em>Oceanospiri/Ium</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 606 166 679 189; x_wconf 90' lang='eng' dir='ltr'><em>linum</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 689 166 772 189; x_wconf 92' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 786 166 883 189; x_wconf 85' lang='eng' dir='ltr'><em>11336T</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 891 166 1022 195; x_wconf 88' lang='eng' dir='ltr'><em>(M22365)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 369 207 1091 236; baseline 0 -6"><span class='ocrx_word' id='word_1_23' title='bbox 369 207 592 236; x_wconf 86' lang='eng' dir='ltr'><em>Oceanospirillum</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 602 207 750 236; x_wconf 83' lang='eng' dir='ltr'><em>beijerinckii</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 760 207 807 231; x_wconf 92' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 822 207 918 231; x_wconf 90' lang='eng' dir='ltr'><em>15445T</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 927 207 1091 236; x_wconf 87' lang='eng' dir='ltr'><em>(AB006760)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 334 248 994 277; baseline 0.002 -6"><span class='ocrx_word' id='word_1_28' title='bbox 334 248 562 272; x_wconf 83' lang='eng' dir='ltr'><em>Marinimicrobium</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 573 248 740 277; x_wconf 85' lang='eng' dir='ltr'><em>agarilyticum</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 751 248 822 272; x_wconf 88' lang='eng' dir='ltr'><em>M18T</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 830 248 994 277; x_wconf 88' lang='eng' dir='ltr'><em>(AY839870)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 371 289 973 319; baseline 0 -6"><span class='ocrx_word' id='word_1_32' title='bbox 371 289 553 313; x_wconf 89' lang='eng' dir='ltr'><em>Microbulbifer</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 560 289 706 319; x_wconf 85' lang='eng' dir='ltr'><em>salipa/udis</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 717 289 802 313; x_wconf 91' lang='eng' dir='ltr'><em>SM-1T</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 810 289 973 319; x_wconf 87' lang='eng' dir='ltr'><em>(AF479688)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 362 330 1063 360; baseline 0 -6"><span class='ocrx_word' id='word_1_36' title='bbox 362 330 543 354; x_wconf 88' lang='eng' dir='ltr'><em>Microbulbifer</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 551 331 687 360; x_wconf 83' lang='eng' dir='ltr'><em>elongatus</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 696 330 780 354; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 794 331 1063 360; x_wconf 82' lang='eng' dir='ltr'><em>10144T(ABOZ1368)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 351 372 1101 402; baseline 0 -7"><span class='ocrx_word' id='word_1_40' title='bbox 351 372 622 402; x_wconf 85' lang='eng' dir='ltr'><em>Saccharospirillum</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 633 372 786 402; x_wconf 87' lang='eng' dir='ltr'><em>salsuginis</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 795 372 930 395; x_wconf 92' lang='eng' dir='ltr'><em>YlM-Y25T</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 937 372 1101 401; x_wconf 87' lang='eng' dir='ltr'><em>(EF177670)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 345 413 1025 442; baseline 0 -6"><span class='ocrx_word' id='word_1_44' title='bbox 345 413 590 442; x_wconf 85' lang='eng' dir='ltr'><em>SaccharospiriI/um</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 601 413 734 442; x_wconf 87' lang='eng' dir='ltr'><em>impatiens</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 746 413 857 436; x_wconf 91' lang='eng' dir='ltr'><em>EL—105T</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 865 413 1025 442; x_wconf 87' lang='eng' dir='ltr'><em>(AJ315983)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 387 454 999 484; baseline 0 -6"><span class='ocrx_word' id='word_1_48' title='bbox 387 455 517 478; x_wconf 85' lang='eng' dir='ltr'><em>Reinekea</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 529 455 678 478; x_wconf 89' lang='eng' dir='ltr'><em>blandensis</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 690 455 822 478; x_wconf 90' lang='eng' dir='ltr'><em>MED297T</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 830 454 999 484; x_wconf 88' lang='eng' dir='ltr'><em>(DQ403810)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 401 495 1182 525; baseline 0 -7"><span class='ocrx_word' id='word_1_52' title='bbox 401 496 532 519; x_wconf 86' lang='eng' dir='ltr'><em>Reinekea</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 543 496 827 519; x_wconf 86' lang='eng' dir='ltr'><em>marinisedimentorum</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 838 495 904 519; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 919 496 1182 525; x_wconf 83' lang='eng' dir='ltr'><em>15388T(AJ561121)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 375 536 954 565; baseline 0.002 -6"><span class='ocrx_word' id='word_1_56' title='bbox 375 537 502 565; x_wconf 84' lang='eng' dir='ltr'><em>Kangiel/a</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 513 537 647 560; x_wconf 86' lang='eng' dir='ltr'><em>koreensis</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 658 536 954 565; x_wconf 76' lang='eng' dir='ltr'><em>SW—125T(AY52056O)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 332 577 976 648">
+     <span class='ocr_line' id='line_1_15' title="bbox 376 577 976 607; baseline 0 -6"><span class='ocrx_word' id='word_1_59' title='bbox 376 578 504 607; x_wconf 81' lang='eng' dir='ltr'><em>Kangie/la</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 515 578 668 607; x_wconf 84' lang='eng' dir='ltr'><em>aquimarina</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 680 577 804 601; x_wconf 81' lang='eng' dir='ltr'><em>SW—154T</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 812 578 976 607; x_wconf 88' lang='eng' dir='ltr'><em>(AY520561)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 332 620 845 648; baseline 0.002 -6"><span class='ocrx_word' id='word_1_63' title='bbox 332 620 495 643; x_wconf 86' lang='eng' dir='ltr'><em>Alcanivorax</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 501 620 620 648; x_wconf 85' lang='eng' dir='ltr'><em>jadensis</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 630 620 678 643; x_wconf 89' lang='eng' dir='ltr'><em>T9T</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 685 620 778 648; x_wconf 90' lang='eng' dir='ltr'><em>(AJ001</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 787 620 845 648; x_wconf 88' lang='eng'><em>150)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 338 660 1130 772">
+     <span class='ocr_line' id='line_1_17' title="bbox 370 660 1130 689; baseline -0.001 -5"><span class='ocrx_word' id='word_1_68' title='bbox 370 660 565 684; x_wconf 88' lang='eng' dir='ltr'><em>Sedimenticola</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 576 661 814 684; x_wconf 87' lang='eng' dir='ltr'><em>selenatireducens</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 823 660 906 684; x_wconf 93' lang='eng' dir='ltr'>AK4O</span> <span class='ocrx_word' id='word_1_71' title='bbox 911 661 928 683; x_wconf 91' lang='eng' dir='ltr'>H</span> <span class='ocrx_word' id='word_1_72' title='bbox 934 661 943 683; x_wconf 98' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 949 662 960 676; x_wconf 85' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_74' title='bbox 968 661 996 689; x_wconf 92' lang='eng' dir='ltr'>(A</span> <span class='ocrx_word' id='word_1_75' title='bbox 1000 661 1067 684; x_wconf 88' lang='eng' dir='ltr'><em>F432</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 1073 661 1081 683; x_wconf 99' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 1087 661 1130 689; x_wconf 92' lang='eng'><em>45)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 338 702 1024 731; baseline 0 -6"><span class='ocrx_word' id='word_1_78' title='bbox 338 702 535 725; x_wconf 87' lang='eng' dir='ltr'><em>Arhodomonas</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 546 702 683 731; x_wconf 88' lang='eng' dir='ltr'><em>aquaeo/ei</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 691 702 775 725; x_wconf 91' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 786 702 885 725; x_wconf 76' lang='eng' dir='ltr'><em>49307T</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 893 702 1024 731; x_wconf 88' lang='eng' dir='ltr'><em>(M26631)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 437 743 1044 772; baseline 0 -6"><span class='ocrx_word' id='word_1_83' title='bbox 437 743 602 766; x_wconf 86' lang='eng' dir='ltr'><em>Terasakiella</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 612 743 700 772; x_wconf 87' lang='eng' dir='ltr'><em>pusi/Ia</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 713 743 761 766; x_wconf 94' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 774 743 1044 772; x_wconf 85' lang='eng' dir='ltr'><em>13613T(ABOO6768)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 0 7 429 761">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 0 7 429 761">
+     <span class='ocr_line' id='line_1_20' title="bbox 165 7 429 28; baseline 0 745"><span class='ocrx_word' id='word_1_87' title='bbox 165 7 429 28; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 165 28 414 126; baseline 0 -15"><span class='ocrx_word' id='word_1_88' title='bbox 165 28 414 126; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 144 126 379 168; baseline 0 -16"><span class='ocrx_word' id='word_1_89' title='bbox 144 126 379 168; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 144 168 366 250; baseline 0 -16"><span class='ocrx_word' id='word_1_90' title='bbox 144 168 366 250; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 114 250 366 334; baseline 0 -19"><span class='ocrx_word' id='word_1_91' title='bbox 114 250 366 334; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 129 334 356 375; baseline 0 0"><span class='ocrx_word' id='word_1_92' title='bbox 129 334 356 375; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 96 375 343 417; baseline 0 356"><span class='ocrx_word' id='word_1_93' title='bbox 96 375 343 417; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 96 417 345 456; baseline 0 317"><span class='ocrx_word' id='word_1_94' title='bbox 96 417 345 456; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 76 456 395 540; baseline 0 0"><span class='ocrx_word' id='word_1_95' title='bbox 76 456 395 540; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 0 540 369 622; baseline 0 0"><span class='ocrx_word' id='word_1_96' title='bbox 0 540 369 622; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 0 622 332 662; baseline 0 111"><span class='ocrx_word' id='word_1_97' title='bbox 0 622 332 662; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 0 662 365 703; baseline 0 0"><span class='ocrx_word' id='word_1_98' title='bbox 0 662 365 703; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 0 703 429 761; baseline 0 0"><span class='ocrx_word' id='word_1_99' title='bbox 0 703 429 761; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/ijs.0.003624-0-000.pbm.png b/examples/ijs.0.003624-0-000.pbm.png
new file mode 100644
index 00000000..57dcd335
Binary files /dev/null and b/examples/ijs.0.003624-0-000.pbm.png differ
diff --git a/examples/ijs.0.003624-0-000.pbm.png.hocr b/examples/ijs.0.003624-0-000.pbm.png.hocr
new file mode 100644
index 00000000..8da187d4
--- /dev/null
+++ b/examples/ijs.0.003624-0-000.pbm.png.hocr
@@ -0,0 +1,219 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003624-0-000.pbm.png"; bbox 0 0 1304 1130; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 285 2 1196 606">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 465 2 1168 34">
+     <span class='ocr_line' id='line_1_1' title="bbox 465 2 1168 34; baseline 0 -7"><span class='ocrx_word' id='word_1_1' title='bbox 465 10 508 28; x_wconf 89' lang='eng'>100</span> <span class='ocrx_word' id='word_1_2' title='bbox 558 5 709 34; x_wconf 86' lang='eng' dir='ltr'><em>Virgibacillus</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 720 5 857 34; x_wconf 85' lang='eng' dir='ltr'><em>chiguensis</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 867 5 946 27; x_wconf 93' lang='eng' dir='ltr'>NTU—1</span> <span class='ocrx_word' id='word_1_5' title='bbox 954 6 981 27; x_wconf 94' lang='eng'><em>01</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 989 2 999 17; x_wconf 95' lang='eng' dir='ltr'><em>T</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 1009 3 1099 31; x_wconf 94' lang='eng' dir='ltr'>(EF101</span> <span class='ocrx_word' id='word_1_8' title='bbox 1110 3 1168 31; x_wconf 89' lang='eng'>168)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 535 52 1168 84">
+     <span class='ocr_line' id='line_1_2' title="bbox 535 52 1168 84; baseline -0.002 -6"><span class='ocrx_word' id='word_1_9' title='bbox 535 56 687 84; x_wconf 85' lang='eng' dir='ltr'><em>Virgibaci/lus</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 697 56 860 78; x_wconf 85' lang='eng' dir='ltr'><em>dokdonensis</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 870 55 963 78; x_wconf 88' lang='eng' dir='ltr'><em>DSW-1</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 971 52 998 77; x_wconf 95' lang='eng' dir='ltr'>0T</span> <span class='ocrx_word' id='word_1_13' title='bbox 1005 53 1168 82; x_wconf 88' lang='eng' dir='ltr'>(AY822043)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 542 98 1196 129">
+     <span class='ocr_line' id='line_1_3' title="bbox 542 98 1196 129; baseline -0.002 -6"><span class='ocrx_word' id='word_1_14' title='bbox 542 101 693 129; x_wconf 83' lang='eng' dir='ltr'><em>Virgibaci/Ius</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 702 101 894 129; x_wconf 79' lang='eng' dir='ltr'><em>pantothenticus</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 904 101 951 122; x_wconf 92' lang='eng' dir='ltr'><em>IAM</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 965 102 973 122; x_wconf 99' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 983 98 1196 127; x_wconf 87' lang='eng' dir='ltr'>1061T(D16275)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 520 150 1120 182">
+     <span class='ocr_line' id='line_1_4' title="bbox 520 150 1120 182; baseline 0 -7"><span class='ocrx_word' id='word_1_19' title='bbox 520 154 672 182; x_wconf 84' lang='eng' dir='ltr'><em>Virgibaci/lus</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 681 154 778 182; x_wconf 82' lang='eng' dir='ltr'><em>proomii</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 786 153 847 176; x_wconf 89' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 861 155 869 175; x_wconf 93' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 878 150 957 175; x_wconf 87' lang='eng' dir='ltr'><em>237OT</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 965 151 1033 180; x_wconf 91' lang='eng' dir='ltr'>(AJO1</span> <span class='ocrx_word' id='word_1_25' title='bbox 1042 151 1120 180; x_wconf 90' lang='eng'>2667)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 460 198 1005 229">
+     <span class='ocr_line' id='line_1_5' title="bbox 460 198 1005 229; baseline 0 -7"><span class='ocrx_word' id='word_1_26' title='bbox 460 201 612 229; x_wconf 83' lang='eng' dir='ltr'><em>Virgibacillus</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 622 201 772 223; x_wconf 82' lang='eng' dir='ltr'><em>marismortui</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 782 202 789 222; x_wconf 95' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 799 198 843 222; x_wconf 82' lang='eng' dir='ltr'><em>2ST</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 850 198 1005 227; x_wconf 74' lang='eng' dir='ltr'>(A1009793)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 395 241 951 273">
+     <span class='ocr_line' id='line_1_6' title="bbox 395 241 951 273; baseline 0 -7"><span class='ocrx_word' id='word_1_31' title='bbox 395 241 438 260; x_wconf 75' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 462 245 614 273; x_wconf 86' lang='eng' dir='ltr'><em>Virgibacillus</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 624 245 695 267; x_wconf 85' lang='eng' dir='ltr'><em>olivae</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 706 241 951 273; x_wconf 71' lang='eng' dir='ltr'>E308T(DO139839)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 503 286 1141 318">
+     <span class='ocr_line' id='line_1_7' title="bbox 503 286 1141 318; baseline 0 -7"><span class='ocrx_word' id='word_1_35' title='bbox 503 289 665 318; x_wconf 88' lang='eng' dir='ltr'><em>Virgibacillus</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 674 289 800 311; x_wconf 88' lang='eng' dir='ltr'><em>sediminis</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 809 289 859 311; x_wconf 95' lang='eng' dir='ltr'><em>YIM</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 872 286 960 318; x_wconf 90' lang='eng' dir='ltr'><em>kkny3T</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 970 287 1141 316; x_wconf 89' lang='eng' dir='ltr'>(AY121430)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 594 336 1150 367">
+     <span class='ocr_line' id='line_1_8' title="bbox 594 336 1150 367; baseline -0.002 -6"><span class='ocrx_word' id='word_1_40' title='bbox 594 339 745 367; x_wconf 84' lang='eng' dir='ltr'><em>Virgibacillus</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 755 339 888 367; x_wconf 82' lang='eng' dir='ltr'><em>salexigens</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 897 336 1017 361; x_wconf 89' lang='eng' dir='ltr'><em>C-2OM0T</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 1025 336 1063 364; x_wconf 90' lang='eng' dir='ltr'><em>(Y1</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 1074 340 1081 360; x_wconf 94' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 1090 336 1150 365; x_wconf 89' lang='eng'>603)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 468 383 1191 463">
+     <span class='ocr_line' id='line_1_9' title="bbox 487 383 1098 415; baseline 0 -7"><span class='ocrx_word' id='word_1_46' title='bbox 487 387 639 415; x_wconf 82' lang='eng' dir='ltr'><em>Virgibacillus</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 648 387 758 409; x_wconf 84' lang='eng' dir='ltr'><em>kekensis</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 767 387 814 408; x_wconf 93' lang='eng' dir='ltr'><em>YIM</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 827 387 893 415; x_wconf 91' lang='eng' dir='ltr'>kkny1</span> <span class='ocrx_word' id='word_1_50' title='bbox 902 383 928 408; x_wconf 92' lang='eng' dir='ltr'><em>6T</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 935 384 993 413; x_wconf 90' lang='eng' dir='ltr'>(AY1</span> <span class='ocrx_word' id='word_1_52' title='bbox 1002 384 1098 413; x_wconf 88' lang='eng'>21439)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 468 431 1191 463; baseline -0.001 -6"><span class='ocrx_word' id='word_1_53' title='bbox 468 435 620 463; x_wconf 83' lang='eng' dir='ltr'><em>Virgibacillus</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 630 435 839 457; x_wconf 82' lang='eng' dir='ltr'><em>ha/odenitriﬁcans</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 849 434 911 457; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 925 431 1022 456; x_wconf 89' lang='eng' dir='ltr'>10037T</span> <span class='ocrx_word' id='word_1_57' title='bbox 1029 432 1140 461; x_wconf 87' lang='eng' dir='ltr'>(AY5431</span> <span class='ocrx_word' id='word_1_58' title='bbox 1149 432 1191 461; x_wconf 90' lang='eng'>69)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 285 478 1147 606">
+     <span class='ocr_line' id='line_1_11' title="bbox 520 478 1101 510; baseline 0 -7"><span class='ocrx_word' id='word_1_59' title='bbox 520 481 672 510; x_wconf 78' lang='eng' dir='ltr'><em>Virgibaci/lus</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 681 481 810 510; x_wconf 83' lang='eng' dir='ltr'><em>halophi/us</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 820 478 927 503; x_wconf 79' lang='eng' dir='ltr'><em>5B7SCT</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 935 479 1101 507; x_wconf 86' lang='eng' dir='ltr'><em>(AB243851)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 434 526 1135 558; baseline 0 -7"><span class='ocrx_word' id='word_1_63' title='bbox 434 541 451 543; x_wconf 98' lang='eng'>—</span> <span class='ocrx_word' id='word_1_64' title='bbox 467 529 619 558; x_wconf 84' lang='eng' dir='ltr'><em>Virgibaci/Ius</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 629 529 792 551; x_wconf 79' lang='eng' dir='ltr'><em>carmonensis</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 801 529 862 551; x_wconf 90' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 875 526 1135 555; x_wconf 86' lang='eng' dir='ltr'>20964T(AJ316302)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 285 567 1147 606; baseline -0.001 -6"><span class='ocrx_word' id='word_1_68' title='bbox 285 567 314 586; x_wconf 74' lang='eng'><em>99</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 374 577 417 596; x_wconf 86' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 434 588 488 590; x_wconf 98' lang='eng'>—</span> <span class='ocrx_word' id='word_1_71' title='bbox 509 578 661 606; x_wconf 80' lang='eng' dir='ltr'><em>Virgibaci/lus</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 670 578 804 606; x_wconf 81' lang='eng' dir='ltr'><em>necropolis</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 813 577 874 600; x_wconf 90' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 889 574 1147 604; x_wconf 75' lang='eng' dir='ltr'><em>19488T(A1315056)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 476 622 1152 697">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 476 622 1152 697">
+     <span class='ocr_line' id='line_1_14' title="bbox 476 622 1080 654; baseline 0 -7"><span class='ocrx_word' id='word_1_75' title='bbox 476 625 628 654; x_wconf 83' lang='eng' dir='ltr'><em>Virgibacillus</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 638 625 760 647; x_wconf 87' lang='eng' dir='ltr'><em>koreensis</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 770 622 910 647; x_wconf 86' lang='eng' dir='ltr'><em>BH30097T</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 918 623 993 651; x_wconf 89' lang='eng' dir='ltr'>(AY61</span> <span class='ocrx_word' id='word_1_79' title='bbox 1002 626 1047 647; x_wconf 88' lang='eng'><em>601</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 1056 623 1080 651; x_wconf 91' lang='eng'><em>2)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 543 665 1152 697; baseline -0.002 -6"><span class='ocrx_word' id='word_1_81' title='bbox 543 669 699 691; x_wconf 85' lang='eng' dir='ltr'><em>Halobacillus</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 709 669 808 697; x_wconf 82' lang='eng' dir='ltr'><em>trueperi</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 817 668 879 691; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 893 665 1152 695; x_wconf 86' lang='eng' dir='ltr'>1O4O4T(AJ310149)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 444 715 1178 1033">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 444 715 1178 1033">
+     <span class='ocr_line' id='line_1_16' title="bbox 567 715 1178 746; baseline 0 -7"><span class='ocrx_word' id='word_1_85' title='bbox 567 717 723 739; x_wconf 81' lang='eng' dir='ltr'><em>Halobaci/lus</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 733 717 861 746; x_wconf 83' lang='eng' dir='ltr'><em>ha/ophi/us</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 872 717 965 739; x_wconf 90' lang='eng' dir='ltr'><em>NCIMB</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 976 718 1039 739; x_wconf 87' lang='eng'><em>9251</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 1053 715 1178 743; x_wconf 91' lang='eng' dir='ltr'>(X62174)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 569 761 1143 790; baseline -0.002 -4"><span class='ocrx_word' id='word_1_90' title='bbox 569 763 748 786; x_wconf 84' lang='eng' dir='ltr'><em>Gracilibacillus</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 758 764 914 786; x_wconf 82' lang='eng' dir='ltr'><em>haloto/erans</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 924 761 975 785; x_wconf 96' lang='eng' dir='ltr'><em>NNT</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 983 761 1143 790; x_wconf 90' lang='eng' dir='ltr'>(AF036922)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 623 808 1156 840; baseline 0 -7"><span class='ocrx_word' id='word_1_94' title='bbox 623 811 802 833; x_wconf 69' lang='eng' dir='ltr'><em>Grad/[bacillus</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 813 811 944 840; x_wconf 83' lang='eng' dir='ltr'><em>dipsosauri</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 953 811 992 833; x_wconf 94' lang='eng' dir='ltr'>DD</span> <span class='ocrx_word' id='word_1_97' title='bbox 998 813 1005 833; x_wconf 96' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 1012 808 1022 823; x_wconf 88' lang='eng' dir='ltr'><em>T</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 1030 809 1156 837; x_wconf 88' lang='eng' dir='ltr'><em>(X82436)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 444 856 1077 887; baseline -0.002 -6"><span class='ocrx_word' id='word_1_100' title='bbox 444 859 644 881; x_wconf 80' lang='eng' dir='ltr'><em>Oceanobacil/us</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 654 859 771 887; x_wconf 86' lang='eng' dir='ltr'><em>iheyensis</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 781 859 883 880; x_wconf 87' lang='eng' dir='ltr'>HTE831</span> <span class='ocrx_word' id='word_1_103' title='bbox 890 856 900 870; x_wconf 96' lang='eng' dir='ltr'><em>T</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 913 856 1077 885; x_wconf 86' lang='eng' dir='ltr'>(ABO10863)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 515 903 1155 933; baseline 0 -5"><span class='ocrx_word' id='word_1_105' title='bbox 515 906 715 928; x_wconf 83' lang='eng' dir='ltr'><em>Oceanobacillus</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 725 907 851 928; x_wconf 80' lang='eng' dir='ltr'><em>Chironomi</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 858 903 978 928; x_wconf 88' lang='eng' dir='ltr'>T3944DT</span> <span class='ocrx_word' id='word_1_108' title='bbox 985 904 1155 933; x_wconf 88' lang='eng' dir='ltr'><em>(DO298074)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 470 953 1082 983; baseline 0 -5"><span class='ocrx_word' id='word_1_109' title='bbox 470 957 645 978; x_wconf 83' lang='eng' dir='ltr'><em>Marinibacillus</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 655 957 754 978; x_wconf 83' lang='eng' dir='ltr'><em>marinus</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 765 956 826 978; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 841 953 920 978; x_wconf 94' lang='eng' dir='ltr'>1297T</span> <span class='ocrx_word' id='word_1_113' title='bbox 927 954 1082 983; x_wconf 85' lang='eng' dir='ltr'>(AJ237708)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 500 1001 1141 1033; baseline 0 -7"><span class='ocrx_word' id='word_1_114' title='bbox 500 1004 695 1033; x_wconf 81' lang='eng' dir='ltr'><em>Jeotgalibacillus</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 705 1004 858 1026; x_wconf 73' lang='eng' dir='ltr'><em>alimentarius</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 867 1001 1072 1030; x_wconf 86' lang='eng' dir='ltr'>YKJ-13T(AF281</span> <span class='ocrx_word' id='word_1_117' title='bbox 1083 1002 1141 1030; x_wconf 93' lang='eng'><em>158)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 451 1051 1302 1127">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 451 1051 1302 1127">
+     <span class='ocr_line' id='line_1_23' title="bbox 451 1051 1066 1083; baseline 0 -7"><span class='ocrx_word' id='word_1_118' title='bbox 451 1054 619 1076; x_wconf 85' lang='eng' dir='ltr'><em>F’aenibaciI/us</em></span> <span class='ocrx_word' id='word_1_119' title='bbox 628 1054 744 1083; x_wconf 83' lang='eng' dir='ltr'><em>po/ymyxa</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 755 1054 842 1076; x_wconf 92' lang='eng' dir='ltr'><em>NCDO</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 856 1055 863 1076; x_wconf 96' lang='eng'><em>1</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 873 1051 934 1076; x_wconf 92' lang='eng' dir='ltr'><em>774T</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 941 1051 1066 1080; x_wconf 84' lang='eng' dir='ltr'>(X60632)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 628 1096 1302 1127; baseline -0.001 -6"><span class='ocrx_word' id='word_1_124' title='bbox 628 1099 827 1127; x_wconf 82' lang='eng' dir='ltr'><em>AlicyC/obaci/lus</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 836 1099 1022 1121; x_wconf 81' lang='eng' dir='ltr'><em>acidocaldarius</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 1033 1098 1095 1121; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 1106 1096 1169 1120; x_wconf 90' lang='eng' dir='ltr'>446T</span> <span class='ocrx_word' id='word_1_128' title='bbox 1177 1096 1302 1125; x_wconf 91' lang='eng' dir='ltr'>(X60742)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 3 13 617 1070">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 3 13 617 1070">
+     <span class='ocr_line' id='line_1_25' title="bbox 428 13 557 50; baseline 0 -14"><span class='ocrx_word' id='word_1_129' title='bbox 428 13 557 50; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 384 50 538 144; baseline 0 0"><span class='ocrx_word' id='word_1_130' title='bbox 384 50 538 144; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 384 144 513 198; baseline 0 0"><span class='ocrx_word' id='word_1_131' title='bbox 384 144 513 198; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 384 198 459 244; baseline 0 0"><span class='ocrx_word' id='word_1_132' title='bbox 384 198 459 244; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 361 244 395 289; baseline 0 841"><span class='ocrx_word' id='word_1_133' title='bbox 361 244 395 289; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 361 289 503 334; baseline 0 796"><span class='ocrx_word' id='word_1_134' title='bbox 361 289 503 334; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 357 334 587 367; baseline 0 763"><span class='ocrx_word' id='word_1_135' title='bbox 357 334 587 367; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 357 367 487 431; baseline 0 0"><span class='ocrx_word' id='word_1_136' title='bbox 357 367 487 431; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 350 522 434 567; baseline 0 563"><span class='ocrx_word' id='word_1_137' title='bbox 350 522 434 567; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 322 631 476 670; baseline 0.019 -3"><span class='ocrx_word' id='word_1_138' title='bbox 322 631 476 670; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> <span class='ocrx_word' id='word_1_139' title='bbox 470 667 476 670; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 322 670 566 761; baseline 0 -58"><span class='ocrx_word' id='word_1_140' title='bbox 322 670 566 761; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 347 761 617 808; baseline 0.015 -4"><span class='ocrx_word' id='word_1_141' title='bbox 347 761 617 808; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 434 808 617 844; baseline 0 -12"><span class='ocrx_word' id='word_1_142' title='bbox 434 808 617 844; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 61 844 442 902; baseline 0 228"><span class='ocrx_word' id='word_1_143' title='bbox 61 844 442 902; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 3 902 511 938; baseline 0 192"><span class='ocrx_word' id='word_1_144' title='bbox 3 902 511 938; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 3 938 470 998; baseline 0 132"><span class='ocrx_word' id='word_1_145' title='bbox 3 938 470 998; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 3 998 492 1035; baseline 0 95"><span class='ocrx_word' id='word_1_146' title='bbox 3 998 492 1035; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 3 1035 451 1070; baseline 0 60"><span class='ocrx_word' id='word_1_147' title='bbox 3 1035 451 1070; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 2 45 123 77">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 25 45 82 66">
+     <span class='ocr_line' id='line_1_43' title="bbox 25 45 82 66; baseline 0 0"><span class='ocrx_word' id='word_1_148' title='bbox 25 45 82 66; x_wconf 92' lang='eng'>0.02</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 351 219 380 237">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 351 219 380 237">
+     <span class='ocr_line' id='line_1_44' title="bbox 351 219 380 237; baseline 0 0"><span class='ocrx_word' id='word_1_149' title='bbox 351 219 380 237; x_wconf 88' lang='eng'><em>59</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 341 290 370 308">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 341 290 370 308">
+     <span class='ocr_line' id='line_1_45' title="bbox 341 290 370 308; baseline 0 0"><span class='ocrx_word' id='word_1_150' title='bbox 341 290 370 308; x_wconf 92' lang='eng'><em>64</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 323 405 352 423">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 323 405 352 423">
+     <span class='ocr_line' id='line_1_46' title="bbox 323 405 352 423; baseline 0 0"><span class='ocrx_word' id='word_1_151' title='bbox 323 405 352 423; x_wconf 89' lang='eng'>54</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 314 467 342 485">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 314 467 342 485">
+     <span class='ocr_line' id='line_1_47' title="bbox 314 467 342 485; baseline 0 0"><span class='ocrx_word' id='word_1_152' title='bbox 314 467 342 485; x_wconf 87' lang='eng'><em>94</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 432 541 434 590">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 432 541 434 590">
+     <span class='ocr_line' id='line_1_48' title="bbox 432 541 434 590; baseline 0 540"><span class='ocrx_word' id='word_1_153' title='bbox 432 541 434 590; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 61 594 392 844">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 61 594 392 844">
+     <span class='ocr_line' id='line_1_49' title="bbox 203 594 329 703; baseline 0 0"><span class='ocrx_word' id='word_1_154' title='bbox 203 594 329 703; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_50' title="bbox 61 703 392 844; baseline 0 -36"><span class='ocrx_word' id='word_1_155' title='bbox 61 703 392 844; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 325 501 327 697">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 325 501 327 697">
+     <span class='ocr_line' id='line_1_51' title="bbox 325 501 327 697; baseline 0 433"><span class='ocrx_word' id='word_1_156' title='bbox 325 501 327 697; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 314 676 470 727">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 314 676 470 727">
+     <span class='ocr_line' id='line_1_52' title="bbox 427 676 470 694; baseline 0 0"><span class='ocrx_word' id='word_1_157' title='bbox 427 676 470 694; x_wconf 92' lang='eng'><em>100</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_53' title="bbox 314 709 342 727; baseline 0 0"><span class='ocrx_word' id='word_1_158' title='bbox 314 709 342 727; x_wconf 88' lang='eng'><em>86</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 330 766 434 835">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 330 766 434 835">
+     <span class='ocr_line' id='line_1_54' title="bbox 330 766 359 785; baseline 0 0"><span class='ocrx_word' id='word_1_159' title='bbox 330 766 359 785; x_wconf 86' lang='eng'>66</span> 
+     </span>
+     <span class='ocr_line' id='line_1_55' title="bbox 392 817 434 835; baseline 0 0"><span class='ocrx_word' id='word_1_160' title='bbox 392 817 434 835; x_wconf 94' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 7 1111 613 1113">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 7 1111 613 1113">
+     <span class='ocr_line' id='line_1_56' title="bbox 7 1111 613 1113; baseline 0 17"><span class='ocrx_word' id='word_1_161' title='bbox 7 1111 613 1113; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/ijs.0.003640-0-001.pbm.png b/examples/ijs.0.003640-0-001.pbm.png
new file mode 100644
index 00000000..fd468716
Binary files /dev/null and b/examples/ijs.0.003640-0-001.pbm.png differ
diff --git a/examples/ijs.0.003640-0-001.pbm.png.hocr b/examples/ijs.0.003640-0-001.pbm.png.hocr
new file mode 100644
index 00000000..bdc6e510
--- /dev/null
+++ b/examples/ijs.0.003640-0-001.pbm.png.hocr
@@ -0,0 +1,110 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003640-0-001.pbm.png"; bbox 0 0 1231 1733; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 17 4 1230 1693">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 17 4 1230 1693">
+     <span class='ocr_line' id='line_1_1' title="bbox 441 4 988 32; baseline -0.002 -5"><span class='ocrx_word' id='word_1_1' title='bbox 441 5 608 27; x_wconf 84' lang='eng' dir='ltr'><em>Nonomuraea</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 617 5 699 32; x_wconf 85' lang='eng' dir='ltr'><em>pusilla</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 711 5 756 27; x_wconf 95' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 769 4 857 27; x_wconf 80' lang='eng' dir='ltr'><em>14684T</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 868 5 988 32; x_wconf 84' lang='eng' dir='ltr'>(D85491)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 235 48 808 76; baseline 0 -6"><span class='ocrx_word' id='word_1_6' title='bbox 235 49 415 70; x_wconf 82' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 425 49 478 70; x_wconf 86' lang='eng' dir='ltr'><em>alba</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 488 49 538 70; x_wconf 94' lang='eng' dir='ltr'><em>YIM</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 548 48 639 70; x_wconf 91' lang='eng' dir='ltr'><em>45681T</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 649 49 808 76; x_wconf 86' lang='eng' dir='ltr'>(DQ985164)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 211 91 904 120; baseline 0 -6"><span class='ocrx_word' id='word_1_11' title='bbox 211 93 391 114; x_wconf 80' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 400 93 540 120; x_wconf 78' lang='eng' dir='ltr'><em>yumaensis</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 551 92 641 114; x_wconf 89' lang='eng' dir='ltr'>IMSNU</span> <span class='ocrx_word' id='word_1_14' title='bbox 652 91 743 114; x_wconf 81' lang='eng' dir='ltr'><em>22167T</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 755 92 904 120; x_wconf 87' lang='eng' dir='ltr'>(AJ293714)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 281 135 869 163; baseline -0.002 -5"><span class='ocrx_word' id='word_1_16' title='bbox 281 136 462 158; x_wconf 85' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 472 136 585 158; x_wconf 85' lang='eng' dir='ltr'><em>hal/ensis</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 596 135 700 158; x_wconf 76' lang='eng' dir='ltr'><em>H647-1T</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 710 136 869 163; x_wconf 88' lang='eng' dir='ltr'>(DQO76484)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 214 179 832 207; baseline 0 -6"><span class='ocrx_word' id='word_1_20' title='bbox 214 180 394 201; x_wconf 82' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 404 180 469 201; x_wconf 84' lang='eng' dir='ltr'><em>Iivida</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 481 180 571 201; x_wconf 86' lang='eng' dir='ltr'>IMSNU</span> <span class='ocrx_word' id='word_1_23' title='bbox 582 179 673 201; x_wconf 88' lang='eng' dir='ltr'><em>22191T</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 683 180 832 207; x_wconf 88' lang='eng' dir='ltr'><em>(AJ293706)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 150 221 1030 251; baseline 0 -6"><span class='ocrx_word' id='word_1_25' title='bbox 150 221 194 242; x_wconf 91' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 205 224 529 245; x_wconf 80' lang='eng' dir='ltr'><em>—Actinomadura</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 540 224 710 250; x_wconf 78' lang='eng' dir='ltr'><em>cate/latispora</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 721 223 767 245; x_wconf 92' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 779 222 868 245; x_wconf 79' lang='eng' dir='ltr'><em>16341T</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 878 223 1030 251; x_wconf 89' lang='eng' dir='ltr'>(AF154127)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 305 266 961 294; baseline 0 -6"><span class='ocrx_word' id='word_1_31' title='bbox 305 267 485 288; x_wconf 80' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 496 267 673 294; x_wconf 83' lang='eng' dir='ltr'><em>rugatobispora</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 685 267 729 288; x_wconf 94' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 743 266 831 288; x_wconf 80' lang='eng' dir='ltr'><em>14382T</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 841 267 961 294; x_wconf 90' lang='eng' dir='ltr'>(U49010)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 137 310 876 340; baseline 0 -8"><span class='ocrx_word' id='word_1_36' title='bbox 137 319 167 340; x_wconf 82' lang='eng'><em>74</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 250 311 430 332; x_wconf 83' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 442 311 540 332; x_wconf 85' lang='eng' dir='ltr'><em>vinacea</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 551 311 612 332; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 622 310 714 332; x_wconf 82' lang='eng' dir='ltr'><em>43765T</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 724 311 876 338; x_wconf 86' lang='eng' dir='ltr'>(AF134070)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 178 352 849 382; baseline 0 -6"><span class='ocrx_word' id='word_1_42' title='bbox 178 352 204 373; x_wconf 88' lang='eng'><em>91</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 253 355 433 376; x_wconf 81' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 444 355 517 376; x_wconf 87' lang='eng' dir='ltr'><em>viridis</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 528 355 588 376; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 599 354 690 376; x_wconf 77' lang='eng' dir='ltr'><em>43175T</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 700 354 849 382; x_wconf 91' lang='eng' dir='ltr'>(AJ420141)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 154 397 1049 426; baseline 0 -6"><span class='ocrx_word' id='word_1_48' title='bbox 154 404 183 425; x_wconf 79' lang='eng'><em>52</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 388 399 568 420; x_wconf 83' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 577 399 688 425; x_wconf 81' lang='eng' dir='ltr'><em>pelletieri</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 697 398 787 420; x_wconf 89' lang='eng' dir='ltr'><em>IMSNU</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 799 397 889 420; x_wconf 79' lang='eng' dir='ltr'><em>22169T</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 900 398 1049 426; x_wconf 80' lang='eng' dir='ltr'>(AJ293710)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 261 441 888 469; baseline 0 -6"><span class='ocrx_word' id='word_1_54' title='bbox 261 442 442 463; x_wconf 81' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 452 448 532 463; x_wconf 81' lang='eng' dir='ltr'><em>macra</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 543 442 622 463; x_wconf 90' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 635 441 723 463; x_wconf 83' lang='eng' dir='ltr'><em>14102T</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 734 442 888 469; x_wconf 86' lang='eng' dir='ltr'>(AB364594)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 346 485 1149 513; baseline 0 -6"><span class='ocrx_word' id='word_1_59' title='bbox 346 486 527 507; x_wconf 86' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 538 491 633 507; x_wconf 85' lang='eng' dir='ltr'><em>cremea</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 643 486 726 513; x_wconf 88' lang='eng' dir='ltr'><em>subsp.</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 738 491 834 507; x_wconf 86' lang='eng' dir='ltr'><em>cremea</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 844 486 901 507; x_wconf 91' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_64' title='bbox 913 485 987 507; x_wconf 78' lang='eng' dir='ltr'><em>3308T</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 997 485 1149 513; x_wconf 88' lang='eng' dir='ltr'>(AF134067)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 204 528 1230 557; baseline 0.001 -7"><span class='ocrx_word' id='word_1_66' title='bbox 204 529 234 550; x_wconf 88' lang='eng'><em>99</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 429 529 609 551; x_wconf 81' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 620 535 715 551; x_wconf 89' lang='eng' dir='ltr'><em>cremea</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 726 529 808 556; x_wconf 87' lang='eng' dir='ltr'><em>subsp.</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 820 529 944 557; x_wconf 70' lang='eng' dir='ltr'><em>rifamycini</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 954 529 999 551; x_wconf 89' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 1012 528 1100 551; x_wconf 89' lang='eng' dir='ltr'><em>14183T</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 1110 529 1230 557; x_wconf 89' lang='eng' dir='ltr'>(U49003)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 17 556 952 601; baseline 0 -7"><span class='ocrx_word' id='word_1_74' title='bbox 17 576 43 597; x_wconf 91' lang='eng'><em>5</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 72 556 102 577; x_wconf 74' lang='eng'><em>72</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 272 573 452 594; x_wconf 83' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 463 573 620 594; x_wconf 84' lang='eng' dir='ltr'><em>formosensis</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 630 573 691 594; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 702 572 793 594; x_wconf 79' lang='eng' dir='ltr'><em>43997T</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 804 573 952 601; x_wconf 91' lang='eng' dir='ltr'>(AJ420140)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 243 616 806 644; baseline 0 -6"><span class='ocrx_word' id='word_1_81' title='bbox 243 617 423 639; x_wconf 82' lang='eng' dir='ltr'><em>Actinornadura</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 434 617 557 639; x_wconf 83' lang='eng' dir='ltr'><em>mexicana</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 565 616 643 639; x_wconf 79' lang='eng' dir='ltr'><em>A290T</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 653 617 806 644; x_wconf 86' lang='eng' dir='ltr'>(AF277195)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 249 660 843 688; baseline 0 -6"><span class='ocrx_word' id='word_1_85' title='bbox 249 661 430 682; x_wconf 84' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 440 661 510 682; x_wconf 84' lang='eng' dir='ltr'><em>citrea</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 521 661 582 682; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 592 660 684 682; x_wconf 80' lang='eng' dir='ltr'><em>43461T</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 694 660 843 688; x_wconf 87' lang='eng' dir='ltr'>(AJ420139)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 166 704 910 732; baseline -0.001 -6"><span class='ocrx_word' id='word_1_90' title='bbox 166 706 196 728; x_wconf 88' lang='eng'>92</span> <span class='ocrx_word' id='word_1_91' title='bbox 262 704 442 726; x_wconf 79' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 452 704 589 732; x_wconf 83' lang='eng' dir='ltr'><em>glauc/ﬂava</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 601 704 646 726; x_wconf 92' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 658 704 747 726; x_wconf 73' lang='eng' dir='ltr'><em>14668T</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 757 704 910 732; x_wconf 86' lang='eng' dir='ltr'>(AF153881)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 179 747 980 782; baseline 0 -13"><span class='ocrx_word' id='word_1_96' title='bbox 179 761 209 782; x_wconf 71' lang='eng'><em>53</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 290 748 471 769; x_wconf 82' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 481 748 693 769; x_wconf 81' lang='eng' dir='ltr'><em>luteof/uorescens</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 704 748 749 769; x_wconf 95' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 762 747 851 769; x_wconf 89' lang='eng' dir='ltr'><em>13057T</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 861 748 980 775; x_wconf 86' lang='eng' dir='ltr'>(U49008)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 200 791 866 822; baseline 0 -9"><span class='ocrx_word' id='word_1_102' title='bbox 200 800 230 822; x_wconf 76' lang='eng'>80</span> <span class='ocrx_word' id='word_1_103' title='bbox 277 792 458 813; x_wconf 83' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 468 792 579 813; x_wconf 85' lang='eng' dir='ltr'><em>coerulea</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 590 792 635 813; x_wconf 95' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 648 791 736 813; x_wconf 80' lang='eng' dir='ltr'><em>14679T</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 747 791 866 819; x_wconf 88' lang='eng' dir='ltr'>(U49002)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 207 830 947 863; baseline 0 -6"><span class='ocrx_word' id='word_1_108' title='bbox 207 830 237 851; x_wconf 81' lang='eng'><em>65</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 271 835 451 857; x_wconf 82' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 463 841 662 862; x_wconf 84' lang='eng' dir='ltr'><em>verrucosospora</em></span> <span class='ocrx_word' id='word_1_111' title='bbox 673 835 718 857; x_wconf 96' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 731 834 820 857; x_wconf 91' lang='eng' dir='ltr'><em>14100T</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 830 835 947 863; x_wconf 84' lang='eng' dir='ltr'>(U49011)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 226 878 835 907; baseline 0 -6"><span class='ocrx_word' id='word_1_114' title='bbox 226 879 406 901; x_wconf 81' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_115' title='bbox 417 879 531 901; x_wconf 81' lang='eng' dir='ltr'><em>madurae</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 542 879 603 901; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 613 878 705 901; x_wconf 78' lang='eng' dir='ltr'><em>43067T</em></span> <span class='ocrx_word' id='word_1_118' title='bbox 716 879 835 907; x_wconf 88' lang='eng' dir='ltr'>(X97889)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 213 922 764 950; baseline 0 -6"><span class='ocrx_word' id='word_1_119' title='bbox 213 923 393 944; x_wconf 81' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 403 929 516 950; x_wconf 86' lang='eng' dir='ltr'><em>meyerae</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 523 922 602 944; x_wconf 88' lang='eng' dir='ltr'><em>A288T</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 612 923 764 950; x_wconf 86' lang='eng' dir='ltr'><em>(AY273787)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 236 966 808 994; baseline 0 -6"><span class='ocrx_word' id='word_1_123' title='bbox 236 967 416 988; x_wconf 81' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_124' title='bbox 427 967 576 994; x_wconf 85' lang='eng' dir='ltr'><em>napierensis</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 586 966 646 988; x_wconf 73' lang='eng' dir='ltr'><em>BSOT</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 656 966 808 994; x_wconf 86' lang='eng' dir='ltr'>(AY568292)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 140 1006 916 1038; baseline 0 -6"><span class='ocrx_word' id='word_1_127' title='bbox 140 1006 170 1028; x_wconf 81' lang='eng'><em>83</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 321 1011 502 1032; x_wconf 83' lang='eng' dir='ltr'><em>Act/nomadura</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 512 1011 580 1032; x_wconf 79' lang='eng' dir='ltr'><em>lat/na</em></span> <span class='ocrx_word' id='word_1_130' title='bbox 591 1010 652 1032; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 663 1009 754 1032; x_wconf 83' lang='eng' dir='ltr'><em>43382T</em></span> <span class='ocrx_word' id='word_1_132' title='bbox 765 1010 916 1038; x_wconf 86' lang='eng' dir='ltr'>(AY035998)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 343 1053 1030 1081; baseline 0 -5"><span class='ocrx_word' id='word_1_133' title='bbox 343 1054 523 1076; x_wconf 85' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_134' title='bbox 534 1054 696 1076; x_wconf 85' lang='eng' dir='ltr'><em>atramentaria</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 707 1054 769 1076; x_wconf 82' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_136' title='bbox 779 1053 870 1076; x_wconf 77' lang='eng' dir='ltr'><em>43919T</em></span> <span class='ocrx_word' id='word_1_137' title='bbox 880 1054 1030 1081; x_wconf 87' lang='eng' dir='ltr'>(AJ420138)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 20 1087 936 1135; baseline 0 -16"><span class='ocrx_word' id='word_1_138' title='bbox 20 1087 49 1109; x_wconf 74' lang='eng'><em>56</em></span> <span class='ocrx_word' id='word_1_139' title='bbox 198 1114 228 1135; x_wconf 76' lang='eng'><em>67</em></span> <span class='ocrx_word' id='word_1_140' title='bbox 323 1098 503 1119; x_wconf 83' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_141' title='bbox 514 1098 603 1119; x_wconf 83' lang='eng' dir='ltr'><em>hibisca</em></span> <span class='ocrx_word' id='word_1_142' title='bbox 614 1098 675 1119; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_143' title='bbox 685 1097 777 1119; x_wconf 73' lang='eng' dir='ltr'><em>44148T</em></span> <span class='ocrx_word' id='word_1_144' title='bbox 787 1097 936 1125; x_wconf 81' lang='eng' dir='ltr'>(AJ420136)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 353 1140 1030 1169; baseline -0.001 -6"><span class='ocrx_word' id='word_1_145' title='bbox 353 1141 533 1163; x_wconf 82' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_146' title='bbox 544 1141 697 1163; x_wconf 85' lang='eng' dir='ltr'><em>namibiensis</em></span> <span class='ocrx_word' id='word_1_147' title='bbox 708 1141 769 1163; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_148' title='bbox 779 1140 871 1163; x_wconf 84' lang='eng' dir='ltr'><em>44197T</em></span> <span class='ocrx_word' id='word_1_149' title='bbox 881 1141 1030 1169; x_wconf 85' lang='eng' dir='ltr'>(AJ420134)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 260 1183 969 1213; baseline 0.003 -8"><span class='ocrx_word' id='word_1_150' title='bbox 260 1183 304 1205; x_wconf 94' lang='eng'>100</span> <span class='ocrx_word' id='word_1_151' title='bbox 371 1185 551 1207; x_wconf 84' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_152' title='bbox 561 1185 667 1213; x_wconf 81' lang='eng' dir='ltr'><em>kijaniata</em></span> <span class='ocrx_word' id='word_1_153' title='bbox 678 1185 739 1207; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_154' title='bbox 750 1184 841 1207; x_wconf 79' lang='eng' dir='ltr'><em>43764T</em></span> <span class='ocrx_word' id='word_1_155' title='bbox 851 1185 969 1213; x_wconf 88' lang='eng' dir='ltr'><em>(X97890)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 367 1228 1036 1256; baseline 0 -5"><span class='ocrx_word' id='word_1_156' title='bbox 367 1229 547 1251; x_wconf 84' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_157' title='bbox 558 1229 691 1256; x_wconf 86' lang='eng' dir='ltr'><em>oligospora</em></span> <span class='ocrx_word' id='word_1_158' title='bbox 698 1229 775 1251; x_wconf 87' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_159' title='bbox 785 1228 876 1251; x_wconf 81' lang='eng' dir='ltr'><em>43269T</em></span> <span class='ocrx_word' id='word_1_160' title='bbox 886 1229 1036 1256; x_wconf 85' lang='eng' dir='ltr'>(AF163118)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 394 1272 1108 1300; baseline 0 -6"><span class='ocrx_word' id='word_1_161' title='bbox 394 1273 591 1294; x_wconf 88' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_162' title='bbox 600 1273 779 1300; x_wconf 85' lang='eng' dir='ltr'><em>keratinilytica</em></span> <span class='ocrx_word' id='word_1_163' title='bbox 787 1272 942 1294; x_wconf 78' lang='eng' dir='ltr'><em>WCC-2265T</em></span> <span class='ocrx_word' id='word_1_164' title='bbox 952 1272 1108 1300; x_wconf 87' lang='eng' dir='ltr'><em>(EU637009)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 237 1315 1042 1347; baseline 0 -9"><span class='ocrx_word' id='word_1_165' title='bbox 237 1326 282 1347; x_wconf 77' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_166' title='bbox 441 1317 622 1338; x_wconf 79' lang='eng' dir='ltr'><em>Act/nomadura</em></span> <span class='ocrx_word' id='word_1_167' title='bbox 633 1317 754 1338; x_wconf 75' lang='eng' dir='ltr'><em>viridi/utea</em></span> <span class='ocrx_word' id='word_1_168' title='bbox 766 1316 811 1338; x_wconf 92' lang='eng' dir='ltr'><em>IFO</em></span> <span class='ocrx_word' id='word_1_169' title='bbox 823 1315 912 1338; x_wconf 80' lang='eng' dir='ltr'><em>14480T</em></span> <span class='ocrx_word' id='word_1_170' title='bbox 922 1316 1042 1344; x_wconf 86' lang='eng' dir='ltr'>(D86943)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 351 1359 1151 1387; baseline 0 -6"><span class='ocrx_word' id='word_1_171' title='bbox 351 1360 395 1381; x_wconf 89' lang='eng'>100</span> <span class='ocrx_word' id='word_1_172' title='bbox 463 1360 643 1381; x_wconf 78' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_173' title='bbox 653 1360 811 1381; x_wconf 86' lang='eng' dir='ltr'><em>rubrobrunea</em></span> <span class='ocrx_word' id='word_1_174' title='bbox 823 1360 883 1381; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_175' title='bbox 894 1359 985 1381; x_wconf 83' lang='eng' dir='ltr'><em>43750T</em></span> <span class='ocrx_word' id='word_1_176' title='bbox 996 1360 1151 1387; x_wconf 84' lang='eng' dir='ltr'><em>(EU637008)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 280 1403 981 1431; baseline 0 -6"><span class='ocrx_word' id='word_1_177' title='bbox 280 1404 460 1425; x_wconf 83' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_178' title='bbox 471 1404 639 1425; x_wconf 85' lang='eng' dir='ltr'><em>rudentiformis</em></span> <span class='ocrx_word' id='word_1_179' title='bbox 650 1404 711 1425; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_180' title='bbox 721 1403 813 1425; x_wconf 81' lang='eng' dir='ltr'><em>44962T</em></span> <span class='ocrx_word' id='word_1_181' title='bbox 823 1403 981 1431; x_wconf 89' lang='eng' dir='ltr'><em>(DQ285420)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 177 1442 926 1475; baseline 0 -6"><span class='ocrx_word' id='word_1_182' title='bbox 177 1442 207 1463; x_wconf 88' lang='eng'>89</span> <span class='ocrx_word' id='word_1_183' title='bbox 266 1448 446 1469; x_wconf 83' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_184' title='bbox 456 1447 593 1469; x_wconf 88' lang='eng' dir='ltr'><em>fulvescens</em></span> <span class='ocrx_word' id='word_1_185' title='bbox 604 1447 665 1469; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_186' title='bbox 675 1446 767 1469; x_wconf 78' lang='eng' dir='ltr'>439st</span> <span class='ocrx_word' id='word_1_187' title='bbox 777 1447 926 1475; x_wconf 88' lang='eng' dir='ltr'>(AJ420137)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 239 1490 861 1519; baseline 0 -6"><span class='ocrx_word' id='word_1_188' title='bbox 239 1491 419 1513; x_wconf 79' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_189' title='bbox 430 1491 516 1513; x_wconf 79' lang='eng' dir='ltr'><em>ﬁbrosa</em></span> <span class='ocrx_word' id='word_1_190' title='bbox 523 1491 599 1513; x_wconf 90' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_191' title='bbox 609 1490 701 1513; x_wconf 81' lang='eng' dir='ltr'><em>49459T</em></span> <span class='ocrx_word' id='word_1_192' title='bbox 711 1491 861 1519; x_wconf 88' lang='eng' dir='ltr'>(AF163114)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 133 1531 920 1562; baseline 0.001 -6"><span class='ocrx_word' id='word_1_193' title='bbox 133 1531 162 1552; x_wconf 78' lang='eng'><em>52</em></span> <span class='ocrx_word' id='word_1_194' title='bbox 253 1535 434 1557; x_wconf 82' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_195' title='bbox 444 1535 585 1562; x_wconf 75' lang='eng' dir='ltr'><em>nitritigenes</em></span> <span class='ocrx_word' id='word_1_196' title='bbox 595 1535 656 1557; x_wconf 83' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_197' title='bbox 667 1534 758 1557; x_wconf 80' lang='eng' dir='ltr'><em>44137T</em></span> <span class='ocrx_word' id='word_1_198' title='bbox 769 1535 920 1562; x_wconf 83' lang='eng' dir='ltr'>(AY035999)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 240 1578 850 1606; baseline 0 -6"><span class='ocrx_word' id='word_1_199' title='bbox 240 1579 420 1600; x_wconf 82' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_200' title='bbox 431 1579 535 1600; x_wconf 82' lang='eng' dir='ltr'><em>umbrina</em></span> <span class='ocrx_word' id='word_1_201' title='bbox 545 1579 602 1600; x_wconf 83' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_202' title='bbox 613 1578 688 1600; x_wconf 78' lang='eng' dir='ltr'><em>6837T</em></span> <span class='ocrx_word' id='word_1_203' title='bbox 698 1579 850 1606; x_wconf 89' lang='eng' dir='ltr'>(AF163121)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 44 1618 922 1650; baseline 0 -6"><span class='ocrx_word' id='word_1_204' title='bbox 44 1618 74 1639; x_wconf 88' lang='eng'>55</span> <span class='ocrx_word' id='word_1_205' title='bbox 240 1623 420 1644; x_wconf 79' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_206' title='bbox 431 1623 588 1649; x_wconf 86' lang='eng' dir='ltr'><em>echinospora</em></span> <span class='ocrx_word' id='word_1_207' title='bbox 600 1622 661 1644; x_wconf 91' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_208' title='bbox 671 1621 762 1644; x_wconf 81' lang='eng' dir='ltr'><em>43163T</em></span> <span class='ocrx_word' id='word_1_209' title='bbox 773 1622 922 1650; x_wconf 86' lang='eng' dir='ltr'>(AJ420135)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 229 1665 818 1693; baseline -0.002 -5"><span class='ocrx_word' id='word_1_210' title='bbox 229 1666 409 1688; x_wconf 83' lang='eng' dir='ltr'><em>Actinomadura</em></span> <span class='ocrx_word' id='word_1_211' title='bbox 420 1666 504 1693; x_wconf 86' lang='eng' dir='ltr'><em>spadix</em></span> <span class='ocrx_word' id='word_1_212' title='bbox 513 1666 570 1688; x_wconf 89' lang='eng' dir='ltr'><em>JCM</em></span> <span class='ocrx_word' id='word_1_213' title='bbox 581 1665 655 1688; x_wconf 88' lang='eng' dir='ltr'><em>3146T</em></span> <span class='ocrx_word' id='word_1_214' title='bbox 665 1666 818 1693; x_wconf 84' lang='eng' dir='ltr'>(AF163120)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 203 189 205 234">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 203 189 205 234">
+     <span class='ocr_line' id='line_1_40' title="bbox 203 189 205 234; baseline 0 1499"><span class='ocrx_word' id='word_1_215' title='bbox 203 189 205 234; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 4 1727 109 1730">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 4 1727 109 1730">
+     <span class='ocr_line' id='line_1_41' title="bbox 4 1727 109 1730; baseline 0 3"><span class='ocrx_word' id='word_1_216' title='bbox 4 1727 109 1730; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/ijs.0.003699-0-000.pbm.png b/examples/ijs.0.003699-0-000.pbm.png
new file mode 100644
index 00000000..5d4b2199
Binary files /dev/null and b/examples/ijs.0.003699-0-000.pbm.png differ
diff --git a/examples/ijs.0.003699-0-000.pbm.png.hocr b/examples/ijs.0.003699-0-000.pbm.png.hocr
new file mode 100644
index 00000000..35ab4dc9
--- /dev/null
+++ b/examples/ijs.0.003699-0-000.pbm.png.hocr
@@ -0,0 +1,214 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003699-0-000.pbm.png"; bbox 0 0 1542 1140; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 307 1 1540 1138">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 307 1 1540 1138">
+     <span class='ocr_line' id='line_1_1' title="bbox 798 1 1444 32; baseline -0.002 -6"><span class='ocrx_word' id='word_1_1' title='bbox 798 4 949 26; x_wconf 82' lang='eng' dir='ltr'>Geobaci/lus</span> <span class='ocrx_word' id='word_1_2' title='bbox 959 4 1118 32; x_wconf 81' lang='eng' dir='ltr'>kaustophi/us</span> <span class='ocrx_word' id='word_1_3' title='bbox 1129 4 1221 26; x_wconf 92' lang='eng' dir='ltr'>NCIMB</span> <span class='ocrx_word' id='word_1_4' title='bbox 1233 1 1312 26; x_wconf 88' lang='eng' dir='ltr'>8547T</span> <span class='ocrx_word' id='word_1_5' title='bbox 1321 1 1444 30; x_wconf 88' lang='eng' dir='ltr'>(X60618)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 813 36 1519 64; baseline 0 -4"><span class='ocrx_word' id='word_1_6' title='bbox 813 38 963 60; x_wconf 79' lang='eng' dir='ltr'>Geobacillus</span> <span class='ocrx_word' id='word_1_7' title='bbox 974 39 1184 60; x_wconf 81' lang='eng' dir='ltr'>thermoleovorans</span> <span class='ocrx_word' id='word_1_8' title='bbox 1194 38 1274 60; x_wconf 92' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_9' title='bbox 1284 36 1381 60; x_wconf 84' lang='eng' dir='ltr'>43513T</span> <span class='ocrx_word' id='word_1_10' title='bbox 1390 36 1519 64; x_wconf 88' lang='eng' dir='ltr'>(M77488)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 844 70 1365 99; baseline 0 -4"><span class='ocrx_word' id='word_1_11' title='bbox 844 73 995 95; x_wconf 75' lang='eng' dir='ltr'>Geobac/l/us</span> <span class='ocrx_word' id='word_1_12' title='bbox 1005 73 1125 95; x_wconf 76' lang='eng' dir='ltr'><em>lituanious</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 1136 70 1195 95; x_wconf 76' lang='eng' dir='ltr'>N—3T</span> <span class='ocrx_word' id='word_1_14' title='bbox 1204 71 1365 99; x_wconf 89' lang='eng' dir='ltr'>(AYO44055)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 803 106 1278 134; baseline 0 -4"><span class='ocrx_word' id='word_1_15' title='bbox 803 108 961 130; x_wconf 77' lang='eng' dir='ltr'>‘Geobaci/Ius</span> <span class='ocrx_word' id='word_1_16' title='bbox 970 108 1064 130; x_wconf 78' lang='eng' dir='ltr'>za/ihae&#39;</span> <span class='ocrx_word' id='word_1_17' title='bbox 1075 108 1101 129; x_wconf 95' lang='eng' dir='ltr'>T1</span> <span class='ocrx_word' id='word_1_18' title='bbox 1118 106 1278 134; x_wconf 85' lang='eng' dir='ltr'>(AY166603)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 772 139 1263 168; baseline 0 -4"><span class='ocrx_word' id='word_1_19' title='bbox 772 142 922 164; x_wconf 83' lang='eng' dir='ltr'>Geobaci/lus</span> <span class='ocrx_word' id='word_1_20' title='bbox 934 142 1023 164; x_wconf 75' lang='eng' dir='ltr'>vulcan/</span> <span class='ocrx_word' id='word_1_21' title='bbox 1031 143 1083 164; x_wconf 74' lang='eng'>33—1</span> <span class='ocrx_word' id='word_1_22' title='bbox 1091 139 1101 154; x_wconf 70' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_23' title='bbox 1111 140 1263 168; x_wconf 76' lang='eng' dir='ltr'>(A1293805)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 828 174 1340 205; baseline 0 -6"><span class='ocrx_word' id='word_1_24' title='bbox 828 177 979 199; x_wconf 80' lang='eng' dir='ltr'>Geobaci/Ius</span> <span class='ocrx_word' id='word_1_25' title='bbox 988 177 1112 205; x_wconf 84' lang='eng' dir='ltr'>gargensis</span> <span class='ocrx_word' id='word_1_26' title='bbox 1122 174 1170 199; x_wconf 77' lang='eng' dir='ltr'>GaT</span> <span class='ocrx_word' id='word_1_27' title='bbox 1180 175 1340 203; x_wconf 85' lang='eng' dir='ltr'>(AY193888)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 733 209 1462 238; baseline 0 -5"><span class='ocrx_word' id='word_1_28' title='bbox 733 212 757 227; x_wconf 82' lang='eng'>94</span> <span class='ocrx_word' id='word_1_29' title='bbox 788 211 939 233; x_wconf 83' lang='eng' dir='ltr'>Geobaci/lus</span> <span class='ocrx_word' id='word_1_30' title='bbox 950 212 1184 233; x_wconf 73' lang='eng' dir='ltr'>thermocatenu/atus</span> <span class='ocrx_word' id='word_1_31' title='bbox 1194 211 1256 233; x_wconf 92' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_32' title='bbox 1269 209 1329 233; x_wconf 89' lang='eng' dir='ltr'>730T</span> <span class='ocrx_word' id='word_1_33' title='bbox 1339 209 1462 238; x_wconf 82' lang='eng'>(226926)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 800 244 1524 275; baseline 0 -7"><span class='ocrx_word' id='word_1_34' title='bbox 800 246 950 268; x_wconf 84' lang='eng' dir='ltr'>Geobaci/Ius</span> <span class='ocrx_word' id='word_1_35' title='bbox 960 247 1203 275; x_wconf 82' lang='eng' dir='ltr'>stearothermophi/us</span> <span class='ocrx_word' id='word_1_36' title='bbox 1215 246 1300 268; x_wconf 91' lang='eng' dir='ltr'>NCDO</span> <span class='ocrx_word' id='word_1_37' title='bbox 1314 248 1321 268; x_wconf 99' lang='eng'>1</span> <span class='ocrx_word' id='word_1_38' title='bbox 1331 244 1391 268; x_wconf 88' lang='eng' dir='ltr'>768T</span> <span class='ocrx_word' id='word_1_39' title='bbox 1400 244 1524 272; x_wconf 86' lang='eng' dir='ltr'>(X60840)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_9' title="bbox 590 278 1295 311; baseline 0 -9"><span class='ocrx_word' id='word_1_40' title='bbox 590 295 626 311; x_wconf 66' lang='eng'>100</span> <span class='ocrx_word' id='word_1_41' title='bbox 723 280 910 302; x_wconf 85' lang='eng' dir='ltr'>—Geobacillus</span> <span class='ocrx_word' id='word_1_42' title='bbox 916 281 1048 309; x_wconf 81' lang='eng' dir='ltr'>jurass/cus</span> <span class='ocrx_word' id='word_1_43' title='bbox 1058 278 1125 302; x_wconf 83' lang='eng' dir='ltr'>D81T</span> <span class='ocrx_word' id='word_1_44' title='bbox 1135 278 1210 307; x_wconf 84' lang='eng' dir='ltr'>(AY31</span> <span class='ocrx_word' id='word_1_45' title='bbox 1219 278 1295 306; x_wconf 87' lang='eng'>2404)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 690 313 1291 341; baseline 0 -4"><span class='ocrx_word' id='word_1_46' title='bbox 690 316 714 331; x_wconf 78' lang='eng'>99</span> <span class='ocrx_word' id='word_1_47' title='bbox 795 315 946 337; x_wconf 83' lang='eng' dir='ltr'>Geobacil/us</span> <span class='ocrx_word' id='word_1_48' title='bbox 957 316 1083 337; x_wconf 84' lang='eng' dir='ltr'><em>uzenensis</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 1094 313 1124 337; x_wconf 74' lang='eng' dir='ltr'>UT</span> <span class='ocrx_word' id='word_1_50' title='bbox 1133 313 1291 341; x_wconf 85' lang='eng' dir='ltr'>(AF276304)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_11' title="bbox 628 347 1265 379; baseline 0 -7"><span class='ocrx_word' id='word_1_51' title='bbox 628 359 705 379; x_wconf 73' lang='eng'>_,—</span> <span class='ocrx_word' id='word_1_52' title='bbox 717 350 868 372; x_wconf 82' lang='eng' dir='ltr'>Geobaci/lus</span> <span class='ocrx_word' id='word_1_53' title='bbox 878 350 1043 372; x_wconf 86' lang='eng' dir='ltr'>subterraneus</span> <span class='ocrx_word' id='word_1_54' title='bbox 1053 347 1098 372; x_wconf 83' lang='eng' dir='ltr'>34T</span> <span class='ocrx_word' id='word_1_55' title='bbox 1107 348 1265 376; x_wconf 86' lang='eng' dir='ltr'>(AF276306)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 628 382 1413 411; baseline 0 -5"><span class='ocrx_word' id='word_1_56' title='bbox 628 385 652 401; x_wconf 83' lang='eng'>90</span> <span class='ocrx_word' id='word_1_57' title='bbox 731 385 882 407; x_wconf 83' lang='eng' dir='ltr'>Geobaci/lus</span> <span class='ocrx_word' id='word_1_58' title='bbox 893 385 1135 407; x_wconf 81' lang='eng' dir='ltr'>thermodenitrificans</span> <span class='ocrx_word' id='word_1_59' title='bbox 1146 385 1208 407; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_60' title='bbox 1219 382 1281 407; x_wconf 87' lang='eng' dir='ltr'>465T</span> <span class='ocrx_word' id='word_1_61' title='bbox 1290 383 1413 411; x_wconf 86' lang='eng' dir='ltr'>(Z26928)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 674 416 1312 448; baseline 0 -7"><span class='ocrx_word' id='word_1_62' title='bbox 674 419 825 441; x_wconf 83' lang='eng' dir='ltr'>Geobaci/lus</span> <span class='ocrx_word' id='word_1_63' title='bbox 835 419 1035 448; x_wconf 73' lang='eng' dir='ltr'>ca/doxy/o/yticus</span> <span class='ocrx_word' id='word_1_64' title='bbox 1045 419 1110 441; x_wconf 80' lang='eng'>8181</span> <span class='ocrx_word' id='word_1_65' title='bbox 1119 416 1145 441; x_wconf 60' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_66' title='bbox 1154 417 1312 445; x_wconf 85' lang='eng' dir='ltr'>(AF067651)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 664 451 1418 482; baseline -0.001 -6"><span class='ocrx_word' id='word_1_67' title='bbox 664 454 815 476; x_wconf 82' lang='eng' dir='ltr'>Geobaci/lus</span> <span class='ocrx_word' id='word_1_68' title='bbox 826 454 1088 482; x_wconf 84' lang='eng' dir='ltr'>thermog/ucosidasius</span> <span class='ocrx_word' id='word_1_69' title='bbox 1098 454 1177 476; x_wconf 90' lang='eng' dir='ltr'>ATCC</span> <span class='ocrx_word' id='word_1_70' title='bbox 1188 451 1285 476; x_wconf 87' lang='eng' dir='ltr'>43742T</span> <span class='ocrx_word' id='word_1_71' title='bbox 1294 451 1418 480; x_wconf 89' lang='eng' dir='ltr'>(X60641)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 649 486 1133 515; baseline -0.002 -4"><span class='ocrx_word' id='word_1_72' title='bbox 649 488 800 511; x_wconf 85' lang='eng' dir='ltr'>Geobacillus</span> <span class='ocrx_word' id='word_1_73' title='bbox 811 489 881 511; x_wconf 78' lang='eng' dir='ltr'>toebii</span> <span class='ocrx_word' id='word_1_74' title='bbox 889 486 965 511; x_wconf 81' lang='eng' dir='ltr'>SK-1T</span> <span class='ocrx_word' id='word_1_75' title='bbox 975 486 1133 515; x_wconf 87' lang='eng' dir='ltr'>(AF326278)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 1091 521 1540 550; baseline 0 -5"><span class='ocrx_word' id='word_1_76' title='bbox 1091 523 1242 545; x_wconf 82' lang='eng' dir='ltr'>Geabaci/Ius</span> <span class='ocrx_word' id='word_1_77' title='bbox 1253 524 1335 545; x_wconf 79' lang='eng' dir='ltr'>deb/[is</span> <span class='ocrx_word' id='word_1_78' title='bbox 1344 521 1378 545; x_wconf 76' lang='eng' dir='ltr'>TfT</span> <span class='ocrx_word' id='word_1_79' title='bbox 1388 521 1540 550; x_wconf 88' lang='eng' dir='ltr'>(AJ564616)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 566 555 1210 586; baseline 0 -7"><span class='ocrx_word' id='word_1_80' title='bbox 566 558 743 586; x_wconf 75' lang='eng' dir='ltr'>Anoxybacil/us</span> <span class='ocrx_word' id='word_1_81' title='bbox 753 558 867 586; x_wconf 85' lang='eng' dir='ltr'><em>rupiensis</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 878 558 940 580; x_wconf 90' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_83' title='bbox 953 559 960 579; x_wconf 98' lang='eng'>1</span> <span class='ocrx_word' id='word_1_84' title='bbox 970 559 995 579; x_wconf 92' lang='eng'>71</span> <span class='ocrx_word' id='word_1_85' title='bbox 1004 555 1048 579; x_wconf 92' lang='eng' dir='ltr'>27T</span> <span class='ocrx_word' id='word_1_86' title='bbox 1058 556 1210 584; x_wconf 85' lang='eng' dir='ltr'>(AJ879076)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 545 590 1149 621; baseline 0 -7"><span class='ocrx_word' id='word_1_87' title='bbox 545 592 696 614; x_wconf 82' lang='eng' dir='ltr'>Geobacillus</span> <span class='ocrx_word' id='word_1_88' title='bbox 707 593 852 621; x_wconf 80' lang='eng' dir='ltr'><em>tepidamans</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 862 590 979 614; x_wconf 88' lang='eng' dir='ltr'>GS5-97T</span> <span class='ocrx_word' id='word_1_90' title='bbox 989 590 1149 619; x_wconf 83' lang='eng' dir='ltr'>(AY563003)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 521 625 1331 656; baseline 0 -7"><span class='ocrx_word' id='word_1_91' title='bbox 521 635 545 650; x_wconf 80' lang='eng'>92</span> <span class='ocrx_word' id='word_1_92' title='bbox 641 627 818 656; x_wconf 74' lang='eng' dir='ltr'>Anoxybaci/lus</span> <span class='ocrx_word' id='word_1_93' title='bbox 828 627 990 649; x_wconf 80' lang='eng' dir='ltr'>contaminans</span> <span class='ocrx_word' id='word_1_94' title='bbox 1000 627 1061 649; x_wconf 85' lang='eng' dir='ltr'>LMG</span> <span class='ocrx_word' id='word_1_95' title='bbox 1073 625 1169 649; x_wconf 88' lang='eng' dir='ltr'>21881T</span> <span class='ocrx_word' id='word_1_96' title='bbox 1179 625 1263 653; x_wconf 77' lang='eng' dir='ltr'>(A1551</span> <span class='ocrx_word' id='word_1_97' title='bbox 1271 625 1331 653; x_wconf 88' lang='eng'>330)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 307 636 1200 708; baseline 0.002 -26"><span class='ocrx_word' id='word_1_98' title='bbox 307 680 331 696; x_wconf 75' lang='eng'>80</span> <span class='ocrx_word' id='word_1_99' title='bbox 434 636 741 708; x_wconf 42' lang='eng' dir='ltr'>iﬂybacﬂ/us</span> <span class='ocrx_word' id='word_1_100' title='bbox 753 662 936 684; x_wconf 82' lang='eng' dir='ltr'>voinovskiensis</span> <span class='ocrx_word' id='word_1_101' title='bbox 945 659 1028 684; x_wconf 90' lang='eng' dir='ltr'>TH13T</span> <span class='ocrx_word' id='word_1_102' title='bbox 1038 660 1097 688; x_wconf 92' lang='eng' dir='ltr'>(AB1</span> <span class='ocrx_word' id='word_1_103' title='bbox 1108 660 1200 688; x_wconf 93' lang='eng'>10008)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 588 694 1196 725; baseline 0 -7"><span class='ocrx_word' id='word_1_104' title='bbox 588 697 765 725; x_wconf 73' lang='eng' dir='ltr'><em>Anoxybacil/us</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 774 697 930 725; x_wconf 75' lang='eng' dir='ltr'>amylo/yticus</span> <span class='ocrx_word' id='word_1_106' title='bbox 941 694 1034 718; x_wconf 83' lang='eng' dir='ltr'>MR3CT</span> <span class='ocrx_word' id='word_1_107' title='bbox 1044 694 1196 722; x_wconf 86' lang='eng' dir='ltr'>(AJ618979)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 682 728 1490 759; baseline -0.002 -5"><span class='ocrx_word' id='word_1_108' title='bbox 682 739 705 754; x_wconf 80' lang='eng'>54</span> <span class='ocrx_word' id='word_1_109' title='bbox 714 736 878 754; x_wconf 81' lang='eng'>[—</span> <span class='ocrx_word' id='word_1_110' title='bbox 888 731 1065 759; x_wconf 79' lang='eng' dir='ltr'>Anoxybaci/lus</span> <span class='ocrx_word' id='word_1_111' title='bbox 1075 731 1265 753; x_wconf 83' lang='eng' dir='ltr'>kestanbolensis</span> <span class='ocrx_word' id='word_1_112' title='bbox 1275 728 1320 752; x_wconf 93' lang='eng' dir='ltr'>K4T</span> <span class='ocrx_word' id='word_1_113' title='bbox 1330 729 1457 757; x_wconf 89' lang='eng' dir='ltr'>(AY24871</span> <span class='ocrx_word' id='word_1_114' title='bbox 1467 729 1490 757; x_wconf 94' lang='eng'>1)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 392 763 1461 794; baseline 0 -7"><span class='ocrx_word' id='word_1_115' title='bbox 392 765 416 781; x_wconf 76' lang='eng'>58</span> <span class='ocrx_word' id='word_1_116' title='bbox 669 765 693 780; x_wconf 76' lang='eng'>9’5</span> <span class='ocrx_word' id='word_1_117' title='bbox 857 766 1034 794; x_wconf 77' lang='eng' dir='ltr'>Anoxybacillus</span> <span class='ocrx_word' id='word_1_118' title='bbox 1043 766 1244 794; x_wconf 83' lang='eng' dir='ltr'>pushchinoensis</span> <span class='ocrx_word' id='word_1_119' title='bbox 1254 766 1282 787; x_wconf 94' lang='eng' dir='ltr'>K1</span> <span class='ocrx_word' id='word_1_120' title='bbox 1289 763 1299 777; x_wconf 71' lang='eng' dir='ltr'>T</span> <span class='ocrx_word' id='word_1_121' title='bbox 1310 763 1461 792; x_wconf 85' lang='eng' dir='ltr'>(AJ010478)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 714 798 1350 829; baseline 0 -7"><span class='ocrx_word' id='word_1_122' title='bbox 714 801 891 829; x_wconf 71' lang='eng' dir='ltr'><em>Anoxybaci/lus</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 902 800 1054 822; x_wconf 80' lang='eng' dir='ltr'>flavithermus</span> <span class='ocrx_word' id='word_1_124' title='bbox 1065 800 1127 822; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_125' title='bbox 1139 798 1218 822; x_wconf 74' lang='eng' dir='ltr'>2641T</span> <span class='ocrx_word' id='word_1_126' title='bbox 1227 798 1350 827; x_wconf 86' lang='eng' dir='ltr'>(Z26932)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 735 832 1320 863; baseline 0.002 -7"><span class='ocrx_word' id='word_1_127' title='bbox 735 835 912 863; x_wconf 81' lang='eng' dir='ltr'>Anoxybaci/lus</span> <span class='ocrx_word' id='word_1_128' title='bbox 922 835 1058 863; x_wconf 83' lang='eng' dir='ltr'>ayderensis</span> <span class='ocrx_word' id='word_1_129' title='bbox 1068 832 1153 857; x_wconf 79' lang='eng' dir='ltr'>ABO4T</span> <span class='ocrx_word' id='word_1_130' title='bbox 1162 832 1320 861; x_wconf 86' lang='eng' dir='ltr'>(AFOO1963)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 722 867 1444 898; baseline 0 -7"><span class='ocrx_word' id='word_1_131' title='bbox 722 870 899 898; x_wconf 69' lang='eng' dir='ltr'>Anoxybacil/us</span> <span class='ocrx_word' id='word_1_132' title='bbox 909 870 1096 891; x_wconf 80' lang='eng' dir='ltr'><em>kamchatkensis</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 1106 867 1277 891; x_wconf 78' lang='eng' dir='ltr'>JW/VK-KG4T</span> <span class='ocrx_word' id='word_1_134' title='bbox 1286 867 1444 896; x_wconf 89' lang='eng' dir='ltr'>(AF510985)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 712 902 1043 931; baseline 0 -5"><span class='ocrx_word' id='word_1_135' title='bbox 712 904 789 926; x_wconf 89' lang='eng' dir='ltr'>Strain</span> <span class='ocrx_word' id='word_1_136' title='bbox 802 905 868 926; x_wconf 90' lang='eng' dir='ltr'>DR01</span> <span class='ocrx_word' id='word_1_137' title='bbox 884 902 1043 931; x_wconf 83' lang='eng' dir='ltr'>(EU621359)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 706 937 1038 965; baseline 0 -4"><span class='ocrx_word' id='word_1_138' title='bbox 706 939 783 961; x_wconf 88' lang='eng' dir='ltr'>Strain</span> <span class='ocrx_word' id='word_1_139' title='bbox 796 940 867 961; x_wconf 89' lang='eng' dir='ltr'>DR02</span> <span class='ocrx_word' id='word_1_140' title='bbox 878 937 1038 965; x_wconf 80' lang='eng' dir='ltr'>(EU621360)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_29' title="bbox 717 972 1049 1000; baseline 0 -4"><span class='ocrx_word' id='word_1_141' title='bbox 717 974 795 996; x_wconf 88' lang='eng' dir='ltr'>Strain</span> <span class='ocrx_word' id='word_1_142' title='bbox 808 974 879 996; x_wconf 86' lang='eng' dir='ltr'>DR04</span> <span class='ocrx_word' id='word_1_143' title='bbox 890 972 1049 1000; x_wconf 84' lang='eng' dir='ltr'>(EU621362)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 667 1006 1325 1037; baseline 0 -7"><span class='ocrx_word' id='word_1_144' title='bbox 667 1011 690 1026; x_wconf 80' lang='eng'>62</span> <span class='ocrx_word' id='word_1_145' title='bbox 793 1008 969 1037; x_wconf 73' lang='eng' dir='ltr'>Anoxybaci/lus</span> <span class='ocrx_word' id='word_1_146' title='bbox 979 1008 1094 1037; x_wconf 86' lang='eng' dir='ltr'>gonensis</span> <span class='ocrx_word' id='word_1_147' title='bbox 1104 1006 1155 1030; x_wconf 79' lang='eng' dir='ltr'>G2T</span> <span class='ocrx_word' id='word_1_148' title='bbox 1165 1006 1222 1034; x_wconf 90' lang='eng' dir='ltr'>(AY1</span> <span class='ocrx_word' id='word_1_149' title='bbox 1231 1006 1325 1034; x_wconf 88' lang='eng'>22325)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 548 1041 880 1069; baseline 0 -4"><span class='ocrx_word' id='word_1_150' title='bbox 548 1043 626 1065; x_wconf 86' lang='eng' dir='ltr'>Strain</span> <span class='ocrx_word' id='word_1_151' title='bbox 639 1044 710 1065; x_wconf 89' lang='eng' dir='ltr'><strong>DRO3</strong></span> <span class='ocrx_word' id='word_1_152' title='bbox 721 1041 880 1069; x_wconf 84' lang='eng' dir='ltr'>(EU621361)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 490 1075 1119 1106; baseline 0 -7"><span class='ocrx_word' id='word_1_153' title='bbox 490 1080 526 1095; x_wconf 84' lang='eng'>100</span> <span class='ocrx_word' id='word_1_154' title='bbox 566 1077 716 1099; x_wconf 80' lang='eng' dir='ltr'>Geobacillus</span> <span class='ocrx_word' id='word_1_155' title='bbox 725 1078 823 1106; x_wconf 81' lang='eng' dir='ltr'>pal/idus</span> <span class='ocrx_word' id='word_1_156' title='bbox 834 1077 896 1099; x_wconf 89' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_157' title='bbox 907 1075 987 1099; x_wconf 74' lang='eng' dir='ltr'>3670T</span> <span class='ocrx_word' id='word_1_158' title='bbox 996 1075 1119 1103; x_wconf 84' lang='eng' dir='ltr'>(Z26930)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 501 1109 1020 1138; baseline 0.002 -5"><span class='ocrx_word' id='word_1_159' title='bbox 501 1112 601 1134; x_wconf 83' lang='eng' dir='ltr'>Bacillus</span> <span class='ocrx_word' id='word_1_160' title='bbox 611 1112 700 1134; x_wconf 78' lang='eng' dir='ltr'>subti/is</span> <span class='ocrx_word' id='word_1_161' title='bbox 711 1112 797 1134; x_wconf 87' lang='eng' dir='ltr'>NCDO</span> <span class='ocrx_word' id='word_1_162' title='bbox 810 1109 888 1134; x_wconf 76' lang='eng' dir='ltr'>1769T</span> <span class='ocrx_word' id='word_1_163' title='bbox 897 1110 1020 1138; x_wconf 84' lang='eng' dir='ltr'>(X60646)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 664 9 838 260">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 664 9 838 260">
+     <span class='ocr_line' id='line_1_34' title="bbox 715 9 838 92; baseline 0 0"><span class='ocrx_word' id='word_1_164' title='bbox 715 9 838 92; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 692 92 820 195; baseline 0 -13"><span class='ocrx_word' id='word_1_165' title='bbox 692 92 820 195; x_wconf 95' lang='eng' dir='ltr'>    </span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 664 195 733 260; baseline -0.116 0"><span class='ocrx_word' id='word_1_166' title='bbox 664 195 733 260; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 703 87 726 103">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 703 87 726 103">
+     <span class='ocr_line' id='line_1_37' title="bbox 703 87 726 103; baseline 0 0"><span class='ocrx_word' id='word_1_167' title='bbox 703 87 726 103; x_wconf 84' lang='eng'>69</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 666 184 689 199">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 666 184 689 199">
+     <span class='ocr_line' id='line_1_38' title="bbox 666 184 689 199; baseline 0 0"><span class='ocrx_word' id='word_1_168' title='bbox 666 184 689 199; x_wconf 83' lang='eng'>76</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 151 236 654 286">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 151 236 654 286">
+     <span class='ocr_line' id='line_1_39' title="bbox 151 236 654 256; baseline 0 0"><span class='ocrx_word' id='word_1_169' title='bbox 151 244 217 256; x_wconf 74' lang='eng'>1—1</span> <span class='ocrx_word' id='word_1_170' title='bbox 631 236 654 251; x_wconf 77' lang='eng'>87</span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 157 270 211 286; baseline 0 0"><span class='ocrx_word' id='word_1_171' title='bbox 157 270 211 286; x_wconf 86' lang='eng'>0.005</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 627 254 789 258">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 627 254 789 258">
+     <span class='ocr_line' id='line_1_41' title="bbox 627 254 789 258; baseline 0 882"><span class='ocrx_word' id='word_1_172' title='bbox 627 254 789 258; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 662 307 723 309">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 662 307 723 309">
+     <span class='ocr_line' id='line_1_42' title="bbox 662 307 723 309; baseline 0 831"><span class='ocrx_word' id='word_1_173' title='bbox 662 307 723 309; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 721 290 723 326">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 721 290 723 326">
+     <span class='ocr_line' id='line_1_43' title="bbox 721 290 723 326; baseline 0 814"><span class='ocrx_word' id='word_1_174' title='bbox 721 290 723 326; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 722 324 784 326">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 722 324 784 326">
+     <span class='ocr_line' id='line_1_44' title="bbox 722 324 784 326; baseline 0 814"><span class='ocrx_word' id='word_1_175' title='bbox 722 324 784 326; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 290 313 1085 539">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 290 313 1085 539">
+     <span class='ocr_line' id='line_1_45' title="bbox 453 313 631 390; baseline 0 -52"><span class='ocrx_word' id='word_1_176' title='bbox 453 313 631 390; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_46' title="bbox 290 390 670 436; baseline 0 0"><span class='ocrx_word' id='word_1_177' title='bbox 290 390 670 436; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_47' title="bbox 453 436 662 497; baseline 0 -33"><span class='ocrx_word' id='word_1_178' title='bbox 453 436 662 497; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_48' title="bbox 453 497 1085 539; baseline 0 0"><span class='ocrx_word' id='word_1_179' title='bbox 453 497 1085 539; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 627 256 629 378">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 627 256 629 378">
+     <span class='ocr_line' id='line_1_49' title="bbox 627 256 629 378; baseline 0 762"><span class='ocrx_word' id='word_1_180' title='bbox 627 256 629 378; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 660 206 665 396">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 660 206 665 396">
+     <span class='ocr_line' id='line_1_50' title="bbox 660 206 665 396; baseline 0 744"><span class='ocrx_word' id='word_1_181' title='bbox 660 206 665 396; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 661 394 726 396">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 661 394 726 396">
+     <span class='ocr_line' id='line_1_51' title="bbox 661 394 726 396; baseline 0 744"><span class='ocrx_word' id='word_1_182' title='bbox 661 394 726 396; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 262 526 285 541">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 262 526 285 541">
+     <span class='ocr_line' id='line_1_52' title="bbox 262 526 285 541; baseline 0 0"><span class='ocrx_word' id='word_1_183' title='bbox 262 526 285 541; x_wconf 85' lang='eng'>78</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 292 424 294 669">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 292 424 294 669">
+     <span class='ocr_line' id='line_1_53' title="bbox 292 424 294 669; baseline 0 471"><span class='ocrx_word' id='word_1_184' title='bbox 292 424 294 669; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 435 774 788 1024">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 637 844 788 1024">
+     <span class='ocr_line' id='line_1_54' title="bbox 637 844 729 888; baseline 0 0"><span class='ocrx_word' id='word_1_185' title='bbox 637 844 729 888; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+     <span class='ocr_line' id='line_1_55' title="bbox 637 888 712 913; baseline 0 227"><span class='ocrx_word' id='word_1_186' title='bbox 637 888 712 913; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+     <span class='ocr_line' id='line_1_56' title="bbox 666 913 702 948; baseline 0.25 -6"><span class='ocrx_word' id='word_1_187' title='bbox 666 913 702 948; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_57' title="bbox 678 948 706 979; baseline 0.071 -2"><span class='ocrx_word' id='word_1_188' title='bbox 678 948 706 979; x_wconf 95' lang='eng' dir='ltr'>  </span> 
+     </span>
+     <span class='ocr_line' id='line_1_58' title="bbox 689 979 788 1024; baseline 0 -20"><span class='ocrx_word' id='word_1_189' title='bbox 689 979 788 1024; x_wconf 95' lang='eng' dir='ltr'>   </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 432 679 434 830">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 432 679 434 830">
+     <span class='ocr_line' id='line_1_59' title="bbox 432 679 434 830; baseline 0 310"><span class='ocrx_word' id='word_1_190' title='bbox 432 679 434 830; x_wconf 95' lang='eng' dir='ltr'> </span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 596 840 632 856">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 596 840 632 856">
+     <span class='ocr_line' id='line_1_60' title="bbox 596 840 632 856; baseline 0 0"><span class='ocrx_word' id='word_1_191' title='bbox 596 840 632 856; x_wconf 91' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 654 955 678 970">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 654 955 678 970">
+     <span class='ocr_line' id='line_1_61' title="bbox 654 955 678 970; baseline 0 0"><span class='ocrx_word' id='word_1_192' title='bbox 654 955 678 970; x_wconf 83' lang='eng'><em>83</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/ijs.0.003723-0-000.pbm.png b/examples/ijs.0.003723-0-000.pbm.png
new file mode 100644
index 00000000..5fe74530
Binary files /dev/null and b/examples/ijs.0.003723-0-000.pbm.png differ
diff --git a/examples/ijs.0.003723-0-000.pbm.png.hocr b/examples/ijs.0.003723-0-000.pbm.png.hocr
new file mode 100644
index 00000000..e911a6d3
--- /dev/null
+++ b/examples/ijs.0.003723-0-000.pbm.png.hocr
@@ -0,0 +1,214 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003723-0-000.pbm.png"; bbox 0 0 1300 477; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 3 334 52 336">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 3 334 52 336">
+     <span class='ocr_line' id='line_1_1' title="bbox 3 334 52 336; baseline 0 141"><span class='ocrx_word' id='word_1_1' title='bbox 3 334 52 336; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 1 334 3 462">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 1 334 3 462">
+     <span class='ocr_line' id='line_1_2' title="bbox 1 334 3 462; baseline 0 15"><span class='ocrx_word' id='word_1_2' title='bbox 1 334 3 462; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 82 33 134 49">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 82 33 134 49">
+     <span class='ocr_line' id='line_1_3' title="bbox 82 33 134 49; baseline 0 0"><span class='ocrx_word' id='word_1_3' title='bbox 82 33 134 49; x_wconf 86' lang='eng'>0.005</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 56 228 89 244">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 56 228 89 244">
+     <span class='ocr_line' id='line_1_4' title="bbox 56 228 89 244; baseline 0 0"><span class='ocrx_word' id='word_1_4' title='bbox 56 228 89 244; x_wconf 88' lang='eng'>100</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 494 1 1232 27">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 494 1 1232 27">
+     <span class='ocr_line' id='line_1_5' title="bbox 494 1 1232 27; baseline 0 -5"><span class='ocrx_word' id='word_1_5' title='bbox 494 12 502 14; x_wconf 98' lang='eng'><em>-</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 511 3 665 22; x_wconf 81' lang='eng' dir='ltr'><em>Saccharothrix</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 674 3 774 22; x_wconf 85' lang='eng' dir='ltr'><em>mutabi/is</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 783 3 855 27; x_wconf 85' lang='eng' dir='ltr'><em>subsp.</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 866 3 966 22; x_wconf 81' lang='eng' dir='ltr'><em>mutabi/is</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 975 3 1028 22; x_wconf 89' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 1037 1 1119 22; x_wconf 80' lang='eng' dir='ltr'><em>43853T</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 1128 3 1232 27; x_wconf 85' lang='eng' dir='ltr'>(X76966)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 382 32 494 34">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 382 32 494 34">
+     <span class='ocr_line' id='line_1_6' title="bbox 382 32 494 34; baseline 0 443"><span class='ocrx_word' id='word_1_13' title='bbox 382 32 494 34; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 492 12 494 55">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 492 12 494 55">
+     <span class='ocr_line' id='line_1_7' title="bbox 492 12 494 55; baseline 0 422"><span class='ocrx_word' id='word_1_14' title='bbox 492 12 494 55; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 494 53 558 55">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 494 53 558 55">
+     <span class='ocr_line' id='line_1_8' title="bbox 494 53 558 55; baseline 0 422"><span class='ocrx_word' id='word_1_15' title='bbox 494 53 558 55; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 334 63 383 65">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 334 63 383 65">
+     <span class='ocr_line' id='line_1_9' title="bbox 334 63 383 65; baseline 0 412"><span class='ocrx_word' id='word_1_16' title='bbox 334 63 383 65; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 382 32 383 95">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 382 32 383 95">
+     <span class='ocr_line' id='line_1_10' title="bbox 382 32 383 95; baseline 0 382"><span class='ocrx_word' id='word_1_17' title='bbox 382 32 383 95; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 281 109 336 111">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 281 109 336 111">
+     <span class='ocr_line' id='line_1_11' title="bbox 281 109 336 111; baseline 0 366"><span class='ocrx_word' id='word_1_18' title='bbox 281 109 336 111; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 281 109 282 237">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 281 109 282 237">
+     <span class='ocr_line' id='line_1_12' title="bbox 281 109 282 237; baseline 0 240"><span class='ocrx_word' id='word_1_19' title='bbox 281 109 282 237; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 334 63 336 156">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 334 63 336 156">
+     <span class='ocr_line' id='line_1_13' title="bbox 334 63 336 156; baseline 0 321"><span class='ocrx_word' id='word_1_20' title='bbox 334 63 336 156; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 345 134 347 177">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 345 134 347 177">
+     <span class='ocr_line' id='line_1_14' title="bbox 345 134 347 177; baseline 0 300"><span class='ocrx_word' id='word_1_21' title='bbox 345 134 347 177; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 316 13 1299 230">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 316 13 1299 230">
+     <span class='ocr_line' id='line_1_15' title="bbox 385 13 471 29; baseline 0 0"><span class='ocrx_word' id='word_1_22' title='bbox 385 13 418 29; x_wconf 86' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 464 16 471 22; x_wconf 48' lang='eng'>&#39;</span> 
+     </span>
+     <span class='ocr_line' id='line_1_16' title="bbox 336 31 1299 68; baseline 0 -5"><span class='ocrx_word' id='word_1_24' title='bbox 336 43 358 59; x_wconf 85' lang='eng'>70</span> <span class='ocrx_word' id='word_1_25' title='bbox 367 31 374 37; x_wconf 38' lang='eng'><strong><em>‘</em></strong></span> <span class='ocrx_word' id='word_1_26' title='bbox 568 44 723 63; x_wconf 72' lang='eng' dir='ltr'><em>Saccharothrix</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 731 44 832 63; x_wconf 74' lang='eng' dir='ltr'><em>mutabi/is</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 840 44 912 68; x_wconf 84' lang='eng' dir='ltr'><em>subsp.</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 923 44 1034 68; x_wconf 85' lang='eng' dir='ltr'><em>capreo/us</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 1043 44 1096 63; x_wconf 87' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 1105 42 1187 63; x_wconf 88' lang='eng' dir='ltr'><em>40225T</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 1196 44 1299 68; x_wconf 85' lang='eng' dir='ltr'>(X76965)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_17' title="bbox 316 82 1127 108; baseline 0.002 -7"><span class='ocrx_word' id='word_1_33' title='bbox 316 95 323 101; x_wconf 60' lang='eng'><strong>,</strong></span> <span class='ocrx_word' id='word_1_34' title='bbox 383 93 502 95; x_wconf 91' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_35' title='bbox 512 84 667 103; x_wconf 82' lang='eng' dir='ltr'><em>Saccharothrix</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 676 84 819 108; x_wconf 85' lang='eng' dir='ltr'><em>espanaensis</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 828 84 895 103; x_wconf 90' lang='eng' dir='ltr'>NRRL</span> <span class='ocrx_word' id='word_1_38' title='bbox 906 82 985 103; x_wconf 81' lang='eng' dir='ltr'><em>15764T</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 994 84 1127 108; x_wconf 89' lang='eng' dir='ltr'><em>(AF114807)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 653 123 1271 149; baseline 0 -5"><span class='ocrx_word' id='word_1_40' title='bbox 653 125 808 144; x_wconf 81' lang='eng' dir='ltr'><em>Saccharothrix</em></span> <span class='ocrx_word' id='word_1_41' title='bbox 817 125 937 144; x_wconf 79' lang='eng' dir='ltr'><em>texasensis</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 946 125 1014 144; x_wconf 87' lang='eng' dir='ltr'>NRRL</span> <span class='ocrx_word' id='word_1_43' title='bbox 1023 125 1085 144; x_wconf 84' lang='eng' dir='ltr'>B-161</span> <span class='ocrx_word' id='word_1_44' title='bbox 1091 123 1128 144; x_wconf 83' lang='eng' dir='ltr'><em>34T</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 1138 125 1271 149; x_wconf 87' lang='eng' dir='ltr'>(AF114814)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_19' title="bbox 329 154 1291 190; baseline 0 -5"><span class='ocrx_word' id='word_1_46' title='bbox 329 154 673 177; x_wconf 37' lang='eng' dir='ltr'><em>CW</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 681 166 852 185; x_wconf 84' lang='eng' dir='ltr'><em>Saccharothrix</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 860 166 1018 185; x_wconf 86' lang='eng' dir='ltr'><em>violaceirubra</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 1026 166 1059 185; x_wconf 98' lang='eng' dir='ltr'>YU</span> <span class='ocrx_word' id='word_1_50' title='bbox 1069 164 1144 185; x_wconf 83' lang='eng' dir='ltr'><em>692-1T</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 1153 166 1291 190; x_wconf 77' lang='eng' dir='ltr'><em>(A8284261)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 350 204 1070 230; baseline -0.001 -4"><span class='ocrx_word' id='word_1_52' title='bbox 350 222 357 229; x_wconf 44' lang='eng'><em>*</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 365 216 422 218; x_wconf 77' lang='eng'><em>-——</em></span> <span class='ocrx_word' id='word_1_54' title='bbox 431 206 585 226; x_wconf 77' lang='eng' dir='ltr'><em>Saccharothrix</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 594 207 736 226; x_wconf 81' lang='eng' dir='ltr'><em>australiensis</em></span> <span class='ocrx_word' id='word_1_56' title='bbox 745 207 813 225; x_wconf 88' lang='eng' dir='ltr'><em>NRRL</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 822 204 928 226; x_wconf 78' lang='eng' dir='ltr'><em>B-11239T</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 937 207 1070 230; x_wconf 83' lang='eng' dir='ltr'><em>(AF114803)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 281 236 365 237">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 281 236 365 237">
+     <span class='ocr_line' id='line_1_21' title="bbox 281 236 365 237; baseline 0 240"><span class='ocrx_word' id='word_1_59' title='bbox 281 236 365 237; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 282 242 305 258">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 282 242 305 258">
+     <span class='ocr_line' id='line_1_22' title="bbox 282 242 305 258; baseline 0 0"><span class='ocrx_word' id='word_1_60' title='bbox 282 242 305 258; x_wconf 88' lang='eng'>96</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 53 250 268 252">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 53 250 268 252">
+     <span class='ocr_line' id='line_1_23' title="bbox 53 250 268 252; baseline 0 225"><span class='ocrx_word' id='word_1_61' title='bbox 53 250 268 252; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 53 250 55 421">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 53 250 55 421">
+     <span class='ocr_line' id='line_1_24' title="bbox 53 250 55 421; baseline 0 56"><span class='ocrx_word' id='word_1_62' title='bbox 53 250 55 421; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 267 173 268 329">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 267 173 268 329">
+     <span class='ocr_line' id='line_1_25' title="bbox 267 173 268 329; baseline 0 148"><span class='ocrx_word' id='word_1_63' title='bbox 267 173 268 329; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 363 216 365 258">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 363 216 365 258">
+     <span class='ocr_line' id='line_1_26' title="bbox 363 216 365 258; baseline 0 219"><span class='ocrx_word' id='word_1_64' title='bbox 363 216 365 258; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 406 245 1137 312">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 406 245 1137 312">
+     <span class='ocr_line' id='line_1_27' title="bbox 516 245 1137 272; baseline 0 -6"><span class='ocrx_word' id='word_1_65' title='bbox 516 247 671 266; x_wconf 75' lang='eng' dir='ltr'><em>Saccharothrix</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 680 247 801 272; x_wconf 83' lang='eng' dir='ltr'><em>algeriensis</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 811 247 878 266; x_wconf 88' lang='eng' dir='ltr'><em>NRRL</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 888 245 993 266; x_wconf 88' lang='eng' dir='ltr'><em>B-24137T</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 1003 247 1137 271; x_wconf 85' lang='eng' dir='ltr'><em>(AY054972)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 406 286 1042 312; baseline 0 -6"><span class='ocrx_word' id='word_1_70' title='bbox 406 288 560 307; x_wconf 74' lang='eng' dir='ltr'><em>Saccharothrix</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 568 288 715 312; x_wconf 81' lang='eng' dir='ltr'><em>xinjiangensis</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 725 288 794 307; x_wconf 91' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 805 286 898 307; x_wconf 78' lang='eng' dir='ltr'><em>101911T</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 908 288 1042 312; x_wconf 77' lang='eng' dir='ltr'><em>(A8381939)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 309 297 397 299">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 309 297 397 299">
+     <span class='ocr_line' id='line_1_29' title="bbox 309 297 397 299; baseline 0 178"><span class='ocrx_word' id='word_1_75' title='bbox 309 297 397 299; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 267 328 309 329">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 267 328 309 329">
+     <span class='ocr_line' id='line_1_30' title="bbox 267 328 309 329; baseline 0 148"><span class='ocrx_word' id='word_1_76' title='bbox 267 328 309 329; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 498 326 1092 353">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 498 326 1092 353">
+     <span class='ocr_line' id='line_1_31' title="bbox 498 326 1092 353; baseline 0 -6"><span class='ocrx_word' id='word_1_77' title='bbox 498 328 653 347; x_wconf 78' lang='eng' dir='ltr'><em>Saccharothrix</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 662 329 757 353; x_wconf 87' lang='eng' dir='ltr'><em>syringae</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 767 328 834 347; x_wconf 91' lang='eng' dir='ltr'>NRRL</span> <span class='ocrx_word' id='word_1_80' title='bbox 844 326 949 347; x_wconf 80' lang='eng' dir='ltr'><em>B-16468T</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 959 328 1092 352; x_wconf 89' lang='eng' dir='ltr'>(AF114812)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 307 297 309 359">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 307 297 309 359">
+     <span class='ocr_line' id='line_1_32' title="bbox 307 297 309 359; baseline 0 118"><span class='ocrx_word' id='word_1_82' title='bbox 307 297 309 359; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 307 358 337 359">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 307 358 337 359">
+     <span class='ocr_line' id='line_1_33' title="bbox 307 358 337 359; baseline 0 118"><span class='ocrx_word' id='word_1_83' title='bbox 307 358 337 359; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 335 337 337 380">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 335 337 337 380">
+     <span class='ocr_line' id='line_1_34' title="bbox 335 337 337 380; baseline 0 97"><span class='ocrx_word' id='word_1_84' title='bbox 335 337 337 380; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 485 367 1142 393">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 485 367 1142 393">
+     <span class='ocr_line' id='line_1_35' title="bbox 485 367 1142 393; baseline 0 -5"><span class='ocrx_word' id='word_1_85' title='bbox 485 369 640 389; x_wconf 81' lang='eng' dir='ltr'><em>Saccharothrix</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 649 369 807 389; x_wconf 81' lang='eng' dir='ltr'><em>coeruleofusca</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 817 370 885 388; x_wconf 89' lang='eng' dir='ltr'>NRRL</span> <span class='ocrx_word' id='word_1_88' title='bbox 894 367 1000 389; x_wconf 75' lang='eng' dir='ltr'><em>B-16115T</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 1009 370 1142 393; x_wconf 88' lang='eng' dir='ltr'><em>(AF114805)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 204 408 820 434">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 204 408 820 434">
+     <span class='ocr_line' id='line_1_36' title="bbox 204 408 820 434; baseline -0.002 -5"><span class='ocrx_word' id='word_1_90' title='bbox 204 410 359 429; x_wconf 78' lang='eng' dir='ltr'><em>Saccharothn&#39;x</em></span> <span class='ocrx_word' id='word_1_91' title='bbox 367 410 484 434; x_wconf 87' lang='eng' dir='ltr'><em>Iongispora</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 494 410 562 428; x_wconf 87' lang='eng' dir='ltr'>NRRL</span> <span class='ocrx_word' id='word_1_93' title='bbox 572 408 677 429; x_wconf 89' lang='eng' dir='ltr'><em>B-16116T</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 686 410 736 434; x_wconf 86' lang='eng' dir='ltr'><em>(AF1</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 744 410 820 434; x_wconf 85' lang='eng'><em>14809)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 495 449 1030 475">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 495 449 1030 475">
+     <span class='ocr_line' id='line_1_37' title="bbox 495 449 1030 475; baseline 0 -5"><span class='ocrx_word' id='word_1_96' title='bbox 495 451 670 475; x_wconf 77' lang='eng' dir='ltr'><em>Actinosynnema</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 679 451 748 470; x_wconf 85' lang='eng' dir='ltr'><em>mirum</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 759 451 827 470; x_wconf 88' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 839 449 1030 475; x_wconf 74' lang='eng' dir='ltr'><em>14064T(D85475)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/ijs.0.003731-0-002.pbm.png b/examples/ijs.0.003731-0-002.pbm.png
new file mode 100644
index 00000000..d4a894c5
Binary files /dev/null and b/examples/ijs.0.003731-0-002.pbm.png differ
diff --git a/examples/ijs.0.003731-0-002.pbm.png.hocr b/examples/ijs.0.003731-0-002.pbm.png.hocr
new file mode 100644
index 00000000..fc91e8b6
--- /dev/null
+++ b/examples/ijs.0.003731-0-002.pbm.png.hocr
@@ -0,0 +1,194 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003731-0-002.pbm.png"; bbox 0 0 1612 746; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 23 4 1297 47">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 23 4 1297 47">
+     <span class='ocr_line' id='line_1_1' title="bbox 23 4 1297 47; baseline -0.002 -10"><span class='ocrx_word' id='word_1_1' title='bbox 23 16 158 47; x_wconf 76' lang='eng' dir='ltr'><em>Bootstrap</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 169 16 252 40; x_wconf 78' lang='eng' dir='ltr'><em>va|ue;</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 577 8 787 35; x_wconf 81' lang='eng' dir='ltr'><em>Methanofollis</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 799 8 985 35; x_wconf 87' lang='eng' dir='ltr'><em>formosanus</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 996 4 1097 36; x_wconf 88' lang='eng' dir='ltr'><em>ML15T</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 1109 8 1297 42; x_wconf 88' lang='eng' dir='ltr'><em>(AY186542)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 446 44 451 174">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 446 44 451 174">
+     <span class='ocr_line' id='line_1_2' title="bbox 446 44 451 174; baseline 0 572"><span class='ocrx_word' id='word_1_7' title='bbox 446 44 451 174; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 448 44 450 174">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 448 44 450 174">
+     <span class='ocr_line' id='line_1_3' title="bbox 448 44 450 174; baseline 0 572"><span class='ocrx_word' id='word_1_8' title='bbox 448 44 450 174; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 115 47 1379 197">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 115 47 1379 197">
+     <span class='ocr_line' id='line_1_4' title="bbox 115 47 1379 91; baseline 0.001 -13"><span class='ocrx_word' id='word_1_9' title='bbox 115 72 135 91; x_wconf 71' lang='eng'><strong><em>.</em></strong></span> <span class='ocrx_word' id='word_1_10' title='bbox 164 67 217 91; x_wconf 73' lang='eng'><em>&gt;90</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 228 67 254 91; x_wconf 73' lang='eng'>%</span> <span class='ocrx_word' id='word_1_12' title='bbox 603 51 813 78; x_wconf 83' lang='eng' dir='ltr'><em>Methanofollis</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 824 51 1011 85; x_wconf 86' lang='eng' dir='ltr'><em>aquaemaris</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 1022 47 1181 79; x_wconf 81' lang='eng' dir='ltr'><em>N2F9704T</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 1193 51 1379 85; x_wconf 84' lang='eng' dir='ltr'><em>(AF262035)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 183 92 1350 148; baseline 0.001 -25"><span class='ocrx_word' id='word_1_16' title='bbox 183 124 217 148; x_wconf 75' lang='eng'><em>70</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 228 124 249 148; x_wconf 42' lang='eng' dir='ltr'><em>(y</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 450 109 560 111; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_19' title='bbox 580 96 811 124; x_wconf 87' lang='eng' dir='ltr'><em>Methanofollis</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 822 96 1020 124; x_wconf 89' lang='eng' dir='ltr'><em>ethanolicus</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 1031 92 1145 124; x_wconf 89' lang='eng' dir='ltr'><em>HASUT</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 1156 96 1350 130; x_wconf 88' lang='eng' dir='ltr'><em>(AB371073)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 115 127 1257 197; baseline 0 -30"><span class='ocrx_word' id='word_1_23' title='bbox 115 127 135 147; x_wconf 79' lang='eng' dir='ltr'>O</span> <span class='ocrx_word' id='word_1_24' title='bbox 164 132 180 147; x_wconf 77' lang='eng'>&gt;</span> <span class='ocrx_word' id='word_1_25' title='bbox 243 136 254 147; x_wconf 90' lang='eng'>°</span> <span class='ocrx_word' id='word_1_26' title='bbox 537 152 560 197; x_wconf 61' lang='eng' dir='ltr'>E</span> <span class='ocrx_word' id='word_1_27' title='bbox 577 140 787 168; x_wconf 86' lang='eng' dir='ltr'><em>MethanofoI/is</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 798 141 959 168; x_wconf 86' lang='eng' dir='ltr'><em>Iiminatans</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 970 136 1101 168; x_wconf 89' lang='eng' dir='ltr'><em>GKZPZT</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 1114 140 1257 175; x_wconf 87' lang='eng' dir='ltr'><em>(Y16428)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 652 177 1422 258">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 652 177 1422 258">
+     <span class='ocr_line' id='line_1_7' title="bbox 652 177 1319 215; baseline 0 -8"><span class='ocrx_word' id='word_1_31' title='bbox 652 180 863 208; x_wconf 86' lang='eng' dir='ltr'><em>Methanofollis</em></span> <span class='ocrx_word' id='word_1_32' title='bbox 875 181 987 208; x_wconf 80' lang='eng' dir='ltr'><em>tationis</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 997 180 1077 208; x_wconf 89' lang='eng' dir='ltr'><em>Chile</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 1090 177 1121 208; x_wconf 90' lang='eng' dir='ltr'><em>9T</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 1134 180 1319 215; x_wconf 89' lang='eng' dir='ltr'><em>(AF095272)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 691 220 1422 258; baseline 0 -7"><span class='ocrx_word' id='word_1_36' title='bbox 691 224 941 251; x_wconf 84' lang='eng' dir='ltr'><em>Methanoculleus</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 952 224 1127 258; x_wconf 88' lang='eng' dir='ltr'><em>bourgensis</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 1139 220 1223 251; x_wconf 82' lang='eng' dir='ltr'><em>M82T</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 1235 223 1422 257; x_wconf 89' lang='eng' dir='ltr'><em>(AF095269)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 357 87 359 239">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 357 87 359 239">
+     <span class='ocr_line' id='line_1_9' title="bbox 357 87 359 239; baseline 0 507"><span class='ocrx_word' id='word_1_40' title='bbox 357 87 359 239; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 312 268 351 270">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 312 268 351 270">
+     <span class='ocr_line' id='line_1_10' title="bbox 312 268 351 270; baseline 0 476"><span class='ocrx_word' id='word_1_41' title='bbox 312 268 351 270; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 487 280 620 282">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 487 280 620 282">
+     <span class='ocr_line' id='line_1_11' title="bbox 487 280 620 282; baseline 0 464"><span class='ocrx_word' id='word_1_42' title='bbox 487 280 620 282; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 468 300 487 302">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 468 300 487 302">
+     <span class='ocr_line' id='line_1_12' title="bbox 468 300 487 302; baseline 0 444"><span class='ocrx_word' id='word_1_43' title='bbox 468 300 487 302; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 485 280 487 325">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 485 280 487 325">
+     <span class='ocr_line' id='line_1_13' title="bbox 485 280 487 325; baseline 0 421"><span class='ocrx_word' id='word_1_44' title='bbox 485 280 487 325; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 349 158 351 372">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 349 158 351 372">
+     <span class='ocr_line' id='line_1_14' title="bbox 349 158 351 372; baseline 0 374"><span class='ocrx_word' id='word_1_45' title='bbox 349 158 351 372; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 468 301 470 367">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 468 301 470 367">
+     <span class='ocr_line' id='line_1_15' title="bbox 468 301 470 367; baseline 0 379"><span class='ocrx_word' id='word_1_46' title='bbox 468 301 470 367; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 284 367 431 372">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 284 367 431 372">
+     <span class='ocr_line' id='line_1_16' title="bbox 284 367 431 372; baseline 0 374"><span class='ocrx_word' id='word_1_47' title='bbox 284 367 431 372; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 440 331 442 410">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 440 331 442 410">
+     <span class='ocr_line' id='line_1_17' title="bbox 440 331 442 410; baseline 0 336"><span class='ocrx_word' id='word_1_48' title='bbox 440 331 442 410; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 312 269 314 472">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 312 269 314 472">
+     <span class='ocr_line' id='line_1_18' title="bbox 312 269 314 472; baseline 0 274"><span class='ocrx_word' id='word_1_49' title='bbox 312 269 314 472; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 1 262 1610 513">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 2 262 1610 513">
+     <span class='ocr_line' id='line_1_19' title="bbox 630 262 1279 300; baseline 0 -8"><span class='ocrx_word' id='word_1_50' title='bbox 630 266 857 292; x_wconf 87' lang='eng' dir='ltr'><em>Methanolacinia</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 864 267 985 300; x_wconf 89' lang='eng' dir='ltr'><em>paynteri</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 994 262 1101 292; x_wconf 80' lang='eng' dir='ltr'><em>62000T</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 1111 266 1279 296; x_wconf 87' lang='eng' dir='ltr'><em>(AY196678)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 442 302 1357 340; baseline -0.001 -7"><span class='ocrx_word' id='word_1_54' title='bbox 442 331 461 333; x_wconf 97' lang='eng'>_</span> <span class='ocrx_word' id='word_1_55' title='bbox 487 323 688 325; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_56' title='bbox 704 306 1008 333; x_wconf 87' lang='eng' dir='ltr'><em>Methanomicrobium</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 1020 306 1125 333; x_wconf 87' lang='eng' dir='ltr'><em>mobile</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 1136 302 1194 332; x_wconf 92' lang='eng' dir='ltr'><em>BPT</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 1207 306 1357 340; x_wconf 89' lang='eng' dir='ltr'><em>(M59142)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 2 348 1244 392; baseline -0.002 -12"><span class='ocrx_word' id='word_1_60' title='bbox 2 367 19 387; x_wconf 83' lang='eng' dir='ltr'>N</span> <span class='ocrx_word' id='word_1_61' title='bbox 21 367 41 392; x_wconf 42' lang='eng' dir='ltr'><em>J‘</em></span> <span class='ocrx_word' id='word_1_62' title='bbox 54 367 98 388; x_wconf 68' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_63' title='bbox 109 367 138 391; x_wconf 56' lang='eng'><strong>%;</strong></span> <span class='ocrx_word' id='word_1_64' title='bbox 151 367 194 391; x_wconf 41' lang='eng' dir='ltr'><em>MP,</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 431 361 450 380; x_wconf 70' lang='eng'><strong>0</strong></span> <span class='ocrx_word' id='word_1_66' title='bbox 470 365 620 367; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_67' title='bbox 635 351 879 385; x_wconf 89' lang='eng' dir='ltr'><em>Methanoplanus</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 891 351 1009 378; x_wconf 86' lang='eng' dir='ltr'><em>Iimicola</em></span> <span class='ocrx_word' id='word_1_69' title='bbox 1021 348 1082 378; x_wconf 83' lang='eng' dir='ltr'><em>M3T</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 1094 351 1244 385; x_wconf 88' lang='eng' dir='ltr'><em>(M59143)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 3 389 1316 427; baseline -0.003 -4"><span class='ocrx_word' id='word_1_71' title='bbox 3 402 47 423; x_wconf 89' lang='eng'>100</span> <span class='ocrx_word' id='word_1_72' title='bbox 57 402 88 423; x_wconf 81' lang='eng'><em>%-</em></span> <span class='ocrx_word' id='word_1_73' title='bbox 100 402 137 422; x_wconf 93' lang='eng' dir='ltr'><em>ML</em></span> <span class='ocrx_word' id='word_1_74' title='bbox 155 402 202 423; x_wconf 89' lang='eng'><em>&lt;50</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 211 402 235 423; x_wconf 80' lang='eng'>%</span> <span class='ocrx_word' id='word_1_76' title='bbox 442 408 583 410; x_wconf 92' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_77' title='bbox 597 393 853 427; x_wconf 82' lang='eng' dir='ltr'><em>Methanogenium</em></span> <span class='ocrx_word' id='word_1_78' title='bbox 866 393 1082 427; x_wconf 87' lang='eng' dir='ltr'><em>organophilum</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 1092 389 1154 420; x_wconf 94' lang='eng' dir='ltr'><em>CVT</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 1166 393 1316 427; x_wconf 90' lang='eng' dir='ltr'><em>(M59131)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 225 432 1545 503; baseline 0 -41"><span class='ocrx_word' id='word_1_81' title='bbox 225 436 247 503; x_wconf 68' lang='eng'>:</span> <span class='ocrx_word' id='word_1_82' title='bbox 662 436 932 462; x_wconf 84' lang='eng' dir='ltr'><em>Methanocalculus</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 942 436 1137 462; x_wconf 84' lang='eng' dir='ltr'><em>halotolerans</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 1148 435 1242 462; x_wconf 84' lang='eng' dir='ltr'>SEBR</span> <span class='ocrx_word' id='word_1_85' title='bbox 1255 432 1348 462; x_wconf 91' lang='eng' dir='ltr'><em>4845T</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 1360 436 1545 470; x_wconf 87' lang='eng' dir='ltr'><em>(AF033672)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 909 475 1610 513; baseline 0 -8"><span class='ocrx_word' id='word_1_87' title='bbox 909 479 1251 513; x_wconf 85' lang='eng' dir='ltr'><em>Methanocorpusculum</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 1261 485 1382 513; x_wconf 88' lang='eng' dir='ltr'><em>parvum</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 1392 475 1448 505; x_wconf 94' lang='eng' dir='ltr'><em>XIIT</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 1460 478 1610 513; x_wconf 89' lang='eng' dir='ltr'><em>(M59147)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 357 522 1388 680">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 357 522 1388 680">
+     <span class='ocr_line' id='line_1_25' title="bbox 357 522 1286 556; baseline 0.001 -7"><span class='ocrx_word' id='word_1_91' title='bbox 357 535 509 537; x_wconf 91' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_92' title='bbox 518 523 819 556; x_wconf 86' lang='eng' dir='ltr'><em>‘Methanosphaeru/a</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 830 523 972 556; x_wconf 86' lang='eng' dir='ltr'><em>palustris’</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 993 523 1027 549; x_wconf 96' lang='eng' dir='ltr'>E1</span> <span class='ocrx_word' id='word_1_95' title='bbox 1036 524 1084 550; x_wconf 81' lang='eng'>-90</span> <span class='ocrx_word' id='word_1_96' title='bbox 1097 522 1286 556; x_wconf 87' lang='eng' dir='ltr'>(EU156000)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_26' title="bbox 357 561 1148 598; baseline 0 -8"><span class='ocrx_word' id='word_1_97' title='bbox 357 577 481 579; x_wconf 93' lang='eng'><strong>—</strong></span> <span class='ocrx_word' id='word_1_98' title='bbox 498 564 712 590; x_wconf 83' lang='eng' dir='ltr'><em>Methanolinea</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 725 564 804 590; x_wconf 84' lang='eng' dir='ltr'><em>tarda</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 817 561 947 591; x_wconf 93' lang='eng' dir='ltr'><em>NOBI-1T</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 959 564 1148 598; x_wconf 89' lang='eng' dir='ltr'><em>(AB162774)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_27' title="bbox 543 602 1388 637; baseline -0.001 -7"><span class='ocrx_word' id='word_1_102' title='bbox 543 602 732 630; x_wconf 86' lang='eng' dir='ltr'><em>‘Candidatus</em></span> <span class='ocrx_word' id='word_1_103' title='bbox 743 603 981 637; x_wconf 87' lang='eng' dir='ltr'><em>Methanoregula</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 992 603 1106 630; x_wconf 88' lang='eng' dir='ltr'><em>boonei’</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 1118 603 1179 630; x_wconf 91' lang='eng' dir='ltr'><em>6A8</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 1193 602 1388 636; x_wconf 79' lang='eng' dir='ltr'><em>(D0282124)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_28' title="bbox 643 641 1318 680; baseline 0 -8"><span class='ocrx_word' id='word_1_107' title='bbox 643 645 914 679; x_wconf 82' lang='eng' dir='ltr'><em>Methanospirillum</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 925 645 1064 680; x_wconf 80' lang='eng' dir='ltr'><em>hungatei</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 1071 645 1136 672; x_wconf 91' lang='eng' dir='ltr'><em>JF-1</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 1144 641 1156 657; x_wconf 74' lang='eng' dir='ltr'><strong>T</strong></span> <span class='ocrx_word' id='word_1_111' title='bbox 1168 645 1318 679; x_wconf 89' lang='eng' dir='ltr'><em>(M60880)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 330 555 357 556">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 330 555 357 556">
+     <span class='ocr_line' id='line_1_29' title="bbox 330 555 357 556; baseline 0 190"><span class='ocrx_word' id='word_1_112' title='bbox 330 555 357 556; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 355 535 357 579">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 355 535 357 579">
+     <span class='ocr_line' id='line_1_30' title="bbox 355 535 357 579; baseline 0 167"><span class='ocrx_word' id='word_1_113' title='bbox 355 535 357 579; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 301 590 331 592">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 301 590 331 592">
+     <span class='ocr_line' id='line_1_31' title="bbox 301 590 331 592; baseline 0 154"><span class='ocrx_word' id='word_1_114' title='bbox 301 590 331 592; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 284 367 286 631">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 284 367 286 631">
+     <span class='ocr_line' id='line_1_32' title="bbox 284 367 286 631; baseline 0 115"><span class='ocrx_word' id='word_1_115' title='bbox 284 367 286 631; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 330 555 331 623">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 330 555 331 623">
+     <span class='ocr_line' id='line_1_33' title="bbox 330 555 331 623; baseline 0 123"><span class='ocrx_word' id='word_1_116' title='bbox 330 555 331 623; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 284 629 303 631">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 284 629 303 631">
+     <span class='ocr_line' id='line_1_34' title="bbox 284 629 303 631; baseline 0 115"><span class='ocrx_word' id='word_1_117' title='bbox 284 629 303 631; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 301 590 303 662">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 301 590 303 662">
+     <span class='ocr_line' id='line_1_35' title="bbox 301 590 303 662; baseline 0 84"><span class='ocrx_word' id='word_1_118' title='bbox 301 590 303 662; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 347 709 415 735">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 347 709 415 735">
+     <span class='ocr_line' id='line_1_36' title="bbox 347 709 415 735; baseline 0.015 -1"><span class='ocrx_word' id='word_1_119' title='bbox 347 709 415 735; x_wconf 92' lang='eng'>0.10</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 112 740 652 741">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 112 740 652 741">
+     <span class='ocr_line' id='line_1_37' title="bbox 112 740 652 741; baseline 0 5"><span class='ocrx_word' id='word_1_120' title='bbox 112 740 652 741; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/ijs.0.003749-0-000.pbm.png b/examples/ijs.0.003749-0-000.pbm.png
new file mode 100644
index 00000000..cc611c95
Binary files /dev/null and b/examples/ijs.0.003749-0-000.pbm.png differ
diff --git a/examples/ijs.0.003749-0-000.pbm.png.hocr b/examples/ijs.0.003749-0-000.pbm.png.hocr
new file mode 100644
index 00000000..b41503b0
--- /dev/null
+++ b/examples/ijs.0.003749-0-000.pbm.png.hocr
@@ -0,0 +1,202 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003749-0-000.pbm.png"; bbox 0 0 1243 557; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 72 3 113 20">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 72 3 113 20">
+     <span class='ocr_line' id='line_1_1' title="bbox 72 3 113 20; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 72 3 113 20; x_wconf 85' lang='eng'><em>002</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 347 233 366 246">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 347 233 366 246">
+     <span class='ocr_line' id='line_1_2' title="bbox 347 233 366 246; baseline 0 0"><span class='ocrx_word' id='word_1_2' title='bbox 347 233 366 246; x_wconf 68' lang='eng'><strong>47</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 560 15 1078 186">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 560 15 1078 186">
+     <span class='ocr_line' id='line_1_3' title="bbox 594 15 1063 38; baseline 0 -4"><span class='ocrx_word' id='word_1_3' title='bbox 594 24 613 38; x_wconf 78' lang='eng'><em>59</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 623 25 651 27; x_wconf 97' lang='eng'>—</span> <span class='ocrx_word' id='word_1_5' title='bbox 658 17 677 34; x_wconf 59' lang='eng' dir='ltr'><em>A,</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 687 17 819 38; x_wconf 78' lang='eng' dir='ltr'><em>cryaerophi/us</em></span> <span class='ocrx_word' id='word_1_7' title='bbox 826 17 889 34; x_wconf 88' lang='eng' dir='ltr'><em>CCUG</em></span> <span class='ocrx_word' id='word_1_8' title='bbox 900 15 968 34; x_wconf 78' lang='eng' dir='ltr'><em>17801T</em></span> <span class='ocrx_word' id='word_1_9' title='bbox 976 17 1063 38; x_wconf 83' lang='eng' dir='ltr'><em>(L14624)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 578 54 1078 78; baseline 0 -5"><span class='ocrx_word' id='word_1_10' title='bbox 578 54 597 68; x_wconf 83' lang='eng'><em>75</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 623 65 644 67; x_wconf 98' lang='eng'>—</span> <span class='ocrx_word' id='word_1_12' title='bbox 651 57 670 73; x_wconf 90' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 680 57 812 78; x_wconf 83' lang='eng' dir='ltr'><em>cryaerophilus</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 819 57 883 73; x_wconf 90' lang='eng' dir='ltr'><em>CCUG</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 893 57 951 73; x_wconf 87' lang='eng'><em>17802</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 960 57 1078 78; x_wconf 86' lang='eng' dir='ltr'><em>(AY314755)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 560 94 1027 118; baseline 0 -5"><span class='ocrx_word' id='word_1_17' title='bbox 560 99 579 113; x_wconf 83' lang='eng'><em>99</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 606 105 667 107; x_wconf 95' lang='eng'>—</span> <span class='ocrx_word' id='word_1_19' title='bbox 674 97 693 113; x_wconf 91' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 703 96 854 113; x_wconf 83' lang='eng' dir='ltr'><em>skirrowiiCCUG</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 864 94 932 113; x_wconf 79' lang='eng' dir='ltr'><em>10374T</em></span> <span class='ocrx_word' id='word_1_22' title='bbox 940 96 1027 118; x_wconf 85' lang='eng' dir='ltr'><em>(L14625)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_6' title="bbox 588 134 1005 186; baseline 0 -33"><span class='ocrx_word' id='word_1_23' title='bbox 588 144 639 186; x_wconf 49' lang='eng'><em>_{</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 646 136 665 153; x_wconf 92' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 675 136 751 153; x_wconf 81' lang='eng' dir='ltr'><em>cibarius</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 759 136 804 153; x_wconf 88' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_27' title='bbox 813 134 883 153; x_wconf 80' lang='eng' dir='ltr'><em>21996T</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 891 136 1005 157; x_wconf 84' lang='eng' dir='ltr'><em>(AJ607391)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 604 45 623 47">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 604 45 623 47">
+     <span class='ocr_line' id='line_1_7' title="bbox 604 45 623 47; baseline 0 510"><span class='ocrx_word' id='word_1_29' title='bbox 604 45 623 47; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 621 25 623 67">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 621 25 623 67">
+     <span class='ocr_line' id='line_1_8' title="bbox 621 25 623 67; baseline 0 490"><span class='ocrx_word' id='word_1_30' title='bbox 621 25 623 67; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 586 75 606 77">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 586 75 606 77">
+     <span class='ocr_line' id='line_1_9' title="bbox 586 75 606 77; baseline 0 480"><span class='ocrx_word' id='word_1_31' title='bbox 586 75 606 77; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 604 45 606 107">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 604 45 606 107">
+     <span class='ocr_line' id='line_1_10' title="bbox 604 45 606 107; baseline 0 450"><span class='ocrx_word' id='word_1_32' title='bbox 604 45 606 107; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 525 120 588 121">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 525 120 588 121">
+     <span class='ocr_line' id='line_1_11' title="bbox 525 120 588 121; baseline 0 436"><span class='ocrx_word' id='word_1_33' title='bbox 525 120 588 121; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 586 75 588 166">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 586 75 588 166">
+     <span class='ocr_line' id='line_1_12' title="bbox 586 75 588 166; baseline 0 391"><span class='ocrx_word' id='word_1_34' title='bbox 586 75 588 166; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 490 162 518 175">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 490 162 518 175">
+     <span class='ocr_line' id='line_1_13' title="bbox 490 162 518 175; baseline 0 0"><span class='ocrx_word' id='word_1_35' title='bbox 490 162 518 175; x_wconf 82' lang='eng'><em>100</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 374 182 526 184">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 374 182 526 184">
+     <span class='ocr_line' id='line_1_14' title="bbox 374 182 526 184; baseline 0 373"><span class='ocrx_word' id='word_1_36' title='bbox 374 182 526 184; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 336 254 375 256">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 336 254 375 256">
+     <span class='ocr_line' id='line_1_15' title="bbox 336 254 375 256; baseline 0 301"><span class='ocrx_word' id='word_1_37' title='bbox 336 254 375 256; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 3 335 337 337">
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 3 335 337 337">
+     <span class='ocr_line' id='line_1_16' title="bbox 3 335 337 337; baseline 0 220"><span class='ocrx_word' id='word_1_38' title='bbox 3 335 337 337; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 3 335 4 544">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 3 335 4 544">
+     <span class='ocr_line' id='line_1_17' title="bbox 3 335 4 544; baseline 0 13"><span class='ocrx_word' id='word_1_39' title='bbox 3 335 4 544; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 336 254 337 420">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 336 254 337 420">
+     <span class='ocr_line' id='line_1_18' title="bbox 336 254 337 420; baseline 0 137"><span class='ocrx_word' id='word_1_40' title='bbox 336 254 337 420; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 374 183 375 325">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 374 183 375 325">
+     <span class='ocr_line' id='line_1_19' title="bbox 374 183 375 325; baseline 0 232"><span class='ocrx_word' id='word_1_41' title='bbox 374 183 375 325; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 526 176 999 317">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 576 176 999 317">
+     <span class='ocr_line' id='line_1_20' title="bbox 599 176 994 197; baseline 0.003 -5"><span class='ocrx_word' id='word_1_42' title='bbox 599 177 627 190; x_wconf 90' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 645 176 664 192; x_wconf 93' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 674 176 749 193; x_wconf 81' lang='eng' dir='ltr'><em>ciban&#39;us</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 757 176 803 193; x_wconf 92' lang='eng' dir='ltr'><em>LMG</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 811 176 872 193; x_wconf 82' lang='eng'><strong>21997</strong></span> <span class='ocrx_word' id='word_1_47' title='bbox 880 176 994 197; x_wconf 79' lang='eng' dir='ltr'><em>(AJ607392)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 611 216 999 245; baseline 0 -13"><span class='ocrx_word' id='word_1_48' title='bbox 611 224 623 245; x_wconf 78' lang='eng' dir='ltr'><strong>I—</strong></span> <span class='ocrx_word' id='word_1_49' title='bbox 630 216 649 232; x_wconf 90' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 658 216 731 232; x_wconf 73' lang='eng' dir='ltr'><em>butzleri</em></span> <span class='ocrx_word' id='word_1_51' title='bbox 737 216 800 232; x_wconf 85' lang='eng' dir='ltr'><em>CCUG</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 809 216 869 232; x_wconf 81' lang='eng'><em>34397</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 878 216 999 237; x_wconf 85' lang='eng' dir='ltr'><em>(DQ464343)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_22' title="bbox 576 246 997 277; baseline 0.005 -7"><span class='ocrx_word' id='word_1_54' title='bbox 576 256 604 270; x_wconf 89' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 611 246 621 266; x_wconf 83' lang='eng' dir='ltr'>L</span> <span class='ocrx_word' id='word_1_56' title='bbox 628 256 647 272; x_wconf 90' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_57' title='bbox 657 256 729 272; x_wconf 78' lang='eng' dir='ltr'><em>butzleri</em></span> <span class='ocrx_word' id='word_1_58' title='bbox 734 255 794 272; x_wconf 86' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_59' title='bbox 801 256 847 272; x_wconf 84' lang='eng'><em>4961</em></span> <span class='ocrx_word' id='word_1_60' title='bbox 852 253 873 272; x_wconf 61' lang='eng' dir='ltr'><em>ST</em></span> <span class='ocrx_word' id='word_1_61' title='bbox 880 255 950 277; x_wconf 81' lang='eng' dir='ltr'>(AY621</span> <span class='ocrx_word' id='word_1_62' title='bbox 956 256 962 272; x_wconf 87' lang='eng'>1</span> <span class='ocrx_word' id='word_1_63' title='bbox 968 256 974 272; x_wconf 88' lang='eng'>1</span> <span class='ocrx_word' id='word_1_64' title='bbox 979 255 997 277; x_wconf 84' lang='eng'><em>6)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_23' title="bbox 580 293 982 317; baseline 0 -5"><span class='ocrx_word' id='word_1_65' title='bbox 580 304 609 306; x_wconf 98' lang='eng'>—</span> <span class='ocrx_word' id='word_1_66' title='bbox 616 295 635 312; x_wconf 85' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_67' title='bbox 645 295 737 317; x_wconf 72' lang='eng' dir='ltr'><em>nitmﬁgilis</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 745 295 808 312; x_wconf 86' lang='eng' dir='ltr'>CCUG</span> <span class='ocrx_word' id='word_1_69' title='bbox 818 293 887 312; x_wconf 43' lang='eng' dir='ltr'><em>15893.r</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 895 295 982 317; x_wconf 84' lang='eng' dir='ltr'><em>(L14627)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 525 120 526 245">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 525 120 526 245">
+     <span class='ocr_line' id='line_1_24' title="bbox 525 120 526 245; baseline 0 312"><span class='ocrx_word' id='word_1_71' title='bbox 525 120 526 245; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 374 324 580 326">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 374 324 580 326">
+     <span class='ocr_line' id='line_1_25' title="bbox 374 324 580 326; baseline 0 231"><span class='ocrx_word' id='word_1_72' title='bbox 374 324 580 326; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 336 418 397 420">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 336 418 397 420">
+     <span class='ocr_line' id='line_1_26' title="bbox 336 418 397 420; baseline 0 137"><span class='ocrx_word' id='word_1_73' title='bbox 336 418 397 420; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 369 430 388 444">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 369 430 388 444">
+     <span class='ocr_line' id='line_1_27' title="bbox 369 430 388 444; baseline 0 0"><span class='ocrx_word' id='word_1_74' title='bbox 369 430 388 444; x_wconf 86' lang='eng'><em>72</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 395 384 397 455">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 395 384 397 455">
+     <span class='ocr_line' id='line_1_28' title="bbox 395 384 397 455; baseline 0 102"><span class='ocrx_word' id='word_1_75' title='bbox 395 384 397 455; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 543 335 994 436">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 543 335 994 436">
+     <span class='ocr_line' id='line_1_29' title="bbox 543 335 965 356; baseline 0.007 -7"><span class='ocrx_word' id='word_1_76' title='bbox 543 336 571 350; x_wconf 86' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 580 344 641 346; x_wconf 96' lang='eng'>—</span> <span class='ocrx_word' id='word_1_78' title='bbox 648 335 667 352; x_wconf 90' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_79' title='bbox 676 335 769 356; x_wconf 71' lang='eng' dir='ltr'><em>nitroﬁgilis</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 777 335 838 352; x_wconf 84' lang='eng' dir='ltr'><em>F2173</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 846 335 965 356; x_wconf 84' lang='eng' dir='ltr'><em>(EU106661)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 660 373 994 396; baseline 0.003 -5"><span class='ocrx_word' id='word_1_82' title='bbox 660 375 679 391; x_wconf 92' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_83' title='bbox 688 375 788 396; x_wconf 82' lang='eng' dir='ltr'><em>halophilus</em></span> <span class='ocrx_word' id='word_1_84' title='bbox 796 373 870 392; x_wconf 79' lang='eng' dir='ltr'><em>LA31BT</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 878 375 994 396; x_wconf 87' lang='eng' dir='ltr'><em>(AF513455)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 587 415 853 436; baseline 0.004 -5"><span class='ocrx_word' id='word_1_86' title='bbox 587 415 608 431; x_wconf 91' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 616 415 676 436; x_wconf 80' lang='eng' dir='ltr'><em>mytili</em></span> <span class='ocrx_word' id='word_1_88' title='bbox 681 415 731 432; x_wconf 84' lang='eng' dir='ltr'><em>T234</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 739 415 853 436; x_wconf 84' lang='eng' dir='ltr'><em>(FJ156092)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 395 453 580 455">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 395 453 580 455">
+     <span class='ocr_line' id='line_1_32' title="bbox 395 453 580 455; baseline 0 102"><span class='ocrx_word' id='word_1_90' title='bbox 395 453 580 455; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 578 304 580 484">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 578 304 580 484">
+     <span class='ocr_line' id='line_1_33' title="bbox 578 304 580 484; baseline 0 73"><span class='ocrx_word' id='word_1_91' title='bbox 578 304 580 484; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 542 453 884 516">
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 542 453 884 516">
+     <span class='ocr_line' id='line_1_34' title="bbox 542 453 884 479; baseline 0 -8"><span class='ocrx_word' id='word_1_92' title='bbox 542 465 571 479; x_wconf 62' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_93' title='bbox 592 455 612 471; x_wconf 91' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 622 455 680 476; x_wconf 82' lang='eng' dir='ltr'><em>mytili</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 687 453 758 471; x_wconf 67' lang='eng' dir='ltr'><em>F2075Y</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 765 455 884 476; x_wconf 69' lang='eng' dir='ltr'><em>(eusegsm)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 560 494 880 516; baseline 0.006 -7"><span class='ocrx_word' id='word_1_97' title='bbox 560 495 579 509; x_wconf 76' lang='eng'><em>58</em></span> <span class='ocrx_word' id='word_1_98' title='bbox 597 495 617 511; x_wconf 91' lang='eng' dir='ltr'><em>A.</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 627 495 685 515; x_wconf 79' lang='eng' dir='ltr'><em>mytili</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 692 494 753 511; x_wconf 79' lang='eng' dir='ltr'><em>F2026</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 761 494 880 516; x_wconf 85' lang='eng' dir='ltr'><em>(EU669906)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 3 542 667 544">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 3 542 667 544">
+     <span class='ocr_line' id='line_1_36' title="bbox 3 542 667 544; baseline 0 13"><span class='ocrx_word' id='word_1_102' title='bbox 3 542 667 544; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 677 532 1240 555">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 677 532 1240 555">
+     <span class='ocr_line' id='line_1_37' title="bbox 677 532 1240 555; baseline -0.002 -4"><span class='ocrx_word' id='word_1_103' title='bbox 677 534 827 555; x_wconf 81' lang='eng' dir='ltr'><em>Campy/abacter</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 833 534 880 551; x_wconf 83' lang='eng' dir='ltr'><em>fetus</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 887 534 945 555; x_wconf 80' lang='eng' dir='ltr'>subsp</span> <span class='ocrx_word' id='word_1_106' title='bbox 954 534 1001 551; x_wconf 78' lang='eng' dir='ltr'><em>fetus</em></span> <span class='ocrx_word' id='word_1_107' title='bbox 1008 534 1067 551; x_wconf 87' lang='eng' dir='ltr'><em>ATCC</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 1075 532 1146 551; x_wconf 76' lang='eng' dir='ltr'><em>27374T</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 1154 534 1240 555; x_wconf 73' lang='eng' dir='ltr'><em>(L04314)</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/ijs.0.003814-0-002.pbm.png b/examples/ijs.0.003814-0-002.pbm.png
new file mode 100644
index 00000000..f5a75b8a
Binary files /dev/null and b/examples/ijs.0.003814-0-002.pbm.png differ
diff --git a/examples/ijs.0.003814-0-002.pbm.png.hocr b/examples/ijs.0.003814-0-002.pbm.png.hocr
new file mode 100644
index 00000000..ef8b7d62
--- /dev/null
+++ b/examples/ijs.0.003814-0-002.pbm.png.hocr
@@ -0,0 +1,290 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003814-0-002.pbm.png"; bbox 0 0 1479 1135; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 250 38 273 52">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 250 38 273 52">
+     <span class='ocr_line' id='line_1_1' title="bbox 250 38 273 52; baseline 0 0"><span class='ocrx_word' id='word_1_1' title='bbox 250 38 273 52; x_wconf 86' lang='eng'>0.1</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 599 5 1251 107">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 599 6 1251 106">
+     <span class='ocr_line' id='line_1_2' title="bbox 627 6 1140 31; baseline 0 -6"><span class='ocrx_word' id='word_1_2' title='bbox 627 14 656 16; x_wconf 95' lang='eng'>—</span> <span class='ocrx_word' id='word_1_3' title='bbox 666 6 812 31; x_wconf 83' lang='eng' dir='ltr'><em>Archangium</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 821 6 918 31; x_wconf 81' lang='eng' dir='ltr'><em>gephyra</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 927 6 955 25; x_wconf 88' lang='eng' dir='ltr'><em>Ar</em></span> <span class='ocrx_word' id='word_1_6' title='bbox 963 6 987 31; x_wconf 77' lang='eng'>91</span> <span class='ocrx_word' id='word_1_7' title='bbox 1002 6 1140 31; x_wconf 83' lang='eng' dir='ltr'><em>(AJ233912)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_3' title="bbox 599 38 1251 92; baseline 0 -29"><span class='ocrx_word' id='word_1_8' title='bbox 599 38 620 52; x_wconf 70' lang='eng'>77</span> <span class='ocrx_word' id='word_1_9' title='bbox 630 51 703 92; x_wconf 55' lang='eng' dir='ltr'><em>_L—</em></span> <span class='ocrx_word' id='word_1_10' title='bbox 714 43 868 68; x_wconf 77' lang='eng' dir='ltr'><em>Melittangium</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 877 43 1019 63; x_wconf 84' lang='eng' dir='ltr'><em>alboraceum</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 1028 43 1064 63; x_wconf 85' lang='eng' dir='ltr'><em>Me</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 1074 43 1102 63; x_wconf 92' lang='eng' dir='ltr'><em>b7</em></span> <span class='ocrx_word' id='word_1_14' title='bbox 1112 43 1251 68; x_wconf 87' lang='eng' dir='ltr'><em>(AJ233907)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 644 79 1251 106; baseline 0 -5"><span class='ocrx_word' id='word_1_15' title='bbox 644 79 665 94; x_wconf 85' lang='eng'>7°</span> <span class='ocrx_word' id='word_1_16' title='bbox 698 80 845 106; x_wconf 79' lang='eng' dir='ltr'><em>Cystobacter</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 851 81 931 101; x_wconf 74' lang='eng' dir='ltr'><em>bad/Us</em></span> <span class='ocrx_word' id='word_1_18' title='bbox 941 80 997 101; x_wconf 87' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_19' title='bbox 1010 80 1094 101; x_wconf 82' lang='eng' dir='ltr'><em>14723T</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 1103 80 1251 106; x_wconf 87' lang='eng' dir='ltr'>(DQ768108)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 3 128 628 132">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 3 128 628 132">
+     <span class='ocr_line' id='line_1_5' title="bbox 3 128 628 132; baseline 0 1003"><span class='ocrx_word' id='word_1_21' title='bbox 3 128 628 132; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 0 221 4 1006">
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 0 221 4 1006">
+     <span class='ocr_line' id='line_1_6' title="bbox 0 221 4 1006; baseline 0 129"><span class='ocrx_word' id='word_1_22' title='bbox 0 221 4 1006; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 258 586 279 601">
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 258 586 279 601">
+     <span class='ocr_line' id='line_1_7' title="bbox 258 586 279 601; baseline 0 0"><span class='ocrx_word' id='word_1_23' title='bbox 258 586 279 601; x_wconf 82' lang='eng'><em>98</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 289 442 454 454">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 289 443 454 453">
+     <span class='ocr_line' id='line_1_8' title="bbox 289 443 454 453; baseline 0 682"><span class='ocrx_word' id='word_1_24' title='bbox 289 443 454 453; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_7' title="bbox 323 515 344 531">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 323 516 344 530">
+     <span class='ocr_line' id='line_1_9' title="bbox 323 516 344 530; baseline 0 0"><span class='ocrx_word' id='word_1_25' title='bbox 323 516 344 530; x_wconf 93' lang='eng'><em>74</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_8' title="bbox 303 712 324 727">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 303 712 324 727">
+     <span class='ocr_line' id='line_1_10' title="bbox 303 712 324 727; baseline 0 0"><span class='ocrx_word' id='word_1_26' title='bbox 303 712 324 727; x_wconf 81' lang='eng'><strong>66</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_9' title="bbox 0 951 854 1111">
+    <p class='ocr_par' dir='ltr' id='par_1_9' title="bbox 0 952 854 1110">
+     <span class='ocr_line' id='line_1_11' title="bbox 0 952 854 1110; baseline 0 -27"><span class='ocrx_word' id='word_1_27' title='bbox 0 952 854 1110; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_10' title="bbox 328 500 461 746">
+    <p class='ocr_par' dir='ltr' id='par_1_10' title="bbox 328 500 461 746">
+     <span class='ocr_line' id='line_1_12' title="bbox 328 500 444 572; baseline 0 -15"><span class='ocrx_word' id='word_1_28' title='bbox 328 500 444 572; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 341 572 458 652; baseline 0 -17"><span class='ocrx_word' id='word_1_29' title='bbox 341 572 458 652; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 398 652 447 684; baseline 0 451"><span class='ocrx_word' id='word_1_30' title='bbox 398 652 447 684; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_15' title="bbox 398 684 461 746; baseline 0 0"><span class='ocrx_word' id='word_1_31' title='bbox 398 684 461 746; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_11' title="bbox 325 543 329 864">
+    <p class='ocr_par' dir='ltr' id='par_1_11' title="bbox 325 543 329 864">
+     <span class='ocr_line' id='line_1_16' title="bbox 325 543 329 864; baseline 0 271"><span class='ocrx_word' id='word_1_32' title='bbox 325 543 329 864; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_12' title="bbox 593 117 1329 258">
+    <p class='ocr_par' dir='ltr' id='par_1_12' title="bbox 593 118 1309 167">
+     <span class='ocr_line' id='line_1_17' title="bbox 792 118 1309 144; baseline -0.002 -5"><span class='ocrx_word' id='word_1_33' title='bbox 792 118 926 144; x_wconf 83' lang='eng' dir='ltr'><em>Stigmate/Ia</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 935 119 1009 139; x_wconf 85' lang='eng' dir='ltr'><em>erecta</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 1020 118 1082 139; x_wconf 91' lang='eng' dir='ltr'><strong>BICC</strong></span> <span class='ocrx_word' id='word_1_36' title='bbox 1092 118 1151 139; x_wconf 86' lang='eng'><em>8613</em></span> <span class='ocrx_word' id='word_1_37' title='bbox 1161 118 1309 144; x_wconf 87' lang='eng' dir='ltr'><em>(DQ491071)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_18' title="bbox 593 127 764 167; baseline 0 -12"><span class='ocrx_word' id='word_1_38' title='bbox 593 140 623 155; x_wconf 77' lang='eng'><em>100</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 658 127 764 167; x_wconf 72' lang='eng'><em>—|</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_13' title="bbox 734 154 1328 257">
+     <span class='ocr_line' id='line_1_19' title="bbox 734 154 1328 182; baseline 0 -6"><span class='ocrx_word' id='word_1_40' title='bbox 734 154 754 169; x_wconf 79' lang='eng'>97</span> <span class='ocrx_word' id='word_1_41' title='bbox 776 156 909 182; x_wconf 77' lang='eng' dir='ltr'><em>Stigmata/la</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 918 156 1007 182; x_wconf 85' lang='eng' dir='ltr'><em>hybrida</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 1017 156 1074 176; x_wconf 86' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_44' title='bbox 1087 156 1171 176; x_wconf 79' lang='eng' dir='ltr'><em>14722T</em></span> <span class='ocrx_word' id='word_1_45' title='bbox 1180 156 1328 181; x_wconf 85' lang='eng' dir='ltr'>(DQ768129)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_20' title="bbox 734 193 1256 219; baseline 0 -5"><span class='ocrx_word' id='word_1_46' title='bbox 734 194 883 219; x_wconf 80' lang='eng' dir='ltr'><em>Myxococcus</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 891 194 986 214; x_wconf 80' lang='eng' dir='ltr'><em>xanthus</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 996 193 1053 214; x_wconf 87' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_49' title='bbox 1063 194 1107 214; x_wconf 84' lang='eng'><em>435</em></span> <span class='ocrx_word' id='word_1_50' title='bbox 1118 194 1256 219; x_wconf 84' lang='eng' dir='ltr'><em>(AJ233929)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_21' title="bbox 762 231 1312 257; baseline 0 -6"><span class='ocrx_word' id='word_1_51' title='bbox 762 231 920 257; x_wconf 82' lang='eng' dir='ltr'><em>Pyxidicoccus</em></span> <span class='ocrx_word' id='word_1_52' title='bbox 929 231 991 251; x_wconf 84' lang='eng' dir='ltr'><em>fal/ax</em></span> <span class='ocrx_word' id='word_1_53' title='bbox 1001 231 1058 251; x_wconf 90' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_54' title='bbox 1071 231 1154 251; x_wconf 79' lang='eng' dir='ltr'><em>14698T</em></span> <span class='ocrx_word' id='word_1_55' title='bbox 1164 231 1312 256; x_wconf 87' lang='eng' dir='ltr'>(DQ768123)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_13' title="bbox 625 73 629 219">
+    <p class='ocr_par' dir='ltr' id='par_1_14' title="bbox 625 73 629 219">
+     <span class='ocr_line' id='line_1_22' title="bbox 625 73 629 219; baseline 0 916"><span class='ocrx_word' id='word_1_56' title='bbox 625 73 629 219; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_14' title="bbox 654 199 794 397">
+    <p class='ocr_par' dir='ltr' id='par_1_15' title="bbox 654 199 794 397">
+     <span class='ocr_line' id='line_1_23' title="bbox 716 199 734 232; baseline 0 903"><span class='ocrx_word' id='word_1_57' title='bbox 716 199 734 232; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_24' title="bbox 654 232 794 346; baseline 0 -76"><span class='ocrx_word' id='word_1_58' title='bbox 654 232 794 346; x_wconf 95' lang='eng' dir='ltr'><em>    </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_25' title="bbox 716 346 740 397; baseline 0 0"><span class='ocrx_word' id='word_1_59' title='bbox 716 346 740 397; x_wconf 95' lang='eng' dir='ltr'><em>  </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_15' title="bbox 626 217 658 219">
+    <p class='ocr_par' dir='ltr' id='par_1_16' title="bbox 626 217 658 219">
+     <span class='ocr_line' id='line_1_26' title="bbox 626 217 658 219; baseline 0 916"><span class='ocrx_word' id='word_1_60' title='bbox 626 217 658 219; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_16' title="bbox 631 227 652 241">
+    <p class='ocr_par' dir='ltr' id='par_1_17' title="bbox 631 227 652 241">
+     <span class='ocr_line' id='line_1_27' title="bbox 631 227 652 241; baseline 0 0"><span class='ocrx_word' id='word_1_61' title='bbox 631 227 652 241; x_wconf 85' lang='eng'>68</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_17' title="bbox 656 146 658 288">
+    <p class='ocr_par' dir='ltr' id='par_1_18' title="bbox 656 146 658 288">
+     <span class='ocr_line' id='line_1_28' title="bbox 656 146 658 288; baseline 0 847"><span class='ocrx_word' id='word_1_62' title='bbox 656 146 658 288; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_18' title="bbox 407 306 1380 861">
+    <p class='ocr_par' dir='ltr' id='par_1_19' title="bbox 407 306 1380 860">
+     <span class='ocr_line' id='line_1_29' title="bbox 757 306 1380 333; baseline 0 -6"><span class='ocrx_word' id='word_1_63' title='bbox 757 306 777 320; x_wconf 79' lang='eng'>95</span> <span class='ocrx_word' id='word_1_64' title='bbox 795 307 966 327; x_wconf 81' lang='eng' dir='ltr'><em>Cora/Iococcus</em></span> <span class='ocrx_word' id='word_1_65' title='bbox 975 307 1068 333; x_wconf 82' lang='eng' dir='ltr'><em>exiguus</em></span> <span class='ocrx_word' id='word_1_66' title='bbox 1078 307 1134 327; x_wconf 88' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_67' title='bbox 1147 307 1232 327; x_wconf 79' lang='eng' dir='ltr'><em>14695T</em></span> <span class='ocrx_word' id='word_1_68' title='bbox 1241 307 1380 332; x_wconf 84' lang='eng' dir='ltr'><em>(AJ811598)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_30' title="bbox 748 345 1314 370; baseline 0 -5"><span class='ocrx_word' id='word_1_69' title='bbox 748 345 897 370; x_wconf 80' lang='eng' dir='ltr'><em>Myxococcus</em></span> <span class='ocrx_word' id='word_1_70' title='bbox 906 345 976 365; x_wconf 77' lang='eng' dir='ltr'><em>fu/vus</em></span> <span class='ocrx_word' id='word_1_71' title='bbox 986 345 1060 365; x_wconf 89' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_72' title='bbox 1072 345 1159 365; x_wconf 88' lang='eng'>100070</span> <span class='ocrx_word' id='word_1_73' title='bbox 1170 345 1314 370; x_wconf 82' lang='eng' dir='ltr'><em>(ABZ18209)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_31' title="bbox 734 382 1336 408; baseline 0 -6"><span class='ocrx_word' id='word_1_74' title='bbox 734 382 883 408; x_wconf 84' lang='eng' dir='ltr'><em>Myxococcus</em></span> <span class='ocrx_word' id='word_1_75' title='bbox 892 382 999 407; x_wconf 80' lang='eng' dir='ltr'><em>stipitatus</em></span> <span class='ocrx_word' id='word_1_76' title='bbox 1008 382 1082 402; x_wconf 91' lang='eng' dir='ltr'><em>NBRC</em></span> <span class='ocrx_word' id='word_1_77' title='bbox 1095 382 1182 402; x_wconf 86' lang='eng'>100069</span> <span class='ocrx_word' id='word_1_78' title='bbox 1193 382 1336 407; x_wconf 80' lang='eng' dir='ltr'><em>(ABZ18208)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_32' title="bbox 465 420 968 445; baseline 0 -5"><span class='ocrx_word' id='word_1_79' title='bbox 465 420 637 445; x_wconf 86' lang='eng' dir='ltr'><em>Phaselicystis</em></span> <span class='ocrx_word' id='word_1_80' title='bbox 646 420 707 440; x_wconf 87' lang='eng' dir='ltr'><em>flava</em></span> <span class='ocrx_word' id='word_1_81' title='bbox 717 420 815 440; x_wconf 90' lang='eng' dir='ltr'><em>NOSO-1</em></span> <span class='ocrx_word' id='word_1_82' title='bbox 829 420 968 445; x_wconf 85' lang='eng' dir='ltr'><em>(AJ233948)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_33' title="bbox 426 457 998 483; baseline 0 -5"><span class='ocrx_word' id='word_1_83' title='bbox 426 457 446 471; x_wconf 80' lang='eng'><strong>99</strong></span> <span class='ocrx_word' id='word_1_84' title='bbox 465 458 637 483; x_wconf 85' lang='eng' dir='ltr'><em>Phase/icystis</em></span> <span class='ocrx_word' id='word_1_85' title='bbox 646 457 707 478; x_wconf 88' lang='eng' dir='ltr'><em>flava</em></span> <span class='ocrx_word' id='word_1_86' title='bbox 716 457 845 478; x_wconf 90' lang='eng' dir='ltr'><em>SBK0001T</em></span> <span class='ocrx_word' id='word_1_87' title='bbox 853 458 998 483; x_wconf 87' lang='eng' dir='ltr'>(EU545827)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_34' title="bbox 451 495 1002 521; baseline 0 -5"><span class='ocrx_word' id='word_1_88' title='bbox 451 495 592 521; x_wconf 86' lang='eng' dir='ltr'><em>Byssovorax</em></span> <span class='ocrx_word' id='word_1_89' title='bbox 601 496 690 516; x_wconf 83' lang='eng' dir='ltr'><em>cruenta</em></span> <span class='ocrx_word' id='word_1_90' title='bbox 701 495 757 516; x_wconf 87' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_91' title='bbox 770 495 854 516; x_wconf 89' lang='eng' dir='ltr'><em>14553T</em></span> <span class='ocrx_word' id='word_1_92' title='bbox 863 495 1002 521; x_wconf 85' lang='eng' dir='ltr'><em>(AJ833647)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_35' title="bbox 446 533 974 559; baseline 0 -6"><span class='ocrx_word' id='word_1_93' title='bbox 446 533 576 559; x_wconf 87' lang='eng' dir='ltr'><em>Sorangium</em></span> <span class='ocrx_word' id='word_1_94' title='bbox 585 533 714 553; x_wconf 85' lang='eng' dir='ltr'><em>cellulosum</em></span> <span class='ocrx_word' id='word_1_95' title='bbox 723 533 754 553; x_wconf 87' lang='eng' dir='ltr'><em>So</em></span> <span class='ocrx_word' id='word_1_96' title='bbox 764 533 822 553; x_wconf 86' lang='eng' dir='ltr'><em>ce26</em></span> <span class='ocrx_word' id='word_1_97' title='bbox 832 533 974 558; x_wconf 84' lang='eng' dir='ltr'>(AF387629)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_36' title="bbox 437 570 962 596; baseline 0 -5"><span class='ocrx_word' id='word_1_98' title='bbox 437 570 567 596; x_wconf 85' lang='eng' dir='ltr'><em>Sorangium</em></span> <span class='ocrx_word' id='word_1_99' title='bbox 577 571 705 591; x_wconf 85' lang='eng' dir='ltr'><em>cellulosum</em></span> <span class='ocrx_word' id='word_1_100' title='bbox 714 570 745 591; x_wconf 88' lang='eng' dir='ltr'><em>So</em></span> <span class='ocrx_word' id='word_1_101' title='bbox 755 571 813 591; x_wconf 88' lang='eng' dir='ltr'><em>ce56</em></span> <span class='ocrx_word' id='word_1_102' title='bbox 823 571 962 596; x_wconf 88' lang='eng' dir='ltr'><em>(AJ316014)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_37' title="bbox 465 609 1018 634; baseline 0 -5"><span class='ocrx_word' id='word_1_103' title='bbox 465 609 596 634; x_wconf 77' lang='eng' dir='ltr'><em>Sorangium</em></span> <span class='ocrx_word' id='word_1_104' title='bbox 605 609 734 629; x_wconf 83' lang='eng' dir='ltr'><em>cellulosum</em></span> <span class='ocrx_word' id='word_1_105' title='bbox 742 609 859 629; x_wconf 82' lang='eng'><em>800157-2</em></span> <span class='ocrx_word' id='word_1_106' title='bbox 870 609 1018 634; x_wconf 83' lang='eng' dir='ltr'>(DQ256394)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_38' title="bbox 447 647 983 685; baseline 0 -18"><span class='ocrx_word' id='word_1_107' title='bbox 447 647 591 685; x_wconf 69' lang='eng' dir='ltr'><em>87Soremgium</em></span> <span class='ocrx_word' id='word_1_108' title='bbox 601 647 729 667; x_wconf 77' lang='eng' dir='ltr'><em>cellulosum</em></span> <span class='ocrx_word' id='word_1_109' title='bbox 738 647 826 667; x_wconf 84' lang='eng'><em>809881</em></span> <span class='ocrx_word' id='word_1_110' title='bbox 841 647 983 672; x_wconf 86' lang='eng' dir='ltr'>(AF467672)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_39' title="bbox 465 684 1014 710; baseline 0 -5"><span class='ocrx_word' id='word_1_111' title='bbox 465 684 596 710; x_wconf 84' lang='eng' dir='ltr'><em>Sorangium</em></span> <span class='ocrx_word' id='word_1_112' title='bbox 606 685 734 705; x_wconf 80' lang='eng' dir='ltr'><em>cellulosum</em></span> <span class='ocrx_word' id='word_1_113' title='bbox 743 684 856 705; x_wconf 82' lang='eng'><em>809721—1</em></span> <span class='ocrx_word' id='word_1_114' title='bbox 870 685 1014 710; x_wconf 90' lang='eng' dir='ltr'><em>(AY032880)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_40' title="bbox 468 722 1016 748; baseline 0 -6"><span class='ocrx_word' id='word_1_115' title='bbox 468 722 599 748; x_wconf 86' lang='eng' dir='ltr'><em>Sorangium</em></span> <span class='ocrx_word' id='word_1_116' title='bbox 608 722 737 742; x_wconf 87' lang='eng' dir='ltr'><em>cellulosum</em></span> <span class='ocrx_word' id='word_1_117' title='bbox 746 722 858 742; x_wconf 80' lang='eng'>300089—1</span> <span class='ocrx_word' id='word_1_118' title='bbox 873 722 1016 747; x_wconf 84' lang='eng' dir='ltr'><em>(AYO79453)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_41' title="bbox 417 759 1017 785; baseline -0.002 -5"><span class='ocrx_word' id='word_1_119' title='bbox 417 759 437 773; x_wconf 70' lang='eng'><em>54</em></span> <span class='ocrx_word' id='word_1_120' title='bbox 455 759 585 785; x_wconf 83' lang='eng' dir='ltr'><em>Sarangium</em></span> <span class='ocrx_word' id='word_1_121' title='bbox 595 760 723 780; x_wconf 86' lang='eng' dir='ltr'><em>cellulosum</em></span> <span class='ocrx_word' id='word_1_122' title='bbox 732 759 864 780; x_wconf 81' lang='eng'><em>809735-22</em></span> <span class='ocrx_word' id='word_1_123' title='bbox 875 760 1017 785; x_wconf 88' lang='eng' dir='ltr'>(AF467675)</span> 
+     </span>
+     <span class='ocr_line' id='line_1_42' title="bbox 407 797 1067 845; baseline 0 -28"><span class='ocrx_word' id='word_1_124' title='bbox 407 806 491 845; x_wconf 63' lang='eng'><em>.1:</em></span> <span class='ocrx_word' id='word_1_125' title='bbox 502 797 684 823; x_wconf 84' lang='eng' dir='ltr'><em>Chondromyces</em></span> <span class='ocrx_word' id='word_1_126' title='bbox 693 797 839 823; x_wconf 84' lang='eng' dir='ltr'><em>lanuginosus</em></span> <span class='ocrx_word' id='word_1_127' title='bbox 848 797 877 823; x_wconf 86' lang='eng' dir='ltr'><em>Sy</em></span> <span class='ocrx_word' id='word_1_128' title='bbox 886 797 919 817; x_wconf 81' lang='eng' dir='ltr'><em>t2T</em></span> <span class='ocrx_word' id='word_1_129' title='bbox 929 797 1067 823; x_wconf 84' lang='eng' dir='ltr'><em>(AJ233939)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_43' title="bbox 429 831 1060 860; baseline 0 -5"><span class='ocrx_word' id='word_1_130' title='bbox 429 831 450 845; x_wconf 73' lang='eng'><em>79</em></span> <span class='ocrx_word' id='word_1_131' title='bbox 503 835 685 860; x_wconf 81' lang='eng' dir='ltr'><em>Chondromyces</em></span> <span class='ocrx_word' id='word_1_132' title='bbox 694 835 798 855; x_wconf 84' lang='eng' dir='ltr'><em>robustus</em></span> <span class='ocrx_word' id='word_1_133' title='bbox 807 835 846 855; x_wconf 91' lang='eng' dir='ltr'><em>Cm</em></span> <span class='ocrx_word' id='word_1_134' title='bbox 857 835 913 855; x_wconf 74' lang='eng' dir='ltr'><em>a13T</em></span> <span class='ocrx_word' id='word_1_135' title='bbox 922 835 1060 860; x_wconf 87' lang='eng' dir='ltr'><em>(AJ233942)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_19' title="bbox 694 367 711 381">
+    <p class='ocr_par' dir='ltr' id='par_1_20' title="bbox 694 367 711 381">
+     <span class='ocr_line' id='line_1_44' title="bbox 694 367 711 381; baseline 0 0"><span class='ocrx_word' id='word_1_136' title='bbox 694 367 711 381; x_wconf 83' lang='eng'>51</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_20' title="bbox 1070 427 1374 474">
+    <p class='ocr_par' dir='ltr' id='par_1_21' title="bbox 1070 427 1374 474">
+     <span class='ocr_line' id='line_1_45' title="bbox 1070 427 1374 474; baseline 0 -13"><span class='ocrx_word' id='word_1_137' title='bbox 1070 427 1108 474; x_wconf 70' lang='eng'>}</span> <span class='ocrx_word' id='word_1_138' title='bbox 1123 441 1374 467; x_wconf 84' lang='eng' dir='ltr'><em>Phaselicystidaceae</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_21' title="bbox 1123 700 1302 726">
+    <p class='ocr_par' dir='ltr' id='par_1_22' title="bbox 1123 700 1302 726">
+     <span class='ocr_line' id='line_1_46' title="bbox 1123 700 1302 726; baseline 0 -6"><span class='ocrx_word' id='word_1_139' title='bbox 1123 700 1302 726; x_wconf 80' lang='eng' dir='ltr'><em>Po/yangiaceae</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_22' title="bbox 405 824 407 884">
+    <p class='ocr_par' dir='ltr' id='par_1_23' title="bbox 405 824 407 884">
+     <span class='ocr_line' id='line_1_47' title="bbox 405 824 407 884; baseline 0 251"><span class='ocrx_word' id='word_1_140' title='bbox 405 824 407 884; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_23' title="bbox 326 860 407 865">
+    <p class='ocr_par' dir='ltr' id='par_1_24' title="bbox 326 860 407 865">
+     <span class='ocr_line' id='line_1_48' title="bbox 326 860 407 865; baseline 0 270"><span class='ocrx_word' id='word_1_141' title='bbox 326 860 407 865; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_24' title="bbox 381 870 1388 1126">
+    <p class='ocr_par' dir='ltr' id='par_1_25' title="bbox 381 870 1017 921">
+     <span class='ocr_line' id='line_1_49' title="bbox 381 870 1017 921; baseline 0 -28"><span class='ocrx_word' id='word_1_142' title='bbox 381 870 501 921; x_wconf 58' lang='eng' dir='ltr'><em>“Ll:</em></span> <span class='ocrx_word' id='word_1_143' title='bbox 513 872 696 898; x_wconf 85' lang='eng' dir='ltr'><em>Chondromyces</em></span> <span class='ocrx_word' id='word_1_144' title='bbox 705 874 807 893; x_wconf 81' lang='eng' dir='ltr'><em>crocatus</em></span> <span class='ocrx_word' id='word_1_145' title='bbox 816 872 855 893; x_wconf 90' lang='eng' dir='ltr'><em>Cm</em></span> <span class='ocrx_word' id='word_1_146' title='bbox 866 873 893 893; x_wconf 77' lang='eng'>06</span> <span class='ocrx_word' id='word_1_147' title='bbox 903 873 1017 898; x_wconf 86' lang='eng' dir='ltr'>(M94275)</span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_26' title="bbox 399 908 1388 1125">
+     <span class='ocr_line' id='line_1_50' title="bbox 399 908 913 936; baseline 0 -5"><span class='ocrx_word' id='word_1_148' title='bbox 399 908 420 923; x_wconf 73' lang='eng'><em>63</em></span> <span class='ocrx_word' id='word_1_149' title='bbox 503 911 604 931; x_wconf 83' lang='eng' dir='ltr'><em>JahneI/a</em></span> <span class='ocrx_word' id='word_1_150' title='bbox 614 911 704 931; x_wconf 77' lang='eng' dir='ltr'><em>thaxteri</em></span> <span class='ocrx_word' id='word_1_151' title='bbox 712 911 733 931; x_wconf 89' lang='eng' dir='ltr'>Pl</span> <span class='ocrx_word' id='word_1_152' title='bbox 742 911 764 931; x_wconf 84' lang='eng' dir='ltr'><em>t3</em></span> <span class='ocrx_word' id='word_1_153' title='bbox 774 911 913 936; x_wconf 85' lang='eng' dir='ltr'><em>(AJ233943)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_51' title="bbox 637 948 1029 974; baseline 0 -6"><span class='ocrx_word' id='word_1_154' title='bbox 637 948 728 968; x_wconf 87' lang='eng' dir='ltr'><em>Kof/eria</em></span> <span class='ocrx_word' id='word_1_155' title='bbox 738 948 794 968; x_wconf 84' lang='eng' dir='ltr'><em>flava</em></span> <span class='ocrx_word' id='word_1_156' title='bbox 804 948 825 968; x_wconf 90' lang='eng' dir='ltr'><em>Pl</em></span> <span class='ocrx_word' id='word_1_157' title='bbox 835 948 881 968; x_wconf 80' lang='eng' dir='ltr'><em>vt1T</em></span> <span class='ocrx_word' id='word_1_158' title='bbox 891 948 1029 974; x_wconf 85' lang='eng' dir='ltr'><em>(AJ233944)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_52' title="bbox 857 986 1372 1012; baseline 0 -6"><span class='ocrx_word' id='word_1_159' title='bbox 857 986 1023 1012; x_wconf 81' lang='eng' dir='ltr'><em>Enhygromyxa</em></span> <span class='ocrx_word' id='word_1_160' title='bbox 1033 986 1103 1006; x_wconf 84' lang='eng' dir='ltr'><em>salina</em></span> <span class='ocrx_word' id='word_1_161' title='bbox 1113 986 1219 1006; x_wconf 84' lang='eng' dir='ltr'><em>SMK-1-3</em></span> <span class='ocrx_word' id='word_1_162' title='bbox 1229 986 1372 1011; x_wconf 80' lang='eng' dir='ltr'><em>(AB097591)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_53' title="bbox 883 1024 1367 1049; baseline 0 -5"><span class='ocrx_word' id='word_1_163' title='bbox 883 1024 1026 1049; x_wconf 80' lang='eng' dir='ltr'><em>Plesiocystis</em></span> <span class='ocrx_word' id='word_1_164' title='bbox 1033 1024 1125 1049; x_wconf 79' lang='eng' dir='ltr'><em>paciﬁca</em></span> <span class='ocrx_word' id='word_1_165' title='bbox 1135 1024 1215 1044; x_wconf 86' lang='eng' dir='ltr'><em>SIR-1T</em></span> <span class='ocrx_word' id='word_1_166' title='bbox 1224 1024 1367 1049; x_wconf 87' lang='eng' dir='ltr'><em>(AB083432)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_54' title="bbox 861 1062 1388 1087; baseline 0 -5"><span class='ocrx_word' id='word_1_167' title='bbox 861 1062 1015 1087; x_wconf 78' lang='eng' dir='ltr'><em>‘Nannocystis</em></span> <span class='ocrx_word' id='word_1_168' title='bbox 1025 1062 1157 1087; x_wconf 69' lang='eng' dir='ltr'><em>aggregans’</em></span> <span class='ocrx_word' id='word_1_169' title='bbox 1169 1062 1200 1082; x_wconf 90' lang='eng' dir='ltr'><em>Na</em></span> <span class='ocrx_word' id='word_1_170' title='bbox 1211 1062 1235 1082; x_wconf 76' lang='eng'>31</span> <span class='ocrx_word' id='word_1_171' title='bbox 1250 1062 1388 1087; x_wconf 84' lang='eng' dir='ltr'><em>(AJ233945)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_55' title="bbox 785 1097 1361 1125; baseline 0 -6"><span class='ocrx_word' id='word_1_172' title='bbox 785 1097 816 1111; x_wconf 76' lang='eng'>10°</span> <span class='ocrx_word' id='word_1_173' title='bbox 841 1099 990 1125; x_wconf 83' lang='eng' dir='ltr'><em>Nannocystis</em></span> <span class='ocrx_word' id='word_1_174' title='bbox 999 1099 1101 1119; x_wconf 85' lang='eng' dir='ltr'><em>exedens</em></span> <span class='ocrx_word' id='word_1_175' title='bbox 1111 1099 1142 1119; x_wconf 87' lang='eng' dir='ltr'><em>Na</em></span> <span class='ocrx_word' id='word_1_176' title='bbox 1152 1099 1208 1119; x_wconf 91' lang='eng' dir='ltr'>e571</span> <span class='ocrx_word' id='word_1_177' title='bbox 1222 1099 1361 1124; x_wconf 82' lang='eng' dir='ltr'><em>(AJ233947)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_25' title="bbox 768 997 770 1034">
+    <p class='ocr_par' dir='ltr' id='par_1_27' title="bbox 768 997 770 1034">
+     <span class='ocr_line' id='line_1_56' title="bbox 768 997 770 1034; baseline 0 101"><span class='ocrx_word' id='word_1_178' title='bbox 768 997 770 1034; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_26' title="bbox 770 1032 872 1034">
+    <p class='ocr_par' dir='ltr' id='par_1_28' title="bbox 770 1032 872 1034">
+     <span class='ocr_line' id='line_1_57' title="bbox 770 1032 872 1034; baseline 0 101"><span class='ocrx_word' id='word_1_179' title='bbox 770 1032 872 1034; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_27' title="bbox 802 268 1417 294">
+    <p class='ocr_par' dir='ltr' id='par_1_29' title="bbox 802 269 1417 294">
+     <span class='ocr_line' id='line_1_58' title="bbox 802 269 1417 294; baseline 0 -5"><span class='ocrx_word' id='word_1_180' title='bbox 802 269 972 289; x_wconf 82' lang='eng' dir='ltr'><em>Cora/lococcus</em></span> <span class='ocrx_word' id='word_1_181' title='bbox 981 269 1111 289; x_wconf 82' lang='eng' dir='ltr'><em>coral/aides</em></span> <span class='ocrx_word' id='word_1_182' title='bbox 1121 269 1178 289; x_wconf 87' lang='eng' dir='ltr'>DSM</span> <span class='ocrx_word' id='word_1_183' title='bbox 1189 269 1259 289; x_wconf 83' lang='eng' dir='ltr'><em>2259T</em></span> <span class='ocrx_word' id='word_1_184' title='bbox 1269 269 1417 294; x_wconf 87' lang='eng' dir='ltr'>(DQ768120)</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_28' title="bbox 1430 98 1479 309">
+    <p class='ocr_par' dir='ltr' id='par_1_30' title="bbox 1430 98 1479 309">
+     <span class='ocr_line' id='line_1_59' title="bbox 1430 178 1448 227; textangle 90"><span class='ocrx_word' id='word_1_185' title='bbox 1430 178 1448 227; x_wconf 63' lang='eng' dir='ltr'>V</span> 
+     </span>
+     <span class='ocr_line' id='line_1_60' title="bbox 1453 98 1479 309; textangle 90"><span class='ocrx_word' id='word_1_186' title='bbox 1453 98 1479 309; x_wconf 61' lang='eng' dir='ltr'><em>eeeuuazoeqozslfg</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_29' title="bbox 1410 373 1428 458">
+    <p class='ocr_par' dir='ltr' id='par_1_31' title="bbox 1410 373 1428 458">
+     <span class='ocr_line' id='line_1_61' title="bbox 1410 373 1428 405; baseline 0 0"><span class='ocrx_word' id='word_1_187' title='bbox 1410 373 1428 405; x_wconf 62' lang='eng' dir='ltr'><em>J</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_62' title="bbox 1410 428 1427 458; baseline 0 -24"><span class='ocrx_word' id='word_1_188' title='bbox 1410 428 1427 458; x_wconf 31' lang='eng' dir='ltr'><strong>N</strong></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_30' title="bbox 1428 601 1479 760">
+    <p class='ocr_par' dir='ltr' id='par_1_32' title="bbox 1428 601 1479 760">
+     <span class='ocr_line' id='line_1_63' title="bbox 1428 650 1448 710; textangle 90"><span class='ocrx_word' id='word_1_189' title='bbox 1428 650 1448 710; x_wconf 57' lang='eng' dir='ltr'>V</span> 
+     </span>
+     <span class='ocr_line' id='line_1_64' title="bbox 1453 601 1479 760; textangle 90"><span class='ocrx_word' id='word_1_190' title='bbox 1453 601 1479 760; x_wconf 64' lang='eng' dir='ltr'><em>aeeuybuwog</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_31' title="bbox 1426 23 1432 1113">
+    <p class='ocr_par' dir='ltr' id='par_1_33' title="bbox 1426 23 1432 1113">
+     <span class='ocr_line' id='line_1_65' title="bbox 1426 23 1432 1113; baseline 0 22"><span class='ocrx_word' id='word_1_191' title='bbox 1426 23 1432 1113; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_32' title="bbox 1430 939 1478 1135">
+    <p class='ocr_par' dir='ltr' id='par_1_34' title="bbox 1430 939 1478 1135">
+     <span class='ocr_line' id='line_1_66' title="bbox 1430 1026 1448 1047; textangle 90"><span class='ocrx_word' id='word_1_192' title='bbox 1430 1026 1448 1047; x_wconf 86' lang='eng' dir='ltr'>Y</span> 
+     </span>
+     <span class='ocr_line' id='line_1_67' title="bbox 1453 939 1478 1135; textangle 90"><span class='ocrx_word' id='word_1_193' title='bbox 1453 939 1478 1135; x_wconf 67' lang='eng' dir='ltr'><em>eBeU/JS/(oouueN</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_33' title="bbox 1410 1109 1428 1123">
+    <p class='ocr_par' dir='ltr' id='par_1_35' title="bbox 1410 1109 1428 1123">
+     <span class='ocr_line' id='line_1_68' title="bbox 1410 1109 1428 1123; baseline 0 0"><span class='ocrx_word' id='word_1_194' title='bbox 1410 1109 1428 1123; x_wconf 54' lang='eng' dir='ltr'><em>J</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/ijs.0.003822-0-000.pbm.png b/examples/ijs.0.003822-0-000.pbm.png
new file mode 100644
index 00000000..024fea01
Binary files /dev/null and b/examples/ijs.0.003822-0-000.pbm.png differ
diff --git a/examples/ijs.0.003822-0-000.pbm.png.hocr b/examples/ijs.0.003822-0-000.pbm.png.hocr
new file mode 100644
index 00000000..f8d29022
--- /dev/null
+++ b/examples/ijs.0.003822-0-000.pbm.png.hocr
@@ -0,0 +1,80 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+    "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+ <head>
+  <title>
+</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+  <meta name='ocr-system' content='tesseract 3.03' />
+  <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
+</head>
+<body>
+  <div class='ocr_page' id='page_1' title='image "ijs.0.003822-0-000.pbm.png"; bbox 0 0 1656 372; ppageno 0'>
+   <div class='ocr_carea' id='block_1_1' title="bbox 365 2 886 56">
+    <p class='ocr_par' dir='ltr' id='par_1_1' title="bbox 365 2 886 56">
+     <span class='ocr_line' id='line_1_1' title="bbox 365 2 886 30; baseline 0 -6"><span class='ocrx_word' id='word_1_1' title='bbox 365 2 508 24; x_wconf 72' lang='eng' dir='ltr'><em>Desulfovibrio</em></span> <span class='ocrx_word' id='word_1_2' title='bbox 515 3 602 30; x_wconf 87' lang='eng' dir='ltr'><em>putealis</em></span> <span class='ocrx_word' id='word_1_3' title='bbox 610 2 662 24; x_wconf 88' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_4' title='bbox 673 2 749 24; x_wconf 82' lang='eng' dir='ltr'><em>16056T</em></span> <span class='ocrx_word' id='word_1_5' title='bbox 758 3 886 30; x_wconf 86' lang='eng' dir='ltr'><em>(AY574979)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_2' title="bbox 753 39 774 56; baseline 0 0"><span class='ocrx_word' id='word_1_6' title='bbox 753 39 774 56; x_wconf 90' lang='eng'>66</span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_2' title="bbox 0 7 1154 329">
+    <p class='ocr_par' dir='ltr' id='par_1_2' title="bbox 0 7 1049 321">
+     <span class='ocr_line' id='line_1_3' title="bbox 0 7 358 44; baseline 0 328"><span class='ocrx_word' id='word_1_7' title='bbox 0 7 358 44; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_4' title="bbox 0 44 995 80; baseline 0 -16"><span class='ocrx_word' id='word_1_8' title='bbox 0 44 995 80; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_5' title="bbox 0 243 1049 321; baseline 0 -56"><span class='ocrx_word' id='word_1_9' title='bbox 0 243 1049 321; x_wconf 95' lang='eng' dir='ltr'><em>   </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_3' title="bbox 955 38 1655 342">
+    <p class='ocr_par' dir='ltr' id='par_1_3' title="bbox 961 38 1645 139">
+     <span class='ocr_line' id='line_1_6' title="bbox 995 38 1509 66; baseline 0 -6"><span class='ocrx_word' id='word_1_10' title='bbox 995 39 1138 60; x_wconf 84' lang='eng' dir='ltr'><em>Desulfovibrio</em></span> <span class='ocrx_word' id='word_1_11' title='bbox 1147 39 1304 66; x_wconf 85' lang='eng' dir='ltr'><em>carbinoliphi/us</em></span> <span class='ocrx_word' id='word_1_12' title='bbox 1313 38 1365 60; x_wconf 72' lang='eng' dir='ltr'><em>D41T</em></span> <span class='ocrx_word' id='word_1_13' title='bbox 1374 39 1509 66; x_wconf 86' lang='eng' dir='ltr'><em>(DQ186200)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_7' title="bbox 1161 72 1645 101; baseline 0 -6"><span class='ocrx_word' id='word_1_14' title='bbox 1161 73 1303 95; x_wconf 72' lang='eng' dir='ltr'><em>Desu/fovibr/o</em></span> <span class='ocrx_word' id='word_1_15' title='bbox 1312 73 1466 95; x_wconf 72' lang='eng' dir='ltr'><em>fructosivorans</em></span> <span class='ocrx_word' id='word_1_16' title='bbox 1474 72 1507 95; x_wconf 90' lang='eng' dir='ltr'><em>JJT</em></span> <span class='ocrx_word' id='word_1_17' title='bbox 1516 74 1645 101; x_wconf 88' lang='eng' dir='ltr'><em>(AF050101)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_8' title="bbox 961 107 1594 139; baseline 0 -10"><span class='ocrx_word' id='word_1_18' title='bbox 961 107 1119 129; x_wconf 87' lang='eng' dir='ltr'><em>Desulfovibrio</em></span> <span class='ocrx_word' id='word_1_19' title='bbox 1128 108 1316 129; x_wconf 86' lang='eng' dir='ltr'><em>marrakechensis</em></span> <span class='ocrx_word' id='word_1_20' title='bbox 1325 107 1449 139; x_wconf 47' lang='eng' dir='ltr'><em>EMSSDQ4Y</em></span> <span class='ocrx_word' id='word_1_21' title='bbox 1457 108 1594 135; x_wconf 83' lang='eng' dir='ltr'><em>(AM947130)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_4' title="bbox 955 141 1655 223">
+     <span class='ocr_line' id='line_1_9' title="bbox 1074 141 1655 170; baseline 0 -6"><span class='ocrx_word' id='word_1_22' title='bbox 1074 142 1216 164; x_wconf 74' lang='eng' dir='ltr'><em>Desu/fovibrio</em></span> <span class='ocrx_word' id='word_1_23' title='bbox 1224 142 1383 164; x_wconf 81' lang='eng' dir='ltr'><em>alcoholivorans</em></span> <span class='ocrx_word' id='word_1_24' title='bbox 1393 142 1444 164; x_wconf 93' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_25' title='bbox 1454 141 1517 164; x_wconf 84' lang='eng' dir='ltr'><em>5433T</em></span> <span class='ocrx_word' id='word_1_26' title='bbox 1526 142 1655 170; x_wconf 85' lang='eng' dir='ltr'><em>(AF053751)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_10' title="bbox 955 176 1496 223; baseline 0 -25"><span class='ocrx_word' id='word_1_27' title='bbox 955 182 1027 223; x_wconf 49' lang='eng' dir='ltr'><em>gr</em></span> <span class='ocrx_word' id='word_1_28' title='bbox 1036 176 1179 198; x_wconf 77' lang='eng' dir='ltr'><em>Desu/fovibrio</em></span> <span class='ocrx_word' id='word_1_29' title='bbox 1187 176 1314 204; x_wconf 78' lang='eng' dir='ltr'><em>magnet/Gus</em></span> <span class='ocrx_word' id='word_1_30' title='bbox 1323 176 1387 198; x_wconf 74' lang='eng' dir='ltr'><em>RS-1T</em></span> <span class='ocrx_word' id='word_1_31' title='bbox 1395 176 1496 204; x_wconf 83' lang='eng' dir='ltr'><em>(D43944)</em></span> 
+     </span>
+    </p>
+
+    <p class='ocr_par' dir='ltr' id='par_1_5' title="bbox 1000 210 1623 342">
+     <span class='ocr_line' id='line_1_11' title="bbox 1000 210 1553 238; baseline 0.002 -6"><span class='ocrx_word' id='word_1_32' title='bbox 1000 211 1143 233; x_wconf 83' lang='eng' dir='ltr'><em>Desu/fovibrio</em></span> <span class='ocrx_word' id='word_1_33' title='bbox 1151 211 1282 233; x_wconf 84' lang='eng' dir='ltr'><em>carbinolicus</em></span> <span class='ocrx_word' id='word_1_34' title='bbox 1291 211 1343 233; x_wconf 90' lang='eng' dir='ltr'><em>DSM</em></span> <span class='ocrx_word' id='word_1_35' title='bbox 1353 210 1416 233; x_wconf 80' lang='eng' dir='ltr'><em>3852T</em></span> <span class='ocrx_word' id='word_1_36' title='bbox 1424 211 1553 238; x_wconf 85' lang='eng' dir='ltr'><em>(AY626035)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_12' title="bbox 1058 245 1536 273; baseline 0 -6"><span class='ocrx_word' id='word_1_37' title='bbox 1058 246 1200 267; x_wconf 83' lang='eng' dir='ltr'><em>Desulfovibr/o</em></span> <span class='ocrx_word' id='word_1_38' title='bbox 1208 246 1334 267; x_wconf 85' lang='eng' dir='ltr'><em>burk/nensis</em></span> <span class='ocrx_word' id='word_1_39' title='bbox 1343 245 1399 267; x_wconf 78' lang='eng' dir='ltr'><em>HDvT</em></span> <span class='ocrx_word' id='word_1_40' title='bbox 1407 246 1536 273; x_wconf 87' lang='eng' dir='ltr'><em>(AF053752)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_13' title="bbox 1030 279 1557 307; baseline 0 -5"><span class='ocrx_word' id='word_1_41' title='bbox 1030 280 1172 302; x_wconf 75' lang='eng' dir='ltr'><em>Desu/fovibrio</em></span> <span class='ocrx_word' id='word_1_42' title='bbox 1181 280 1347 302; x_wconf 83' lang='eng' dir='ltr'><em>sulfodismutans</em></span> <span class='ocrx_word' id='word_1_43' title='bbox 1354 279 1448 302; x_wconf 77' lang='eng' dir='ltr'><em>ThA&lt;201T</em></span> <span class='ocrx_word' id='word_1_44' title='bbox 1457 280 1557 307; x_wconf 85' lang='eng' dir='ltr'><em>(Y17764)</em></span> 
+     </span>
+     <span class='ocr_line' id='line_1_14' title="bbox 1115 314 1623 342; baseline 0 -6"><span class='ocrx_word' id='word_1_45' title='bbox 1115 314 1258 336; x_wconf 85' lang='eng' dir='ltr'><em>Desulfovibrio</em></span> <span class='ocrx_word' id='word_1_46' title='bbox 1266 315 1379 342; x_wconf 83' lang='eng' dir='ltr'><em>inopinatus</em></span> <span class='ocrx_word' id='word_1_47' title='bbox 1388 314 1440 337; x_wconf 89' lang='eng' dir='ltr'><em>HHQ</em></span> <span class='ocrx_word' id='word_1_48' title='bbox 1449 314 1485 336; x_wconf 73' lang='eng' dir='ltr'><em>20T</em></span> <span class='ocrx_word' id='word_1_49' title='bbox 1494 315 1623 342; x_wconf 85' lang='eng' dir='ltr'><em>(AF177276)</em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_4' title="bbox 953 202 955 257">
+    <p class='ocr_par' dir='ltr' id='par_1_6' title="bbox 953 202 955 257">
+     <span class='ocr_line' id='line_1_15' title="bbox 953 202 955 257; baseline 0 115"><span class='ocrx_word' id='word_1_50' title='bbox 953 202 955 257; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_5' title="bbox 353 324 1107 326">
+    <p class='ocr_par' dir='ltr' id='par_1_7' title="bbox 353 324 1107 326">
+     <span class='ocr_line' id='line_1_16' title="bbox 353 324 1107 326; baseline 0 46"><span class='ocrx_word' id='word_1_51' title='bbox 353 324 1107 326; x_wconf 95' lang='eng' dir='ltr'><em> </em></span> 
+     </span>
+    </p>
+   </div>
+   <div class='ocr_carea' id='block_1_6' title="bbox 61 341 96 358">
+    <p class='ocr_par' dir='ltr' id='par_1_8' title="bbox 61 341 96 358">
+     <span class='ocr_line' id='line_1_17' title="bbox 61 341 96 358; baseline 0 0"><span class='ocrx_word' id='word_1_52' title='bbox 61 341 96 358; x_wconf 94' lang='eng'><em>0.01</em></span> 
+     </span>
+    </p>
+   </div>
+  </div>
+ </body>
+</html>
diff --git a/examples/ijsem-quickscrape.zip b/examples/ijsem-quickscrape.zip
new file mode 100644
index 00000000..42ae7e1f
Binary files /dev/null and b/examples/ijsem-quickscrape.zip differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4141.full/F1.small.gif b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4141.full/F1.small.gif
new file mode 100644
index 00000000..2e154f87
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4141.full/F1.small.gif differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4141.full/F2.small.gif b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4141.full/F2.small.gif
new file mode 100644
index 00000000..7abbc7a7
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4141.full/F2.small.gif differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4141.full/F3.small.gif b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4141.full/F3.small.gif
new file mode 100644
index 00000000..d5234dd1
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4141.full/F3.small.gif differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4141.full/fulltext.html b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4141.full/fulltext.html
new file mode 100644
index 00000000..0647bffc
--- /dev/null
+++ b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4141.full/fulltext.html
@@ -0,0 +1,1754 @@
+<!DOCTYPE html
+  PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html
+      xmlns="http://www.w3.org/1999/xhtml"
+      xml:lang="en"
+      lang="en">
+   <head>
+      <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
+      <title>Sulfurimonas gotlandica sp. nov., a chemoautotrophic and psychrotolerant epsilonproteobacterium isolated from a pelagic redoxcline,
+         and an emended description of the genus Sulfurimonas 
+      </title>
+      <meta name="googlebot" content="NOODP" />
+      <meta name="HW.ad-path" content="/cgi/content/full/63/Pt_11/4141" />
+      <meta content="/ijs/63/Pt_11/4141.atom" name="HW.identifier" />
+      <meta name="DC.Format" content="text/html" />
+      <meta name="DC.Language" content="en" />
+      <meta content="Sulfurimonas gotlandica sp. nov., a chemoautotrophic and psychrotolerant epsilonproteobacterium isolated from a pelagic redoxcline, and an emended description of the genus Sulfurimonas"
+            name="DC.Title" />
+      <meta content="10.1099/ijs.0.048827-0" name="DC.Identifier" />
+      <meta content="2013-11-01" name="DC.Date" />
+      <meta content="Society for General Microbiology" name="DC.Publisher" />
+      <meta content="Matthias Labrenz" name="DC.Contributor" />
+      <meta content="Jana Grote" name="DC.Contributor" />
+      <meta content="Kerstin Mammitzsch" name="DC.Contributor" />
+      <meta content="Henricus T. S. Boschker" name="DC.Contributor" />
+      <meta content="Michael Laue" name="DC.Contributor" />
+      <meta content="Günter Jost" name="DC.Contributor" />
+      <meta content="Sabine Glaubitz" name="DC.Contributor" />
+      <meta content="Klaus Jürgens" name="DC.Contributor" />
+      <meta content="International Journal of Systematic and Evolutionary&#xA;                Microbiology"
+            name="citation_journal_title" />
+      <meta content="Int J Syst Evol&#xA;                Microbiol"
+            name="citation_journal_abbrev" />
+      <meta content="1466-5026" name="citation_issn" />
+      <meta content="1466-5034" name="citation_issn" />
+      <meta name="citation_author" content="Matthias Labrenz" />
+      <meta name="citation_author_institution"
+            content="1IOW Leibniz Institute for Baltic Sea Research Warnemuende (IOW), Germany" />
+      <meta name="citation_author" content="Jana Grote" />
+      <meta name="citation_author_institution"
+            content="1IOW Leibniz Institute for Baltic Sea Research Warnemuende (IOW), Germany" />
+      <meta name="citation_author" content="Kerstin Mammitzsch" />
+      <meta name="citation_author_institution"
+            content="1IOW Leibniz Institute for Baltic Sea Research Warnemuende (IOW), Germany" />
+      <meta name="citation_author" content="Henricus T. S. Boschker" />
+      <meta name="citation_author_institution"
+            content="2Royal Netherlands Institute of Sea Research (NIOZ), Yerseke, Netherlands" />
+      <meta name="citation_author" content="Michael Laue" />
+      <meta name="citation_author_institution"
+            content="3Arbeitsbereich Medizinische Biologie und Elektronenmikroskopisches Zentrum (EMZ), Universität Rostock, Germany" />
+      <meta name="citation_author" content="Günter Jost" />
+      <meta name="citation_author_institution"
+            content="1IOW Leibniz Institute for Baltic Sea Research Warnemuende (IOW), Germany" />
+      <meta name="citation_author" content="Sabine Glaubitz" />
+      <meta name="citation_author_institution"
+            content="1IOW Leibniz Institute for Baltic Sea Research Warnemuende (IOW), Germany" />
+      <meta name="citation_author" content="Klaus Jürgens" />
+      <meta name="citation_author_institution"
+            content="1IOW Leibniz Institute for Baltic Sea Research Warnemuende (IOW), Germany" />
+      <meta content="Sulfurimonas gotlandica sp. nov., a chemoautotrophic and psychrotolerant epsilonproteobacterium isolated from a pelagic redoxcline, and an emended description of the genus Sulfurimonas"
+            name="citation_title" />
+      <meta content="11/01/2013" name="citation_date" />
+      <meta content="63" name="citation_volume" />
+      <meta content="Pt 11" name="citation_issue" />
+      <meta content="4141" name="citation_firstpage" />
+      <meta content="4148" name="citation_lastpage" />
+      <meta content="63/Pt_11/4141" name="citation_id" />
+      <meta content="63/Pt 11/4141" name="citation_id_from_sass_path" />
+      <meta content="ijs;63/Pt_11/4141" name="citation_mjid" />
+      <meta content="10.1099/ijs.0.048827-0" name="citation_doi" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4141.abstract"
+            name="citation_abstract_html_url" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4141.full"
+            name="citation_fulltext_html_url" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4141.full.pdf"
+            name="citation_pdf_url" />
+      <meta content="/content/63/Pt_11.cover.gif" name="issue_cover_image" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4141"
+            name="citation_public_url" />
+      <meta content="23749282" name="citation_pmid" />
+      <meta name="citation_access" content="all" />
+      <meta name="citation_fulltext_world_readable" content="" />
+      <meta name="citation_section" content="Proteobacteria" />
+      <meta name="robots" content="noarchive,nofollow" />
+      <meta name="googlebot" content="noarchive" />
+      <link href="/content/63/Pt_11/4136.short" rel="prev" />
+      <link href="/content/63/Pt_11/4149.short" rel="next" />
+      <link rel="stylesheet" type="text/css" media="all" href="/shared/css/hw-global.css" />
+      <link rel="stylesheet" type="text/css" media="print" href="/shared/css/hw-print.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/standard-designs/design25/main.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/local/css/hw-local-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/jquery.fancybox-1.3.4.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-global-colexpand.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-global-colexpand.css" /><script type="text/javascript" id="session-d7768454e1">var callbackToken='56361896C937FF6';</script><script type="text/javascript" id="session-d7768454e3">
+                      var subCode='sgmjournal_sub';
+                    </script><script type="text/javascript" src="/shared/js/jquery-min.js"></script><script type="text/javascript" src="/shared/js/fingerprint.js"></script><script type="text/javascript" src="/shared/js/hw-shared.js"></script><script type="text/javascript" src="/shared/js/design/hw-design1.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-shared.js"></script><script type="text/javascript" src="/shared/js/pages/hw-content.js"></script><script type="text/javascript" src="/shared/js/fancybox/jquery.fancybox-1.3.4.js"></script><script type="text/javascript" src="/shared/js/fancybox/jquery.easing-1.3.pack.js"></script><script type="text/javascript"
+              src="/shared/js/fancybox/jquery.mousewheel-3.0.4.pack.js"></script><script type="text/javascript" src="/shared/js/util/content.jquery.addVariantLink.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-custom-free.js"></script><script type="text/javascript" src="/shared/js/util/hw-col-expand.js"></script><script type="text/javascript"
+              src="https://data.namesforlife.com/script/NamesforLife.js"></script></head>
+   <body>
+      <div class="hw-gen-page pagetype-content" id="pageid-content" itemscope="itemscope"
+           itemtype="http://schema.org/ScholarlyArticle">
+         <div id="header">
+            
+            <h1><a id="logo" href="/"><span>International Journal of Systematic and Evolutionary Microbiology</span></a></h1>
+            
+            <p id="skip-link">
+               <a href="#content-block">Skip to main page content</a>
+               
+            </p>
+            
+            <ul class="button-list header-buttons">
+               <li class="first"><a href="/" title="HOME"><span>HOME</span></a></li>
+               <li><a href="/content/current" title="CURRENT ISSUE"><span>CURRENT ISSUE</span></a></li>
+               <li><a href="/content" title="ARCHIVE"><span>ARCHIVE</span></a></li>
+               <li><a href="/search" title="SEARCH"><span>SEARCH</span></a></li>
+               <li><a href="/help" title="HELP"><span>HELP</span></a></li>
+               <li class="last"><a href="/feedback" title="CONTACT US"><span>CONTACT US</span></a></li>
+            </ul>
+            
+            
+            <div class="header-qs">
+               
+               <form class="searchbox" action="/search" method="get">
+                  <div>
+                     	<label for="header-qs-input" id="header-qs-search-label">Search for Keyword:</label>
+                     <input value="" title="Search" type="text" name="fulltext" id="header-qs-input" /><input type="hidden" name="submit" value="yes" /><label for="header-qs-search" id="header-qs-search-label">GO</label><input value="GO" alt="Link: Go" type="image" id="header-qs-search-go"
+                            src="/shared/img/standard-design/design2/go.gif" /> 
+                     
+                  </div>
+                  <div class="adv-search-link"><a href="/search">Advanced Search</a></div>
+               </form>
+               
+               
+            </div>
+            
+            <div class="header-ac-elements">
+               
+               <div id="authstring" class="suppress-header-login">
+                  
+                  <ul>
+                     <li class="subscr-ref">Institution: THE NATURAL HISTORY MUSEUM</li>
+                     <li>
+                        <a href="/login?uri=http%3A%2F%2Fijs.sgmjournals.org%2Fcontent%2F63%2FPt_11%2F4141.full">
+                           Sign In as Member / Individual
+                           </a>
+                        
+                     </li>
+                  </ul>           
+                  
+               </div> 
+               
+               <div id="hdr-login" class="suppress-header-login"></div>
+               
+            </div>
+            
+            <div class="banner-ads">
+               		
+               <ul>
+                  <li class="position-1 no-ad hdr_left"><span>  </span></li>
+               </ul>
+               	
+            </div>
+            
+            <div class="bar">
+               
+               <div class="bar-inner"></div>
+               
+            </div>
+            
+         </div>
+         <div id="content-block">
+            <div class="article fulltext-view " itemprop="articleBody"><span class="highwire-journal-article-marker-start"></span><h1 id="article-title-1" itemprop="headline"><em>Sulfurimonas gotlandica</em> sp. nov., a chemoautotrophic and psychrotolerant epsilonproteobacterium isolated from a pelagic redoxcline, and an emended
+                  description of the genus <em>Sulfurimonas</em></h1>
+               <div class="contributors">
+                  <ol class="contributor-list" id="contrib-group-1">
+                     <li class="contributor" id="contrib-1" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Matthias+Labrenz&amp;sortspec=date&amp;submit=Submit">Matthias Labrenz</a></span><a id="xref-aff-1-1" class="xref-aff" href="#aff-1"><sup>1</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-2" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Jana+Grote&amp;sortspec=date&amp;submit=Submit">Jana Grote</a></span><a id="xref-aff-1-2" class="xref-aff" href="#aff-1"><sup>1</sup></a><span class="xref-sep">,</span><a id="xref-fn-1-1" class="xref-fn" href="#fn-1">†</a><a id="xref-fn-2-1" class="xref-fn" href="#fn-2">‡</a>, 
+                     </li>
+                     <li class="contributor" id="contrib-3" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Kerstin+Mammitzsch&amp;sortspec=date&amp;submit=Submit">Kerstin Mammitzsch</a></span><a id="xref-aff-1-3" class="xref-aff" href="#aff-1"><sup>1</sup></a><span class="xref-sep">,</span><a id="xref-fn-1-2" class="xref-fn" href="#fn-1">†</a>, 
+                     </li>
+                     <li class="contributor" id="contrib-4" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Henricus+T.+S.+Boschker&amp;sortspec=date&amp;submit=Submit">Henricus T. S. Boschker</a></span><a id="xref-aff-2-1" class="xref-aff" href="#aff-2"><sup>2</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-5" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Michael+Laue&amp;sortspec=date&amp;submit=Submit">Michael Laue</a></span><a id="xref-aff-3-1" class="xref-aff" href="#aff-3"><sup>3</sup></a><span class="xref-sep">,</span><a id="xref-fn-3-1" class="xref-fn" href="#fn-3">§</a>, 
+                     </li>
+                     <li class="contributor" id="contrib-6" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=G%C3%BCnter+Jost&amp;sortspec=date&amp;submit=Submit">Günter Jost</a></span><a id="xref-aff-1-4" class="xref-aff" href="#aff-1"><sup>1</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-7" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Sabine+Glaubitz&amp;sortspec=date&amp;submit=Submit">Sabine Glaubitz</a></span><a id="xref-aff-1-5" class="xref-aff" href="#aff-1"><sup>1</sup></a> and 
+                     </li>
+                     <li class="last" id="contrib-8"><span class="name"><a class="name-search"
+                              href="/search?author1=Klaus+J%C3%BCrgens&amp;sortspec=date&amp;submit=Submit">Klaus Jürgens</a></span><a id="xref-aff-1-6" class="xref-aff" href="#aff-1"><sup>1</sup></a></li>
+                  </ol>
+                  <ol class="affiliation-list">
+                     <li class="aff"><a id="aff-1" name="aff-1"></a><address><sup>1</sup>IOW Leibniz Institute for Baltic Sea Research Warnemuende (IOW), Germany
+                        </address>
+                     </li>
+                     <li class="aff"><a id="aff-2" name="aff-2"></a><address><sup>2</sup>Royal Netherlands Institute of Sea Research (NIOZ), Yerseke, Netherlands
+                        </address>
+                     </li>
+                     <li class="aff"><a id="aff-3" name="aff-3"></a><address><sup>3</sup>Arbeitsbereich Medizinische Biologie und Elektronenmikroskopisches Zentrum (EMZ), Universität Rostock, Germany
+                        </address>
+                     </li>
+                  </ol>
+                  <ol class="corresp-list">
+                     <li class="corresp" id="corresp-1"><strong>Correspondence</strong><br /> Matthias Labrenz <span class="em-link"><span class="em-addr">matthias.labrenz{at}io-warnemuende.de</span></span></li>
+                  </ol>
+                  <ul class="author-notes">
+                     <li class="fn-present-address" id="fn-2">
+                        <p id="p-2"><a class="rev-xref" href="#xref-fn-2-1">↵</a><span class="fn-label">‡</span> <strong>Present address:</strong> Center for Microbial Oceanography: Research and Education, SOEST, University of Hawaii at Manoa, Honolulu, HI 96822, USA.
+                        </p>
+                     </li>
+                     <li class="fn-present-address" id="fn-3">
+                        <p id="p-3"><a class="rev-xref" href="#xref-fn-3-1">↵</a><span class="fn-label">§</span> <strong>Present address:</strong> Robert Koch Institute, Berlin, Germany.
+                        </p>
+                     </li>
+                  </ul>
+               </div>
+               <div class="section abstract" id="abstract-1" itemprop="description">
+                  <div class="section-nav">
+                     <div class="nav-placeholder"> </div><a href="#fn-group-1" title="Next Section" class="next-section-link"><span>Next Section</span></a></div>
+                  <h2>Abstract</h2>
+                  
+                  <p id="p-6">A psychro- and aerotolerant bacterium was isolated from the sulfidic water of a pelagic redox zone of the central Baltic Sea.
+                     The slightly curved rod- or spiral-shaped cells were motile by one polar flagellum or two bipolar flagella. Growth was chemolithoautotrophic,
+                     with nitrate or nitrite as electron acceptor and either a variety of sulfur species of different oxidation states or hydrogen
+                     as electron donor. Although the bacterium was able to utilize organic substances such as acetate, pyruvate, peptone and yeast
+                     extract for growth, these compounds yielded considerably lower cell numbers than obtained with reduced sulfur or hydrogen;
+                     in addition, bicarbonate supplementation was necessary. The cells also had an absolute requirement for NaCl. Optimal growth
+                     occurred at 15 °C and at pH 6.6–8.0. The predominant fatty acid of this organism was 16 : 1ω7<em>c</em>, with 3-OH 14 : 0, 16 : 0, 16 : 1ω5<em>c</em>+<em>t</em> and 18 : 1ω7<em>c</em> present in smaller amounts. The DNA G+C content was 33.6 mol%. As determined in 16S rRNA gene sequence phylogeny analysis,
+                     the isolate belongs to the genus <span class="named-content genus" id="named-content-1"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                           href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span>, within the class <span class="named-content class" id="named-content-2"><a class="namesforlife" rel="namesforlife-name" title="Epsilonproteobacteria"
+                           href="doi:10.1601/nm.3783"><em>Epsilonproteobacteria</em></a></span>, with 93.7 to 94.2 % similarity to the other species of the genus <span class="named-content genus" id="named-content-3"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                           href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span>, <span class="named-content species" id="named-content-4"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas autotrophica"
+                           href="doi:10.1601/nm.3857"><em>Sulfurimonas autotrophica</em></a></span>, <span class="named-content species" id="named-content-5"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas paralvinellae"
+                           href="doi:10.1601/nm.10230"><em>Sulfurimonas paralvinellae</em></a></span> and <span class="named-content species" id="named-content-6"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas denitrificans"
+                           href="doi:10.1601/nm.9790"><em>Sulfurimonas denitrificans</em></a></span>. However, the distinct physiological and genotypic differences from these previously described taxa support the description
+                     of a novel species, <em>Sulfurimonas gotlandica</em> sp. nov. The type strain is GD1<sup>T</sup> ( = DSM 19862<sup>T</sup> = JCM 16533<sup>T</sup>). Our results also justify an emended description of the genus <span class="named-content genus" id="named-content-7"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                           href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span>.
+                  </p>
+                  
+               </div>
+               <div class="section fn-group" id="fn-group-1">
+                  <div class="section-nav"><a href="#abstract-1" title="Abstract" class="prev-section-link"><span>Previous Section</span></a><a href="#sec-1" title="Next Section" class="next-section-link"><span>Next Section</span></a></div>
+                  <ul>
+                     <li class="fn-equal" id="fn-1">
+                        <p id="p-1"><a class="rev-xref" href="#xref-fn-1-1">↵</a><span class="fn-label">†</span> These authors contributed equally to this study.
+                        </p>
+                     </li>
+                     <li class="fn-other" id="fn-4">
+                        <p id="p-4">The GenBank/EMBL/DDBJ accession number for the 16S rRNA gene sequence of strain GD1<sup>T</sup> is AFRZ01000001 (804671..806178), locus_tag SMGD1_rRNA3.
+                        </p>
+                     </li>
+                  </ul>
+               </div>
+               <div class="license" id="license-1">
+                  <p id="p-5">This is an open-access article distributed under the terms of the Creative Commons Attribution License, which permits unrestricted
+                     use, distribution, and reproduction in any medium, provided the original work is properly cited.
+                  </p>
+               </div>
+               <p id="p-7">Deep-sea vents are among the most productive marine systems on Earth. The discovery of these primarily chemoautotrophic environments,
+                  in 1977, has been followed by an appreciation of the remarkable physiological and phylogenetic diversity of their endosymbiotic
+                  and often thermophilic inhabitants, most commonly species of the class <span class="named-content class" id="named-content-8"><a class="namesforlife" rel="namesforlife-name" title="Epsilonproteobacteria"
+                        href="doi:10.1601/nm.3783"><em>Epsilonproteobacteria</em></a></span>. Moreover, deep-sea vent chemolithoautotrophs are thought to be representatives of the earliest biological communities on
+                  Earth (see the review by <a id="xref-ref-26-1" class="xref-bibr" href="#ref-26">Nakagawa &amp; Takai, 2008</a>). Indeed, many epsilonproteobacteria are globally ubiquitous in oxygen-deficient and sulfide-rich marine and terrestrial
+                  ecosystems, which accommodate their predominantly auto- to mixotrophic lifestyles (<a id="xref-ref-8-1" class="xref-bibr" href="#ref-8">Campbell <em>et al.</em>, 2006</a>). A number of studies have verified the significant role of epsilonproteobacteria in biogeochemical cycles, particularly
+                  those which are sulfur-dependent, as is the case in deep-sea hydrothermal fields (<a id="xref-ref-27-1" class="xref-bibr" href="#ref-27">Nakagawa <em>et al.</em>, 2005</a>; <a id="xref-ref-8-2" class="xref-bibr" href="#ref-8">Campbell <em>et al.</em>, 2006</a>), sulfidic cave springs (<a id="xref-ref-10-1" class="xref-bibr" href="#ref-10">Engel <em>et al.</em>, 2004</a>) and autotrophic episymbiotic associations (<a id="xref-ref-35-1" class="xref-bibr" href="#ref-35">Suzuki <em>et al.</em>, 2006</a>). In the suboxic to sulfidic transition zones of aquatic pelagic redox zones, high dark CO<sub>2</sub> fixation rates, mainly due to the activities of epsilonproteobacterial chemolithoautotrophs, have been determined, for instance,
+                  in the Black Sea and the Baltic Sea (<a id="xref-ref-14-1" class="xref-bibr" href="#ref-14">Grote <em>et al.</em>, 2008</a>; <a id="xref-ref-12-1" class="xref-bibr" href="#ref-12">Glaubitz <em>et al.</em>, 2010</a>; <a id="xref-ref-20-1" class="xref-bibr" href="#ref-20">Jost <em>et al.</em>, 2008</a>).
+               </p>
+               <p id="p-8">The Baltic Sea is among the largest brackish basins of the world, with periodically anoxic conditions in its bottom waters.
+                  In the region known as the Baltic Proper there are a number of such areas, including the Gotland Deep, where at depths below
+                  50–60 m a stable halocline separates the water column into an upper oxygenated layer and underlying oxygen-deficient and anoxic/sulfidic
+                  layers (<a id="xref-ref-24-1" class="xref-bibr" href="#ref-24">Lepland &amp; Stevens, 1998</a>; <a id="xref-ref-28-1" class="xref-bibr" href="#ref-28">Neretin <em>et al.</em>, 2003</a>), in which high dark CO<sub>2</sub> fixation rates have been reported (<a id="xref-ref-20-2" class="xref-bibr" href="#ref-20">Jost <em>et al.</em>, 2010</a>).
+               </p>
+               <p id="p-9">In stimulation experiments (<a id="xref-ref-22-1" class="xref-bibr" href="#ref-22">Labrenz <em>et al.</em>, 2005</a>; <a id="xref-ref-5-1" class="xref-bibr" href="#ref-5">Brettar <em>et al.</em>, 2006</a>), quantitative 16S rRNA PCR (<a id="xref-ref-21-1" class="xref-bibr" href="#ref-21">Labrenz <em>et al.</em>, 2004</a>), catalysed reporter deposition–fluorescence <em>in situ</em> hybridization (CARD-FISH; <a id="xref-ref-13-1" class="xref-bibr" href="#ref-13">Grote <em>et al.</em>, 2007</a>) and microautoradiography (MICRO)-CARD-FISH (<a id="xref-ref-14-2" class="xref-bibr" href="#ref-14">Grote <em>et al.</em>, 2008</a>) analyses, as well as 16S rRNA stable isotope probing (RNA-SIP; <a id="xref-ref-11-1" class="xref-bibr" href="#ref-11">Glaubitz <em>et al.</em>, 2009</a>), the epsilonproteobacterial ‘Uncultured <span class="named-content family" id="named-content-9"><a class="namesforlife" rel="namesforlife-name" title="Helicobacteraceae"
+                        href="doi:10.1601/nm.3831"><em>Helicobacteraceae</em></a></span> G138eps1/GD17’ subgroup was shown to account for up to 30 % of the total cell numbers in pelagic redox zones of the central
+                  Baltic Sea. The abundance of these bacteria highlights the importance of chemolithoautotrophic denitrification, which was
+                  convincingly demonstrated to be the major N-loss process in water columns with a sulfide–nitrate interface (<a id="xref-ref-4-1" class="xref-bibr" href="#ref-4">Brettar &amp; Rheinheimer, 1991</a>; <a id="xref-ref-16-1" class="xref-bibr" href="#ref-16">Hannig <em>et al.</em>, 2007</a>; <a id="xref-ref-18-1" class="xref-bibr" href="#ref-18">Jensen <em>et al.</em>, 2009</a>), catalysed by the GD17 group as potential key organisms for this process. According to its 16S rRNA phylogeny, the ‘Uncultured
+                  <span class="named-content family" id="named-content-10"><a class="namesforlife" rel="namesforlife-name" title="Helicobacteraceae"
+                        href="doi:10.1601/nm.3831"><em>Helicobacteraceae</em></a></span> G138eps1/GD17’ subgroup belongs to the genus <span class="named-content genus" id="named-content-11"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                        href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span><em>,</em> which comprises mesophilic, facultatively anaerobic, chemolithoautotrophic species originating from deep-sea hydrothermal
+                  and marine sulfidic environments (<a id="xref-ref-36-1" class="xref-bibr" href="#ref-36">Takai <em>et al.</em>, 2006</a>). In previous work (<a id="xref-ref-15-1" class="xref-bibr" href="#ref-15">Grote <em>et al.</em>, 2012</a>) we described the isolation of strain Gotland Deep 1 (GD1<sup>T</sup>), a close phylogenetic relative (16S rRNA similarity of 95.7 %) and thus representative of the Baltic <span class="named-content genus" id="named-content-12"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                        href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span> ‘Uncultured <span class="named-content family" id="named-content-13"><a class="namesforlife" rel="namesforlife-name" title="Helicobacteraceae"
+                        href="doi:10.1601/nm.3831"><em>Helicobacteraceae</em></a></span> G138eps1/GD17’ subgroup. Selected genomic and physiological data suggested an ecological role for GD1<sup>T</sup>, especially with respect to its sulfide detoxification ability (<a id="xref-ref-15-2" class="xref-bibr" href="#ref-15">Grote <em>et al.</em>, 2012</a>). Here, we expand on previous work by presenting the taxonomic characteristics of GD1<sup>T</sup>. Our results form the basis of an emended description of the genus <span class="named-content genus" id="named-content-14"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                        href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span>.
+               </p>
+               <p id="p-10">Strain GD1<sup>T</sup> was isolated from a pelagic redox zone of the Gotland Deep in the central Baltic Sea during a research cruise on board the
+                  RV <em>Alkor</em> in May 2005 (57° 19.2′ N 20° 03′ E). Water was collected in a free-flow bottle attached to a CTD-rosette from a depth of
+                  215 m. The <em>in situ</em> temperature was 6 °C, the salinity 13 practical salinity units (PSU), and the sulfide concentration 11 µM. Directly on board,
+                  100 µM KNO<sub>3</sub> and 100 µM Na<sub>2</sub>S<sub>2</sub>O<sub>3</sub> were added to the water samples, which were then incubated in the dark at 10 °C under anoxic conditions. For further isolation
+                  and cultivation in the laboratory, a modified version of artificial brackish water medium (ABW) (<a id="xref-ref-7-1" class="xref-bibr" href="#ref-7">Bruns <em>et al.</em>, 2002</a>) was used, consisting of 95 mM NaCl, 11.2 mM MgCl<sub>2</sub> . 6H<sub>2</sub>O, 2.3 mM CaCl<sub>2</sub> . 2H<sub>2</sub>O, 2.0 mM KCl, 6.4 mM Na<sub>2</sub>SO<sub>4</sub>, 192 µM KBr, 92 µM H<sub>3</sub>BO<sub>3</sub>, 34 µM SrCl<sub>2</sub>, 92 µM NH<sub>4</sub>Cl, 9 µM KH<sub>2</sub>PO<sub>4</sub> and 16 µM NaF, buffered with 10 mM HEPES (pH 7.3). For anaerobic cultivation, the medium was boiled, bubbled with N<sub>2</sub> for 30 min, and then autoclaved under anoxic conditions. Subsequently, anoxic and sterile-filtered 0.1 % (v/v) of the trace
+                  element solution SL10 (<a id="xref-ref-39-1" class="xref-bibr" href="#ref-39">Widdel <em>et al.</em>, 1983</a>), 0.2 % (v/v) of a 10-vitamin solution (<a id="xref-ref-2-1" class="xref-bibr" href="#ref-2">Balch <em>et al.</em>, 1979</a>), 0.02 % (v/v) of a selenite–tungstate solution (<a id="xref-ref-38-1" class="xref-bibr" href="#ref-38">Widdel &amp; Bak, 1992</a>), and 2–5 mM NaHCO<sub>3</sub> were added. The standard medium ABW+nitrate+thiosulfate (ABW+NS) was prepared by the variable addition of 10 mM KNO<sub>3</sub> and 10 mM Na<sub>2</sub>S<sub>2</sub>O<sub>3</sub>, with the final concentration depending on the experiment. A pure culture was acquired by the dilution to extinction method
+                  and was cryopreserved at −80 °C in glycerol for long-term storage.
+               </p>
+               <p id="p-11">Morphological, physiological, and metabolic characteristics were, for the most part, analysed as described earlier (<a id="xref-ref-15-3" class="xref-bibr" href="#ref-15">Grote <em>et al.</em>, 2012</a>). For these analyses, strain GD1<sup>T</sup> was cultivated in triplicate for 7–10 days at 15 °C in the dark. Growth was usually measured by counting 4′,6′-diamidino-2-phenylindol
+                  (DAPI) stained cells, observed using epifluorescence microscopy, or by flow cytometric determinations of SYBR-Green I (Molecular
+                  Probes) stained cells (<a id="xref-ref-23-1" class="xref-bibr" href="#ref-23">Labrenz <em>et al.</em>, 2007</a>) at the end of the experiment. <span class="named-content species" id="named-content-15"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas denitrificans"
+                        href="doi:10.1601/nm.9790"><em>Sulfurimonas denitrificans</em></a></span> DSM 1251<sup>T</sup> was used as the reference strain in the cultivation experiments.
+               </p>
+               <p id="p-12">Isolate GD1<sup>T</sup> is a motile, Gram-reaction-negative, slightly curved or spirilla-shaped bacterium typically with one polar flagellum (<a id="xref-fig-1-1" class="xref-fig" href="#F1">Fig. 1a, b</a>), but in some cases two flagella at opposite poles (<a id="xref-fig-1-2" class="xref-fig" href="#F1">Fig. 1c</a>). Cell width was rather constant (mean = 0.66 µm, <span class="sc">sd</span> = 0.083 µm, <em>n</em> = 112) whereas cell length, i.e. from pole to pole, was variable (mean = 2.1 µm, <span class="sc">sd</span> = 0.54 µm, <em>n</em> = 112). The cells had a positive chemotactic response to nitrate (<a id="xref-ref-15-4" class="xref-bibr" href="#ref-15">Grote <em>et al.</em>, 2012</a>). Under optimal conditions in ABW+NS medium the cell doubling time of strain GD1<sup>T</sup> was 13 h. Cells in older cultures tended to form aggregates. Growth at temperatures in the range of 4–40 °C was investigated,
+                  with highest cell numbers obtained between 4 and 20 °C and optimal growth at 15 °C (<a id="xref-ref-15-5" class="xref-bibr" href="#ref-15">Grote <em>et al.</em>, 2012</a>). Thus, isolate GD1<sup>T</sup> is the first psychrotolerant species within the genus <span class="named-content genus" id="named-content-16"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                        href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span>, in which all member species at the time of writing are mesophilic (<a id="xref-table-wrap-1-1" class="xref-table" href="#T1">Table 1</a>).
+               </p>
+               <div id="F1" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4141/F1.expansion.html"><img alt="Fig. 1. " src="4141/F1.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4141/F1.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4141/F1.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4141/F1">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 1. </span> 
+                     
+                     <p id="p-13" class="first-child">Cell morphology of spirilla-shaped cells of strain GD1<sup>T</sup> cultivated on ABW+NS medium. (a) Fluorescence microscopy of 4′,6′-diamidino-2-phenylindol (DAPI) stained cells. (b) Transmission
+                        electron microscopy of a bacterium with one flagellum and (c) of a bacterium with two flagella (indicated by arrows), both
+                        negatively stained with phosphotungstic acid.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <div id="T1" class="table pos-float">
+                  <div class="table-inline">
+                     <div class="callout"><span>View this table:</span><ul class="callout-links">
+                           <li><a href="4141/T1.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4141/T1.expansion.html">In a new window</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="table-caption"><span class="table-label">Table 1. </span> 
+                     <span class="caption-title">Differential characteristics between strain GD1<sup>T</sup> and species of the genus <span class="named-content genus" id="named-content-17"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                              href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span></span>
+                     
+                     <p id="p-14" class="first-child">Taxa: 1, <em>Sulfurimonas gotlandica</em> sp. nov. GD1<sup>T</sup>; 2, <span class="named-content species" id="named-content-18"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas denitrificans"
+                              href="doi:10.1601/nm.9790"><em>Sulfurimonas denitrificans</em></a></span> DSM 1251<sup>T</sup> (data from this study; <a id="xref-ref-37-1" class="xref-bibr" href="#ref-37">Timmer-ten Hoor, 1975</a>; <a id="xref-ref-6-1" class="xref-bibr" href="#ref-6">Brinkhoff <em>et al.</em>, 2005</a>); 3, <span class="named-content species" id="named-content-19"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas paralvinellae"
+                              href="doi:10.1601/nm.10230"><em>Sulfurimonas paralvinellae</em></a></span> GO25<sup>T</sup> (<a id="xref-ref-36-2" class="xref-bibr" href="#ref-36">Takai <em>et al.</em>, 2006</a>); 4, <span class="named-content species" id="named-content-20"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas autotrophica"
+                              href="doi:10.1601/nm.3857"><em>Sulfurimonas autotrophica</em></a></span> OK10<sup>T</sup> (<a id="xref-ref-17-1" class="xref-bibr" href="#ref-17">Inagaki <em>et al.</em>, 2003</a>). <span class="sc">nd</span>, Not determined; +, positive; −, negative.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <p id="p-20">To obtain media with different pH values, the pH of a 20 ml subsample from the anoxic ABW+NS was adjusted to pH 6.0, 6.5,
+                  6.7, 6.9, 7.1, 7.5, 8.0, 8.4 and 9.0 by the addition of the appropriate amount of 0.1M HCl. For the experimental setup, the
+                  corresponding amount of 1 M HCl was added to the media preparations, which were then inoculated. After 14 days of incubation,
+                  the pH was measured. At an initial pH of 6.5–8.4, it remained constant (±0.02) throughout the experiment whereas below and
+                  above this range it decreased by about 0.18–0.25 pH units. Optimal growth occurred over a wide pH range (6.7–8.0) but no growth
+                  occured at pH 6.0 and 8.4. The NaCl requirement was determined by cultivation in ABW+NS containing the following salt concentrations
+                  [NaCl (g l<sup>−1</sup>)/MgCl<sub>2</sub> . 6H<sub>2</sub>O (g l<sup>−1</sup>)]: 0/0, 0/0.50, 2.50/0.38, 5.00/0.75, 7.50/1.13, 10.00/1.50, 12.50/1.88, 15.00/2.25, 17.50/2.63 and 20.00/3.00. The isolate
+                  had an absolute requirement for NaCl and grew best with between 10 and 20 g NaCl l<sup>−1</sup>; the upper limit for growth was not further determined. No growth was observed in media without added NaCl, in contrast to
+                  <span class="named-content species" id="named-content-21"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas denitrificans"
+                        href="doi:10.1601/nm.9790"><em>Sulfurimonas denitrificans</em></a></span> DSM 1251<sup>T</sup>, which grew equally well without NaCl and at all NaCl concentrations tested (<a id="xref-table-wrap-1-2" class="xref-table" href="#T1">Table 1</a>).
+               </p>
+               <p id="p-21">To identify the electron donors sustaining chemoautotrophic growth of isolate GD1<sup>T</sup>, ABW medium containing 5 mM nitrate was supplemented with sulfite (1 mM), sulfide (10 µM, 20 µM, 100 µM) or elemental sulfur
+                  (1 mM). Hydrogen utilization was assessed by bubbling ABW+NS with forming gas (N<sub>2</sub>/H<sub>2</sub>, 95 : 5) for several hours prior to inoculation and cultivation. Strain GD1<sup>T</sup> was able to use all of the tested electron donors as an energy source for growth although growth was inhibited by sulfide
+                  concentrations &gt;20 µM (<a id="xref-ref-15-6" class="xref-bibr" href="#ref-15">Grote <em>et al.</em>, 2012</a>). This observation is in accordance with <em>in situ</em> activities of chemoautotrophic micro-organisms in pelagic Gotland Deep redox zones, where dark CO<sub>2</sub> fixation rates are significantly reduced at environmental sulfide concentrations &gt;20 µM (<a id="xref-ref-20-3" class="xref-bibr" href="#ref-20">Jost <em>et al.</em>, 2010</a>). As electron acceptors, nitrate (100 µM, 2 mM, 5 mM, 10 mM), nitrite (600 µM, 2 mM) (<a id="xref-ref-15-7" class="xref-bibr" href="#ref-15">Grote <em>et al.</em>, 2012</a>), manganese(IV) oxide (200 µM), manganese(III) acetate dihydrate (2.4 mM), iron(III) chloride hexahydrate (5 mM), fumarate
+                  (100 µM) and oxygen (4 % saturation, approx. 12 µmol O<sub>2</sub> l<sup>−1</sup>) were tested in ABW containing 5 mM thiosulfate. For the oxygen experiment, the oxygen content in fully oxygenated ABW+thiosulfate
+                  was measured with an optode (POF-PSt3; PreSens) and the appropriate amount of oxygen was then mixed with anoxic ABW+thiosulfate
+                  to achieve the desired amount of saturation. However, only nitrate and nitrite served as electron acceptors during growth
+                  of the bacterium.
+               </p>
+               <p id="p-22">Although the manganese and iron concentrations tested may have been too high and thereby suppressed cell growth, previous
+                  thiosulfate/manganese stimulation experiments with Baltic Sea water samples containing lower metal concentrations similarly
+                  failed to reveal active manganese-reducing species of the genus <span class="named-content genus" id="named-content-22"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                        href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span> (<a id="xref-ref-22-2" class="xref-bibr" href="#ref-22">Labrenz <em>et al.</em>, 2005</a>). <span class="named-content species" id="named-content-23"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas autotrophica"
+                        href="doi:10.1601/nm.3857"><em>Sulfurimonas autotrophica</em></a></span> is likewise unable to reduce ferrihydrite (<a id="xref-ref-17-2" class="xref-bibr" href="#ref-17">Inagaki <em>et al.</em>, 2003</a>), which further supports the lack of direct participation of strain GD1<sup>T</sup> in the Mn/Fe-shuttle (<a id="xref-ref-28-2" class="xref-bibr" href="#ref-28">Neretin <em>et al.</em>, 2003</a>) of Baltic pelagic redox zones. It also cannot be excluded that strain GD1<sup>T</sup> is able to grow in medium with an oxygen concentration below 4 %, given that the genome of this bacterium includes a gene
+                  encoding a putative cbb3-type cytochrome <em>c</em> oxidase with the potential to mediate aerobic respiration (<a id="xref-ref-15-8" class="xref-bibr" href="#ref-15">Grote <em>et al.</em>, 2012</a>). If aerobic respiration could occur at very low oxygen concentrations, it was beyond the scope of our experimental design.
+                  The oxygen sensitivity of strain GD1<sup>T</sup> was examined in detail, using ABW+NS with oxygen saturations of 0.5, 3, 5, 10, 20, 30, 40 and 50 %. Compared to oxygen-free
+                  conditions, oxygen concentrations ≥20 % reduced or inhibited the growth of this strain whereas oxygen concentration ≤10 %
+                  had no such effect (<a id="xref-ref-15-9" class="xref-bibr" href="#ref-15">Grote <em>et al.</em>, 2012</a>). Thus, the oxygen tolerance of strain GD1<sup>T</sup> is similar to that of aerobic <span class="named-content species" id="named-content-24"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas autotrophica"
+                        href="doi:10.1601/nm.3857"><em>Sulfurimonas autotrophica</em></a></span> OK10<sup>T</sup> (<a id="xref-table-wrap-1-3" class="xref-table" href="#T1">Table 1</a>). Based on our current knowledge, we consider strain GD1<sup>T</sup> to be an aerotolerant representative of the genus <span class="named-content genus" id="named-content-25"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                        href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span>.
+               </p>
+               <p id="p-23">Chemolithoautotrophic growth was directly confirmed in ABW+NS containing <sup>14</sup>C-bicarbonate followed by a combination of fluorescence <em>in situ</em> hybridization and microautoradiography (MICRO-CARD-FISH) (<a id="xref-ref-15-10" class="xref-bibr" href="#ref-15">Grote <em>et al.</em>, 2012</a>). As electron donor (in ABW+5 mM KNO<sub>3</sub>) alone or as electron donor and sole carbon source (in NaHCO<sub>3</sub>-free ABW+5 mM KNO<sub>3</sub>) the following compounds were tested: (a) glucose (0.1 mM), (b) a mixture of lactate, malate, fumarate, succinate, glycerine
+                  and glucose (abbreviated as mix 4) (100 µM), (c) yeast extract (0.01 mg l<sup>−1</sup>), (d) pyruvate (100 µM), (e) acetate (100 µM), (f) fumarate (100 µM), (g) alcohol mix (butanol, ethanol, methanol, propanol;
+                  100 µM) (<a id="xref-ref-15-11" class="xref-bibr" href="#ref-15">Grote <em>et al.</em>, 2012</a>) and (h) an amino acid mix (0.1 mM) consisting of (g l<sup>−1</sup>): β-alanine 0.466, <span class="sc">l</span>-arginine 0.872, <span class="sc">l</span>-asparagine 0.750, <span class="sc">l</span>-cysteine 0.606, <span class="sc">l</span>-glutamine 0.730, <span class="sc">l</span>-glutamic acid 0.736, glycine 0.376, isoleucine 0.656, <span class="sc">l</span>-leucine 0.656, <span class="sc">l</span>-methionine 0.746, <span class="sc">l</span>-phenylalanine 0.826, <span class="sc">l</span>-serine 0.526, <span class="sc">l</span>-threonine 0.596, <span class="sc">l</span>-valine 0.586, <span class="sc">l</span>-proline 0.576, <span class="sc">l</span>-tryptophan 1.022, <span class="sc">l</span>-histidine 0.776, <span class="sc">l</span>-lysine 0.822, <span class="sc">l</span>-tyrosine 0.906 and <span class="sc">l</span>-asparagine 0.666.
+               </p>
+               <p id="p-24">In the presence of 2 mM NaHCO<sub>3</sub>, the growth of isolate GD1<sup>T</sup> was promoted with formate, acetate, yeast extract, pyruvate and the amino acid mix as electron donors. However, maximal cell
+                  numbers were usually more than a magnitude less than those reached with thiosulfate/nitrate-containing medium, as shown in
+                  <a id="xref-fig-2-1" class="xref-fig" href="#F2">Fig. 2(a)</a> for pyruvate, which was also used in radiotracer experiments aimed at confirming the capability of strain GD1<sup>T</sup> to use organics as electron donor. In those experiments, CO<sub>2</sub> production was measured following the addition of 16 kBq [2-<sup>14</sup>C]pyruvate (specific activity 0.6 GBq mmol<sup>−1</sup>) to cultures grown solely on pyruvate or on thiosulfate/pyruvate. After 24 h or 72 h of incubation, CO<sub>2</sub> was degassed by the acidification of cell-free medium and trapped in ethanolamine. In nitrate/pyruvate medium, the growth
+                  of strain GD1<sup>T</sup> was accompanied by elevated CO<sub>2</sub> production (<a id="xref-fig-2-2" class="xref-fig" href="#F2">Fig. 2b</a>). The simultaneous incorporation of [2-<sup>14</sup>C]pyruvate into GD1T cells was much less pronounced, but its uptake and contribution to biomass production were clearly determined
+                  in thiosulfate/nitrate/pyruvate medium, where total cell numbers were also higher than those reached in thiosulfate/nitrate
+                  medium (<a id="xref-fig-2-3" class="xref-fig" href="#F2">Fig. 2a</a>), but the difference was not statistically significant (unpublished data). By contrast, in NaHCO<sub>3</sub>-free medium strain GD1<sup>T</sup> was unable to use any of the organics offered simultaneously as electron donor and carbon source (<a id="xref-fig-2-4" class="xref-fig" href="#F2">Fig. 2a</a>). It has long been recognized that even heterotrophic bacteria may require CO<sub>2</sub> for growth (<a id="xref-ref-9-1" class="xref-bibr" href="#ref-9">Dehority, 1971</a>), e.g. in anaplerotic reactions (<a id="xref-ref-1-1" class="xref-bibr" href="#ref-1">Alonso-Sáez <em>et al.</em>, 2010</a>). Similar findings were reported for <span class="named-content species" id="named-content-26"><a class="namesforlife" rel="namesforlife-name" title="Nitrobacter hamburgensis"
+                        href="doi:10.1601/nm.1487"><em>Nitrobacter hamburgensis</em></a></span>, which requires atmospheric CO<sub>2</sub> or the addition of sodium carbonate for mixotrophic growth (in the presence of NO<sub>2</sub><sup>−</sup>) on <span class="sc">d</span>-lactate (<a id="xref-ref-33-1" class="xref-bibr" href="#ref-33">Starkenburg <em>et al.</em>, 2008</a>). The authors of that study suggested that CO<sub>2</sub> fixation served as a reductant sink necessary to maintain cellular redox balance. The physiological background for the growth
+                  of isolate GD1<sup>T</sup> on organics is thus far unclear. In other species of the genus <span class="named-content genus" id="named-content-27"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                        href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span>, organic substance utilization is variable. For example, in a similar experiment <span class="named-content species" id="named-content-28"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas denitrificans"
+                        href="doi:10.1601/nm.9790"><em>Sulfurimonas denitrificans</em></a></span> was able to use formate, fumarate, yeast extract and the alcohol mix as electron donors (<a id="xref-table-wrap-1-4" class="xref-table" href="#T1">Table 1</a>). The ability of this bacterium to oxidize formate was proposed in a genome analysis, which identified a formate dehydrogenase
+                  complex (<a id="xref-ref-31-1" class="xref-bibr" href="#ref-31">Sievert <em>et al.</em>, 2008</a>). Homologues of genes involved in glycolysis and proteolysis are also present in the genome of strain GD1<sup>T</sup> (<a id="xref-ref-15-12" class="xref-bibr" href="#ref-15">Grote <em>et al.</em>, 2012</a>), whereas <span class="named-content species" id="named-content-29"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas autotrophica"
+                        href="doi:10.1601/nm.3857"><em>Sulfurimonas autotrophica</em></a></span> (<a id="xref-ref-17-3" class="xref-bibr" href="#ref-17">Inagaki <em>et al.</em>, 2003</a>; but tested without bicarbonate supplementation to the organic medium) and <span class="named-content species" id="named-content-30"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas paralvinellae"
+                        href="doi:10.1601/nm.10230"><em>Sulfurimonas paralvinellae</em></a></span> (<a id="xref-ref-36-3" class="xref-bibr" href="#ref-36">Takai <em>et al.</em>, 2006</a>) are unable to grow on organic compounds. In conclusion, although under specific circumstances organic compounds enhance
+                  the growth of some species of the genus <span class="named-content genus" id="named-content-31"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                        href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span>, members of this genus characteristically grow chemolithoautotrophically.
+               </p>
+               <div id="F2" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4141/F2.expansion.html"><img alt="Fig. 2. " src="4141/F2.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4141/F2.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4141/F2.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4141/F2">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 2. </span> 
+                     
+                     <p id="p-25" class="first-child">Impact of pyruvate on the growth of isolate GD1<sup>T</sup>. Error bars indicate the standard deviation of three independent replicates for each assay. (a) Growth on media with different
+                        substrate combinations: 1, NaHCO<sub>3</sub>, S<sub>2</sub>O<sub>3</sub><sup>2-</sup>, NO<sub>3</sub><sup>−</sup>; 2, NaHCO<sub>3</sub>, S<sub>2</sub>O<sub>3</sub><sup>2-</sup>, NO<sub>3</sub><sup>−</sup>, pyruvate; 3, NaHCO<sub>3</sub>, pyruvate; 4, pyruvate; 5, ABW without further supplements. The relative enrichment factor describes the increase of cell
+                        numbers after 7 days of incubation compared to the initial cell numbers after inoculation at day 0 (6.1×10<sup>5</sup> ml<sup>−1</sup>). (b) <sup>14</sup>CO<sub>2</sub> production and [<sup>14</sup>C]pyruvate incorporation after 24 h and 72 h of incubation. Media: 1, NaHCO<sub>3</sub>, S<sub>2</sub>O<sub>3</sub><sup>2-</sup>, NO<sub>3</sub><sup>−</sup>, [<sup>14</sup>C]pyruvate; 2, NaHCO<sub>3</sub>, NO<sub>3</sub><sup>−</sup>, [<sup>14</sup>C]pyruvate. P, pyruvate incorporation; CO<sub>2</sub>, CO<sub>2</sub> production.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <p id="p-26">Total fatty acids and phospholipid-derived fatty acids were extracted as described by Sasser (1990) and <a id="xref-ref-3-1" class="xref-bibr" href="#ref-3">Boschker (2004)</a>, respectively, and analysed by gas chromatography with a flame-ionization detector on a non-polar HP-5ms column (Agilent).
+                  The dominant cellular fatty acid of strain GD1<sup>T</sup> was 16 : 1ω7<em>c</em>, with 3-OH 14 : 0, 16 : 0, 16 : 1ω5<em>c</em>+<em>t</em>, and 18 : 1ω7<em>c</em> detected in lower amounts. This fatty acid profile is comparable to those of other species of the genus <span class="named-content genus" id="named-content-32"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                        href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span> but most similar to that of <span class="named-content species" id="named-content-33"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas denitrificans"
+                        href="doi:10.1601/nm.9790"><em>Sulfurimonas denitrificans</em></a></span> (<a id="xref-table-wrap-1-5" class="xref-table" href="#T1">Table 1</a>). This may reflect the fact that strain GD1<sup>T</sup> and <span class="named-content species" id="named-content-34"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas denitrificans"
+                        href="doi:10.1601/nm.9790"><em>Sulfurimonas denitrificans</em></a></span> were cultivated on ABW+NS under identical conditions. However, a high percentage of C16 : 0 and one or both of the monounsaturated
+                  C16 and C18 fatty acids has also been described in other members of the class <span class="named-content class" id="named-content-35"><a class="namesforlife" rel="namesforlife-name" title="Epsilonproteobacteria"
+                        href="doi:10.1601/nm.3783"><em>Epsilonproteobacteria</em></a></span>, such as <span class="named-content species" id="named-content-36"><a class="namesforlife" rel="namesforlife-name" title="Nitratifractor salsuginis"
+                        href="doi:10.1601/nm.9373"><em>Nitratifractor salsuginis</em></a></span> and <span class="named-content species" id="named-content-37"><a class="namesforlife" rel="namesforlife-name" title="Sulfurovum lithotrophicum"
+                        href="doi:10.1601/nm.8874"><em>Sulfurovum lithotrophicum</em></a></span> (<a id="xref-ref-34-1" class="xref-bibr" href="#ref-34">Suzuki <em>et al.</em>, 2005</a>). Accordingly, this combination may be a general characteristic of these epsilonproteobacteria.
+               </p>
+               <p id="p-27">The DNA guanine-plus-cytosine (G+C) content of strain GD1<sup>T</sup> was determined to be 33.6 mol%, as calculated by analysis of the whole genome (<a id="xref-ref-15-13" class="xref-bibr" href="#ref-15">Grote <em>et al.</em>, 2012</a>).
+               </p>
+               <p id="p-28">To establish the closest relatives of strain GD1<sup>T</sup> based on 16S rRNA sequencing, preliminary searches in the EMBL Data Library were performed with the program <span class="sc">fasta</span> (<a id="xref-ref-29-1" class="xref-bibr" href="#ref-29">Pearson &amp; Lipman, 1988</a>). Closely related sequences were retrieved from GenBank and aligned and analysed with the newly determined sequence, within
+                  the program <span class="sc">arb</span> (<a id="xref-ref-25-1" class="xref-bibr" href="#ref-25">Ludwig <em>et al.</em>, 2004</a>). Sequences for analysis were reduced to unambiguously alignable positions using group-specific filters. For phylogenetic
+                  analyses, three different trees were calculated using the neighbour-joining, parsimony and maximum-likelihood (Phyml) algorithms
+                  based on nearly full-length 16S rRNA sequences (approx. 1400 bp). For neighbour-joining, the Jukes–Cantor-correction was applied.
+                  Shorter sequences were gradually inserted into the reconstructed tree without changing the topology. Sequence searches of
+                  the EMBL database (latest: 2013-05-14) revealed that our isolate is related to the epsilon class of the phylum <span class="named-content phylum" id="named-content-38"><a class="namesforlife" rel="namesforlife-name" title="Proteobacteria"
+                        href="doi:10.1601/nm.808"><em>Proteobacteria</em></a></span> (data not shown). In a pairwise analysis, it displayed highest (93.7–94.2 %) 16S rRNA gene sequence similarity to species
+                  of the genus <span class="named-content genus" id="named-content-39"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                        href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span> and to the Baltic ‘Uncultured <span class="named-content family" id="named-content-40"><a class="namesforlife" rel="namesforlife-name" title="Helicobacteraceae"
+                        href="doi:10.1601/nm.3831"><em>Helicobacteraceae</em></a></span> G138eps1/GD17’ subgroup (95.7 %). Lower levels of relatedness (≤91 % sequence similarity) were determined for the other examined
+                  species belonging to the epsilon class of the phylum <span class="named-content phylum" id="named-content-41"><a class="namesforlife" rel="namesforlife-name" title="Proteobacteria"
+                        href="doi:10.1601/nm.808"><em>Proteobacteria</em></a></span>.
+               </p>
+               <p id="p-29">An unrooted tree reconstructed using the neighbour-joining method showed the phylogenetic position of the novel bacterium,
+                  strain GD1<sup>T</sup>, amongst the members of the class <span class="named-content class" id="named-content-42"><a class="namesforlife" rel="namesforlife-name" title="Epsilonproteobacteria"
+                        href="doi:10.1601/nm.3783"><em>Epsilonproteobacteria</em></a></span> (<a id="xref-fig-3-1" class="xref-fig" href="#F3">Fig. 3</a>). Treeing analyses confirmed it to be a member of the genus <span class="named-content genus" id="named-content-43"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                        href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span>, forming a stable cluster with the ‘Uncultured <span class="named-content family" id="named-content-44"><a class="namesforlife" rel="namesforlife-name" title="Helicobacteraceae"
+                        href="doi:10.1601/nm.3831"><em>Helicobacteraceae</em></a></span> G138eps1/GD17’ subgroup. This cluster is specifically detected by the SUL90 16S rRNA gene probe, originally developed to
+                  be 100 % complementary to the G138eps1/GD17 target site (<a id="xref-ref-13-2" class="xref-bibr" href="#ref-13">Grote <em>et al.</em>, 2007</a>).
+               </p>
+               <div id="F3" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4141/F3.expansion.html"><img alt="Fig. 3. " src="4141/F3.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4141/F3.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4141/F3.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4141/F3">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 3. </span> 
+                     
+                     <p id="p-30" class="first-child">Unrooted tree showing phylogenetic relationships of isolate GD1<sup>T</sup> and closely related members of the class <span class="named-content class" id="named-content-45"><a class="namesforlife" rel="namesforlife-name" title="Epsilonproteobacteria"
+                              href="doi:10.1601/nm.3783"><em>Epsilonproteobacteria</em></a></span>. The tree was reconstructed using the neighbour-joining method and was based on a comparison of approximately 1400 nt. Solid
+                        squares indicate that the corresponding nodes (or groups) were recovered in neighbour-joining, maximum-parsimony and maximum-likelihood
+                        methods. Branching points supported by two algorithms are marked by an open square. The following strains were used as an
+                        outgroup (not shown): <span class="named-content species" id="named-content-46"><a class="namesforlife" rel="namesforlife-name"
+                              title="Antarctobacter heliothermus"
+                              href="doi:10.1601/nm.1057"><em>Antarctobacter heliothermus</em></a></span> EL-219<sup>T</sup>, <span class="named-content species" id="named-content-47"><a class="namesforlife" rel="namesforlife-name" title="Sagittula stellata"
+                              href="doi:10.1601/nm.1149"><em>Sagittula stellata</em></a></span> E-37<sup>T</sup>, <span class="named-content species" id="named-content-48"><a class="namesforlife" rel="namesforlife-name" title="Roseovarius tolerans"
+                              href="doi:10.1601/nm.1140"><em>Roseovarius tolerans</em></a></span> EL-172<sup>T</sup>, <span class="named-content species" id="named-content-49"><a class="namesforlife" rel="namesforlife-name" title="Roseovarius nubinhibens"
+                              href="doi:10.1601/nm.1141"><em>Roseovarius nubinhibens</em></a></span> ISM<sup>T</sup> and <span class="named-content species" id="named-content-50"><a class="namesforlife" rel="namesforlife-name" title="Roseovarius mucosus"
+                              href="doi:10.1601/nm.9734"><em>Roseovarius mucosus</em></a></span> DFL-24<sup>T</sup>. Bar, 1 substitution per 10 nt.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <p id="p-31">There is no precise correlation between percentage 16S rRNA sequence divergence and species delineation, but it is generally
+                  recognized that divergence values ≥3 % are significant (<a id="xref-ref-32-1" class="xref-bibr" href="#ref-32">Stackebrandt &amp; Goebel, 1994</a>). However, it is pertinent to note that the phylogenetic separateness of strain GD1<sup>T</sup> is strongly supported by phenotypic considerations. For instance, this novel bacterium is distinguishable from other species
+                  of the genus <span class="named-content genus" id="named-content-51"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                        href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span> by its psychrotolerance and energy metabolism (<a id="xref-table-wrap-1-6" class="xref-table" href="#T1">Table 1</a>). Additional characteristics useful in differentiating Baltic isolate GD1<sup>T</sup> from related organisms are shown in <a id="xref-table-wrap-1-7" class="xref-table" href="#T1">Table 1</a>. Based on phenotypic and genetic evidence, we propose the classification of strain GD1<sup>T</sup> as a representative of a novel species of the genus <span class="named-content genus" id="named-content-52"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                        href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span>: <em>Sulfurimonas gotlandica</em> sp. nov.
+               </p>
+               <div class="section" id="sec-1">
+                  <div class="section-nav"><a href="#fn-group-1" title="Previous Section" class="prev-section-link"><span>Previous Section</span></a><a href="#ack-1" title="Acknowledgements" class="next-section-link"><span>Next Section</span></a></div>
+                  
+                  
+                  <div id="sec-2" class="subsection">
+                     
+                     <h3>Emended description of the genus <span class="named-content genus" id="named-content-53"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                              href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span></h3>
+                     
+                     <p id="p-32">The description is based on that by <a id="xref-ref-36-4" class="xref-bibr" href="#ref-36">Takai <em>et al.</em> (2006)</a>. Cells are Gram-negative and morphologically variable. Straight to slightly short rods, elongated rods and spiral in different
+                        growth phases and under different growth conditions. Psychrotolerant to mesophilic and aerotolerant to facultatively anaerobic.
+                        Do not always require NaCl for growth. Optimal growth occurs chemolithoautotrophically with sulfide, S<sup>0</sup>, thiosulfate and H<sub>2</sub> as electron donors, and with nitrate, nitrite and O<sub>2</sub> as electron acceptors, using CO<sub>2</sub> as a carbon source. Supplementation of bicarbonate can enable growth on organic substances, but yields much lower cell numbers
+                        compared to growth on reduced sulfur or hydrogen. Potential ecological niches are deep-sea hydrothermal environments and benthic
+                        or pelagic marine to brackish transition zones from oxic to anoxic/sulfidic environments. The type species is <span class="named-content species" id="named-content-54"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas autotrophica"
+                              href="doi:10.1601/nm.3857"><em>Sulfurimonas autotrophica</em></a></span> (<a id="xref-ref-17-4" class="xref-bibr" href="#ref-17">Inagaki <em>et al.</em> 2003</a>).
+                     </p>
+                     
+                  </div>
+                  <div id="sec-3" class="subsection">
+                     
+                     <h3>Description of <em>Sulfurimonas gotlandica</em> sp. nov.
+                     </h3>
+                     
+                     <p id="p-33"><em>Sulfurimonas</em> <em>gotlandica</em> (got.lan′di.ca. N.L. fem. adj. <em>gotlandica</em> pertaining to the Gotland Deep, the basin in the central Baltic Sea from which the organism was first isolated).
+                     </p>
+                     
+                     <p id="p-34">Gram-negative, slightly curved or spirilla-shaped cells. Motile by one polar flagellum or two flagella at opposite poles.
+                        Cells exhibit a positive chemotactic response to nitrate. Cell sizes are 0.66±0.083×2.1±0.54 µm. Cells have a tendency to
+                        aggregate at older stages. Psychro- and aerotolerant. The temperature range for growth is 4–20 °C. Optimal growth occurs at
+                        15 °C and pH 6.7–8.0. The cells have an absolute requirement for NaCl. Chemolithoautotrophic growth occurs with H<sub>2</sub>, HS<sup>−</sup>, S<sup>0</sup> and thiosulfate. Supplementation of bicarbonate can enable growth on formate, acetate, yeast extract, pyruvate or amino acid
+                        mix, but yields much lower cell numbers compared with growth on reduced sulfur or hydrogen. Sulfide concentrations of more
+                        than 20 µM inhibit, but up to 10 % of oxygen in the medium does not influence growth. Dominant cellular fatty acid is 16 : 1ω7<em>c</em>, with 14 : 0, 16 : 0, 16 : 1ω5<em>c</em>+<em>t</em>, and 18 : 1ω7<em>c</em> present in smaller amounts.
+                     </p>
+                     
+                     <p id="p-35">The type strain is GD1<sup>T</sup> ( = DSM 19862<sup>T</sup> = JCM 16533<sup>T</sup>), isolated from water of a pelagic redox zone of the central Baltic Sea. The G+C content of the type strain is 33.6 mol%.
+                     </p>
+                     
+                  </div>
+               </div>
+               <div class="section ack" id="ack-1">
+                  <div class="section-nav"><a href="#sec-1" title="Previous Section" class="prev-section-link"><span>Previous Section</span></a><a href="#ref-list-1" title="References" class="next-section-link"><span>Next Section</span></a></div>
+                  <h2>Acknowledgements</h2>
+                  
+                  <p id="p-36">We thank the captain and the crew of the RV <em>Alkor</em>. We gratefully acknowledge the skilful technical assistance of Bärbel Buuk. Michael Hannig helped during the isolation procedure.
+                     We thank the Deutsche Forschungsgemeinschaft (DFG) for grants LA 1466/4-1 and LA 1466/4-2.
+                  </p>
+                  
+               </div>
+               <div class="section ref-list" id="ref-list-1">
+                  <div class="section-nav"><a href="#ack-1" title="Acknowledgements" class="prev-section-link"><span>Previous Section</span></a><div class="nav-placeholder"> </div>
+                  </div>
+                  <h2>References</h2>
+                  <ol class="cit-list ref-use-labels">
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-1-1" title="View reference  in text"
+                           id="ref-1">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.1"
+                             data-doi="10.1038/ismej.2010.69">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Alonso-Sáez</span>,  <span class="cit-name-given-names">L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Galand</span>,  <span class="cit-name-given-names">P. E.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Casamayor</span>,  <span class="cit-name-given-names">E. O.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pedrós-Alió</span>,  <span class="cit-name-given-names">C.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bertilsson</span>,  <span class="cit-name-given-names">S.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2010</span><strong>).</strong> <span class="cit-article-title">High bicarbonate assimilation in the dark by Arctic bacteria</span>. <abbr class="cit-jnl-abbrev">ISME J</abbr> <span class="cit-vol">4</span>, <span class="cit-fpage">1581</span>–<span class="cit-lpage">1590</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1038/ismej.2010.69</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>20555365</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1038/ismej.2010.69&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=20555365&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=High%20bicarbonate%20assimilation%20in%20the%20dark%20by%20Arctic%20bacteria&amp;author=L.%20Alonso-S%C3%A1ez&amp;author=P.%20E.%20Galand&amp;author=E.%20O.%20Casamayor&amp;author=C.%20Pedr%C3%B3s-Ali%C3%B3&amp;author=S.%20Bertilsson&amp;publication_year=2010&amp;journal=ISME%20J&amp;volume=4&amp;pages=1581-1590&amp;doi=10.1038%2Fismej.2010.69&amp;pmid=20555365">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-2-1" title="View reference  in text"
+                           id="ref-2">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.2"
+                             data-doi="10.1080/713851165">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Balch</span>,  <span class="cit-name-given-names">W. E.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Fox</span>,  <span class="cit-name-given-names">G. E.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Magrum</span>,  <span class="cit-name-given-names">L. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Woese</span>,  <span class="cit-name-given-names">C. R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wolfe</span>,  <span class="cit-name-given-names">R. S.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1979</span><strong>).</strong> <span class="cit-article-title">Methanogens: reevaluation of a unique biological group</span>. <abbr class="cit-jnl-abbrev">Microbiol Rev</abbr> <span class="cit-vol">43</span>, <span class="cit-fpage">260</span>–<span class="cit-lpage">296</span>.<span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>390357</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=PDF&amp;journalCode=mmbr&amp;resid=43/2/260"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-3-1" title="View reference  in text"
+                           id="ref-3">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4141.3">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Kowalchuk</span>,  <span class="cit-name-given-names">G. A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">de Bruijn</span>,  <span class="cit-name-given-names">F. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Head</span>,  <span class="cit-name-given-names">I. M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Akkermans</span>,  <span class="cit-name-given-names">A. D.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">van Elsas</span>,  <span class="cit-name-given-names">J. D.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Boschker</span>,  <span class="cit-name-given-names">H. T. S.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2004</span><strong>).</strong> <span class="cit-article-title">Linking microbial community structure and functioning: stable isotope (13C) labeling in combination with PLFA analysis</span>. <em>In</em> <span class="cit-source">Molecular Microbial Ecology Manual II</span>, pp. <span class="cit-fpage">1673</span>–<span class="cit-lpage">1688</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Kowalchuk</span>,  <span class="cit-name-given-names">G. A.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">de Bruijn</span>,  <span class="cit-name-given-names">F. J.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Head</span>,  <span class="cit-name-given-names">I. M.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Akkermans</span>,  <span class="cit-name-given-names">A. D.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">van Elsas</span>,  <span class="cit-name-given-names">J. D.</span></span>
+                                 . <span class="cit-publ-loc">Dordrecht</span>: <span class="cit-publ-name">Kluwer Academic Publishers</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Linking%20microbial%20community%20structure%20and%20functioning%3A%20stable%20isotope%20%2813C%29%20labeling%20in%20combination%20with%20PLFA%20analysis&amp;author=H.%20T.%20S.%20Boschker&amp;publication_year=2004&amp;citation_inbook_title=Molecular%20Microbial%20Ecology%20Manual%20II">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-4-1" title="View reference  in text"
+                           id="ref-4">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.4"
+                             data-doi="10.3354/meps077157">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brettar</span>,  <span class="cit-name-given-names">I.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Rheinheimer</span>,  <span class="cit-name-given-names">G.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1991</span><strong>).</strong> <span class="cit-article-title">Denitrification in the central Baltic: evidence for H<sub>2</sub>S-oxidation as motor of denitrification at the oxic-anoxic interface</span>. <abbr class="cit-jnl-abbrev">Mar Ecol Prog Ser</abbr> <span class="cit-vol">77</span>, <span class="cit-fpage">157</span>–<span class="cit-lpage">169</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.3354/meps077157</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.3354/meps077157&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Denitrification%20in%20the%20central%20Baltic%3A%20evidence%20for%20H2S-oxidation%20as%20motor%20of%20denitrification%20at%20the%20oxic-anoxic%20interface&amp;author=I.%20Brettar&amp;author=G.%20Rheinheimer&amp;publication_year=1991&amp;journal=Mar%20Ecol%20Prog%20Ser&amp;volume=77&amp;pages=157-169&amp;doi=10.3354%2Fmeps077157">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-5-1" title="View reference  in text"
+                           id="ref-5">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.5"
+                             data-doi="10.1128/AEM.72.2.1364-1372.2006">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brettar</span>,  <span class="cit-name-given-names">I.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Labrenz</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Flavier</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bötel</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kuosa</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Christen</span>,  <span class="cit-name-given-names">R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Höfle</span>,  <span class="cit-name-given-names">M. G.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2006</span><strong>).</strong> <span class="cit-article-title">Identification of a <em>Thiomicrospira denitrificans</em>-like epsilonproteobacterium as a catalyst for autotrophic denitrification in the central Baltic Sea</span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">72</span>, <span class="cit-fpage">1364</span>–<span class="cit-lpage">1372</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.72.2.1364-1372.2006</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>16461688</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=72/2/1364"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-6-1" title="View reference  in text"
+                           id="ref-6">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4141.6">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Brenner</span>,  <span class="cit-name-given-names">D. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Staley</span>,  <span class="cit-name-given-names">J. T.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brinkhoff</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kuever</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Muyzer</span>,  <span class="cit-name-given-names">G.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jannasch</span>,  <span class="cit-name-given-names">H. W.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2005</span><strong>).</strong> <span class="cit-article-title">Genus VI. Thiomicrospira</span>. <em>In</em> <span class="cit-source">Bergey’s Manual of Systematic Bacteriology</span>, <span class="cit-edition">2nd edn</span>, <span class="cit-vol">vol. 2</span>, part B, pp. <span class="cit-fpage">193</span>–<span class="cit-lpage">199</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Brenner</span>,  <span class="cit-name-given-names">D. J.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Staley</span>,  <span class="cit-name-given-names">J. T.</span></span>
+                                 . <span class="cit-publ-loc">New York</span>: <span class="cit-publ-name">Springer</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Genus%20VI.%20Thiomicrospira&amp;author=T.%20Brinkhoff&amp;author=J.%20Kuever&amp;author=G.%20Muyzer&amp;author=H.%20W.%20Jannasch&amp;publication_year=2005&amp;citation_inbook_title=Bergey%E2%80%99s%20Manual%20of%20Systematic%20Bacteriology">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-7-1" title="View reference  in text"
+                           id="ref-7">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.7"
+                             data-doi="10.1128/AEM.68.8.3978-3987.2002">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bruns</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Cypionka</span>,  <span class="cit-name-given-names">H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Overmann</span>,  <span class="cit-name-given-names">J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2002</span><strong>).</strong> <span class="cit-article-title">Cyclic AMP and acyl homoserine lactones increase the cultivation efficiency of heterotrophic bacteria from the central Baltic
+                                    Sea</span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">68</span>, <span class="cit-fpage">3978</span>–<span class="cit-lpage">3987</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.68.8.3978-3987.2002</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>12147499</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=68/8/3978"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-8-1" title="View reference  in text"
+                           id="ref-8">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.8"
+                             data-doi="10.1038/nrmicro1414">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Campbell</span>,  <span class="cit-name-given-names">B. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Engel</span>,  <span class="cit-name-given-names">A. S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Porter</span>,  <span class="cit-name-given-names">M. L.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Takai</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2006</span><strong>).</strong> <span class="cit-article-title">The versatile epsilon-proteobacteria: key players in sulphidic habitats</span>. <abbr class="cit-jnl-abbrev">Nat Rev Microbiol</abbr> <span class="cit-vol">4</span>, <span class="cit-fpage">458</span>–<span class="cit-lpage">468</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1038/nrmicro1414</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>16652138</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1038/nrmicro1414&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=16652138&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=The%20versatile%20epsilon-proteobacteria%3A%20key%20players%20in%20sulphidic%20habitats&amp;author=B.%20J.%20Campbell&amp;author=A.%20S.%20Engel&amp;author=M.%20L.%20Porter&amp;author=K.%20Takai&amp;publication_year=2006&amp;journal=Nat%20Rev%20Microbiol&amp;volume=4&amp;pages=458-468&amp;doi=10.1038%2Fnrmicro1414&amp;pmid=16652138">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-9-1" title="View reference  in text"
+                           id="ref-9">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.9">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Dehority</span>,  <span class="cit-name-given-names">B. A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1971</span><strong>).</strong> <span class="cit-article-title">Carbon dioxide requirement of various species of rumen bacteria</span>. <abbr class="cit-jnl-abbrev">J Bacteriol</abbr> <span class="cit-vol">105</span>, <span class="cit-fpage">70</span>–<span class="cit-lpage">76</span>.<span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>5541030</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=jb&amp;resid=105/1/70"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-10-1" title="View reference  in text"
+                           id="ref-10">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.10"
+                             data-doi="10.1016/j.femsec.2004.07.004">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Engel</span>,  <span class="cit-name-given-names">A. S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Porter</span>,  <span class="cit-name-given-names">M. L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stern</span>,  <span class="cit-name-given-names">L. A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Quinlan</span>,  <span class="cit-name-given-names">S.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bennett</span>,  <span class="cit-name-given-names">P. C.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2004</span><strong>).</strong> <span class="cit-article-title">Bacterial diversity and ecosystem function of filamentous microbial mats from aphotic (cave) sulfidic springs dominated by
+                                    chemolithoautotrophic “<em>Epsilonproteobacteria</em>”</span>. <abbr class="cit-jnl-abbrev">FEMS Microbiol Ecol</abbr> <span class="cit-vol">51</span>, <span class="cit-fpage">31</span>–<span class="cit-lpage">53</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/j.femsec.2004.07.004</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>16329854</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/j.femsec.2004.07.004&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=16329854&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Bacterial%20diversity%20and%20ecosystem%20function%20of%20filamentous%20microbial%20mats%20from%20aphotic%20%28cave%29%20sulfidic%20springs%20dominated%20by%20chemolithoautotrophic%20%E2%80%9CEpsilonproteobacteria%E2%80%9D&amp;author=A.%20S.%20Engel&amp;author=M.%20L.%20Porter&amp;author=L.%20A.%20Stern&amp;author=S.%20Quinlan&amp;author=P.%20C.%20Bennett&amp;publication_year=2004&amp;journal=FEMS%20Microbiol%20Ecol&amp;volume=51&amp;pages=31-53&amp;doi=10.1016%2Fj.femsec.2004.07.004&amp;pmid=16329854">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-11-1" title="View reference  in text"
+                           id="ref-11">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.11"
+                             data-doi="10.1111/j.1462-2920.2008.01770.x">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Glaubitz</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lueders</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Abraham</span>,  <span class="cit-name-given-names">W.-R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jost</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jürgens</span>,  <span class="cit-name-given-names">K.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Labrenz</span>,  <span class="cit-name-given-names">M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2009</span><strong>).</strong> <span class="cit-article-title"><sup>13</sup>C-isotope analyses reveal that chemolithoautotrophic <em>Gamma</em>- and <em>Epsilonproteobacteria</em> feed a microbial food web in a pelagic redoxcline of the central Baltic Sea</span>. <abbr class="cit-jnl-abbrev">Environ Microbiol</abbr> <span class="cit-vol">11</span>, <span class="cit-fpage">326</span>–<span class="cit-lpage">337</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1111/j.1462-2920.2008.01770.x</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>18793316</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1111/j.1462-2920.2008.01770.x&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=18793316&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=13C-isotope%20analyses%20reveal%20that%20chemolithoautotrophic%20Gamma-%20and%20Epsilonproteobacteria%20feed%20a%20microbial%20food%20web%20in%20a%20pelagic%20redoxcline%20of%20the%20central%20Baltic%20Sea&amp;author=S.%20Glaubitz&amp;author=T.%20Lueders&amp;author=W.-R.%20Abraham&amp;author=G.%20Jost&amp;author=K.%20J%C3%BCrgens&amp;author=M.%20Labrenz&amp;publication_year=2009&amp;journal=Environ%20Microbiol&amp;volume=11&amp;pages=326-337&amp;doi=10.1111%2Fj.1462-2920.2008.01770.x&amp;pmid=18793316">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-12-1" title="View reference  in text"
+                           id="ref-12">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.12"
+                             data-doi="10.1111/j.1574-6941.2010.00944.x">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Glaubitz</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Labrenz</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jost</span>,  <span class="cit-name-given-names">G.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jürgens</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2010</span><strong>).</strong> <span class="cit-article-title">Diversity of active chemolithoautotrophic prokaryotes in the sulfidic zone of a Black Sea pelagic redoxcline as determined
+                                    by rRNA-based stable isotope probing</span>. <abbr class="cit-jnl-abbrev">FEMS Microbiol Ecol</abbr> <span class="cit-vol">74</span>, <span class="cit-fpage">32</span>–<span class="cit-lpage">41</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1111/j.1574-6941.2010.00944.x</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>20649907</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=femsec&amp;resid=74/1/32"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-13-1" title="View reference  in text"
+                           id="ref-13">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.13"
+                             data-doi="10.1128/AEM.00466-07">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Grote</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Labrenz</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pfeiffer</span>,  <span class="cit-name-given-names">B.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jost</span>,  <span class="cit-name-given-names">G.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jürgens</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2007</span><strong>).</strong> <span class="cit-article-title">Quantitative distributions of <em>Epsilonproteobacteria</em> and a <em>Sulfurimonas</em> subgroup in pelagic redoxclines of the central Baltic Sea</span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">73</span>, <span class="cit-fpage">7155</span>–<span class="cit-lpage">7161</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.00466-07</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>17921285</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=73/22/7155"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-14-1" title="View reference  in text"
+                           id="ref-14">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.14"
+                             data-doi="10.1128/AEM.01186-08">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Grote</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jost</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Labrenz</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Herndl</span>,  <span class="cit-name-given-names">G. J.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jürgens</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2008</span><strong>).</strong> <span class="cit-article-title"><em>Epsilonproteobacteria</em> represent the major portion of chemoautotrophic bacteria in sulfidic waters of pelagic redoxclines of the Baltic and Black
+                                    Seas</span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">74</span>, <span class="cit-fpage">7546</span>–<span class="cit-lpage">7551</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.01186-08</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>18952879</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=74/24/7546"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-15-1" title="View reference  in text"
+                           id="ref-15">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.15"
+                             data-doi="10.1073/pnas.1111262109">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Grote</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Schott</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bruckner</span>,  <span class="cit-name-given-names">C. G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Glöckner</span>,  <span class="cit-name-given-names">F. O.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jost</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Teeling</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Labrenz</span>,  <span class="cit-name-given-names">M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jürgens</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2012</span><strong>).</strong> <span class="cit-article-title">Genome and physiology of a model Epsilonproteobacterium responsible for sulfide detoxification in marine oxygen depletion
+                                    zones</span>. <abbr class="cit-jnl-abbrev">Proc Natl Acad Sci U S A</abbr> <span class="cit-vol">109</span>, <span class="cit-fpage">506</span>–<span class="cit-lpage">510</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1073/pnas.1111262109</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>22203982</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=pnas&amp;resid=109/2/506"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-16-1" title="View reference  in text"
+                           id="ref-16">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.16"
+                             data-doi="10.4319/lo.2007.52.4.1336">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hannig</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lavik</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kuypers</span>,  <span class="cit-name-given-names">M. M. M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Woebken</span>,  <span class="cit-name-given-names">D.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Martens-Habbena</span>,  <span class="cit-name-given-names">W.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jürgens</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2007</span><strong>).</strong> <span class="cit-article-title">Shift from denitrification to anammox after inflow events in the central Baltic Sea</span>. <abbr class="cit-jnl-abbrev">Limnol Oceanogr</abbr> <span class="cit-vol">52</span>, <span class="cit-fpage">1336</span>–<span class="cit-lpage">1345</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.4319/lo.2007.52.4.1336</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.4319/lo.2007.52.4.1336&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Shift%20from%20denitrification%20to%20anammox%20after%20inflow%20events%20in%20the%20central%20Baltic%20Sea&amp;author=M.%20Hannig&amp;author=G.%20Lavik&amp;author=M.%20M.%20M.%20Kuypers&amp;author=D.%20Woebken&amp;author=W.%20Martens-Habbena&amp;author=K.%20J%C3%BCrgens&amp;publication_year=2007&amp;journal=Limnol%20Oceanogr&amp;volume=52&amp;pages=1336-1345&amp;doi=10.4319%2Flo.2007.52.4.1336">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-17-1" title="View reference  in text"
+                           id="ref-17">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.17"
+                             data-doi="10.1099/ijs.0.02682-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Inagaki</span>,  <span class="cit-name-given-names">F.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Takai</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kobayashi</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nealson</span>,  <span class="cit-name-given-names">K. H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Horikoshi</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2003</span><strong>).</strong> <span class="cit-article-title"><em>Sulfurimonas autotrophica</em> gen. nov., sp. nov., a novel sulfur-oxidizing ϵ-proteobacterium isolated from hydrothermal sediments in the Mid-Okinawa Trough</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">53</span>, <span class="cit-fpage">1801</span>–<span class="cit-lpage">1805</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.02682-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>14657107</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=53/6/1801"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-18-1" title="View reference  in text"
+                           id="ref-18">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.18"
+                             data-doi="10.1016/j.marchem.2009.01.002">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jensen</span>,  <span class="cit-name-given-names">M. M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Petersen</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Dalsgaard</span>,  <span class="cit-name-given-names">T.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Thamdrup</span>,  <span class="cit-name-given-names">B.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2009</span><strong>).</strong> <span class="cit-article-title">Pathways, rates, and regulation of N<sub>2</sub> production in the chemocline of an anoxic basin, Mariager Fjord, Denmark</span>. <abbr class="cit-jnl-abbrev">Mar Chem</abbr> <span class="cit-vol">113</span>, <span class="cit-fpage">102</span>–<span class="cit-lpage">113</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/j.marchem.2009.01.002</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/j.marchem.2009.01.002&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Pathways%2C%20rates%2C%20and%20regulation%20of%20N2%20production%20in%20the%20chemocline%20of%20an%20anoxic%20basin%2C%20Mariager%20Fjord%2C%20Denmark&amp;author=M.%20M.%20Jensen&amp;author=J.%20Petersen&amp;author=T.%20Dalsgaard&amp;author=B.%20Thamdrup&amp;publication_year=2009&amp;journal=Mar%20Chem&amp;volume=113&amp;pages=102-113&amp;doi=10.1016%2Fj.marchem.2009.01.002">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><div class="cit ref-cit ref-journal no-rev-xref" id="cit-63.Pt_11.4141.19"
+                             data-doi="10.4319/lo.2008.53.1.0014">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jost</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Zubkov</span>,  <span class="cit-name-given-names">M. V.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Yakushev</span>,  <span class="cit-name-given-names">E.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Labrenz</span>,  <span class="cit-name-given-names">M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jürgens</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2008</span><strong>).</strong> <span class="cit-article-title">High abundance and dark CO<sub>2</sub> fixation of chemolithoautotrophic prokaryotes in anoxic waters of the Baltic Sea</span>. <abbr class="cit-jnl-abbrev">Limnol Oceanogr</abbr> <span class="cit-vol">53</span>, <span class="cit-fpage">14</span>–<span class="cit-lpage">22</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.4319/lo.2008.53.1.0014</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.4319/lo.2008.53.1.0014&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=High%20abundance%20and%20dark%20CO2%20fixation%20of%20chemolithoautotrophic%20prokaryotes%20in%20anoxic%20waters%20of%20the%20Baltic%20Sea&amp;author=G.%20Jost&amp;author=M.%20V.%20Zubkov&amp;author=E.%20Yakushev&amp;author=M.%20Labrenz&amp;author=K.%20J%C3%BCrgens&amp;publication_year=2008&amp;journal=Limnol%20Oceanogr&amp;volume=53&amp;pages=14-22&amp;doi=10.4319%2Flo.2008.53.1.0014">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-20-1" title="View reference  in text"
+                           id="ref-20">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.20"
+                             data-doi="10.1111/j.1574-6941.2009.00798.x">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jost</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Martens-Habbena</span>,  <span class="cit-name-given-names">W.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pollehne</span>,  <span class="cit-name-given-names">F.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Schnetger</span>,  <span class="cit-name-given-names">B.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Labrenz</span>,  <span class="cit-name-given-names">M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2010</span><strong>).</strong> <span class="cit-article-title">Anaerobic sulfur oxidation in the absence of nitrate dominates microbial chemoautotrophy beneath the pelagic chemocline of
+                                    the eastern Gotland Basin, Baltic Sea</span>. <abbr class="cit-jnl-abbrev">FEMS Microbiol Ecol</abbr> <span class="cit-vol">71</span>, <span class="cit-fpage">226</span>–<span class="cit-lpage">236</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1111/j.1574-6941.2009.00798.x</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>19925634</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1111/j.1574-6941.2009.00798.x&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=19925634&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Anaerobic%20sulfur%20oxidation%20in%20the%20absence%20of%20nitrate%20dominates%20microbial%20chemoautotrophy%20beneath%20the%20pelagic%20chemocline%20of%20the%20eastern%20Gotland%20Basin%2C%20Baltic%20Sea&amp;author=G.%20Jost&amp;author=W.%20Martens-Habbena&amp;author=F.%20Pollehne&amp;author=B.%20Schnetger&amp;author=M.%20Labrenz&amp;publication_year=2010&amp;journal=FEMS%20Microbiol%20Ecol&amp;volume=71&amp;pages=226-236&amp;doi=10.1111%2Fj.1574-6941.2009.00798.x&amp;pmid=19925634">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-21-1" title="View reference  in text"
+                           id="ref-21">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.21"
+                             data-doi="10.1128/AEM.70.8.4971-4979.2004">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Labrenz</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brettar</span>,  <span class="cit-name-given-names">I.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Christen</span>,  <span class="cit-name-given-names">R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Flavier</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bötel</span>,  <span class="cit-name-given-names">J.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Höfle</span>,  <span class="cit-name-given-names">M. G.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2004</span><strong>).</strong> <span class="cit-article-title">Development and application of a real-time PCR approach for quantification of uncultured bacteria in the central Baltic Sea</span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">70</span>, <span class="cit-fpage">4971</span>–<span class="cit-lpage">4979</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.70.8.4971-4979.2004</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>15294837</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=70/8/4971"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-22-1" title="View reference  in text"
+                           id="ref-22">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.22"
+                             data-doi="10.1128/AEM.71.11.6664-6672.2005">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Labrenz</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jost</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pohl</span>,  <span class="cit-name-given-names">C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Beckmann</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Martens-Habbena</span>,  <span class="cit-name-given-names">W.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jürgens</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2005</span><strong>).</strong> <span class="cit-article-title">Impact of different <em>in vitro</em> electron donor/acceptor conditions on potential chemolithoautotrophic communities from marine pelagic redoxclines</span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">71</span>, <span class="cit-fpage">6664</span>–<span class="cit-lpage">6672</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.71.11.6664-6672.2005</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>16269695</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=71/11/6664"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-23-1" title="View reference  in text"
+                           id="ref-23">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.23"
+                             data-doi="10.3354/ame046177">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Labrenz</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jost</span>,  <span class="cit-name-given-names">G.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jürgens</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2007</span><strong>).</strong> <span class="cit-article-title">Distribution of abundant prokaryotic organisms in the water column of the central Baltic Sea with an oxic-anoxic interface</span>. <abbr class="cit-jnl-abbrev">Aquat Microb Ecol</abbr> <span class="cit-vol">46</span>, <span class="cit-fpage">177</span>–<span class="cit-lpage">190</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.3354/ame046177</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.3354/ame046177&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Distribution%20of%20abundant%20prokaryotic%20organisms%20in%20the%20water%20column%20of%20the%20central%20Baltic%20Sea%20with%20an%20oxic-anoxic%20interface&amp;author=M.%20Labrenz&amp;author=G.%20Jost&amp;author=K.%20J%C3%BCrgens&amp;publication_year=2007&amp;journal=Aquat%20Microb%20Ecol&amp;volume=46&amp;pages=177-190&amp;doi=10.3354%2Fame046177">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-24-1" title="View reference  in text"
+                           id="ref-24">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.24"
+                             data-doi="10.1016/S0025-3227(98)00046-2">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lepland</span>,  <span class="cit-name-given-names">A.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stevens</span>,  <span class="cit-name-given-names">R. L.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1998</span><strong>).</strong> <span class="cit-article-title">Manganese authigenesis in the Landsort Deep, Baltic Sea</span>. <abbr class="cit-jnl-abbrev">Mar Geol</abbr> <span class="cit-vol">151</span>, <span class="cit-fpage">1</span>–<span class="cit-lpage">25</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/S0025-3227(98)00046-2</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/S0025-3227(98)00046-2&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Manganese%20authigenesis%20in%20the%20Landsort%20Deep%2C%20Baltic%20Sea&amp;author=A.%20Lepland&amp;author=R.%20L.%20Stevens&amp;publication_year=1998&amp;journal=Mar%20Geol&amp;volume=151&amp;pages=1-25&amp;doi=10.1016%2FS0025-3227%2898%2900046-2">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-25-1" title="View reference  in text"
+                           id="ref-25">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.25"
+                             data-doi="10.1093/nar/gkh293">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ludwig</span>,  <span class="cit-name-given-names">W.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Strunk</span>,  <span class="cit-name-given-names">O.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Westram</span>,  <span class="cit-name-given-names">R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Richter</span>,  <span class="cit-name-given-names">L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Meier</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Yadhukumar</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Buchner</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lai</span>,  <span class="cit-name-given-names">T.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Steppi</span>,  <span class="cit-name-given-names">S.</span></span></li>
+                              </ol><cite> <strong>&amp; other authors (</strong><span class="cit-pub-date">2004</span><strong>).</strong> <span class="cit-article-title"><span class="sc">arb</span>: a software environment for sequence data</span>. <abbr class="cit-jnl-abbrev">Nucleic Acids Res</abbr> <span class="cit-vol">32</span>, <span class="cit-fpage">1363</span>–<span class="cit-lpage">1371</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1093/nar/gkh293</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>14985472</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=nar&amp;resid=32/4/1363"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-26-1" title="View reference  in text"
+                           id="ref-26">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.26"
+                             data-doi="10.1111/j.1574-6941.2008.00502.x">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nakagawa</span>,  <span class="cit-name-given-names">S.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Takai</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2008</span><strong>).</strong> <span class="cit-article-title">Deep-sea vent chemoautotrophs: diversity, biochemistry and ecological significance</span>. <abbr class="cit-jnl-abbrev">FEMS Microbiol Ecol</abbr> <span class="cit-vol">65</span>, <span class="cit-fpage">1</span>–<span class="cit-lpage">14</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1111/j.1574-6941.2008.00502.x</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>18503548</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=femsec&amp;resid=65/1/1"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-27-1" title="View reference  in text"
+                           id="ref-27">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.27"
+                             data-doi="10.1111/j.1462-2920.2005.00856.x">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nakagawa</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Takai</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Inagaki</span>,  <span class="cit-name-given-names">F.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hirayama</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nunoura</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Horikoshi</span>,  <span class="cit-name-given-names">K.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sako</span>,  <span class="cit-name-given-names">Y.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2005</span><strong>).</strong> <span class="cit-article-title">Distribution, phylogenetic diversity and physiological characteristics of epsilon-<em>Proteobacteria</em> in a deep-sea hydrothermal field</span>. <abbr class="cit-jnl-abbrev">Environ Microbiol</abbr> <span class="cit-vol">7</span>, <span class="cit-fpage">1619</span>–<span class="cit-lpage">1632</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1111/j.1462-2920.2005.00856.x</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>16156735</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1111/j.1462-2920.2005.00856.x&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=16156735&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Distribution%2C%20phylogenetic%20diversity%20and%20physiological%20characteristics%20of%20epsilon-Proteobacteria%20in%20a%20deep-sea%20hydrothermal%20field&amp;author=S.%20Nakagawa&amp;author=K.%20Takai&amp;author=F.%20Inagaki&amp;author=H.%20Hirayama&amp;author=T.%20Nunoura&amp;author=K.%20Horikoshi&amp;author=Y.%20Sako&amp;publication_year=2005&amp;journal=Environ%20Microbiol&amp;volume=7&amp;pages=1619-1632&amp;doi=10.1111%2Fj.1462-2920.2005.00856.x&amp;pmid=16156735">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-28-1" title="View reference  in text"
+                           id="ref-28">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.28"
+                             data-doi="10.1016/S0304-4203(03)00048-3">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Neretin</span>,  <span class="cit-name-given-names">L. N.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pohl</span>,  <span class="cit-name-given-names">C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jost</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Leipe</span>,  <span class="cit-name-given-names">T.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pollehne</span>,  <span class="cit-name-given-names">F.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2003</span><strong>).</strong> <span class="cit-article-title">Manganese cycling in the Gotland Deep, Baltic Sea</span>. <abbr class="cit-jnl-abbrev">Mar Chem</abbr> <span class="cit-vol">82</span>, <span class="cit-fpage">125</span>–<span class="cit-lpage">143</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/S0304-4203(03)00048-3</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/S0304-4203(03)00048-3&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Manganese%20cycling%20in%20the%20Gotland%20Deep%2C%20Baltic%20Sea&amp;author=L.%20N.%20Neretin&amp;author=C.%20Pohl&amp;author=G.%20Jost&amp;author=T.%20Leipe&amp;author=F.%20Pollehne&amp;publication_year=2003&amp;journal=Mar%20Chem&amp;volume=82&amp;pages=125-143&amp;doi=10.1016%2FS0304-4203%2803%2900048-3">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-29-1" title="View reference  in text"
+                           id="ref-29">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.29"
+                             data-doi="10.1073/pnas.85.8.2444">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pearson</span>,  <span class="cit-name-given-names">W. R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lipman</span>,  <span class="cit-name-given-names">D. J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1988</span><strong>).</strong> <span class="cit-article-title">Improved tools for biological sequence comparison</span>. <abbr class="cit-jnl-abbrev">Proc Natl Acad Sci U S A</abbr> <span class="cit-vol">85</span>, <span class="cit-fpage">2444</span>–<span class="cit-lpage">2448</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1073/pnas.85.8.2444</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>3162770</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=pnas&amp;resid=85/8/2444"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><div class="cit ref-cit ref-book no-rev-xref" id="cit-63.Pt_11.4141.30">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sasser</span>,  <span class="cit-name-given-names">M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1990</span><strong>).</strong> <span class="cit-source">Identification of bacteria by gas chromatography of cellular fatty acids</span>, MIDI Technical Note 101. <span class="cit-publ-loc">Newark, DE</span>: <span class="cit-publ-name">Microbial ID</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Identification%20of%20bacteria%20by%20gas%20chromatography%20of%20cellular%20fatty%20acids&amp;author=M.%20Sasser&amp;publication_year=1990">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-31-1" title="View reference  in text"
+                           id="ref-31">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.31"
+                             data-doi="10.1128/AEM.01844-07">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sievert</span>,  <span class="cit-name-given-names">S. M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Scott</span>,  <span class="cit-name-given-names">K. M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Klotz</span>,  <span class="cit-name-given-names">M. G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Chain</span>,  <span class="cit-name-given-names">P. S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hauser</span>,  <span class="cit-name-given-names">L. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hemp</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hügler</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Land</span>,  <span class="cit-name-given-names">M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lapidus</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>&amp; other authors (</strong><span class="cit-pub-date">2008</span><strong>).</strong> <span class="cit-article-title">Genome of the epsilonproteobacterial chemolithoautotroph <em>Sulfurimonas denitrificans</em></span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">74</span>, <span class="cit-fpage">1145</span>–<span class="cit-lpage">1156</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.01844-07</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>18065616</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=74/4/1145"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-32-1" title="View reference  in text"
+                           id="ref-32">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.32"
+                             data-doi="10.1099/00207713-44-4-846">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stackebrandt</span>,  <span class="cit-name-given-names">E.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Goebel</span>,  <span class="cit-name-given-names">B. M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1994</span><strong>).</strong> <span class="cit-article-title">Taxonomic Note: A place for DNA-DNA reassociation and 16S rRNA sequence analysis in the present species definition in Bacteriology</span>. <abbr class="cit-jnl-abbrev">Int J Syst Bacteriol</abbr> <span class="cit-vol">44</span>, <span class="cit-fpage">846</span>–<span class="cit-lpage">849</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-44-4-846</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=44/4/846"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-33-1" title="View reference  in text"
+                           id="ref-33">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.33"
+                             data-doi="10.1099/mic.0.2008/018085-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Starkenburg</span>,  <span class="cit-name-given-names">S. R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Arp</span>,  <span class="cit-name-given-names">D. J.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bottomley</span>,  <span class="cit-name-given-names">P. J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2008</span><strong>).</strong> <span class="cit-article-title"><span class="sc">d</span>-Lactate metabolism and the obligate requirement for CO<sub>2</sub> during growth on nitrite by the facultative lithoautotroph <em>Nitrobacter hamburgensis</em></span>. <abbr class="cit-jnl-abbrev">Microbiology</abbr> <span class="cit-vol">154</span>, <span class="cit-fpage">2473</span>–<span class="cit-lpage">2481</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/mic.0.2008/018085-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>18667580</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=mic&amp;resid=154/8/2473"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-34-1" title="View reference  in text"
+                           id="ref-34">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.34"
+                             data-doi="10.1128/AEM.71.9.5440-5450.2005">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Suzuki</span>,  <span class="cit-name-given-names">Y.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sasaki</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Suzuki</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nogi</span>,  <span class="cit-name-given-names">Y.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Miwa</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Takai</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nealson</span>,  <span class="cit-name-given-names">K. H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Horikoshi</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2005</span><strong>).</strong> <span class="cit-article-title">Novel chemoautotrophic endosymbiosis between a member of the <em>Epsilonproteobacteria</em> and the hydrothermal-vent gastropod <em>Alviniconcha</em> aff. <em>hessleri</em> (Gastropoda: Provannidae) from the Indian Ocean</span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">71</span>, <span class="cit-fpage">5440</span>–<span class="cit-lpage">5450</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.71.9.5440-5450.2005</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>16151136</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=71/9/5440"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-35-1" title="View reference  in text"
+                           id="ref-35">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.35"
+                             data-doi="10.1128/AEM.72.2.1388-1393.2006">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Suzuki</span>,  <span class="cit-name-given-names">Y.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kojima</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sasaki</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Suzuki</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Utsumi</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Watanabe</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Urakawa</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Tsuchida</span>,  <span class="cit-name-given-names">S.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nunoura</span>,  <span class="cit-name-given-names">T.</span></span></li>
+                              </ol><cite> <strong>&amp; other authors (</strong><span class="cit-pub-date">2006</span><strong>).</strong> <span class="cit-article-title">Host-symbiont relationships in hydrothermal vent gastropods of the genus <em>Alviniconcha</em> from the Southwest Pacific</span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">72</span>, <span class="cit-fpage">1388</span>–<span class="cit-lpage">1393</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.72.2.1388-1393.2006</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>16461691</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=72/2/1388"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-36-1" title="View reference  in text"
+                           id="ref-36">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.36"
+                             data-doi="10.1099/ijs.0.64255-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Takai</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Suzuki</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nakagawa</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Miyazaki</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Suzuki</span>,  <span class="cit-name-given-names">Y.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Inagaki</span>,  <span class="cit-name-given-names">F.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Horikoshi</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2006</span><strong>).</strong> <span class="cit-article-title"><em>Sulfurimonas paralvinellae</em> sp. nov., a novel mesophilic, hydrogen- and sulfur-oxidizing chemolithoautotroph within the <em>Epsilonproteobacteria</em> isolated from a deep-sea hydrothermal vent polychaete nest, reclassification of <em>Thiomicrospira denitrificans</em> as <em>Sulfurimonas denitrificans</em> comb. nov. and emended description of the genus <em>Sulfurimonas</em></span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">56</span>, <span class="cit-fpage">1725</span>–<span class="cit-lpage">1733</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.64255-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>16901999</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=56/8/1725"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-37-1" title="View reference  in text"
+                           id="ref-37">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.37"
+                             data-doi="10.1016/0077-7579(75)90008-3">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Timmer-ten Hoor</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1975</span><strong>).</strong> <span class="cit-article-title">A new type of thiosulphate oxidizing, nitrate reducing microorganism: <em>Thiomicrospira denitrificans</em> sp. nov.</span>. <abbr class="cit-jnl-abbrev">Neth J Sea Res</abbr> <span class="cit-vol">9</span>, <span class="cit-fpage">344</span>–<span class="cit-lpage">350</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/0077-7579(75)90008-3</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/0077-7579(75)90008-3&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=A%20new%20type%20of%20thiosulphate%20oxidizing%2C%20nitrate%20reducing%20microorganism%3A%20Thiomicrospira%20denitrificans%20sp.%20nov.&amp;author=A.%20Timmer-ten%20Hoor&amp;publication_year=1975&amp;journal=Neth%20J%20Sea%20Res&amp;volume=9&amp;pages=344-350&amp;doi=10.1016%2F0077-7579%2875%2990008-3">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-38-1" title="View reference  in text"
+                           id="ref-38">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4141.38">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Balows</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Trüper</span>,  <span class="cit-name-given-names">H. G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Dworkin</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Harder</span>,  <span class="cit-name-given-names">W.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Schleifer</span>,  <span class="cit-name-given-names">K.-H.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Widdel</span>,  <span class="cit-name-given-names">F.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bak</span>,  <span class="cit-name-given-names">F.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1992</span><strong>).</strong> <span class="cit-article-title">Chapter 183. Gram-negative mesophilic sulfate-reducing bacteria</span>. In <span class="cit-source">The Prokaryotes</span>. <span class="cit-edition">2nd edn</span>, <span class="cit-vol">vol. IV</span>, pp, <span class="cit-fpage">3352</span>–<span class="cit-lpage">3378</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Balows</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Trüper</span>,  <span class="cit-name-given-names">H. G.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Dworkin</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Harder</span>,  <span class="cit-name-given-names">W.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Schleifer</span>,  <span class="cit-name-given-names">K.-H.</span></span>
+                                 . <span class="cit-publ-loc">New York</span>: <span class="cit-publ-name">Springer</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Chapter%20183.%20Gram-negative%20mesophilic%20sulfate-reducing%20bacteria&amp;author=F.%20Widdel&amp;author=F.%20Bak&amp;publication_year=1992&amp;citation_inbook_title=The%20Prokaryotes">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-39-1" title="View reference  in text"
+                           id="ref-39">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.39"
+                             data-doi="10.1007/BF00407804">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Widdel</span>,  <span class="cit-name-given-names">F.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kohring</span>,  <span class="cit-name-given-names">G. W.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Mayer</span>,  <span class="cit-name-given-names">F.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1983</span><strong>).</strong> <span class="cit-article-title">Studies on dissimilatory sulfate-reducing bacteria that decompose fatty acids. III. Characterization of the filamentous gliding
+                                    <em>Desulfonema limicola</em> gen. nov. sp. nov., and <em>Desulfonema magnum</em> sp. nov.</span> <abbr class="cit-jnl-abbrev">Arch Microbiol</abbr> <span class="cit-vol">134</span>, <span class="cit-fpage">286</span>–<span class="cit-lpage">294</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/BF00407804</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/BF00407804&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=7283636&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Studies%20on%20dissimilatory%20sulfate-reducing%20bacteria%20that%20decompose%20fatty%20acids.%20III.%20Characterization%20of%20the%20filamentous%20gliding%20Desulfonema%20limicola%20gen.%20nov.%20sp.%20nov.%2C%20and%20Desulfonema%20magnum%20sp.%20nov.&amp;author=F.%20Widdel&amp;author=G.%20W.%20Kohring&amp;author=F.%20Mayer&amp;publication_year=1983&amp;journal=Arch%20Microbiol&amp;volume=134&amp;pages=286-294&amp;doi=10.1007%2FBF00407804">Google Scholar</a></div>
+                        </div>
+                     </li>
+                  </ol>
+               </div><span class="highwire-journal-article-marker-end"></span></div>
+            <div class="social-bookmarking">
+               
+               <ul class="social-bookmark-links">
+                  <li class="social-bookmarking-item social-bookmarking-item-citeulike"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=CITEULIKE"><img src="/shared/img/common/social-bookmarking/citeulike.gif"
+                             alt="Add to CiteULike"
+                             title="CiteULike" /></a><span class="soc-bm-link-text">CiteULike</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-delicious"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=DEL_ICIO_US"><img src="/shared/img/common/social-bookmarking/delicious.gif"
+                             alt="Add to Delicious"
+                             title="Delicious" /></a><span class="soc-bm-link-text">Delicious</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-digg"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=DIGG"><img src="/shared/img/common/social-bookmarking/digg.gif" alt="Add to Digg"
+                             title="Digg" /></a><span class="soc-bm-link-text">Digg</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-facebook"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/short/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=FACEBOOK"
+                        class="sb-facebook"
+                        rel="external-nw"><img src="/shared/img/common/social-bookmarking/facebook.gif" alt="Add to Facebook"
+                             title="Facebook" /></a><span class="soc-bm-link-text">Facebook</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-googleplus"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=GOOGLEPLUS&amp;log_only=yes"><img src="/shared/img/common/social-bookmarking/googleplus.jpg" alt="Add to Google+"
+                             title="Google+" /></a><span class="soc-bm-link-text">Google+</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-linkedin"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=LINKEDIN"><img src="/shared/img/common/social-bookmarking/linkedin.gif" alt="Add to LinkedIn"
+                             title="LinkedIn" /></a><span class="soc-bm-link-text">LinkedIn</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-mendeley"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=MENDELEY"><img src="/shared/img/common/social-bookmarking/mendeley.gif" alt="Add to Mendeley"
+                             title="Mendeley" /></a><span class="soc-bm-link-text">Mendeley</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-reddit"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=REDDIT"><img src="/shared/img/common/social-bookmarking/reddit.gif" alt="Add to Reddit"
+                             title="Reddit" /></a><span class="soc-bm-link-text">Reddit</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-twitter"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=TWITTER"><img src="/shared/img/common/social-bookmarking/twitter.gif" alt="Add to Twitter"
+                             title="Twitter" /></a><span class="soc-bm-link-text">Twitter</span></li>
+               </ul>
+               
+               <p class="social-bookmarking-help"><a href="/help/social_bookmarks.dtl">What's this?</a></p>
+               
+            </div><span id="related-urls"></span></div>
+         <div id="col-2">
+            
+            <div class="article-nav sidebar-nav">
+               <a href="/content/63/Pt_11/4136.short" title="Previous article" class="previous">« Previous</a><span class="article-nav-sep"> | </span><a href="/content/63/Pt_11/4149.short" title="Next article" class="next">Next Article »</a>
+               
+               <span class="toc-link">
+                  				<a href="/content/63/Pt_11.toc" title="Table of Contents">Table of Contents</a>
+                  			</span>
+               
+               
+            </div>
+            <div class="open-access-note">
+               <span class="open-access-note">OPEN ACCESS ARTICLE</span>
+               
+            </div>
+            <div class="content-box" id="article-cb-main">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Article</span></h3>
+                  <div class="cb-section cb-slug">
+                     <ol>
+                        <li>
+                           <div id="slugline">
+                              
+                              
+                              	    <span class="slug-metadata-note ahead-of-print">
+                                 	
+                                 Published online ahead of print
+                                 
+                                 <span class="slug-ahead-of-print-date">June 7, 2013</span>,
+                                 doi:
+                                 <span title="10.1099/ijs.0.048827-0" class="slug-doi">10.1099/ijs.0.048827-0
+                                    </span>
+                                 </span>
+                              
+                              <cite>
+                                 	    <abbr title="International Journal of Systematic and Evolutionary Microbiology"
+                                       class="slug-jnl-abbrev">
+                                    IJSEM</abbr><span class="slug-pub-date" itemprop="datePublished">
+                                    	    November 2013 
+                                    </span>
+                                 	    <span class="slug-vol">
+                                    vol. 63 
+                                    </span><span class="slug-issue">
+                                    no. Pt 11 
+                                    </span><span class="slug-pages">
+                                    4141-4148
+                                    </span>
+                                 </cite>
+                              
+                              	           
+                              
+                              
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section cb-views">
+                     <ol>
+                        <li><span class="oa-article">Free via Open Access: <span>OA</span></span></li>
+                        <li><span class="creative-commons-article">Free via Creative Commons: <span>CC</span></span></li>
+                        <li><span class="ccv cc-version-by/2.5/"></span></li>
+                        <li class="abstract-view-link primary"><span class="oa-view">OA </span><a href="/content/63/Pt_11/4141.abstract" rel="view-abstract">Abstract</a><span class="free">Free</span></li>
+                        <li class="notice full-text-view-link primary"><span class="variant-indicator">» <span>Full Text</span></span><span class="free">Free</span></li>
+                        <li class="notice full-text-pdf-view-link primary"><a href="/content/63/Pt_11/4141.full.pdf+html" rel="view-full-text.pdf">Full Text (PDF)</a><span class="free">Free</span></li>
+                        <li><a href="/powerpoint/63/Pt_11/4141">PPT Slides of All Figures</a></li>
+                        <li class="cb-versions">
+                           <div><span id="pap-all-versions-label">All Versions of this Article:</span><ol class="version-list">
+                                 <li><a href="/content/early/2013/06/04/ijs.0.048827-0">ijs.0.048827-0v1</a></li>
+                                 <li class="current-li"><span>63/Pt_11/4141</span> <span class="current-version">most recent</span></li>
+                              </ol>
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible" id="cb-art-cat">
+                     <h4 class="cb-section-header"><span>Classifications</span></h4>
+                     <ol>
+                        <li>
+                           <ul class="subject-headings">
+                              <li>New Taxa
+                                 <ul class="subject-sub-headings last-child">
+                                    <li><a class="tocsection-search"
+                                          href="/search?tocsectionid=Proteobacteria&amp;sortspec=date&amp;submit=Submit">Proteobacteria</a></li>
+                                 </ul>
+                              </li>
+                           </ul>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible" id="cb-art-svcs">
+                     <h4 class="cb-section-header"><span>Services</span></h4>
+                     <ol>
+                        <li class="mail-a-friend-link icon-link"><a href="/email?gca=ijs%3B63%2FPt_11%2F4141&amp;current-view-path=/content/63/Pt_11/4141.full">
+                              Email this article to a colleague</a></li>
+                        <li class="alert-link icon-link"><a href="/cgi/alerts/ctalert?alertType=citedby&amp;addAlert=cited_by&amp;cited_by_criteria_resid=ijs%3B63%2FPt_11%2F4141&amp;saveAlert=no&amp;return-type=article&amp;return_url=http://ijs.sgmjournals.org/content/63/Pt_11/4141.full">Alert me when this article is cited</a></li>
+                        <li class="alert-link icon-link"><a href="/cgi/alerts/ctalert?alertType=correction&amp;addAlert=correction&amp;correction_criteria_value=63/Pt_11/4141&amp;saveAlert=no&amp;return-type=article&amp;return_url=http://ijs.sgmjournals.org/content/63/Pt_11/4141.full">Alert me if a correction is posted</a></li>
+                        <li class="similar-link"><a href="/search?qbe=ijs%3Bijs.0.048827-0&amp;citation=Labrenz%20et%20al.%2063%20%28Pt%2011%29:%204141&amp;submit=yes">Similar articles in this journal</a></li>
+                        <li class="similar-link"><a href="/external-ref?access_num=ijs%3B63%2FPt_11%2F4141&amp;link_type=ISI_RELATEDRECORDS"
+                              id="cb-isi-similar-articles"
+                              class="similar-link">Similar articles in Web of Science</a></li>
+                        <li class="similar-link"><a href="/external-ref?access_num=23749282&amp;link_type=MED_NBRS"
+                              class="similar-link">Similar articles in PubMed</a></li>
+                        <li class="cit-man-link icon-link cite-link"><a href="/citmgr?gca=ijs%3B63%2FPt_11%2F4141">Download to citation manager</a></li>
+                        <li class="copyright-link icon-link"><a href="/external-ref?link_type=PERMISSIONDIRECT"><img src="/shared/img/content/permissions.gif" /></a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-cit">
+                     <h4 class="cb-section-header"><span>Citing Articles</span></h4>
+                     <ol>
+                        <li class="hw-citing-link"><a href="/content/63/Pt_11/4141.full?cited-by=yes&amp;legid=ijs;63/Pt_11/4141#cited-by"
+                              id="cb-hw-citing-articles">Load citing article information</a></li>
+                        <li><a href="/cgi/crossref-forward-links/63/Pt_11/4141" rel="external-nw"
+                              id="cb-crossref-citing-articles">Citing articles via CrossRef</a></li>
+                        <li><a href="/external-ref?access_num=%2Fijs%2F63%2FPt_11%2F4141&amp;link_type=ISI_CITING&amp;accnum_type=native"
+                              rel="external-nw"
+                              id="cb-isi-citing-articles">Citing articles via Web of Science</a></li>
+                        <li><a href="/external-ref?access_num=http://ijs.sgmjournals.org/content/63/Pt_11/4141.abstract&amp;link_type=GOOGLESCHOLAR">Citing articles via Google Scholar</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-gs">
+                     <h4 class="cb-section-header"><span>Google Scholar</span></h4>
+                     <ol>
+                        <li class="cb-art-gs-auth author-link"><a href="http://scholar.google.com/scholar?q=%22author%3ALabrenz%20author%3AM.%22"
+                              class="cb-art-gs-auth author-link">Articles by  Labrenz, M.</a></li>
+                        <li class="cb-art-gs-auth author-link"><a href="http://scholar.google.com/scholar?q=%22author%3AJ%C3%BCrgens%20author%3AK.%22"
+                              class="cb-art-gs-auth author-link">Articles by  Jürgens, K.</a></li>
+                        <li class="cb-art-gs-rel similar-link"><a href="/external-ref?access_num=http://ijs.sgmjournals.org/content/63/Pt_11/4141.abstract&amp;link_type=GOOGLESCHOLARRELATED">Search for related content</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-pm">
+                     <h4 class="cb-section-header"><span>PubMed</span></h4>
+                     <ol>
+                        <li class="cb-art-pm-cite cite-link icon-link"><a href="/external-ref?access_num=23749282&amp;link_type=PUBMED"
+                              class="cb-art-pm-cite cite-link icon-link">PubMed citation</a></li>
+                        <li class="cb-art-pm-auth author-link"><a href="/external-ref?access_num=Labrenz%20M&amp;link_type=AUTHORSEARCH"
+                              class="cb-art-pm-auth author-link">Articles by  Labrenz, M.</a></li>
+                        <li class="cb-art-pm-auth author-link"><a href="/external-ref?access_num=J%C3%BCrgens%20K&amp;link_type=AUTHORSEARCH"
+                              class="cb-art-pm-auth author-link">Articles by  Jürgens, K.</a></li>
+                        <li>
+                           <div id="cb-entrez-links-placeholder"><a href="/entrez-links/23749282"></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-rel">
+                     <h4 class="cb-section-header"><span>Related Content</span></h4>
+                     <ol>
+                        <li><a href="/content/63/Pt_11/4141.full?related-urls=yes&amp;legid=ijs;63/Pt_11/4141#related-urls"
+                              id="cb-related-urls">Load related web page information</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed soc-links icon-link"
+                       id="cb-art-soc">
+                     <h4 class="cb-section-header"><span>Social Bookmarking</span></h4>
+                     <ol>
+                        <li>
+                           <div class="social-bookmarking">
+                              
+                              <ul class="social-bookmark-links">
+                                 <li class="social-bookmarking-item social-bookmarking-item-citeulike"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=CITEULIKE"><img src="/shared/img/common/social-bookmarking/citeulike.gif"
+                                            alt="Add to CiteULike"
+                                            title="CiteULike" /></a><span class="soc-bm-link-text">CiteULike</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-delicious"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=DEL_ICIO_US"><img src="/shared/img/common/social-bookmarking/delicious.gif"
+                                            alt="Add to Delicious"
+                                            title="Delicious" /></a><span class="soc-bm-link-text">Delicious</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-digg"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=DIGG"><img src="/shared/img/common/social-bookmarking/digg.gif" alt="Add to Digg"
+                                            title="Digg" /></a><span class="soc-bm-link-text">Digg</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-facebook"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/short/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=FACEBOOK"
+                                       class="sb-facebook"
+                                       rel="external-nw"><img src="/shared/img/common/social-bookmarking/facebook.gif" alt="Add to Facebook"
+                                            title="Facebook" /></a><span class="soc-bm-link-text">Facebook</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-googleplus"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=GOOGLEPLUS&amp;log_only=yes"><img src="/shared/img/common/social-bookmarking/googleplus.jpg" alt="Add to Google+"
+                                            title="Google+" /></a><span class="soc-bm-link-text">Google+</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-linkedin"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=LINKEDIN"><img src="/shared/img/common/social-bookmarking/linkedin.gif" alt="Add to LinkedIn"
+                                            title="LinkedIn" /></a><span class="soc-bm-link-text">LinkedIn</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-mendeley"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=MENDELEY"><img src="/shared/img/common/social-bookmarking/mendeley.gif" alt="Add to Mendeley"
+                                            title="Mendeley" /></a><span class="soc-bm-link-text">Mendeley</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-reddit"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=REDDIT"><img src="/shared/img/common/social-bookmarking/reddit.gif" alt="Add to Reddit"
+                                            title="Reddit" /></a><span class="soc-bm-link-text">Reddit</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-twitter"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=TWITTER"><img src="/shared/img/common/social-bookmarking/twitter.gif" alt="Add to Twitter"
+                                            title="Twitter" /></a><span class="soc-bm-link-text">Twitter</span></li>
+                              </ul>
+                              
+                              <p class="social-bookmarking-help"><a href="/help/social_bookmarks.dtl">What's this?</a></p>
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+            
+            <div class="content-box" id="article-dyn-nav">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>Navigate This Article</span></h3>
+                  <div class="cb-section" id="cb-art-nav">
+                     <ol>
+                        <li><a href="#content-block">Top</a></li>
+                        <li><a href="#abstract-1">Abstract</a></li>
+                        <li><a href="#ack-1">Acknowledgements</a></li>
+                        <li><a href="#ref-list-1">References</a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+         </div>
+         <div id="col-3">
+            
+            <div class="content-box" id="sidebar-current-issue">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Month's Issue</span></h3>
+                  <div class="cb-section">
+                     <ol>
+                        <li><span><a href="/content/current" rel="current-issue">April 2015, 65 (Pt 4)</a></span></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section">
+                     <ol>
+                        <li>
+                           <div class="current-issue"><a href="/content/current" rel="current-issue"><img src="/content/65/Pt_4.cover.gif" width="67" height="89" alt="Current Issue" /></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section sidebar-etoc-link">
+                     <ol>
+                        <li><a href="/cgi/alerts/etoc">Alert me to new issues of IJSEM
+                              </a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            <div id="sidebar-global-nav">
+               
+               		
+               <ul class="button-list pub-links">
+                  <li class="first"><a href="/site/misc/about.xhtml" title="ABOUT IJSEM"><span>ABOUT IJSEM</span></a></li>
+                  <li><a href="/site/misc/edboard.xhtml" title="EDITORIAL BOARD &amp; STAFF"><span>EDITORIAL BOARD &amp; STAFF</span></a></li>
+                  <li><a href="http://www.editorialmanager.com/ijs/" title="SUBMIT A MANUSCRIPT"><span>SUBMIT A MANUSCRIPT</span></a></li>
+                  <li><a href="/site/misc/ifora.xhtml" title="INFORMATION FOR AUTHORS"><span>INFORMATION FOR AUTHORS</span></a></li>
+                  <li><a href="/site/misc/iforr.xhtml" title="INFORMATION FOR REVIEWERS"><span>INFORMATION FOR REVIEWERS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/site/librarians/index.xhtml"
+                        title="INFORMATION FOR LIBRARIANS"><span>INFORMATION FOR LIBRARIANS</span></a></li>
+                  <li><a href="/site/misc/reprints.xhtml" title="PERMISSIONS AND REPRINTS"><span>PERMISSIONS AND REPRINTS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/subscriptions" title="SUBSCRIPTIONS"><span>SUBSCRIPTIONS</span></a></li>
+                  <li><a href="/site/misc/addir.xhtml" title="ADVERTISING"><span>ADVERTISING</span></a></li>
+                  <li class="rss-img-button"><a href="/site/misc/alerts_feeds.xhtml" title="ALERTS &amp; FEEDS"><span>ALERTS &amp; FEEDS</span></a></li>
+                  <li class="last"><a href="/feedback" title="FEEDBACK"><span>FEEDBACK</span></a></li>
+               </ul>
+               		
+               <ul class="button-list pub-links umbrella-links">
+                  <li class="first"><a href="http://mic.sgmjournals.org" title="MICROBIOLOGY"><span>MICROBIOLOGY</span></a></li>
+                  <li><a href="http://vir.sgmjournals.org" title="J GEN VIROL"><span>J GEN VIROL</span></a></li>
+                  <li><a href="http://jmm.sgmjournals.org" title="J MED MICROBIOL"><span>J MED MICROBIOL</span></a></li>
+                  <li><a href="http://jmmcr.sgmjournals.org" title="JMM CASE REPORTS"><span>JMM CASE REPORTS</span></a></li>
+                  <li class="last"><a href="http://www.sgmjournals.org" title="ALL SGM JOURNALS"><span>ALL SGM JOURNALS</span></a></li>
+               </ul>
+               		
+               <div class="sidebar-icon-group">
+                  			
+                  <div class="icons">
+                     			<a href="http://www.sgm.ac.uk/" rel="external-nw"><img src="/publisher/img/society_logo.gif" class="publisher-icon" alt="Society Logo" /></a>
+                     			<a href="http://www.the-icsp.org/" rel="external-nw"><img src="/publisher/img/icsp_logo.gif" class="publisher-icon" alt="ICSP Logo" /></a>
+                     			<a href="http://highwire.stanford.edu/" rel="external-nw"><img src="/publisher/img/hplogo.gif" class="hw-icon" alt="HighWire Press Logo" /></a>
+                     			
+                  </div>
+                  			
+                  <div class="sidebar-icon-text"><span>The <a href="http://www.sgmjournals.org"> Society for General Microbiology</a> publishes online with the assistance of <a href="http://highwire.stanford.edu">HighWire Press®</a>.</span></div>
+                  		
+               </div>
+               	
+            </div>
+            <div class="most-links-box js-marker">
+               
+               <div class="most-header">
+                  
+                  <h3>Most</h3>
+                  
+               </div>
+               
+               <ul>
+                  <li class="most-cur-sel">
+                     <h4>Viewed</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/1070?rss=1&amp;ssource=mfr">Proposal to consistently apply the International Code of Nomenclature of Prokaryotes (ICNP) to names of the oxygenic photosynthetic
+                                 bacteria (cyanobacteria), including those validly published under the International Code of Botanical Nomenclature (ICBN)/International
+                                 Code of Nomenclature for algae, fungi and plants (ICN), and proposal to change Principle 2 of the ICNP</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfr">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/316?rss=1&amp;ssource=mfr">Integrating genomics into the taxonomy and systematics of the Bacteria and Archaea</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/333?rss=1&amp;ssource=mfr">Applications of next-generation sequencing to unravelling the evolutionary history of algae</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/739?rss=1&amp;ssource=mfr">Notification that new names of prokaryotes, new combinations, and new taxonomic opinions have appeared in volume 64, part
+                                 12, of the IJSEM</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfr1.dtl" class="view-all">» View all Most Viewed articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+                  <li>
+                     <h4>Cited</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4386?rss=1&amp;ssource=mfc">Chryseobacterium hispalense sp. nov., a plant-growth-promoting bacterium isolated from a rainwater pond in an olive plant
+                                 nursery, and emended descriptions of Chryseobacterium defluvii, Chryseobacterium indologenes, Chryseobacterium wanjuense and
+                                 Chryseobacterium gregarium</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfc">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_1/138?rss=1&amp;ssource=mfc">Aquibacter zeaxanthinifaciens gen. nov., sp. nov., a zeaxanthin-producing bacterium of the family Flavobacteriaceae isolated
+                                 from surface seawater, and emended descriptions of the genera Aestuariibaculum and Gaetbulibacter</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4790?rss=1&amp;ssource=mfc">Kordia aquimaris sp. nov., a zeaxanthin-producing member of the family Flavobacteriaceae isolated from surface seawater, and
+                                 emended description of the genus Kordia</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4524?rss=1&amp;ssource=mfc">Erythrobacter odishensis sp. nov. and Pontibacter odishensis sp. nov. isolated from dry soil of a solar saltern</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfc1.dtl" class="view-all">» View all Most Cited articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+               </ul>
+               
+               
+            </div>
+            
+            
+            
+         </div>
+         <div id="footer">
+            
+            <div class="bar">
+               
+               <div class="footer-group footer-col-left">
+                  		
+                  <p class="copyright">Copyright ©
+                     		2015 International Union of Microbiological Societies
+                     	
+                  </p>
+                  	
+               </div>
+               
+               <div class="footer-group footer-col-right">
+                  	    
+                  <ul class="issns">
+                     <li>
+                        <span>Print ISSN: </span>
+                        <span class="issn">1466-5026</span>
+                        
+                     </li>
+                     <li>
+                        <span>Online ISSN: </span>
+                        <span class="issn">1466-5034</span>
+                        
+                     </li>
+                  </ul>
+                  	  
+               </div>
+               	  
+            </div>
+            
+            
+            <div class="block-2 sb-div"></div>
+            
+         </div><script type="text/javascript">
+        var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
+        document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
+        </script><script type="text/javascript">
+        try {
+        var pageTracker = _gat._getTracker("UA-189672-25");
+        pageTracker._setDomainName(".sgmjournals.org");
+        pageTracker._trackPageview();
+        } catch(err) {}
+        </script><script type="text/javascript">
+	(function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
+		(i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
+		m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
+	})(window,document,'script','//www.google-analytics.com/analytics.js','ga');
+
+	ga('create', 'UA-48529861-1', '.sgmjournals.org');
+	ga('send', 'pageview');
+	</script></div>
+   </body>
+</html>
\ No newline at end of file
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4141.full/fulltext.pdf b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4141.full/fulltext.pdf
new file mode 100644
index 00000000..07da41b7
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4141.full/fulltext.pdf differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4141.full/results.json b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4141.full/results.json
new file mode 100644
index 00000000..50ce3e4f
--- /dev/null
+++ b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4141.full/results.json
@@ -0,0 +1,96 @@
+{
+  "publisher": {
+    "value": [
+      "Society for General Microbiology"
+    ]
+  },
+  "journal": {
+    "value": [
+      "International Journal of Systematic and Evolutionary\n                Microbiology"
+    ]
+  },
+  "title": {
+    "value": [
+      "Sulfurimonas gotlandica sp. nov., a chemoautotrophic and psychrotolerant epsilonproteobacterium isolated from a pelagic redoxcline, and an emended description of the genus Sulfurimonas"
+    ]
+  },
+  "authors": {
+    "value": [
+      "Matthias Labrenz",
+      "Jana Grote",
+      "Kerstin Mammitzsch",
+      "Henricus T. S. Boschker",
+      "Michael Laue",
+      "Günter Jost",
+      "Sabine Glaubitz",
+      "Klaus Jürgens"
+    ]
+  },
+  "date": {
+    "value": [
+      "11/01/2013"
+    ]
+  },
+  "doi": {
+    "value": [
+      "10.1099/ijs.0.048827-0"
+    ]
+  },
+  "volume": {
+    "value": [
+      "63"
+    ]
+  },
+  "issue": {
+    "value": [
+      "Pt 11"
+    ]
+  },
+  "firstpage": {
+    "value": [
+      "4141"
+    ]
+  },
+  "abstract": {
+    "value": [
+      "\n                  \n                      Next Section\n                  Abstract\n                  \n                  A psychro- and aerotolerant bacterium was isolated from the sulfidic water of a pelagic redox zone of the central Baltic Sea.\n                     The slightly curved rod- or spiral-shaped cells were motile by one polar flagellum or two bipolar flagella. Growth was chemolithoautotrophic,\n                     with nitrate or nitrite as electron acceptor and either a variety of sulfur species of different oxidation states or hydrogen\n                     as electron donor. Although the bacterium was able to utilize organic substances such as acetate, pyruvate, peptone and yeast\n                     extract for growth, these compounds yielded considerably lower cell numbers than obtained with reduced sulfur or hydrogen;\n                     in addition, bicarbonate supplementation was necessary. The cells also had an absolute requirement for NaCl. Optimal growth\n                     occurred at 15 °C and at pH 6.6–8.0. The predominant fatty acid of this organism was 16 : 1ω7c, with 3-OH 14 : 0, 16 : 0, 16 : 1ω5c+t and 18 : 1ω7c present in smaller amounts. The DNA G+C content was 33.6 mol%. As determined in 16S rRNA gene sequence phylogeny analysis,\n                     the isolate belongs to the genus Sulfurimonas, within the class Epsilonproteobacteria, with 93.7 to 94.2 % similarity to the other species of the genus Sulfurimonas, Sulfurimonas autotrophica, Sulfurimonas paralvinellae and Sulfurimonas denitrificans. However, the distinct physiological and genotypic differences from these previously described taxa support the description\n                     of a novel species, Sulfurimonas gotlandica sp. nov. The type strain is GD1T ( = DSM 19862T = JCM 16533T). Our results also justify an emended description of the genus Sulfurimonas.\n                  \n                  \n               "
+    ]
+  },
+  "fulltext_html": {
+    "value": [
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4141.full"
+    ]
+  },
+  "fulltext_pdf": {
+    "value": [
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4141.full.pdf"
+    ]
+  },
+  "supplementary_material": {
+    "value": []
+  },
+  "figure": {
+    "value": [
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4141/F1.small.gif",
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4141/F2.small.gif",
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4141/F3.small.gif"
+    ]
+  },
+  "figure_caption": {
+    "value": [
+      "Fig. 1.  \n                     \n                     Cell morphology of spirilla-shaped cells of strain GD1T cultivated on ABW+NS medium. (a) Fluorescence microscopy of 4′,6′-diamidino-2-phenylindol (DAPI) stained cells. (b) Transmission\n                        electron microscopy of a bacterium with one flagellum and (c) of a bacterium with two flagella (indicated by arrows), both\n                        negatively stained with phosphotungstic acid.\n                     \n                     \n                     \n                  ",
+      "Fig. 2.  \n                     \n                     Impact of pyruvate on the growth of isolate GD1T. Error bars indicate the standard deviation of three independent replicates for each assay. (a) Growth on media with different\n                        substrate combinations: 1, NaHCO3, S2O32-, NO3−; 2, NaHCO3, S2O32-, NO3−, pyruvate; 3, NaHCO3, pyruvate; 4, pyruvate; 5, ABW without further supplements. The relative enrichment factor describes the increase of cell\n                        numbers after 7 days of incubation compared to the initial cell numbers after inoculation at day 0 (6.1×105 ml−1). (b) 14CO2 production and [14C]pyruvate incorporation after 24 h and 72 h of incubation. Media: 1, NaHCO3, S2O32-, NO3−, [14C]pyruvate; 2, NaHCO3, NO3−, [14C]pyruvate. P, pyruvate incorporation; CO2, CO2 production.\n                     \n                     \n                     \n                  ",
+      "Fig. 3.  \n                     \n                     Unrooted tree showing phylogenetic relationships of isolate GD1T and closely related members of the class Epsilonproteobacteria. The tree was reconstructed using the neighbour-joining method and was based on a comparison of approximately 1400 nt. Solid\n                        squares indicate that the corresponding nodes (or groups) were recovered in neighbour-joining, maximum-parsimony and maximum-likelihood\n                        methods. Branching points supported by two algorithms are marked by an open square. The following strains were used as an\n                        outgroup (not shown): Antarctobacter heliothermus EL-219T, Sagittula stellata E-37T, Roseovarius tolerans EL-172T, Roseovarius nubinhibens ISMT and Roseovarius mucosus DFL-24T. Bar, 1 substitution per 10 nt.\n                     \n                     \n                     \n                  "
+    ]
+  },
+  "license": {
+    "value": [
+      "\n                  This is an open-access article distributed under the terms of the Creative Commons Attribution License, which permits unrestricted\n                     use, distribution, and reproduction in any medium, provided the original work is properly cited.\n                  \n               "
+    ]
+  },
+  "copyright": {
+    "value": [
+      "Copyright ©\n                     \t\t2015 International Union of Microbiological Societies\n                     \t\n                  "
+    ]
+  }
+}
\ No newline at end of file
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4174.full/DC1 b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4174.full/DC1
new file mode 100644
index 00000000..2266e827
--- /dev/null
+++ b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4174.full/DC1
@@ -0,0 +1,358 @@
+<!DOCTYPE html
+  PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html
+      xmlns="http://www.w3.org/1999/xhtml"
+      xml:lang="en"
+      lang="en">
+   <head>
+      <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
+      <title>Supplementary material </title>
+      <meta name="googlebot" content="NOODP" />
+      <meta name="HW.ad-path" content="/cgi/content/full/ijs.0.052902-0/DC1" />
+      <link rel="stylesheet" type="text/css" media="all" href="/shared/css/hw-global.css" />
+      <link rel="stylesheet" type="text/css" media="print" href="/shared/css/hw-print.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/standard-designs/design25/main.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/local/css/hw-local-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-page-data-supp.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-page-data-supp.css" /><script type="text/javascript" id="session-d6526224e1">var callbackToken='5632987E8596775';</script><script type="text/javascript" id="session-d6526224e3">
+                      var subCode='sgmjournal_sub';
+                    </script><script type="text/javascript" src="/shared/js/jquery-min.js"></script><script type="text/javascript" src="/shared/js/fingerprint.js"></script><script type="text/javascript" src="/shared/js/hw-shared.js"></script><script type="text/javascript" src="/shared/js/design/hw-design1.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-shared.js"></script><script type="text/javascript" src="/shared/js/pages/hw-data-supp.js"></script></head>
+   <body>
+      <div class="hw-gen-page pagetype-content" id="pageid-data-supp">
+         <div id="header">
+            
+            <h1><a id="logo" href="/"><span>International Journal of Systematic and Evolutionary Microbiology</span></a></h1>
+            
+            <p id="skip-link">
+               <a href="#content-block">Skip to main page content</a>
+               
+            </p>
+            
+            <ul class="button-list header-buttons">
+               <li class="first"><a href="/" title="HOME"><span>HOME</span></a></li>
+               <li><a href="/content/current" title="CURRENT ISSUE"><span>CURRENT ISSUE</span></a></li>
+               <li><a href="/content" title="ARCHIVE"><span>ARCHIVE</span></a></li>
+               <li><a href="/search" title="SEARCH"><span>SEARCH</span></a></li>
+               <li><a href="/help" title="HELP"><span>HELP</span></a></li>
+               <li class="last"><a href="/feedback" title="CONTACT US"><span>CONTACT US</span></a></li>
+            </ul>
+            
+            
+            <div class="header-qs">
+               
+               <form class="searchbox" action="/search" method="get">
+                  <div>
+                     	<label for="header-qs-input" id="header-qs-search-label">Search for Keyword:</label>
+                     <input value="" title="Search" type="text" name="fulltext" id="header-qs-input" /><input type="hidden" name="submit" value="yes" /><label for="header-qs-search" id="header-qs-search-label">GO</label><input value="GO" alt="Link: Go" type="image" id="header-qs-search-go"
+                            src="/shared/img/standard-design/design2/go.gif" /> 
+                     
+                  </div>
+                  <div class="adv-search-link"><a href="/search">Advanced Search</a></div>
+               </form>
+               
+               
+            </div>
+            
+            <div class="header-ac-elements">
+               
+               <div id="authstring" class="suppress-header-login">
+                  
+                  <ul>
+                     <li class="subscr-ref">Institution: THE NATURAL HISTORY MUSEUM</li>
+                     <li>
+                        <a href="/login?uri=http%3A%2F%2Fijs.sgmjournals.org%2Fcontent%2F63%2FPt_11%2F4174%2Fsuppl%2FDC1">
+                           Sign In as Member / Individual
+                           </a>
+                        
+                     </li>
+                  </ul>           
+                  
+               </div> 
+               
+               <div id="hdr-login" class="suppress-header-login"></div>
+               
+            </div>
+            
+            <div class="banner-ads">
+               		
+               <ul>
+                  <li class="position-1 no-ad hdr_left"><span>  </span></li>
+               </ul>
+               	
+            </div>
+            
+            <div class="bar">
+               
+               <div class="bar-inner"></div>
+               
+            </div>
+            
+         </div>
+         <div id="content-block">
+            <h1 class="data-supp-article-title"><span class="named-content genus" id="named-content-1"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter"
+                     href="doi:10.1601/nm.5839"><em>Arthrobacter</em></a></span> <em>siccitolerans</em> sp. nov., a highly desiccation-tolerant, xeroprotectant-producing strain isolated from dry soil
+            </h1>
+            <div><span class="highwire-journal-article-marker-start"></span><div class="auto-clean"><span style="font-family: Verdana,Arial,Helvetica,sans-serif;  font-size: 83.33%">
+                     
+                     
+                     <h2>Supplementary material</h2>
+                     
+                     <p><strong>Files in this Data Supplement:</strong></p>
+                     
+                     <ul>
+                        <li><a href="/content/suppl/2013/11/05/ijs.0.052902-0.DC1/ijs052902.pdf">Supplementary material</a> 
+                           		
+                           
+                        </li>
+                     </ul>
+                     </span>
+                  
+                  
+               </div><span class="highwire-journal-article-marker-end"></span></div><span id="related-urls"></span></div>
+         <div id="col-2">
+            
+            <div class="content-box" id="article-cb-main">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Article</span></h3>
+                  <div class="cb-section cb-slug">
+                     <ol>
+                        <li>
+                           <div id="slugline">
+                              
+                              	<span class="slug-metadata-note ahead-of-print">
+                                 
+                                 Published online ahead of print
+                                 
+                                 <span class="slug-ahead-of-print-date">June 2013</span>,
+                                 doi:
+                                 <span title="10.1099/ijs.0.052902-0" class="slug-doi">10.1099/ijs.0.052902-0</span>
+                                 </span>
+                              
+                              
+                              
+                              <cite>
+                                 	    <abbr title="International Journal of Systematic and Evolutionary Microbiology"
+                                       class="slug-jnl-abbrev">
+                                    IJSEM</abbr><span class="slug-pub-date">
+                                    November 2013 
+                                    </span>
+                                 	    <span class="slug-vol">
+                                    vol. 63 
+                                    </span><span class="slug-issue">
+                                    no. Pt 11 
+                                    </span><span class="slug-pages">
+                                    4174-4180
+                                    </span>
+                                 </cite>
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section cb-views">
+                     <ol>
+                        <li><span class="oa-article">Free via Open Access: <span>OA</span></span></li>
+                        <li class="abstract-view-link primary"><span class="oa-view">OA </span><a href="/content/63/Pt_11/4174.abstract" rel="view-abstract">Abstract</a><span class="free">Free</span></li>
+                        <li class="notice full-text-view-link primary"><span class="oa-view">OA </span><a href="/content/63/Pt_11/4174.full" rel="view-full-text">Full Text</a><span class="free">Free</span></li>
+                        <li class="notice full-text-pdf-view-link primary"><a href="/content/63/Pt_11/4174.full.pdf+html" rel="view-full-text.pdf">Full Text (PDF)</a></li>
+                        <li><span class="variant-indicator">» <span>Supplementary material</span></span></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+            
+            
+         </div>
+         <div id="col-3">
+            
+            <div class="content-box" id="sidebar-current-issue">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Month's Issue</span></h3>
+                  <div class="cb-section">
+                     <ol>
+                        <li><span><a href="/content/current" rel="current-issue">April 2015, 65 (Pt 4)</a></span></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section">
+                     <ol>
+                        <li>
+                           <div class="current-issue"><a href="/content/current" rel="current-issue"><img src="/content/65/Pt_4.cover.gif" width="67" height="89" alt="Current Issue" /></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section sidebar-etoc-link">
+                     <ol>
+                        <li><a href="/cgi/alerts/etoc">Alert me to new issues of IJSEM
+                              </a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            <div id="sidebar-global-nav">
+               
+               		
+               <ul class="button-list pub-links">
+                  <li class="first"><a href="/site/misc/about.xhtml" title="ABOUT IJSEM"><span>ABOUT IJSEM</span></a></li>
+                  <li><a href="/site/misc/edboard.xhtml" title="EDITORIAL BOARD &amp; STAFF"><span>EDITORIAL BOARD &amp; STAFF</span></a></li>
+                  <li><a href="http://www.editorialmanager.com/ijs/" title="SUBMIT A MANUSCRIPT"><span>SUBMIT A MANUSCRIPT</span></a></li>
+                  <li><a href="/site/misc/ifora.xhtml" title="INFORMATION FOR AUTHORS"><span>INFORMATION FOR AUTHORS</span></a></li>
+                  <li><a href="/site/misc/iforr.xhtml" title="INFORMATION FOR REVIEWERS"><span>INFORMATION FOR REVIEWERS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/site/librarians/index.xhtml"
+                        title="INFORMATION FOR LIBRARIANS"><span>INFORMATION FOR LIBRARIANS</span></a></li>
+                  <li><a href="/site/misc/reprints.xhtml" title="PERMISSIONS AND REPRINTS"><span>PERMISSIONS AND REPRINTS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/subscriptions" title="SUBSCRIPTIONS"><span>SUBSCRIPTIONS</span></a></li>
+                  <li><a href="/site/misc/addir.xhtml" title="ADVERTISING"><span>ADVERTISING</span></a></li>
+                  <li class="rss-img-button"><a href="/site/misc/alerts_feeds.xhtml" title="ALERTS &amp; FEEDS"><span>ALERTS &amp; FEEDS</span></a></li>
+                  <li class="last"><a href="/feedback" title="FEEDBACK"><span>FEEDBACK</span></a></li>
+               </ul>
+               		
+               <ul class="button-list pub-links umbrella-links">
+                  <li class="first"><a href="http://mic.sgmjournals.org" title="MICROBIOLOGY"><span>MICROBIOLOGY</span></a></li>
+                  <li><a href="http://vir.sgmjournals.org" title="J GEN VIROL"><span>J GEN VIROL</span></a></li>
+                  <li><a href="http://jmm.sgmjournals.org" title="J MED MICROBIOL"><span>J MED MICROBIOL</span></a></li>
+                  <li><a href="http://jmmcr.sgmjournals.org" title="JMM CASE REPORTS"><span>JMM CASE REPORTS</span></a></li>
+                  <li class="last"><a href="http://www.sgmjournals.org" title="ALL SGM JOURNALS"><span>ALL SGM JOURNALS</span></a></li>
+               </ul>
+               		
+               <div class="sidebar-icon-group">
+                  			
+                  <div class="icons">
+                     			<a href="http://www.sgm.ac.uk/" rel="external-nw"><img src="/publisher/img/society_logo.gif" class="publisher-icon" alt="Society Logo" /></a>
+                     			<a href="http://www.the-icsp.org/" rel="external-nw"><img src="/publisher/img/icsp_logo.gif" class="publisher-icon" alt="ICSP Logo" /></a>
+                     			<a href="http://highwire.stanford.edu/" rel="external-nw"><img src="/publisher/img/hplogo.gif" class="hw-icon" alt="HighWire Press Logo" /></a>
+                     			
+                  </div>
+                  			
+                  <div class="sidebar-icon-text"><span>The <a href="http://www.sgmjournals.org"> Society for General Microbiology</a> publishes online with the assistance of <a href="http://highwire.stanford.edu">HighWire Press®</a>.</span></div>
+                  		
+               </div>
+               	
+            </div>
+            <div class="most-links-box js-marker">
+               
+               <div class="most-header">
+                  
+                  <h3>Most</h3>
+                  
+               </div>
+               
+               <ul>
+                  <li class="most-cur-sel">
+                     <h4>Viewed</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/1070?rss=1&amp;ssource=mfr">Proposal to consistently apply the International Code of Nomenclature of Prokaryotes (ICNP) to names of the oxygenic photosynthetic
+                                 bacteria (cyanobacteria), including those validly published under the International Code of Botanical Nomenclature (ICBN)/International
+                                 Code of Nomenclature for algae, fungi and plants (ICN), and proposal to change Principle 2 of the ICNP</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfr">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/316?rss=1&amp;ssource=mfr">Integrating genomics into the taxonomy and systematics of the Bacteria and Archaea</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/333?rss=1&amp;ssource=mfr">Applications of next-generation sequencing to unravelling the evolutionary history of algae</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/739?rss=1&amp;ssource=mfr">Notification that new names of prokaryotes, new combinations, and new taxonomic opinions have appeared in volume 64, part
+                                 12, of the IJSEM</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfr1.dtl" class="view-all">» View all Most Viewed articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+                  <li>
+                     <h4>Cited</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4386?rss=1&amp;ssource=mfc">Chryseobacterium hispalense sp. nov., a plant-growth-promoting bacterium isolated from a rainwater pond in an olive plant
+                                 nursery, and emended descriptions of Chryseobacterium defluvii, Chryseobacterium indologenes, Chryseobacterium wanjuense and
+                                 Chryseobacterium gregarium</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfc">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_1/138?rss=1&amp;ssource=mfc">Aquibacter zeaxanthinifaciens gen. nov., sp. nov., a zeaxanthin-producing bacterium of the family Flavobacteriaceae isolated
+                                 from surface seawater, and emended descriptions of the genera Aestuariibaculum and Gaetbulibacter</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4790?rss=1&amp;ssource=mfc">Kordia aquimaris sp. nov., a zeaxanthin-producing member of the family Flavobacteriaceae isolated from surface seawater, and
+                                 emended description of the genus Kordia</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4524?rss=1&amp;ssource=mfc">Erythrobacter odishensis sp. nov. and Pontibacter odishensis sp. nov. isolated from dry soil of a solar saltern</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfc1.dtl" class="view-all">» View all Most Cited articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+               </ul>
+               
+               
+            </div>
+            
+            
+            
+         </div>
+         <div id="footer">
+            
+            <div class="bar">
+               
+               <div class="footer-group footer-col-left">
+                  		
+                  <p class="copyright">Copyright ©
+                     		2015 International Union of Microbiological Societies
+                     	
+                  </p>
+                  	
+               </div>
+               
+               <div class="footer-group footer-col-right">
+                  	    
+                  <ul class="issns">
+                     <li>
+                        <span>Print ISSN: </span>
+                        <span class="issn">1466-5026</span>
+                        
+                     </li>
+                     <li>
+                        <span>Online ISSN: </span>
+                        <span class="issn">1466-5034</span>
+                        
+                     </li>
+                  </ul>
+                  	  
+               </div>
+               	  
+            </div>
+            
+            
+            <div class="block-2 sb-div"></div>
+            
+         </div><script type="text/javascript">
+        var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
+        document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
+        </script><script type="text/javascript">
+        try {
+        var pageTracker = _gat._getTracker("UA-189672-25");
+        pageTracker._setDomainName(".sgmjournals.org");
+        pageTracker._trackPageview();
+        } catch(err) {}
+        </script><script type="text/javascript">
+	(function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
+		(i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
+		m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
+	})(window,document,'script','//www.google-analytics.com/analytics.js','ga');
+
+	ga('create', 'UA-48529861-1', '.sgmjournals.org');
+	ga('send', 'pageview');
+	</script></div>
+   </body>
+</html>
\ No newline at end of file
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4174.full/F1.small.gif b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4174.full/F1.small.gif
new file mode 100644
index 00000000..b5bfe2e6
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4174.full/F1.small.gif differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4174.full/fulltext.html b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4174.full/fulltext.html
new file mode 100644
index 00000000..98780b0c
--- /dev/null
+++ b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4174.full/fulltext.html
@@ -0,0 +1,1690 @@
+<!DOCTYPE html
+  PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html
+      xmlns="http://www.w3.org/1999/xhtml"
+      xml:lang="en"
+      lang="en">
+   <head>
+      <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
+      <title>Arthrobacter siccitolerans sp. nov., a highly desiccation-tolerant, xeroprotectant-producing strain isolated from dry soil
+         
+      </title>
+      <meta name="googlebot" content="NOODP" />
+      <meta name="HW.ad-path" content="/cgi/content/full/63/Pt_11/4174" />
+      <meta content="/ijs/63/Pt_11/4174.atom" name="HW.identifier" />
+      <meta name="DC.Format" content="text/html" />
+      <meta name="DC.Language" content="en" />
+      <meta content="Arthrobacter siccitolerans sp. nov., a highly desiccation-tolerant, xeroprotectant-producing strain isolated from dry soil"
+            name="DC.Title" />
+      <meta content="10.1099/ijs.0.052902-0" name="DC.Identifier" />
+      <meta content="2013-11-01" name="DC.Date" />
+      <meta content="Society for General Microbiology" name="DC.Publisher" />
+      <meta content="L. SantaCruz-Calvo" name="DC.Contributor" />
+      <meta content="J. González-López" name="DC.Contributor" />
+      <meta content="M. Manzanera" name="DC.Contributor" />
+      <meta content="International Journal of Systematic and Evolutionary&#xA;                Microbiology"
+            name="citation_journal_title" />
+      <meta content="Int J Syst Evol&#xA;                Microbiol"
+            name="citation_journal_abbrev" />
+      <meta content="1466-5026" name="citation_issn" />
+      <meta content="1466-5034" name="citation_issn" />
+      <meta name="citation_author" content="L. SantaCruz-Calvo" />
+      <meta name="citation_author_institution"
+            content="Institute for Water Research, and Department of Microbiology, University of Granada, Granada, Spain" />
+      <meta name="citation_author" content="J. González-López" />
+      <meta name="citation_author_institution"
+            content="Institute for Water Research, and Department of Microbiology, University of Granada, Granada, Spain" />
+      <meta name="citation_author" content="M. Manzanera" />
+      <meta name="citation_author_institution"
+            content="Institute for Water Research, and Department of Microbiology, University of Granada, Granada, Spain" />
+      <meta content="Arthrobacter siccitolerans sp. nov., a highly desiccation-tolerant, xeroprotectant-producing strain isolated from dry soil"
+            name="citation_title" />
+      <meta content="11/01/2013" name="citation_date" />
+      <meta content="63" name="citation_volume" />
+      <meta content="Pt 11" name="citation_issue" />
+      <meta content="4174" name="citation_firstpage" />
+      <meta content="4180" name="citation_lastpage" />
+      <meta content="63/Pt_11/4174" name="citation_id" />
+      <meta content="63/Pt 11/4174" name="citation_id_from_sass_path" />
+      <meta content="ijs;63/Pt_11/4174" name="citation_mjid" />
+      <meta content="10.1099/ijs.0.052902-0" name="citation_doi" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4174.abstract"
+            name="citation_abstract_html_url" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4174.full"
+            name="citation_fulltext_html_url" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4174.full.pdf"
+            name="citation_pdf_url" />
+      <meta content="/content/63/Pt_11.cover.gif" name="issue_cover_image" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4174"
+            name="citation_public_url" />
+      <meta content="23771623" name="citation_pmid" />
+      <meta name="citation_access" content="all" />
+      <meta name="citation_fulltext_world_readable" content="" />
+      <meta name="citation_section" content="Actinobacteria" />
+      <meta name="robots" content="noarchive,nofollow" />
+      <meta name="googlebot" content="noarchive" />
+      <link href="/content/63/Pt_11/4167.short" rel="prev" />
+      <link href="/content/63/Pt_11/4181.short" rel="next" />
+      <link rel="stylesheet" type="text/css" media="all" href="/shared/css/hw-global.css" />
+      <link rel="stylesheet" type="text/css" media="print" href="/shared/css/hw-print.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/standard-designs/design25/main.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/local/css/hw-local-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/jquery.fancybox-1.3.4.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-global-colexpand.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-global-colexpand.css" /><script type="text/javascript" id="session-d6526715e1">var callbackToken='5632987E8596775';</script><script type="text/javascript" id="session-d6526715e3">
+                      var subCode='sgmjournal_sub';
+                    </script><script type="text/javascript" src="/shared/js/jquery-min.js"></script><script type="text/javascript" src="/shared/js/fingerprint.js"></script><script type="text/javascript" src="/shared/js/hw-shared.js"></script><script type="text/javascript" src="/shared/js/design/hw-design1.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-shared.js"></script><script type="text/javascript" src="/shared/js/pages/hw-content.js"></script><script type="text/javascript" src="/shared/js/fancybox/jquery.fancybox-1.3.4.js"></script><script type="text/javascript" src="/shared/js/fancybox/jquery.easing-1.3.pack.js"></script><script type="text/javascript"
+              src="/shared/js/fancybox/jquery.mousewheel-3.0.4.pack.js"></script><script type="text/javascript" src="/shared/js/util/content.jquery.addVariantLink.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-custom-free.js"></script><script type="text/javascript" src="/shared/js/util/hw-col-expand.js"></script><script type="text/javascript"
+              src="https://data.namesforlife.com/script/NamesforLife.js"></script></head>
+   <body>
+      <div class="hw-gen-page pagetype-content" id="pageid-content" itemscope="itemscope"
+           itemtype="http://schema.org/ScholarlyArticle">
+         <div id="header">
+            
+            <h1><a id="logo" href="/"><span>International Journal of Systematic and Evolutionary Microbiology</span></a></h1>
+            
+            <p id="skip-link">
+               <a href="#content-block">Skip to main page content</a>
+               
+            </p>
+            
+            <ul class="button-list header-buttons">
+               <li class="first"><a href="/" title="HOME"><span>HOME</span></a></li>
+               <li><a href="/content/current" title="CURRENT ISSUE"><span>CURRENT ISSUE</span></a></li>
+               <li><a href="/content" title="ARCHIVE"><span>ARCHIVE</span></a></li>
+               <li><a href="/search" title="SEARCH"><span>SEARCH</span></a></li>
+               <li><a href="/help" title="HELP"><span>HELP</span></a></li>
+               <li class="last"><a href="/feedback" title="CONTACT US"><span>CONTACT US</span></a></li>
+            </ul>
+            
+            
+            <div class="header-qs">
+               
+               <form class="searchbox" action="/search" method="get">
+                  <div>
+                     	<label for="header-qs-input" id="header-qs-search-label">Search for Keyword:</label>
+                     <input value="" title="Search" type="text" name="fulltext" id="header-qs-input" /><input type="hidden" name="submit" value="yes" /><label for="header-qs-search" id="header-qs-search-label">GO</label><input value="GO" alt="Link: Go" type="image" id="header-qs-search-go"
+                            src="/shared/img/standard-design/design2/go.gif" /> 
+                     
+                  </div>
+                  <div class="adv-search-link"><a href="/search">Advanced Search</a></div>
+               </form>
+               
+               
+            </div>
+            
+            <div class="header-ac-elements">
+               
+               <div id="authstring" class="suppress-header-login">
+                  
+                  <ul>
+                     <li class="subscr-ref">Institution: THE NATURAL HISTORY MUSEUM</li>
+                     <li>
+                        <a href="/login?uri=http%3A%2F%2Fijs.sgmjournals.org%2Fcontent%2F63%2FPt_11%2F4174.full">
+                           Sign In as Member / Individual
+                           </a>
+                        
+                     </li>
+                  </ul>           
+                  
+               </div> 
+               
+               <div id="hdr-login" class="suppress-header-login"></div>
+               
+            </div>
+            
+            <div class="banner-ads">
+               		
+               <ul>
+                  <li class="position-1 no-ad hdr_left"><span>  </span></li>
+               </ul>
+               	
+            </div>
+            
+            <div class="bar">
+               
+               <div class="bar-inner"></div>
+               
+            </div>
+            
+         </div>
+         <div id="content-block">
+            <div class="article fulltext-view " itemprop="articleBody"><span class="highwire-journal-article-marker-start"></span><h1 id="article-title-1" itemprop="headline"><span class="named-content genus" id="named-content-1"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter"
+                        href="doi:10.1601/nm.5839"><em>Arthrobacter</em></a></span> <em>siccitolerans</em> sp. nov., a highly desiccation-tolerant, xeroprotectant-producing strain isolated from dry soil
+               </h1>
+               <div class="contributors">
+                  <ol class="contributor-list" id="contrib-group-1">
+                     <li class="contributor" id="contrib-1" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=L.+SantaCruz-Calvo&amp;sortspec=date&amp;submit=Submit">L. SantaCruz-Calvo</a></span>, 
+                     </li>
+                     <li class="contributor" id="contrib-2" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=J.+Gonz%C3%A1lez-L%C3%B3pez&amp;sortspec=date&amp;submit=Submit">J. González-López</a></span> and 
+                     </li>
+                     <li class="last" id="contrib-3"><span class="name"><a class="name-search"
+                              href="/search?author1=M.+Manzanera&amp;sortspec=date&amp;submit=Submit">M. Manzanera</a></span></li>
+                  </ol>
+                  <ol class="affiliation-list">
+                     <li class="aff"><a id="aff-1" name="aff-1"></a><address>Institute for Water Research, and Department of Microbiology, University of Granada, Granada, Spain</address>
+                     </li>
+                  </ol>
+                  <ol class="corresp-list">
+                     <li class="corresp" id="corresp-1"><strong>Correspondence</strong><br /> M. Manzanera <span class="em-link"><span class="em-addr">manzanera{at}ugr.es</span></span></li>
+                  </ol>
+               </div>
+               <div class="section abstract" id="abstract-1" itemprop="description">
+                  <div class="section-nav">
+                     <div class="nav-placeholder"> </div><a href="#fn-group-1" title="Next Section" class="next-section-link"><span>Next Section</span></a></div>
+                  <h2>Abstract</h2>
+                  
+                  <p id="p-3">A novel desiccation-tolerant, xeroprotectant-producing bacterium, designated strain 4J27<sup>T</sup>, was isolated from a <em>Nerium oleander</em> rhizosphere subjected to seasonal drought in Granada, Spain. Phylogenetic analysis based on 16S rRNA gene sequencing placed
+                     the isolate within the genus <span class="named-content genus" id="named-content-3"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter"
+                           href="doi:10.1601/nm.5839"><em>Arthrobacter</em></a></span>, its closest relative being <span class="named-content species" id="named-content-4"><a class="namesforlife" rel="namesforlife-name"
+                           title="Arthrobacter phenanthrenivorans"
+                           href="doi:10.1601/nm.13221"><em>Arthrobacter phenanthrenivorans</em></a></span> Shep3 DSM 18606<sup>T</sup>, with which it showed 99.23 % 16S rRNA gene sequence similarity. DNA–DNA hybridization measurements showed less than 25 %
+                     relatedness between strain 4J27<sup>T</sup> and <span class="named-content species" id="named-content-5"><a class="namesforlife" rel="namesforlife-name"
+                           title="Arthrobacter phenanthrenivorans"
+                           href="doi:10.1601/nm.13221"><em>Arthrobacter phenanthrenivorans</em></a></span> DSM 18606<sup>T</sup>. The DNA base composition of strain 4J27<sup>T</sup> was 65.3 mol%. The main fatty acids were anteiso C<sub>15 : 0</sub>, anteiso C<sub>17 : 0</sub>, C<sub>16 : 0</sub> and iso C<sub>16 : 0</sub> and the major menaquinone was MK-9 (H<sub>2</sub>). The peptidoglycan type was A3α with an <span class="sc">l</span>-Lys–<span class="sc">l</span>-Ser–<span class="sc">l</span>-Thr–<span class="sc">l</span>-Ala interpeptide bridge. The bacterium tested positive for catalase activity and negative for oxidase activity. Phylogenetic,
+                     chemotaxonomic and phenotypic analyses indicated that the desiccation-tolerant strain 4J27<sup>T</sup> represents a novel species within the genus <span class="named-content genus" id="named-content-6"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter"
+                           href="doi:10.1601/nm.5839"><em>Arthrobacter</em></a></span>, for which the name <span class="named-content genus" id="named-content-7"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter"
+                           href="doi:10.1601/nm.5839"><em>Arthrobacter</em></a></span> <em>siccitolerans</em> is proposed. The type strain is 4J27<sup>T</sup> ( = CECT 8257<sup>T</sup> = LMG 27359<sup>T</sup>).
+                  </p>
+                  
+               </div>
+               <div class="section fn-group" id="fn-group-1">
+                  <div class="section-nav"><a href="#abstract-1" title="Abstract" class="prev-section-link"><span>Previous Section</span></a><a href="#sec-1" title="Next Section" class="next-section-link"><span>Next Section</span></a></div>
+                  <ul>
+                     <li class="fn-supplementary-material" id="fn-1">
+                        <p id="p-1">A supplementary figure and a supplementary table are available with the online version of this paper.</p>
+                     </li>
+                  </ul>
+               </div>
+               <div class="license" id="license-1">
+                  <p id="p-2">This is an open-access article distributed under the terms of the Creative Commons Attribution License, which permits unrestricted
+                     use, distribution, and reproduction in any medium, provided the original work is properly cited.
+                  </p>
+               </div>
+               <p id="p-5">The genus <span class="named-content genus" id="named-content-8"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter"
+                        href="doi:10.1601/nm.5839"><em>Arthrobacter</em></a></span>, first defined by <a id="xref-ref-5-1" class="xref-bibr" href="#ref-5">Conn &amp; Dimmick (1947)</a>, belongs to the class <span class="named-content class" id="named-content-9"><a class="namesforlife" rel="namesforlife-name" title="Actinobacteria"
+                        href="doi:10.1601/nm.5712"><em>Actinobacteria</em></a></span> and includes Gram-stain-positive coryneform bacteria with aerobic metabolism and little or no acid production from glucose.
+                  Species of the genus <span class="named-content genus" id="named-content-10"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter"
+                        href="doi:10.1601/nm.5839"><em>Arthrobacter</em></a></span> contain lysine in the peptidoglycan and have a DNA G+C content ranging from 59 mol% to 66 mol% (<a id="xref-ref-17-1" class="xref-bibr" href="#ref-17">Keddie <em>et al.</em>, 1986</a>; <a id="xref-ref-14-1" class="xref-bibr" href="#ref-14">Jones &amp; Keddie, 1992</a>). These bacteria typically take the shape of rods in younger cultures and cocci in older cultures (<a id="xref-ref-17-2" class="xref-bibr" href="#ref-17">Keddie <em>et al.</em>, 1986</a>), depending on their growth rate and nutritional conditions (Germida &amp; Cassida, 1980). The transition to this coccoid-like
+                  state has been shown to require manganese (Germida &amp; Cassida, 1980). The small coccoid-like state has been described as being
+                  the most stable form. Due to their pleomorphic and heterogeneous appearance, strains of species of the genus <span class="named-content genus" id="named-content-11"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter"
+                        href="doi:10.1601/nm.5839"><em>Arthrobacter</em></a></span> were originally grouped with the Corynebacteria (<a id="xref-ref-17-3" class="xref-bibr" href="#ref-17">Keddie <em>et al.</em>, 1986</a>).
+               </p>
+               <p id="p-6">In response to changing extracellular osmolarity such as desiccation or increased salinity some micro-organisms accumulate
+                  small organic compounds (<a id="xref-ref-3-1" class="xref-bibr" href="#ref-3">Brown, 1976</a>; <a id="xref-ref-1-1" class="xref-bibr" href="#ref-1">Arakawa&amp; Timasheff, 1982</a>). These compatible solutes act as protectants, which under laboratory conditions can also stabilize enzymes, DNA, cell membranes
+                  and even whole cells against different kinds of stress, such as freezing, drying and heating (<a id="xref-ref-3-2" class="xref-bibr" href="#ref-3">Brown, 1976</a>; <a id="xref-ref-47-1" class="xref-bibr" href="#ref-47">Yancey <em>et al.</em>, 1982</a>; <a id="xref-ref-21-1" class="xref-bibr" href="#ref-21">Knapp <em>et al.</em>, 1999</a>; <a id="xref-ref-26-1" class="xref-bibr" href="#ref-26">Manzanera <em>et al.</em> 2002</a>, <a id="xref-ref-31-1" class="xref-bibr" href="#ref-31">Narváez-Reinaldo <em>et al.</em>, 2010</a>, <a id="xref-ref-15-1" class="xref-bibr" href="#ref-15">Julca <em>et al.</em>, 2012</a>). Our group has previously reported a new method for the isolation of desiccation-tolerant micro-organisms from dry soil
+                  using organic solvents as selective agents (<a id="xref-ref-27-1" class="xref-bibr" href="#ref-27">Manzanera <em>et al.</em>, 2004a</a>; <a id="xref-ref-31-2" class="xref-bibr" href="#ref-31">Narváez-Reinaldo <em>et al.</em>, 2010</a>). Strain 4J27<sup>T</sup> displayed remarkably high tolerance to desiccation and produced excellent xeroprotectants for the dry stabilization of proteins
+                  (lipase enzymes) and whole prokaryotic cells (<span class="named-content species" id="named-content-12"><a class="namesforlife" rel="namesforlife-name" title="Escherichia coli"
+                        href="doi:10.1601/nm.3093"><em>Escherichia coli</em></a></span> MC4100) compared with those when trehalose was used (<a id="xref-ref-28-1" class="xref-bibr" href="#ref-28">Manzanera <em>et al.</em>, 2004b</a>; <a id="xref-ref-31-3" class="xref-bibr" href="#ref-31">Narváez-Reinaldo <em>et al.</em>, 2010</a>). Among the 10 different xeroprotectants tested, the best results were observed with S4J27-D (composed of trehalose, glutamine
+                  and glucose), a synthetic mixture derived from strain 4J27<sup>T</sup> (<a id="xref-ref-31-4" class="xref-bibr" href="#ref-31">Narváez-Reinaldo <em>et al.</em>, 2010</a>).
+               </p>
+               <p id="p-7">Here we describe the morphological, biochemical and phylogenetic characteristics of this desiccation-tolerant strain (4J27<sup>T</sup>), isolated from dry soil and with a remarkable potential for the dry stabilization of some biomaterials. On the basis of
+                  the phylogenetic analysis of the 16S rRNA gene sequence together with physiological, chemotaxonomic and DNA–DNA hybridization
+                  analyses we demonstrate that strain 4J27<sup>T</sup> represents a novel species of the genus <span class="named-content genus" id="named-content-13"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter"
+                        href="doi:10.1601/nm.5839"><em>Arthrobacter</em></a></span>.
+               </p>
+               <p id="p-8">Strain 4J27<sup>T</sup> was grown at 30 °C (±3 °C) in tryptone soya agar (TSA) plates and in tryptone soya broth (TSB) or M9 minimal medium (M6030;
+                  Sigma). <span class="named-content species" id="named-content-14"><a class="namesforlife" rel="namesforlife-name"
+                        title="Arthrobacter phenanthrenivorans"
+                        href="doi:10.1601/nm.13221"><em>Arthrobacter phenanthrenivorans</em></a></span> DSM 18606<sup>T</sup> was included in the study as reference.
+               </p>
+               <p id="p-9">Strain 4J27<sup>T</sup>, the object of this study, had already been assigned to the genus <span class="named-content genus" id="named-content-15"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter"
+                        href="doi:10.1601/nm.5839"><em>Arthrobacter</em></a></span> by partial analysis of its 16S rRNA gene sequence (GenBank accession number <a href="/external-ref?link_type=GEN&amp;access_num=GU815139">GU815139</a>; <a id="xref-ref-31-5" class="xref-bibr" href="#ref-31">Narváez-Reinaldo <em>et al.</em>, 2010</a>), which was compared with those in the EzTaxon-e server (<a href="http://eztaxon-e.ezbiocloud.net/">http://eztaxon-e.ezbiocloud.net/</a>, <a id="xref-ref-19-1" class="xref-bibr" href="#ref-19">Kim <em>et al.</em>, 2012</a>). The nearly complete sequence of the 16S rRNA gene of strain 4J27<sup>T</sup> (approximately 1500 bp) was aligned with the sequences of closely related species of the genus <span class="named-content genus" id="named-content-16"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter"
+                        href="doi:10.1601/nm.5839"><em>Arthrobacter</em></a></span> by using the <span class="sc">clustal</span> <span class="sc">x</span> 2 program (<a id="xref-ref-24-1" class="xref-bibr" href="#ref-24">Larkin <em>et al.</em>, 2007</a>). A phylogenetic tree was inferred using the neighbour-joining (<a id="xref-ref-35-1" class="xref-bibr" href="#ref-35">Saitou &amp; Nei, 1987</a>) and maximum-likelihood (<a id="xref-ref-11-1" class="xref-bibr" href="#ref-11">Guindon &amp; Gascuel, 2003</a>) methods with the <span class="sc">mega</span> 5.0 software package (<a id="xref-ref-41-1" class="xref-bibr" href="#ref-41">Tamura <em>et al.</em>, 2011</a>). Bootstrap analysis was based on 1000 resamplings (<a id="xref-ref-9-1" class="xref-bibr" href="#ref-9">Felsenstein, 1985</a>). The distances were calculated according to Kimura’s two-parameter model (<a id="xref-ref-20-1" class="xref-bibr" href="#ref-20">Kimura, 1980</a>). The resulting neighbour-joining tree obtained with Kimura’s two-parameter model is shown in <a id="xref-fig-1-1" class="xref-fig" href="#F1">Fig. 1</a> and the maximum-likelihood tree is shown in Fig. S1, available in IJSEM Online.
+               </p>
+               <div id="F1" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4174/F1.expansion.html"><img alt="Fig. 1. " src="4174/F1.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4174/F1.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4174/F1.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4174/F1">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 1. </span> 
+                     
+                     <p id="p-10" class="first-child">Neighbour-joining phylogenetic tree based on 16S rRNA sequence comparisons of strain 4J27<sup>T</sup> and its 24 closest relatives. <span class="named-content species" id="named-content-17"><a class="namesforlife" rel="namesforlife-name" title="Streptomyces albus"
+                              href="doi:10.1601/nm.11066"><em>Streptomyces albus</em></a></span> AS 4.164<sup>T</sup> was used as the outgroup. The numbers at bifurcations indicate how many times each species coincided in this position as
+                        percentages and only values &gt; 50% are shown. Bar, 0.01 changes per nucleotide position.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <p id="p-11">The sequence corresponding to the 16S rRNA gene of strain 4J27<sup>T</sup> showed 99.23 % similarity to that of <span class="named-content species" id="named-content-18"><a class="namesforlife" rel="namesforlife-name"
+                        title="Arthrobacter phenanthrenivorans"
+                        href="doi:10.1601/nm.13221"><em>Arthrobacter phenanthrenivorans</em></a></span> DSM 18606<sup>T</sup>. Phylogenetic analysis showed that strain 4J27<sup>T</sup> clearly belongs to the genus <span class="named-content genus" id="named-content-19"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter"
+                        href="doi:10.1601/nm.5839"><em>Arthrobacter</em></a></span><em>,</em> and its closest relative was <span class="named-content species" id="named-content-20"><a class="namesforlife" rel="namesforlife-name"
+                        title="Arthrobacter phenanthrenivorans"
+                        href="doi:10.1601/nm.13221"><em>Arthrobacter phenanthrenivorans</em></a></span> DSM 18606<sup>T</sup>.
+               </p>
+               <p id="p-12">DNA–DNA hybridization was carried out at the Deutsche Sammlung von Mikroorganismen und Zellkulturen (DSMZ; Braunschweig, Germany).
+                  Cells of <span class="named-content species" id="named-content-21"><a class="namesforlife" rel="namesforlife-name"
+                        title="Artrhobacter phenanthrenivorans"
+                        href="doi:10.1601/nm.13221"><em>Artrhobacter phenanthrenivorans</em></a></span> DSM 18606<sup>T</sup> and strain 4J27<sup>T</sup> were disrupted by using a French pressure cell (Thermo Spectronic) and the DNA of each strain in the crude lysate were purified
+                  by chromatography on hydroxyapatite as described by <a id="xref-ref-4-1" class="xref-bibr" href="#ref-4">Cashion <em>et al.</em> (1977)</a>. DNA–DNA hybridization was conducted as described by <a id="xref-ref-6-1" class="xref-bibr" href="#ref-6">De Ley <em>et al.</em> (1970)</a> with the modifications described by <a id="xref-ref-13-1" class="xref-bibr" href="#ref-13">Huss <em>et al.</em> (1983)</a> using a model Cary 100 Bio UV/VIS-spectrophotometer equipped with a Peltier-thermostat-regulated 6×6 multicell charger and
+                  a temperature controller with <em>in situ</em> temperature probe (Varian). DNA–DNA hybridization of strain 4J27<sup>T</sup> with <span class="named-content species" id="named-content-22"><a class="namesforlife" rel="namesforlife-name"
+                        title="Arthrobacter phenanthrenivorans"
+                        href="doi:10.1601/nm.13221"><em>Arthrobacter phenanthrenivorans</em></a></span> DSM 18606<sup>T</sup> resulted in a DNA–DNA relatedness value of 22.3 % (22.1 %), the value in parentheses being the result of measurements in
+                  duplicate. On the basis of DNA–DNA reciprocal hybridization, strain 4J27<sup>T</sup> did not belong to the species <span class="named-content species" id="named-content-23"><a class="namesforlife" rel="namesforlife-name"
+                        title="Arthrobacter phenanthrenivorans"
+                        href="doi:10.1601/nm.13221"><em>Arthrobacter phenanthrenivorans</em></a></span> according to the recommendations of a threshold value of 70 % DNA–DNA relatedness for the definition of bacterial species
+                  (<a id="xref-ref-44-1" class="xref-bibr" href="#ref-44">Wayne <em>et al.</em>, 1987</a>). Therefore strain 4J27<sup>T</sup> probably represents a novel species of the genus <span class="named-content genus" id="named-content-24"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter"
+                        href="doi:10.1601/nm.5839"><em>Arthrobacter</em></a></span>.
+               </p>
+               <p id="p-13">The G+C (mol%) content of the genomic DNA of strain 4J27<sup>T</sup> was analysed at the DSMZ. The dG and dT ratio was calculated according to the method of <a id="xref-ref-29-1" class="xref-bibr" href="#ref-29">Mesbah <em>et al.</em> (1989)</a>. Species of the genus <span class="named-content genus" id="named-content-25"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter"
+                        href="doi:10.1601/nm.5839"><em>Arthrobacter</em></a></span> have previously been described as Gram-stain-positive actinobacteria with high GC content (<a id="xref-ref-17-4" class="xref-bibr" href="#ref-17">Keddie <em>et al.</em>, 1986</a>; <a id="xref-ref-14-2" class="xref-bibr" href="#ref-14">Jones &amp; Keddie ,1992</a>), which typically have a DNA G+C content in the range of 59–66 mol% (<a id="xref-ref-17-5" class="xref-bibr" href="#ref-17">Keddie <em>et al.</em>, 1986</a>). The DNA G+C content of strain 4J27<sup>T</sup> was 65.3 mol%, which was within the range shown by all members of the genus <span class="named-content genus" id="named-content-26"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter"
+                        href="doi:10.1601/nm.5839"><em>Arthrobacter</em></a></span> and considered to have a high GC content (<a id="xref-ref-17-6" class="xref-bibr" href="#ref-17">Keddie <em>et al.</em>, 1986</a>).
+               </p>
+               <p id="p-14">Chemotaxonomic analyses were carried out by the Identification Service of the DSMZ. Peptidoglycans were isolated from strain
+                  4J27<sup>T</sup> and their structures analysed (<a id="xref-ref-38-1" class="xref-bibr" href="#ref-38">Schleifer &amp; Kandler, 1972</a>). After derivatization according to the method of <a id="xref-ref-25-1" class="xref-bibr" href="#ref-25">MacKenzie (1987</a>) the approximate molar amino-acid ratio was determined by gas chromatography. Free amino groups within the peptidoglycan
+                  were detected by labelling with 1-fluoro-2,4-dinitrobenzene (<a id="xref-ref-37-1" class="xref-bibr" href="#ref-37">Schleifer, 1985</a>). The peptidoglycan of strain 4J27<sup>T</sup> was composed of Ala, Ser, Thr, Glu and Lys at a molar ratio of 2.8 : 1.2 : 1.0 : 1.0 : 1.5. Two-dimensional TLC of the partial
+                  hydrolysate (4 M HCl, 100 °C, 45 min) of the peptidoglycan revealed the presence of the peptides <span class="sc">l</span>-Ala–<span class="sc">d</span>-Glu, <span class="sc">l</span>-Lys–<span class="sc">d</span>-Ala, <span class="sc">l</span>-Lys–<span class="sc">l</span>-Ser, <span class="sc">l</span>-Lys–<span class="sc">l</span>-Ser–<span class="sc">l</span>-Thr, <span class="sc">d</span>-Ala–<span class="sc">l</span>-Lys–<span class="sc">l</span>-Ser–<span class="sc">l</span>-Thr, <span class="sc">l</span>-Ser–<span class="sc">l</span>-Thr and <span class="sc">l</span>-Ala–<span class="sc">d</span>-Ala. On the basis of these results it was concluded that strain 4J27<sup>T</sup> contains a type A3α peptidoglycan (<a id="xref-ref-38-2" class="xref-bibr" href="#ref-38">Schleifer &amp; Kandler, 1972</a>) with an <span class="sc">l</span>-Lys–<span class="sc">l</span>-Ser–<span class="sc">l</span>-Thr–<span class="sc">l</span>-Ala interpeptide bridge (A11.23 DSMZ-Catalogue of strains, 7th edition, 2001), which is found in the more closely related
+                  members of the genus <span class="named-content genus" id="named-content-27"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter"
+                        href="doi:10.1601/nm.5839"><em>Arthrobacter</em></a></span>, according to the neighbour-joining phylogenetic tree, such as <span class="named-content species" id="named-content-28"><a class="namesforlife" rel="namesforlife-name"
+                        title="Arthrobacter chlorophenolicus"
+                        href="doi:10.1601/nm.5845"><em>Arthrobacter chlorophenolicus</em></a></span>, <span class="named-content species" id="named-content-29"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter oxydans"
+                        href="doi:10.1601/nm.5863"><em>Arthrobacter oxydans</em></a></span>, <span class="named-content species" id="named-content-30"><a class="namesforlife" rel="namesforlife-name"
+                        title="Arthrobacter polychromogenes"
+                        href="doi:10.1601/nm.5866"><em>Arthrobacter polychromogenes</em></a></span>, <span class="named-content species" id="named-content-31"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter sulfonivorans"
+                        href="doi:10.1601/nm.5875"><em>Arthrobacter sulfonivorans</em></a></span>, <span class="named-content species" id="named-content-32"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter equi"
+                        href="doi:10.1601/nm.22523"><em>Arthrobacter equi</em></a></span>, <span class="named-content species" id="named-content-33"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter niigatensis"
+                        href="doi:10.1601/nm.14163"><em>Arthrobacter niigatensis</em></a></span>, <span class="named-content species" id="named-content-34"><a class="namesforlife" rel="namesforlife-name"
+                        title="Arthrobacter phenanthrenivorans"
+                        href="doi:10.1601/nm.13221"><em>Arthrobacter phenanthrenivorans</em></a></span>, <span class="named-content species" id="named-content-35"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter defluvii"
+                        href="doi:10.1601/nm.13218"><em>Arthrobacter defluvii</em></a></span>, <span class="named-content species" id="named-content-36"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter roseus"
+                        href="doi:10.1601/nm.5872"><em>Arthrobacter roseus</em></a></span> and <span class="named-content species" id="named-content-37"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter scleromae"
+                        href="doi:10.1601/nm.9649"><em>Arthrobacter scleromae</em></a></span> (<a id="xref-ref-2-1" class="xref-bibr" href="#ref-2">Borodina <em>et al.</em>, 2002</a>; <a id="xref-ref-22-1" class="xref-bibr" href="#ref-22">Kodama <em>et al.</em>, 1992</a>; <a id="xref-ref-45-1" class="xref-bibr" href="#ref-45">Westerberg <em>et al.</em>, 2000</a>; <a id="xref-ref-34-1" class="xref-bibr" href="#ref-34">Reddy <em>et al.</em>, 2002</a>; <a id="xref-ref-12-1" class="xref-bibr" href="#ref-12">Huang <em>et al.</em>, 2005</a>; <a id="xref-ref-18-1" class="xref-bibr" href="#ref-18">Kim <em>et al.</em>, 2008</a>; <a id="xref-ref-7-1" class="xref-bibr" href="#ref-7">Ding <em>et al.</em>, 2009</a>; <a id="xref-ref-48-1" class="xref-bibr" href="#ref-48">Yassin <em>et al.</em>, 2011</a>). Strains containing a type A3α peptidoglycan make up a rather uniform group, although they do show a considerable number
+                  of different types of interpeptide bridge. Most of these strains belong to the genus <span class="named-content genus" id="named-content-38"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter"
+                        href="doi:10.1601/nm.5839"><em>Arthrobacter</em></a></span> and are distinguished by strictly aerobic growth and a complete life cycle (<a id="xref-ref-5-2" class="xref-bibr" href="#ref-5">Conn &amp; Dimmick, 1947</a>; <a id="xref-ref-38-3" class="xref-bibr" href="#ref-38">Schleifer &amp; Kandler, 1972</a>).
+               </p>
+               <p id="p-15">Fatty-acid methyl esters were obtained from 40 mg cells of strain 4J27<sup>T</sup> scraped from Petri dishes by saponification, methylation and extraction using the methods of <a id="xref-ref-30-1" class="xref-bibr" href="#ref-30">Miller (1982)</a> and <a id="xref-ref-23-1" class="xref-bibr" href="#ref-23">Kuykendall <em>et al.</em>, (1988)</a> with minor modifications. The fatty-acid methyl-ester mixtures were separated using the Sherlock Microbial Identification
+                  System (MIS) (MIDI, Microbial ID). The main cellular fatty acids of the highly desiccation-tolerant strain 4J27<sup>T</sup> were, from highest to lowest, anteiso-C<sub>15 : 0</sub>, 41.20 %; anteiso-C<sub>17 : 0</sub>, 30.86 %; C<sub>16 : 0</sub>, 10.21 %; iso-C<sub>16 : 0</sub>, 6.61 %; iso-C<sub>15 : 0</sub>, 4.40 %; C<sub>18 : 0</sub>, 2.38 %; iso-C<sub>17 : 0</sub>, 1.79 %; iso-C<sub>14 : 0</sub>, 0.83 %; C<sub>14 : 0</sub>, 0.75 %; anteiso-C<sub>19 : 0</sub>, 0.61 % and iso-C<sub>18 : 0</sub>, 0.36 %. The fatty-acid composition of strain 4J27<sup>T</sup> was consistent with that of the genus <span class="named-content genus" id="named-content-39"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter"
+                        href="doi:10.1601/nm.5839"><em>Arthrobacter</em></a></span>, with branched-chain fatty acid, antesio-pentadecanoic acid (anteiso-C<sub>15 : 0</sub>) predominating (<a id="xref-ref-45-2" class="xref-bibr" href="#ref-45">Westerberg <em>et al.</em>, 2000</a>).
+               </p>
+               <p id="p-16">Respiratory quinones were analysed as described by <a id="xref-ref-42-1" class="xref-bibr" href="#ref-42">Tindall (1990a</a>; b), using TLC and UV mass spectroscopy, and found menaquinone to be the sole quinone component. Analyses of the electron-transport
+                  system (isoprenoid quinones) for strain 4J27<sup>T</sup> resulted in detection of MK9 (II-H<sub>2</sub>) 68 %; MK9 21 % and MK8 (II-H<sub>2</sub>) 11 %.
+               </p>
+               <p id="p-17">To analyse the whole cell sugars of strain 4J27<sup>T</sup>, cells were hydrolysed in 0.5 M H<sub>2</sub>SO<sub>4</sub> for 2 h at 100 °C. Sulfuric acid was removed by 20 % <em>N,N</em>-dioctylmethylamine in chloroform according to the method of <a id="xref-ref-46-1" class="xref-bibr" href="#ref-46">Whiton <em>et al.</em> (1985)</a>. Sugars in the hydrolysate were analysed by TLC on cellulose plates according to the methods of <a id="xref-ref-40-1" class="xref-bibr" href="#ref-40">Staneck &amp; Roberts (1974)</a>. The whole-cell sugars of the isolated strain were galactose, glucose, mannose, ribose and rhamnose.
+               </p>
+               <p id="p-18">Mobility was tested by stab-inoculating mannitol-mobility semi-solid agar (413782; Ultimed). This semi-solid agar medium enabled
+                  us to analyse the nitrate reductase activity (capacity to reduce nitrate to nitrite) and catabolism of mannitol by using Griess–Ilosvay
+                  A and B reagents. Oxidase activity was determined using 1 % w/v <em>N</em>,<em>N</em>,<em>N</em>′,<em>N</em>′-tetramethyl-<em>p</em>-phenylenediamine and catalase activity was determined by the production of bubbles from 3 % v/v. H<sub>2</sub>O<sub>2</sub>. Cells of strain 4J27<sup>T</sup> were identified as catalase-positive, oxidase-negative, nitrate reductase-negative and mannitol-positive. <span class="named-content species" id="named-content-40"><a class="namesforlife" rel="namesforlife-name"
+                        title="Arthrobacter phenanthrenivorans"
+                        href="doi:10.1601/nm.13221"><em>Arthrobacter phenanthrenivorans</em></a></span> DSM 18606<sup>T</sup>.
+               </p>
+               <p id="p-19">To characterize the growth of strain 4J27<sup>T</sup> at different temperatures, pH values and salinities, cultures were incubated at 150 r.p.m. in Luria–Bertani (LB) rich medium
+                  (L3152; Sigma). Cell growth was monitored at different temperatures (5, 10, 15, 20, 25, 30, 35, 40, 45 and 50 °C), pH (3,
+                  5, 7, 9, 12 and 13) and NaCl concentrations (0, 0.2, 0.4, 0.6, 0.8, 1 and 1.2 M) by measuring the OD<sub>600</sub> in triplicate at 0, 12 and 24 h using a UV-160A spectrophotometer (Shimadzu). Strain 4J27<sup>T</sup> grew best at 30 °C in LB medium. It was able to grow at 37 °C and 15 °C but not at 40 °C or 10 °C. The pH range for growth
+                  was between 5 and 9 with optimum growth at pH 7. Strain 4J27<sup>T</sup> grew in NaCl concentrations ranging from 0 to 0.8 M but grew best at 0.2 M. This differed clearly from the most closely related
+                  species, <span class="named-content species" id="named-content-41"><a class="namesforlife" rel="namesforlife-name"
+                        title="Arthrobacter phenanthrenivorans"
+                        href="doi:10.1601/nm.13221"><em>Arthrobacter phenanthrenivorans</em></a></span> DSM 18606<sup>T</sup>, which was able to grow at 4 °C but not at pH 5.
+               </p>
+               <p id="p-20">The following API kits were used for testing, API Coryne, API 20NE and API 20E (bioMérieux,). Each test was interpreted according
+                  to the manufacturer’s instructions. Biolog tests were performed to investigate which compounds the strains in question could
+                  use for respiration. A GP2 MicroPlate (Cat. No 1014; Biolog), containing 95 different carbon compounds, was used to test for
+                  substrate oxidation. The chemistry of these plates is based on tetrazolium reduction, in response to metabolic processes such
+                  as fermentation and oxidation. Tetrazolium reduction produced formazan in a variety of colours from dark blue to deep red
+                  to orange, depending upon the original tetrazolium salt used as the substrate for the reaction. MicroPlates were inoculated
+                  and interpreted according to the manufacturer’s instructions. The results were recorded after 12 h based on <em>A</em><sub>585</sub>. Antibiotic susceptibility testing was performed using the disc-diffusion method in which the antibiotic diffuses away from
+                  the disc in two dimensions, forming a concentration gradient that inhibits the growth of bacteria and causes an inhibition
+                  zone (Piddock, 1990). The results were interpreted according to the criteria established for staphylococci in 1997 by the
+                  National Committee for Clinical Laboratory Standards (2000). At the concentrations assayed, the inhibition zone caused by
+                  streptomycin was 157 mm, rifampicin 347 mm, chloramphenicol 340 mm, kanamycin 150 mm and tetracycline 157 mm and thus it could
+                  be concluded that strain 4J27<sup>T</sup> was susceptible to all the antibiotics tested. The phenotypic differences between strain 4J27<sup>T</sup> and closely related species are summarized in <a id="xref-table-wrap-1-1" class="xref-table" href="#T1">Table 1</a> and the physiological differences between strain 4J27<sup>T</sup> and its closest relative species <span class="named-content species" id="named-content-42"><a class="namesforlife" rel="namesforlife-name"
+                        title="Arthrobacter phenanthrenivorans"
+                        href="doi:10.1601/nm.13221"><em>Arthrobacter phenanthrenivorans</em></a></span> DSM 18606<sup>T</sup> are summarized in Table S1.
+               </p>
+               <div id="T1" class="table pos-float">
+                  <div class="table-inline">
+                     <div class="callout"><span>View this table:</span><ul class="callout-links">
+                           <li><a href="4174/T1.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4174/T1.expansion.html">In a new window</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="table-caption"><span class="table-label">Table 1. </span> 
+                     <span class="caption-title">Differential characteristics between strain 4J27<sup>T</sup> and the type strains of the most closely related species of the genus <span class="named-content genus" id="named-content-43"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter"
+                              href="doi:10.1601/nm.5839"><em>Arthrobacter</em></a></span></span>
+                     
+                     <p id="p-21" class="first-child">Strains: 1, 4J27<sup>T</sup>; 2, <span class="named-content species" id="named-content-44"><a class="namesforlife" rel="namesforlife-name"
+                              title="Arthrobacter phenanthrenivorans"
+                              href="doi:10.1601/nm.13221"><em>Arthrobacter phenanthrenivorans</em></a></span> DSM 18606<sup>T</sup>; 3, <span class="named-content species" id="named-content-45"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter niigatensis"
+                              href="doi:10.1601/nm.14163"><em>Arthrobacter niigatensis</em></a></span> IAM 15382<sup>T</sup>; 4, <span class="named-content species" id="named-content-46"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter. defluvii"
+                              href="doi:10.1601/nm.13218"><em>Arthrobacter. defluvii</em></a></span> DSM 18782<sup>T</sup>; 5. <span class="named-content species" id="named-content-47"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter equi"
+                              href="doi:10.1601/nm.22523"><em>Arthrobacter equi</em></a></span> DSM 23395<sup>T</sup>; 6. <span class="named-content species" id="named-content-48"><a class="namesforlife" rel="namesforlife-name"
+                              title="Arthrobacter chlorophenolicus"
+                              href="doi:10.1601/nm.5845"><em>Arthrobacter chlorophenolicus</em></a></span> DSM 12829<sup>T</sup>; 7. <span class="named-content species" id="named-content-49"><a class="namesforlife" rel="namesforlife-name"
+                              title="Arthrobacter polychromogenes"
+                              href="doi:10.1601/nm.5866"><em>Arthrobacter polychromogenes</em></a></span> DSM 20136<sup>T</sup>; 8. <span class="named-content species" id="named-content-50"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter oxydans"
+                              href="doi:10.1601/nm.5863"><em>Arthrobacter oxydans</em></a></span> DSM 20119<sup>T</sup>; 9. <span class="named-content species" id="named-content-51"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter scleromae"
+                              href="doi:10.1601/nm.9649"><em>Arthrobacter scleromae</em></a></span> JCM 12642<sup>T</sup>. Data of the reference species were taken from <a id="xref-ref-16-1" class="xref-bibr" href="#ref-16">Kallimanis <em>et al.</em> (2009)</a>, <a id="xref-ref-7-2" class="xref-bibr" href="#ref-7">Ding <em>et al.</em> (2009)</a>, <a id="xref-ref-18-2" class="xref-bibr" href="#ref-18">Kim <em>et al.</em>, (2008)</a>, <a id="xref-ref-48-2" class="xref-bibr" href="#ref-48">Yassin <em>et al.</em> (2011)</a>, <a id="xref-ref-45-3" class="xref-bibr" href="#ref-45">Westerberg <em>et al.</em> (2000)</a>, Schippers-Lammertse <em>et al.</em> (2009), <a id="xref-ref-39-1" class="xref-bibr" href="#ref-39">Sguros (1955)</a>, <a id="xref-ref-12-2" class="xref-bibr" href="#ref-12">Huang <em>et al.</em> (2005)</a> and the present study. +, Positive; −, negative; <span class="sc">nd</span>, not determined; CFA, cellular fatty acid.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <p id="p-23">The degree of tolerance to desiccation shown by strain 4J27<sup>T</sup> was compared with that of the previously described desiccation-tolerant bacteria <span class="named-content species" id="named-content-52"><a class="namesforlife" rel="namesforlife-name"
+                        title="Acinetobacter calcoaceticus"
+                        href="doi:10.1601/nm.2766"><em>Acinetobacter calcoaceticus</em></a></span> PADD68 (<a id="xref-ref-31-6" class="xref-bibr" href="#ref-31">Narváez-Reinaldo <em>et al.</em>, 2010</a>), the desiccation-sensitive strain <span class="named-content species" id="named-content-53"><a class="namesforlife" rel="namesforlife-name" title="Pseudomonas putida"
+                        href="doi:10.1601/nm.2674"><em>Pseudomonas putida</em></a></span> KT2440 (<a id="xref-ref-26-2" class="xref-bibr" href="#ref-26">Manzanera <em>et al.</em>, 2002</a>) and the closely related <span class="named-content species" id="named-content-54"><a class="namesforlife" rel="namesforlife-name"
+                        title="Arthrobacter phenanthrenivorans"
+                        href="doi:10.1601/nm.13221"><em>Arthrobacter phenanthrenivorans</em></a></span> DSM 18606<sup>T</sup>. A colony of a pure culture grown for 48 h of each strain, containing 10<sup>7</sup> to 10<sup>9</sup> cells, was suspended in 1 ml M9 minimal medium. Aliquots (100 µl) were placed on sterile Petri dishes and dried under a current
+                  of sterile air for 24 h. The cells were then suspended in 1 ml sterile saline buffer, and serial dilutions of the cell suspension
+                  were plated on TSA plates before and after drying. All such procedures were conducted at room temperature. The survival rate
+                  was calculated in terms of c.f.u. ml<sup>−1</sup> after drying compared with c.f.u. ml<sup>−1</sup> before drying, expressed as a percentage. The assays were performed in triplicate accordingly to the protocol of <a id="xref-ref-26-3" class="xref-bibr" href="#ref-26">Manzanera <em>et al.</em>, 2002</a>. Strain 4J27<sup>T</sup> showed the highest values of desiccation tolerance (31.58 %±6.9 %), which were significantly different from those of the
+                  positive control, <span class="named-content species" id="named-content-55"><a class="namesforlife" rel="namesforlife-name"
+                        title="Acinetobacter calcoaceticus"
+                        href="doi:10.1601/nm.2766"><em>Acinetobacter calcoaceticus</em></a></span> PADD68 (3.23 %±0.2 %) and more so from the closely related strain, <span class="named-content species" id="named-content-56"><a class="namesforlife" rel="namesforlife-name"
+                        title="Arthrobacter phenanthrenivorans"
+                        href="doi:10.1601/nm.13221"><em>Arthrobacter phenanthrenivorans</em></a></span> DSM 18606<sup>T</sup> (1.5 %±0.41 %). As expected, the desiccation tolerance of the negative control, <span class="named-content species" id="named-content-57"><a class="namesforlife" rel="namesforlife-name" title="P. putida"
+                        href="doi:10.1601/nm.2674"><em>P. putida</em></a></span> KT2440<sup>T</sup>, was below detectable levels. Therefore the closely related species <span class="named-content species" id="named-content-58"><a class="namesforlife" rel="namesforlife-name"
+                        title="Arthrobacter phenanthrenivorans"
+                        href="doi:10.1601/nm.13221"><em>Arthrobacter phenanthrenivorans</em></a></span> DSM 18606<sup>T</sup> is considered to be desiccation-sensitive, due to its low degree of desiccation tolerance, in contrast to the novel strain,
+                  which is considered to be a desiccation-tolerant strain.
+               </p>
+               <p id="p-24">On the basis of phylogenetic analysis of its 16S rRNA gene sequence, together with physiological, chemotaxonomic and DNA–DNA
+                  hybridization analyses, strain 4J27<sup>T</sup> is considered to represent a novel species of the genus <span class="named-content genus" id="named-content-59"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter"
+                        href="doi:10.1601/nm.5839"><em>Arthrobacter</em></a></span>, for which the name <span class="named-content genus" id="named-content-60"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter"
+                        href="doi:10.1601/nm.5839"><em>Arthrobacter</em></a></span> <em>siccitolerans</em> is proposed.
+               </p>
+               <div class="section" id="sec-1">
+                  <div class="section-nav"><a href="#fn-group-1" title="Previous Section" class="prev-section-link"><span>Previous Section</span></a><a href="#ack-1" title="Acknowledgements" class="next-section-link"><span>Next Section</span></a></div>
+                  
+                  
+                  <div id="sec-2" class="subsection">
+                     
+                     <h3>Description of <span class="named-content genus" id="named-content-61"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter"
+                              href="doi:10.1601/nm.5839"><em>Arthrobacter</em></a></span><em>siccitolerans</em> sp. nov.
+                     </h3>
+                     
+                     <p id="p-25"><span class="named-content genus" id="named-content-62"><a class="namesforlife" rel="namesforlife-name" title="Arthrobacter"
+                              href="doi:10.1601/nm.5839"><em>Arthrobacter</em></a></span> <em>siccitolerans</em> (sic.ci.to′le.rans. L. adj. <em>siccus</em> dry, L. part. adj. <em>tolerans</em> tolerating; N.L. part. adj. <em>siccitolerans</em> dry-tolerating).
+                     </p>
+                     
+                     <p id="p-26">Cells are non-motile, non-spore-forming, Gram-positive, aerobic and rod-to-coccus-shaped. Colonies on TSA are convex, circular,
+                        cream, opaque and usually 1–2 mm in diameter within 2 days at 30 °C. Catalase-positive, oxidase-negative and nitrate-reductase-negative
+                        (no capacity to reduce nitrate to nitrite). Grows at temperatures from 15 to 35 °C, pH 5–9 and with 0–0.8 M NaCl in LB medium.
+                        The peptidoglycan type is A3α (<a id="xref-ref-38-4" class="xref-bibr" href="#ref-38">Schleifer &amp; Kandler, 1972</a>), with an <span class="sc">l</span>-Lys–<span class="sc">l</span>-Ser–<span class="sc">l</span>-Thr–<span class="sc">l</span>-Ala interpeptide bridge. The major cellular fatty acids are anteiso C<sub>15 : 0</sub>, anteiso C<sub>17 : 0</sub>, C<sub>16 : 0</sub> and iso C<sub>16 : 0</sub>. The major menaquinone is MK9-(II-H<sub>2</sub>). The whole-cell sugars of the strain are galactose, glucose, mannose, ribose and rhamnose. It reduces nitrites to nitrogen.
+                        Indole and acetoin (Voges–Proskauer) production are positive. According to the results from the API CORYNE, API 20NE and API
+                        20E strips, the following enzyme activities are detected: pirazinamidase, β-glucuronidase, β-galactosidase, α-glucosidase,
+                        β-glucosidase (aesculin), β-galactosidase (<em>p</em>-nitrophenyl-β-<span class="sc">d</span>-galactopyranosidase). Assimilation of glucose, arabinose, mannose, mannitol, N-acetyl-glucosamine, maltose, potassium gluconate,
+                        malate, trisodium citrate, inositol, sorbitol, rhamnose, sucrose, melibiose, amygdalin and arabinose are positive. The following
+                        enzyme activities are not present: β-galactosidase (<em>o</em>-nitro-phenyl-β-<span class="sc">d</span>-galactopyranoside), arginine dihydrolase, lysine decarboxylase, ornithine decarboxylase, urease, tryptophan desaminase, gelatinase,
+                        pyrrolidonyl arylamidase, alkaline phosphatase and <em>N</em>-acetyl-β-glucosaminidase. Production of H<sub>2</sub>S is negative and does not use citrate. In the Biolog GP2 MicroPlates the following substrates were used for respiration:
+                        dextrin, inulin, <span class="sc">l</span>-arabinose, <em>N</em>-acetyl-<span class="sc">d</span>-glucosamine, <em>N</em>-acetyl-<span class="sc">d</span>-mannosamine, <span class="sc">d</span>-arbutin, cellobiose, <span class="sc">d</span>-fructose, <span class="sc">d</span>-galactose, <span class="sc">d</span>-galacturonic acid, α-<span class="sc">d</span>-glucose, gentiobiose, lactamide, <span class="sc">l</span>-lactic acid, lactulose, maltose, maltotriose, <span class="sc">d</span>-mannitol, <span class="sc">d</span>-mannose, melezitose, melibiose, 3-methyl glucose, α-methyl <span class="sc">d</span>-mannoside, palatinose, <span class="sc">d</span>-psicose, <span class="sc">d</span>-rafinose, <span class="sc">l</span>-rhamnose, <span class="sc">d</span>-ribose, salicin, <span class="sc">d</span>-sorbitol, sucrose, trehalose, turanose, xylitol, <span class="sc">d</span>-xylose, acetic acid, α-hydroxybutyric acid, β-hydroxybutyric acid, <em>p</em>-hydroxyphenylacetic acid, α-ketovaleric acid, <span class="sc">l</span>-malic acid, pyruvic acid, <span class="sc">l</span>-alaninamide, <span class="sc">l</span>-alanyl glycine, glycyl-<span class="sc">l</span>-glutamic acid, putrescine, glycerol, adenosine, 2′-deoxy adenosine, inosine, thymidine, uridine, thymidine-5′ monophosphate,
+                        glucose-1-phosphate and <span class="sc">d</span>-<span class="sc">l</span>-α-glycerol phosphate. The following compounds were not used for respiration: α-cyclodextrin, β-cyclodextrin, glycogen, mannan,
+                        Tween 40, Tween 80, amygdalin, <span class="sc">d</span>-arabitol, <span class="sc">d</span>-fructose, <span class="sc">l</span>-fucose, <span class="sc">d</span>-gluconic acid, <em>myo</em>-inositol, α-<span class="sc">d</span>-lactose, α-methyl-<span class="sc">d</span>-galactoside, β-methyl-<span class="sc">d</span>-galactoside, α-methyl-<span class="sc">d</span>-glucoside, β-methyl-<span class="sc">d</span>-glucoside, palatinose, propionic acid, <span class="sc">l</span>-alanine, <span class="sc">l</span>-asparagine, <span class="sc">l</span>-glutamic acid, <span class="sc">l</span>-pyroglutamic acid and <span class="sc">l</span>-serine, sedoheptulose, stachyose, <span class="sc">d</span>-tagatose, γ-hydroxybutyric acid, α-ketoglutaric acid, <span class="sc">d</span>-lactic acid methyl ester, <span class="sc">d</span>-malic acid, methyl pyruvate, mono-methyl succinate, succinamic acid, succinic acid, <span class="sc">d</span>-alanine, <em>N</em>-acetyl-<span class="sc">l</span>-glutamic acid, 2,3-butanediol, adenosine-5′-monophosphate, uridine-5′-monophosphate, fructose-6-phosphate and glucose-6-phosphate.
+                        Susceptible to all the antibiotics tested: streptomycin, rifampicin, chloramphenicol, kanamycin and tetracycline.
+                     </p>
+                     
+                     <p id="p-27">The type strain, 4J27<sup>T</sup> ( = CECT 8257<sup>T</sup> = LMG 27359<sup>T</sup>), was isolated from a <em>Nerium oleander</em> rhizosphere subjected to seasonal drought in Granada, Spain. The DNA G+C content of strain 4J27<sup>T</sup> is 65.3 mol%.
+                     </p>
+                     
+                  </div>
+               </div>
+               <div class="section ack" id="ack-1">
+                  <div class="section-nav"><a href="#sec-1" title="Previous Section" class="prev-section-link"><span>Previous Section</span></a><a href="#ref-list-1" title="References" class="next-section-link"><span>Next Section</span></a></div>
+                  <h2>Acknowledgements</h2>
+                  
+                  <p id="p-28">We thank María de la Encarnación Olimpia Velázquez Pérez of the University of Salamanca for her useful discussions. This research
+                     was funded by the Spanish Ministry of Science and Innovation under the aegis of research project P07-RNM-02588 and the Andalusian
+                     Regional Government under the aegis of research project CTM2009-09270. M. M. received a Ramón y Cajal research grant from
+                     the Ministry of Science and Innovation as well as support from European Regional Development Funds (EU). The authors also
+                     thank J. Trout of the University of Granada Scientific Translation Service for revising their English text.
+                  </p>
+                  
+               </div>
+               <div class="section ref-list" id="ref-list-1">
+                  <div class="section-nav"><a href="#ack-1" title="Acknowledgements" class="prev-section-link"><span>Previous Section</span></a><div class="nav-placeholder"> </div>
+                  </div>
+                  <h2>References</h2>
+                  <ol class="cit-list ref-use-labels">
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-1-1" title="View reference  in text"
+                           id="ref-1">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.1"
+                             data-doi="10.1021/bi00268a033">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Arakawa</span>,  <span class="cit-name-given-names">T.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Timasheff</span>,  <span class="cit-name-given-names">S. N.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1982</span><strong>).</strong> <span class="cit-article-title">Stabilization of protein structure by sugars</span>. <abbr class="cit-jnl-abbrev">Biochemistry</abbr> <span class="cit-vol">21</span>, <span class="cit-fpage">6536</span>–<span class="cit-lpage">6544</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1021/bi00268a033</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>7150574</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1021/bi00268a033&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=7150574&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Stabilization%20of%20protein%20structure%20by%20sugars&amp;author=T.%20Arakawa&amp;author=S.%20N.%20Timasheff&amp;publication_year=1982&amp;journal=Biochemistry&amp;volume=21&amp;pages=6536-6544&amp;doi=10.1021%2Fbi00268a033&amp;pmid=7150574">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-2-1" title="View reference  in text"
+                           id="ref-2">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.2"
+                             data-doi="10.1007/s00203-001-0373-3">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Borodina</span>,  <span class="cit-name-given-names">E.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kelly</span>,  <span class="cit-name-given-names">D. P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Schumann</span>,  <span class="cit-name-given-names">P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Rainey</span>,  <span class="cit-name-given-names">F. A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ward-Rainey</span>,  <span class="cit-name-given-names">N. L.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wood</span>,  <span class="cit-name-given-names">A. P.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2002</span><strong>).</strong> <span class="cit-article-title">Enzymes of dimethylsulfone metabolism and the phylogenetic characterization of the facultative methylotrophs <em>Arthrobacter sulfonivorans</em> sp. nov., <em>Arthrobacter methylotrophus</em> sp. nov., and <em>Hyphomicrobium sulfonivorans</em> sp. nov.</span> <abbr class="cit-jnl-abbrev">Arch Microbiol</abbr> <span class="cit-vol">177</span>, <span class="cit-fpage">173</span>–<span class="cit-lpage">183</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/s00203-001-0373-3</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>11807567</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/s00203-001-0373-3&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=11807567&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Enzymes%20of%20dimethylsulfone%20metabolism%20and%20the%20phylogenetic%20characterization%20of%20the%20facultative%20methylotrophs%20Arthrobacter%20sulfonivorans%20sp.%20nov.%2C%20Arthrobacter%20methylotrophus%20sp.%20nov.%2C%20and%20Hyphomicrobium%20sulfonivorans%20sp.%20nov.&amp;author=E.%20Borodina&amp;author=D.%20P.%20Kelly&amp;author=P.%20Schumann&amp;author=F.%20A.%20Rainey&amp;author=N.%20L.%20Ward-Rainey&amp;author=A.%20P.%20Wood&amp;publication_year=2002&amp;journal=Arch%20Microbiol&amp;volume=177&amp;pages=173-183&amp;doi=10.1007%2Fs00203-001-0373-3&amp;pmid=11807567">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-3-1" title="View reference  in text"
+                           id="ref-3">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.3">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brown</span>,  <span class="cit-name-given-names">A. D.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1976</span><strong>).</strong> <span class="cit-article-title">Microbial water stress</span>. <abbr class="cit-jnl-abbrev">Bacteriol Rev</abbr> <span class="cit-vol">40</span>, <span class="cit-fpage">803</span>–<span class="cit-lpage">846</span>.<span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>1008746</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=PDF&amp;journalCode=mmbr&amp;resid=40/4/803"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-4-1" title="View reference  in text"
+                           id="ref-4">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.4"
+                             data-doi="10.1016/0003-2697(77)90720-5">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Cashion</span>,  <span class="cit-name-given-names">P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Holder-Franklin</span>,  <span class="cit-name-given-names">M. A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">McCully</span>,  <span class="cit-name-given-names">J.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Franklin</span>,  <span class="cit-name-given-names">M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1977</span><strong>).</strong> <span class="cit-article-title">A rapid method for the base ratio determination of bacterial DNA</span>. <abbr class="cit-jnl-abbrev">Anal Biochem</abbr> <span class="cit-vol">81</span>, <span class="cit-fpage">461</span>–<span class="cit-lpage">466</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/0003-2697(77)90720-5</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>907108</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/0003-2697(77)90720-5&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=907108&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=A%20rapid%20method%20for%20the%20base%20ratio%20determination%20of%20bacterial%20DNA&amp;author=P.%20Cashion&amp;author=M.%20A.%20Holder-Franklin&amp;author=J.%20McCully&amp;author=M.%20Franklin&amp;publication_year=1977&amp;journal=Anal%20Biochem&amp;volume=81&amp;pages=461-466&amp;doi=10.1016%2F0003-2697%2877%2990720-5&amp;pmid=907108">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-5-1" title="View reference  in text"
+                           id="ref-5">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.5">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Conn</span>,  <span class="cit-name-given-names">H. J.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Dimmick</span>,  <span class="cit-name-given-names">I.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1947</span><strong>).</strong> <span class="cit-article-title">Soil bacteria similar in morphology to <em>Mycobacterium</em> and <em>Corynebacterium</em></span>. <abbr class="cit-jnl-abbrev">J Bacteriol</abbr> <span class="cit-vol">54</span>, <span class="cit-fpage">291</span>–<span class="cit-lpage">303</span>.<span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>16561362</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=PDF&amp;journalCode=jb&amp;resid=54/3/291-b"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-6-1" title="View reference  in text"
+                           id="ref-6">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.6"
+                             data-doi="10.1111/j.1432-1033.1970.tb00830.x">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">De Ley</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Cattoir</span>,  <span class="cit-name-given-names">H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Reynaerts</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1970</span><strong>).</strong> <span class="cit-article-title">The quantitative measurement of DNA hybridization from renaturation rates</span>. <abbr class="cit-jnl-abbrev">Eur J Biochem</abbr> <span class="cit-vol">12</span>, <span class="cit-fpage">133</span>–<span class="cit-lpage">142</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1111/j.1432-1033.1970.tb00830.x</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>4984993</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1111/j.1432-1033.1970.tb00830.x&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=4984993&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=The%20quantitative%20measurement%20of%20DNA%20hybridization%20from%20renaturation%20rates&amp;author=J.%20De%20Ley&amp;author=H.%20Cattoir&amp;author=A.%20Reynaerts&amp;publication_year=1970&amp;journal=Eur%20J%20Biochem&amp;volume=12&amp;pages=133-142&amp;doi=10.1111%2Fj.1432-1033.1970.tb00830.x&amp;pmid=4984993">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-7-1" title="View reference  in text"
+                           id="ref-7">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.7"
+                             data-doi="10.1099/ijs.0.65301-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ding</span>,  <span class="cit-name-given-names">L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hirose</span>,  <span class="cit-name-given-names">T.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Yokota</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2009</span><strong>).</strong> <span class="cit-article-title">Four novel <em>Arthrobacter</em> species isolated from filtration substrate</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">59</span>, <span class="cit-fpage">856</span>–<span class="cit-lpage">862</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.65301-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>19329620</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=59/4/856"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><div class="cit ref-cit ref-book no-rev-xref" id="cit-63.Pt_11.4174.8">
+                           <div class="cit-metadata"><cite><span class="cit-auth cit-collab">DSMZ</span> <strong>(</strong><span class="cit-pub-date">2001</span><strong>).</strong> <span class="cit-article-title">Catalogue of Strains, 7th edn</span>, p. <span class="cit-fpage">617</span>. <span class="cit-publ-loc">Braunschweig</span>: <span class="cit-publ-name">DSMZ</span>. <a href="http://www.dsmz.de/fileadmin/Bereiche/Microbiology/Dateien/Key_to_Murein2.pdf">http://www.dsmz.de/fileadmin/Bereiche/Microbiology/Dateien/Key_to_Murein2.pdf</a></cite></div>
+                           <div class="cit-extra"></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-9-1" title="View reference  in text"
+                           id="ref-9">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.9"
+                             data-doi="10.2307/2408678">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Felsenstein</span>,  <span class="cit-name-given-names">J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1985</span><strong>).</strong> <span class="cit-article-title">Confidence limits on phylogenies: an approach using the bootstrap</span>. <abbr class="cit-jnl-abbrev">Evolution</abbr> <span class="cit-vol">39</span>, <span class="cit-fpage">783</span>–<span class="cit-lpage">791</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.2307/2408678</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.2307/2408678&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=7288891&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Confidence%20limits%20on%20phylogenies%3A%20an%20approach%20using%20the%20bootstrap&amp;author=J.%20Felsenstein&amp;publication_year=1985&amp;journal=Evolution&amp;volume=39&amp;pages=783-791&amp;doi=10.2307%2F2408678">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><div class="cit ref-cit ref-journal no-rev-xref" id="cit-63.Pt_11.4174.10">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Germida</span>,  <span class="cit-name-given-names">J. J.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Casida</span>,  <span class="cit-name-given-names">L. E.</span>  <span class="cit-name-suffix">Jr</span>.</span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1980</span><strong>).</strong> <span class="cit-article-title">Myceloid growth of <em>Arthrobacter globiformis</em> and other <em>Arthrobacter</em> species</span>. <abbr class="cit-jnl-abbrev">J Bacteriol</abbr> <span class="cit-vol">144</span>, <span class="cit-fpage">1152</span>–<span class="cit-lpage">1158</span>.<span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>6254945</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=jb&amp;resid=144/3/1152"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-11-1" title="View reference  in text"
+                           id="ref-11">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.11"
+                             data-doi="10.1080/10635150390235520">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Guindon</span>,  <span class="cit-name-given-names">S.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Gascuel</span>,  <span class="cit-name-given-names">O.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2003</span><strong>).</strong> <span class="cit-article-title">A simple, fast, and accurate algorithm to estimate large phylogenies by maximum likelihood</span>. <abbr class="cit-jnl-abbrev">Syst Biol</abbr> <span class="cit-vol">52</span>, <span class="cit-fpage">696</span>–<span class="cit-lpage">704</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1080/10635150390235520</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>14530136</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=sysbio&amp;resid=52/5/696"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-12-1" title="View reference  in text"
+                           id="ref-12">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.12"
+                             data-doi="10.1128/JCM.43.3.1451-1455.2005">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Huang</span>,  <span class="cit-name-given-names">Y.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Zhao</span>,  <span class="cit-name-given-names">N.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">He</span>,  <span class="cit-name-given-names">L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wang</span>,  <span class="cit-name-given-names">L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Liu</span>,  <span class="cit-name-given-names">Z.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">You</span>,  <span class="cit-name-given-names">M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Guan</span>,  <span class="cit-name-given-names">F.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2005</span><strong>).</strong> <span class="cit-article-title"><em>Arthrobacter scleromae</em> sp. nov. isolated from human clinical specimens</span>. <abbr class="cit-jnl-abbrev">J Clin Microbiol</abbr> <span class="cit-vol">43</span>, <span class="cit-fpage">1451</span>–<span class="cit-lpage">1455</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/JCM.43.3.1451-1455.2005</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>15750131</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=jcm&amp;resid=43/3/1451"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-13-1" title="View reference  in text"
+                           id="ref-13">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.13"
+                             data-doi="10.1016/S0723-2020(83)80048-4">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Huss</span>,  <span class="cit-name-given-names">V. A. R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Festl</span>,  <span class="cit-name-given-names">H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Schleifer</span>,  <span class="cit-name-given-names">K. H.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1983</span><strong>).</strong> <span class="cit-article-title">Studies on the spectrophotometric determination of DNA hybridization from renaturation rates</span>. <abbr class="cit-jnl-abbrev">Syst Appl Microbiol</abbr> <span class="cit-vol">4</span>, <span class="cit-fpage">184</span>–<span class="cit-lpage">192</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/S0723-2020(83)80048-4</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>23194591</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/S0723-2020(83)80048-4&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=23194591&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Studies%20on%20the%20spectrophotometric%20determination%20of%20DNA%20hybridization%20from%20renaturation%20rates&amp;author=V.%20A.%20R.%20Huss&amp;author=H.%20Festl&amp;author=K.%20H.%20Schleifer&amp;publication_year=1983&amp;journal=Syst%20Appl%20Microbiol&amp;volume=4&amp;pages=184-192&amp;doi=10.1016%2FS0723-2020%2883%2980048-4&amp;pmid=23194591">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-14-1" title="View reference  in text"
+                           id="ref-14">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4174.14">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Balows</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Truper</span>,  <span class="cit-name-given-names">H. G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Dworkin</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Harder</span>,  <span class="cit-name-given-names">W.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Schleifer</span>,  <span class="cit-name-given-names">K. H.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jones</span>,  <span class="cit-name-given-names">D.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Keddie</span>,  <span class="cit-name-given-names">R. M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1992</span><strong>).</strong> <span class="cit-article-title">The genus <em>Arthrobacter</em></span>. In <span class="cit-source">The Prokaryotes: a Handbook on the Biology of Bacteria: Ecophysiology, Isolation, Identification, Applications</span>, <span class="cit-edition">2nd edn</span>, <span class="cit-vol">vol. 2</span>, pp. <span class="cit-fpage">1283</span>–<span class="cit-lpage">1299</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Balows</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Truper</span>,  <span class="cit-name-given-names">H. G.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Dworkin</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Harder</span>,  <span class="cit-name-given-names">W.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Schleifer</span>,  <span class="cit-name-given-names">K. H.</span></span>
+                                 . <span class="cit-publ-loc">NY</span>: <span class="cit-publ-name">Springer</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=The%20genus%20Arthrobacter&amp;author=D.%20Jones&amp;author=R.%20M.%20Keddie&amp;publication_year=1992&amp;citation_inbook_title=The%20Prokaryotes%3A%20a%20Handbook%20on%20the%20Biology%20of%20Bacteria%3A%20Ecophysiology%2C%20Isolation%2C%20Identification%2C%20Applications">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-15-1" title="View reference  in text"
+                           id="ref-15">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.15"
+                             data-doi="10.1016/j.biotechadv.2012.07.002">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Julca</span>,  <span class="cit-name-given-names">I.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Alaminos</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">González-López</span>,  <span class="cit-name-given-names">J.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Manzanera</span>,  <span class="cit-name-given-names">M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2012</span><strong>).</strong> <span class="cit-article-title">Xeroprotectants for the stabilization of biomaterials</span>. <abbr class="cit-jnl-abbrev">Biotechnol Adv</abbr> <span class="cit-vol">30</span>, <span class="cit-fpage">1641</span>–<span class="cit-lpage">1654</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/j.biotechadv.2012.07.002</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>22814234</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/j.biotechadv.2012.07.002&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=22814234&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Xeroprotectants%20for%20the%20stabilization%20of%20biomaterials&amp;author=I.%20Julca&amp;author=M.%20Alaminos&amp;author=J.%20Gonz%C3%A1lez-L%C3%B3pez&amp;author=M.%20Manzanera&amp;publication_year=2012&amp;journal=Biotechnol%20Adv&amp;volume=30&amp;pages=1641-1654&amp;doi=10.1016%2Fj.biotechadv.2012.07.002&amp;pmid=22814234">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-16-1" title="View reference  in text"
+                           id="ref-16">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.16"
+                             data-doi="10.1099/ijs.0.000984-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kallimanis</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kavakiotis</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Perisynakis</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Spröer</span>,  <span class="cit-name-given-names">C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pukall</span>,  <span class="cit-name-given-names">R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Drainas</span>,  <span class="cit-name-given-names">C.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Koukkou</span>,  <span class="cit-name-given-names">A. I.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2009</span><strong>).</strong> <span class="cit-article-title"><em>Arthrobacter phenanthrenivorans</em> sp. nov., to accommodate the phenanthrene-degrading bacterium <em>Arthrobacter</em> sp. strain Sphe3</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">59</span>, <span class="cit-fpage">275</span>–<span class="cit-lpage">279</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.000984-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>19196765</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=59/2/275"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-17-1" title="View reference  in text"
+                           id="ref-17">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4174.17">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Sneath</span>,  <span class="cit-name-given-names"> P. H. A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Mair</span>,  <span class="cit-name-given-names">N. S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Sharpe</span>,  <span class="cit-name-given-names">M. E.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Holt</span>,  <span class="cit-name-given-names">J. G.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Keddie</span>,  <span class="cit-name-given-names">R. M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Collins</span>,  <span class="cit-name-given-names">M. D.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jones</span>,  <span class="cit-name-given-names">D.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1986</span><strong>).</strong> <span class="cit-article-title">Genus <em>Arthrobacter</em> Conn and Dimmick 1947, 300AL</span>. In <span class="cit-source">Bergey's Manual of Systematic Bacteriology</span>, pp. <span class="cit-fpage">1288</span>–<span class="cit-lpage">1301</span>. Edited by
+                                 <span class="cit-ed"><span class="cit-name-surname">Sneath</span>,  <span class="cit-name-given-names"> P. H. A.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Mair</span>,  <span class="cit-name-given-names">N. S.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Sharpe</span>,  <span class="cit-name-given-names">M. E.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Holt</span>,  <span class="cit-name-given-names">J. G.</span></span>
+                                 . <span class="cit-publ-loc">Baltimore</span>: <span class="cit-publ-name">Williams &amp; Wilkins</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Genus%20Arthrobacter%20Conn%20and%20Dimmick%201947%2C%20300AL&amp;author=R.%20M.%20Keddie&amp;author=M.%20D.%20Collins&amp;author=D.%20Jones&amp;publication_year=1986&amp;citation_inbook_title=Bergey%27s%20Manual%20of%20Systematic%20Bacteriology">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-18-1" title="View reference  in text"
+                           id="ref-18">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.18"
+                             data-doi="10.1099/ijs.0.65550-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kim</span>,  <span class="cit-name-given-names">K. K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lee</span>,  <span class="cit-name-given-names">K. C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Oh</span>,  <span class="cit-name-given-names">H. M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kim</span>,  <span class="cit-name-given-names">M. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Eom</span>,  <span class="cit-name-given-names">M. K.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lee</span>,  <span class="cit-name-given-names">J. S.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2008</span><strong>).</strong> <span class="cit-article-title"><em>Arthrobacter defluvii</em> sp. nov., 4-chlorophenol-degrading bacteria isolated from sewage</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">58</span>, <span class="cit-fpage">1916</span>–<span class="cit-lpage">1921</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.65550-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>18676480</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=58/8/1916"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-19-1" title="View reference  in text"
+                           id="ref-19">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.19"
+                             data-doi="10.1099/ijs.0.038075-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kim</span>,  <span class="cit-name-given-names">O. S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Cho</span>,  <span class="cit-name-given-names">Y. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lee</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Yoon</span>,  <span class="cit-name-given-names">S. H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kim</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Na</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Park</span>,  <span class="cit-name-given-names">S. C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jeon</span>,  <span class="cit-name-given-names">Y. S.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lee</span>,  <span class="cit-name-given-names">J. H.</span></span></li>
+                              </ol><cite> <strong>&amp; other authors (</strong><span class="cit-pub-date">2012</span><strong>).</strong> <span class="cit-article-title">Introducing EzTaxon-e: a prokaryotic 16S rRNA gene sequence database with phylotypes that represent uncultured species</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">62</span>, <span class="cit-fpage">716</span>–<span class="cit-lpage">721</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.038075-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>22140171</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=62/Pt_3/716"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-20-1" title="View reference  in text"
+                           id="ref-20">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.20"
+                             data-doi="10.1007/BF01731581">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kimura</span>,  <span class="cit-name-given-names">M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1980</span><strong>).</strong> <span class="cit-article-title">A simple method for estimating evolutionary rates of base substitutions through comparative studies of nucleotide sequences</span>. <abbr class="cit-jnl-abbrev">J Mol Evol</abbr> <span class="cit-vol">16</span>, <span class="cit-fpage">111</span>–<span class="cit-lpage">120</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/BF01731581</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>7463489</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/BF01731581&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=7463489&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=A%20simple%20method%20for%20estimating%20evolutionary%20rates%20of%20base%20substitutions%20through%20comparative%20studies%20of%20nucleotide%20sequences&amp;author=M.%20Kimura&amp;publication_year=1980&amp;journal=J%20Mol%20Evol&amp;volume=16&amp;pages=111-120&amp;doi=10.1007%2FBF01731581&amp;pmid=7463489">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-21-1" title="View reference  in text"
+                           id="ref-21">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.21"
+                             data-doi="10.1007/s007920050116">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Knapp</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ladenstein</span>,  <span class="cit-name-given-names">R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Galinski</span>,  <span class="cit-name-given-names">E. A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1999</span><strong>).</strong> <span class="cit-article-title">Extrinsic protein stabilization by the naturally occurring osmolytes β-hydroxyectoine and betaine</span>. <abbr class="cit-jnl-abbrev">Extremophiles</abbr> <span class="cit-vol">3</span>, <span class="cit-fpage">191</span>–<span class="cit-lpage">198</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/s007920050116</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>10484175</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/s007920050116&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=10484175&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Extrinsic%20protein%20stabilization%20by%20the%20naturally%20occurring%20osmolytes%20%CE%B2-hydroxyectoine%20and%20betaine&amp;author=S.%20Knapp&amp;author=R.%20Ladenstein&amp;author=E.%20A.%20Galinski&amp;publication_year=1999&amp;journal=Extremophiles&amp;volume=3&amp;pages=191-198&amp;doi=10.1007%2Fs007920050116&amp;pmid=10484175">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-22-1" title="View reference  in text"
+                           id="ref-22">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.22"
+                             data-doi="10.1099/00207713-42-2-234">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kodama</span>,  <span class="cit-name-given-names">Y.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Yamamoto</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Amano</span>,  <span class="cit-name-given-names">N.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Amachi</span>,  <span class="cit-name-given-names">T.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1992</span><strong>).</strong> <span class="cit-article-title">Reclassification of two strains of <em>Arthrobacter oxydans</em> and proposal of <em>Arthrobacter nicotinovorans</em> sp. nov.</span> <abbr class="cit-jnl-abbrev">Int J Syst Bacteriol</abbr> <span class="cit-vol">42</span>, <span class="cit-fpage">234</span>–<span class="cit-lpage">239</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-42-2-234</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>1581183</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=42/2/234"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-23-1" title="View reference  in text"
+                           id="ref-23">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.23"
+                             data-doi="10.1099/00207713-38-4-358">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kuykendall</span>,  <span class="cit-name-given-names">L. D.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Roy</span>,  <span class="cit-name-given-names">M. A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">O'Neill</span>,  <span class="cit-name-given-names">J. J.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Devine</span>,  <span class="cit-name-given-names">T. E.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1988</span><strong>).</strong> <span class="cit-article-title">Fatty acids, antibiotic resistance, and deoxyribonucleic acid homology groups of <em>Bradorhizobium japonicum</em></span>. <abbr class="cit-jnl-abbrev">Int J Syst Bacteriol</abbr> <span class="cit-vol">38</span>, <span class="cit-fpage">358</span>–<span class="cit-lpage">361</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-38-4-358</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=38/4/358"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-24-1" title="View reference  in text"
+                           id="ref-24">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.24"
+                             data-doi="10.1093/bioinformatics/btm404">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Larkin</span>,  <span class="cit-name-given-names">M. A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Blackshields</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brown</span>,  <span class="cit-name-given-names">N. P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Chenna</span>,  <span class="cit-name-given-names">R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">McGettigan</span>,  <span class="cit-name-given-names">P. A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">McWilliam</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Valentin</span>,  <span class="cit-name-given-names">F.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wallace</span>,  <span class="cit-name-given-names">I. M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wilm</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>&amp; other authors (</strong><span class="cit-pub-date">2007</span><strong>).</strong> <span class="cit-article-title"><span class="sc">clustal</span> <span class="sc">w</span> and <span class="sc">clustal</span>_<span class="sc">x</span> version 2.0</span>. <abbr class="cit-jnl-abbrev">Bioinformatics</abbr> <span class="cit-vol">23</span>, <span class="cit-fpage">2947</span>–<span class="cit-lpage">2948</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1093/bioinformatics/btm404</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>17846036</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=bioinfo&amp;resid=23/21/2947"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-25-1" title="View reference  in text"
+                           id="ref-25">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.25">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">MacKenzie</span>,  <span class="cit-name-given-names">S. L.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1987</span><strong>).</strong> <span class="cit-article-title">Gas chromatographic analysis of amino acids as the N-heptafluorobutyryl isobutyl esters</span>. <abbr class="cit-jnl-abbrev">J Assoc Anal Chem</abbr> <span class="cit-vol">70</span>, <span class="cit-fpage">151</span>–<span class="cit-lpage">160</span>.<span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>1008746</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=1008746&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Gas%20chromatographic%20analysis%20of%20amino%20acids%20as%20the%20N-heptafluorobutyryl%20isobutyl%20esters&amp;author=S.%20L.%20MacKenzie&amp;publication_year=1987&amp;journal=J%20Assoc%20Anal%20Chem&amp;volume=70&amp;pages=151-160&amp;pmid=1008746">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-26-1" title="View reference  in text"
+                           id="ref-26">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.26"
+                             data-doi="10.1128/AEM.68.9.4328-4333.2002">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Manzanera</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">García de Castro</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Tøndervik</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Rayner-Brandes</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Strøm</span>,  <span class="cit-name-given-names">A. R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Tunnacliffe</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2002</span><strong>).</strong> <span class="cit-article-title">Hydroxyectoine is superior to trehalose for anhydrobiotic engineering of <em>Pseudomonas putida</em> KT2440</span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">68</span>, <span class="cit-fpage">4328</span>–<span class="cit-lpage">4333</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.68.9.4328-4333.2002</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>12200283</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=68/9/4328"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-27-1" title="View reference  in text"
+                           id="ref-27">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.27"
+                             data-doi="10.1128/AEM.70.5.3143-3145.2004">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Manzanera</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Vilchez</span>,  <span class="cit-name-given-names">S.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Tunnacliffe</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2004a</span><strong>).</strong> <span class="cit-article-title">Plastic encapsulation of stabilized <em>Escherichia coli</em> and <em>Pseudomonas putida</em></span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">70</span>, <span class="cit-fpage">3143</span>–<span class="cit-lpage">3145</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.70.5.3143-3145.2004</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>15128579</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=70/5/3143"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-28-1" title="View reference  in text"
+                           id="ref-28">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.28"
+                             data-doi="10.1111/j.1574-6968.2004.tb09502.x">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Manzanera</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Vilchez</span>,  <span class="cit-name-given-names">S.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Tunnacliffe</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2004b</span><strong>).</strong> <span class="cit-article-title">High survival and stability rates of <em>Escherichia coli</em> dried in hydroxyectoine</span>. <abbr class="cit-jnl-abbrev">FEMS Microbiol Lett</abbr> <span class="cit-vol">233</span>, <span class="cit-fpage">347</span>–<span class="cit-lpage">352</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1111/j.1574-6968.2004.tb09502.x</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>15063506</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1111/j.1574-6968.2004.tb09502.x&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=15063506&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=High%20survival%20and%20stability%20rates%20of%20Escherichia%20coli%20dried%20in%20hydroxyectoine&amp;author=M.%20Manzanera&amp;author=S.%20Vilchez&amp;author=A.%20Tunnacliffe&amp;publication_year=2004b&amp;journal=FEMS%20Microbiol%20Lett&amp;volume=233&amp;pages=347-352&amp;doi=10.1111%2Fj.1574-6968.2004.tb09502.x&amp;pmid=15063506">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-29-1" title="View reference  in text"
+                           id="ref-29">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.29"
+                             data-doi="10.1099/00207713-39-2-159">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Mesbah</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Premachandran</span>,  <span class="cit-name-given-names">U.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Whitman</span>,  <span class="cit-name-given-names">W.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1989</span><strong>).</strong> <span class="cit-article-title">Precise measurement of the G+C content of deoxyribonucleic acid by high performance liquid chromatography</span>. <abbr class="cit-jnl-abbrev">Int J Syst Bacteriol</abbr> <span class="cit-vol">39</span>, <span class="cit-fpage">159</span>–<span class="cit-lpage">167</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-39-2-159</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=39/2/159"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-30-1" title="View reference  in text"
+                           id="ref-30">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.30">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Miller</span>,  <span class="cit-name-given-names">L. T.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1982</span><strong>).</strong> <span class="cit-article-title">Single derivatization method for routine analysis of bacterial whole-cell fatty acid methyl esters including hydroxy acids</span>. <abbr class="cit-jnl-abbrev">J Clin Microbiol</abbr> <span class="cit-vol">16</span>, <span class="cit-fpage">584</span>–<span class="cit-lpage">586</span>.<span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>7130373</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=jcm&amp;resid=16/3/584"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-31-1" title="View reference  in text"
+                           id="ref-31">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.31"
+                             data-doi="10.1128/AEM.00855-10">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Narváez-Reinaldo</span>,  <span class="cit-name-given-names">J. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Barba</span>,  <span class="cit-name-given-names">I.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">González-López</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Tunnacliffe</span>,  <span class="cit-name-given-names">A.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Manzanera</span>,  <span class="cit-name-given-names">M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2010</span><strong>).</strong> <span class="cit-article-title">Rapid method for isolation of desiccation-tolerant strains and xeroprotectants</span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">76</span>, <span class="cit-fpage">5254</span>–<span class="cit-lpage">5262</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.00855-10</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>20562279</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=76/15/5254"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><div class="cit ref-cit ref-book no-rev-xref" id="cit-63.Pt_11.4174.32">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth cit-collab">National Committee for Clinical Laboratory Standards</span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1997</span><strong>).</strong> <span class="cit-source">Minimum inhibitory concentration (MIC) interpretive standards (g/ml) for organisms other than <em>Haemophilus</em> spp., <em>Neisseria gonorrhoeae</em>, and <em>Streptococcus</em> spp. NCCLS document M7–A4</span>. <span class="cit-publ-loc">Wayne, PA</span>: <span class="cit-publ-name">National Committee for Clinical Laboratory Standards</span>.</cite></div>
+                           <div class="cit-extra"></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><div class="cit ref-cit ref-journal no-rev-xref" id="cit-63.Pt_11.4174.33"
+                             data-doi="10.1111/j.1365-2672.1990.tb02880.x">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Piddock</span>,  <span class="cit-name-given-names">L. J. V.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1990</span><strong>).</strong> <span class="cit-article-title">Techniques used for the determination of antimicrobial resistance and sensitivity in bacteria</span>. <abbr class="cit-jnl-abbrev">J Appl Bacteriol</abbr> <span class="cit-vol">68</span>, <span class="cit-fpage">307</span>–<span class="cit-lpage">318</span>.<span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1111/j.1365-2672.1990.tb02880.x</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>2190965</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1111/j.1365-2672.1990.tb02880.x&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=2190965&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Techniques%20used%20for%20the%20determination%20of%20antimicrobial%20resistance%20and%20sensitivity%20in%20bacteria&amp;author=L.%20J.%20V.%20Piddock&amp;publication_year=1990&amp;journal=J%20Appl%20Bacteriol&amp;volume=68&amp;pages=307-318&amp;doi=10.1111%2Fj.1365-2672.1990.tb02880.x&amp;pmid=2190965">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-34-1" title="View reference  in text"
+                           id="ref-34">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.34"
+                             data-doi="10.1099/ijs.0.02131-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Reddy</span>,  <span class="cit-name-given-names">G. S. N.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Prakash</span>,  <span class="cit-name-given-names">J. S. S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Matsumoto</span>,  <span class="cit-name-given-names">G. I.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stackebrandt</span>,  <span class="cit-name-given-names">E.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Shivaji</span>,  <span class="cit-name-given-names">S.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2002</span><strong>).</strong> <span class="cit-article-title"><em>Arthrobacter roseus</em> sp. nov., a psychrophilic bacterium isolated from an Antarctic cyanobacterial mat sample</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">52</span>, <span class="cit-fpage">1017</span>–<span class="cit-lpage">1021</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.02131-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>12054218</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=52/3/1017"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-35-1" title="View reference  in text"
+                           id="ref-35">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.35"
+                             data-doi="10.1099/ijs.0.01472-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Saitou</span>,  <span class="cit-name-given-names">N.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nei</span>,  <span class="cit-name-given-names">M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1987</span><strong>).</strong> <span class="cit-article-title">The neighbor-joining method: a new method for reconstructing phylogenetic trees</span>. <abbr class="cit-jnl-abbrev">Mol Biol Evol</abbr> <span class="cit-vol">4</span>, <span class="cit-fpage">406</span>–<span class="cit-lpage">425</span>.<span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>3447015</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=molbiolevol&amp;resid=4/4/406"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><div class="cit ref-cit ref-journal no-rev-xref" id="cit-63.Pt_11.4174.36"
+                             data-doi="10.1007/BF02046033">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Schippers-Lammertse</span>,  <span class="cit-name-given-names">A. F.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Muijsers</span>,  <span class="cit-name-given-names">A. O.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Klatser-Oedekerk</span>,  <span class="cit-name-given-names">K. B.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1963</span><strong>).</strong> <span class="cit-article-title"><em>Arthrobacter polychromogenes</em> nov. spec., its pigments, and a bacteriophage of this species</span>. <abbr class="cit-jnl-abbrev">Antonie van Leeuwenhoek</abbr> <span class="cit-vol">29</span>, <span class="cit-fpage">1</span>–<span class="cit-lpage">15</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/BF02046033</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/BF02046033&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Arthrobacter%20polychromogenes%20nov.%20spec.%2C%20its%20pigments%2C%20and%20a%20bacteriophage%20of%20this%20species&amp;author=A.%20F.%20Schippers-Lammertse&amp;author=A.%20O.%20Muijsers&amp;author=K.%20B.%20Klatser-Oedekerk&amp;publication_year=1963&amp;journal=Antonie%20van%20Leeuwenhoek&amp;volume=29&amp;pages=1-15&amp;doi=10.1007%2FBF02046033">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-37-1" title="View reference  in text"
+                           id="ref-37">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.37"
+                             data-doi="10.1016/S0580-9517(08)70474-4">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Schleifer</span>,  <span class="cit-name-given-names">K. H.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1985</span><strong>).</strong> <span class="cit-article-title">Analysis of the chemical composition and primary structure of murein</span>. <abbr class="cit-jnl-abbrev">Methods Microbiol</abbr> <span class="cit-vol">18</span>, <span class="cit-fpage">123</span>–<span class="cit-lpage">156</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/S0580-9517(08)70474-4</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/S0580-9517(08)70474-4&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=17911292&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Analysis%20of%20the%20chemical%20composition%20and%20primary%20structure%20of%20murein&amp;author=K.%20H.%20Schleifer&amp;publication_year=1985&amp;journal=Methods%20Microbiol&amp;volume=18&amp;pages=123-156&amp;doi=10.1016%2FS0580-9517%2808%2970474-4">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-38-1" title="View reference  in text"
+                           id="ref-38">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.38"
+                             data-doi="10.1016/S0580-9517(08)70474-4">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Schleifer</span>,  <span class="cit-name-given-names">K. H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kandler</span>,  <span class="cit-name-given-names">O.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1972</span><strong>).</strong> <span class="cit-article-title">Peptidoglycan types of bacterial cell walls and their taxonomic implications</span>. <abbr class="cit-jnl-abbrev">Bacteriol Rev</abbr> <span class="cit-vol">36</span>, <span class="cit-fpage">407</span>–<span class="cit-lpage">477</span>.<span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>4568761</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=PDF&amp;journalCode=mmbr&amp;resid=36/4/407"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-39-1" title="View reference  in text"
+                           id="ref-39">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.39">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sguros</span>,  <span class="cit-name-given-names">P. L.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1955</span><strong>).</strong> <span class="cit-article-title">Microbial transformations of the tobacco alkaloids. I. Cultural and morphological characteristics of a nicotinophile</span>. <abbr class="cit-jnl-abbrev">J Bacteriol</abbr> <span class="cit-vol">69</span>, <span class="cit-fpage">28</span>–<span class="cit-lpage">37</span>.<span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>13233163</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=PDF&amp;journalCode=jb&amp;resid=69/1/28"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-40-1" title="View reference  in text"
+                           id="ref-40">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.40"
+                             data-doi="10.1093/molbev/msm092">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Staneck</span>,  <span class="cit-name-given-names">J. L.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Roberts</span>,  <span class="cit-name-given-names">G. D.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1974</span><strong>).</strong> <span class="cit-article-title">Simplified approach to identification of aerobic actinomycetes by thin-layer chromatography</span>. <abbr class="cit-jnl-abbrev">Appl Microbiol</abbr> <span class="cit-vol">28</span>, <span class="cit-fpage">226</span>–<span class="cit-lpage">231</span>.<span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>4605116</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1093/molbev/msm092&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=4605116&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Simplified%20approach%20to%20identification%20of%20aerobic%20actinomycetes%20by%20thin-layer%20chromatography&amp;author=J.%20L.%20Staneck&amp;author=G.%20D.%20Roberts&amp;publication_year=1974&amp;journal=Appl%20Microbiol&amp;volume=28&amp;pages=226-231&amp;pmid=4605116">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-41-1" title="View reference  in text"
+                           id="ref-41">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.41"
+                             data-doi="10.1093/molbev/msr121">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Tamura</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Peterson</span>,  <span class="cit-name-given-names">D.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Peterson</span>,  <span class="cit-name-given-names">N.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stecher</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nei</span>,  <span class="cit-name-given-names">M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kumar</span>,  <span class="cit-name-given-names">S.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2011</span><strong>).</strong> <span class="cit-article-title"><span class="sc">mega</span>5: molecular evolutionary genetics analysis using maximum likelihood, evolutionary distance, and maximum parsimony methods</span>. <abbr class="cit-jnl-abbrev">Mol Biol Evol</abbr> <span class="cit-vol">28</span>, <span class="cit-fpage">2731</span>–<span class="cit-lpage">2739</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1093/molbev/msr121</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>21546353</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=molbiolevol&amp;resid=28/10/2731"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-42-1" title="View reference  in text"
+                           id="ref-42">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.42"
+                             data-doi="10.1016/S0723-2020(11)80158-X">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Tindall</span>,  <span class="cit-name-given-names">B. J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1990a</span><strong>).</strong> <span class="cit-article-title">A comparative study of the lipid composition of <em>Halobacterium saccharovorum</em> from various sources</span>. <abbr class="cit-jnl-abbrev">Syst Appl Microbiol</abbr> <span class="cit-vol">13</span>, <span class="cit-fpage">128</span>–<span class="cit-lpage">130</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/S0723-2020(11)80158-X</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/S0723-2020(11)80158-X&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=A%20comparative%20study%20of%20the%20lipid%20composition%20of%20Halobacterium%20saccharovorum%20from%20various%20sources&amp;author=B.%20J.%20Tindall&amp;publication_year=1990a&amp;journal=Syst%20Appl%20Microbiol&amp;volume=13&amp;pages=128-130&amp;doi=10.1016%2FS0723-2020%2811%2980158-X">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><div class="cit ref-cit ref-journal no-rev-xref" id="cit-63.Pt_11.4174.43"
+                             data-doi="10.1111/j.1574-6968.1990.tb03996.x">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Tindall</span>,  <span class="cit-name-given-names">B. J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1990b</span><strong>).</strong> <span class="cit-article-title">Lipid composition of <em>Halobacterium lacusprofundi</em></span><em>.</em> <abbr class="cit-jnl-abbrev">FEMS Microbiol Lett</abbr> <span class="cit-vol">66</span>, <span class="cit-fpage">199</span>–<span class="cit-lpage">202</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1111/j.1574-6968.1990.tb03996.x</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=femsle&amp;resid=66/1-3/199"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-44-1" title="View reference  in text"
+                           id="ref-44">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.44"
+                             data-doi="10.1099/00207713-37-4-463">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wayne</span>,  <span class="cit-name-given-names">L. G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brenner</span>,  <span class="cit-name-given-names">D. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Colwell</span>,  <span class="cit-name-given-names">R. R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Grimont</span>,  <span class="cit-name-given-names">P. A. D.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kandler</span>,  <span class="cit-name-given-names">O.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Krichevsky</span>,  <span class="cit-name-given-names">M. I.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Moore</span>,  <span class="cit-name-given-names">L. H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Moore</span>,  <span class="cit-name-given-names">W. E. C.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Murray</span>,  <span class="cit-name-given-names">R. G. E.</span></span></li>
+                              </ol><cite> <strong>&amp; other authors (</strong><span class="cit-pub-date">1987</span><strong>).</strong> <span class="cit-article-title">International Committee on Systematic Bacteriology. Report of the ad hoc committee on reconciliation of approaches to bacterial
+                                    systematics</span>. <abbr class="cit-jnl-abbrev">Int J Syst Bacteriol</abbr> <span class="cit-vol">37</span>, <span class="cit-fpage">463</span>–<span class="cit-lpage">464</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-37-4-463</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=PDF&amp;journalCode=ijs&amp;resid=37/4/463"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-45-1" title="View reference  in text"
+                           id="ref-45">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.45"
+                             data-doi="10.1099/00207713-50-6-2083">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Westerberg</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Elväng</span>,  <span class="cit-name-given-names">A. M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stackebrandt</span>,  <span class="cit-name-given-names">E.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jansson</span>,  <span class="cit-name-given-names">J. K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2000</span><strong>).</strong> <span class="cit-article-title"><em>Arthrobacter chlorophenolicus</em> sp. nov., a new species capable of degrading high concentrations of 4-chlorophenol</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">50</span>, <span class="cit-fpage">2083</span>–<span class="cit-lpage">2092</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-50-6-2083</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>11155983</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=50/6/2083"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-46-1" title="View reference  in text"
+                           id="ref-46">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.46"
+                             data-doi="10.1016/S0021-9673(01)95474-3">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Whiton</span>,  <span class="cit-name-given-names">R. S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lau</span>,  <span class="cit-name-given-names">P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Morgan</span>,  <span class="cit-name-given-names">S. L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Gilbart</span>,  <span class="cit-name-given-names">J.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Fox</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1985</span><strong>).</strong> <span class="cit-article-title">Modifications in the alditol acetate method for analysis of muramic acid and other neutral and amino sugars by capillary gas
+                                    chromatography-mass spectrometry with selected ion monitoring</span>. <abbr class="cit-jnl-abbrev">J Chromatogr A</abbr> <span class="cit-vol">347</span>, <span class="cit-fpage">109</span>–<span class="cit-lpage">120</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/S0021-9673(01)95474-3</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>4086626</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/S0021-9673(01)95474-3&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=4086626&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Modifications%20in%20the%20alditol%20acetate%20method%20for%20analysis%20of%20muramic%20acid%20and%20other%20neutral%20and%20amino%20sugars%20by%20capillary%20gas%20chromatography-mass%20spectrometry%20with%20selected%20ion%20monitoring&amp;author=R.%20S.%20Whiton&amp;author=P.%20Lau&amp;author=S.%20L.%20Morgan&amp;author=J.%20Gilbart&amp;author=A.%20Fox&amp;publication_year=1985&amp;journal=J%20Chromatogr%20A&amp;volume=347&amp;pages=109-120&amp;doi=10.1016%2FS0021-9673%2801%2995474-3&amp;pmid=4086626">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-47-1" title="View reference  in text"
+                           id="ref-47">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.47"
+                             data-doi="10.1126/science.7112124">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Yancey</span>,  <span class="cit-name-given-names">P. H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Clark</span>,  <span class="cit-name-given-names">M. E.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hand</span>,  <span class="cit-name-given-names">S. C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bowlus</span>,  <span class="cit-name-given-names">R. D.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Somero</span>,  <span class="cit-name-given-names">G. N.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1982</span><strong>).</strong> <span class="cit-article-title">Living with water stress: evolution of osmolyte systems</span>. <abbr class="cit-jnl-abbrev">Science</abbr> <span class="cit-vol">217</span>, <span class="cit-fpage">1214</span>–<span class="cit-lpage">1222</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1126/science.7112124</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>7112124</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=sci&amp;resid=217/4566/1214"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-48-1" title="View reference  in text"
+                           id="ref-48">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4174.48"
+                             data-doi="10.1099/ijs.0.026690-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Yassin</span>,  <span class="cit-name-given-names">A. F.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Spröer</span>,  <span class="cit-name-given-names">C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Siering</span>,  <span class="cit-name-given-names">C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hupfer</span>,  <span class="cit-name-given-names">H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Schumann</span>,  <span class="cit-name-given-names">P.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2011</span><strong>).</strong> <span class="cit-article-title"><em>Arthrobacter equi</em> sp. nov., isolated from veterinary clinical material</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">61</span>, <span class="cit-fpage">2089</span>–<span class="cit-lpage">2094</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.026690-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>20870884</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=61/9/2089"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                  </ol>
+               </div><span class="highwire-journal-article-marker-end"></span></div>
+            <div class="social-bookmarking">
+               
+               <ul class="social-bookmark-links">
+                  <li class="social-bookmarking-item social-bookmarking-item-citeulike"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4174&amp;title=Arthrobacter%20siccitolerans%20sp.%20nov.%2C%20a%20highly%20desiccation-tolerant%2C%20xeroprotectant-producing%20strain%20isolated%20from%20dry%20soil+--+SantaCruz-Calvo%20et%20al.%2063%20%28Pt%2011%29%3A%204174+--+IJSEM&amp;doi=10.1099/ijs.0.052902-0&amp;link_type=CITEULIKE"><img src="/shared/img/common/social-bookmarking/citeulike.gif"
+                             alt="Add to CiteULike"
+                             title="CiteULike" /></a><span class="soc-bm-link-text">CiteULike</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-delicious"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4174&amp;title=Arthrobacter%20siccitolerans%20sp.%20nov.%2C%20a%20highly%20desiccation-tolerant%2C%20xeroprotectant-producing%20strain%20isolated%20from%20dry%20soil+--+SantaCruz-Calvo%20et%20al.%2063%20%28Pt%2011%29%3A%204174+--+IJSEM&amp;doi=10.1099/ijs.0.052902-0&amp;link_type=DEL_ICIO_US"><img src="/shared/img/common/social-bookmarking/delicious.gif"
+                             alt="Add to Delicious"
+                             title="Delicious" /></a><span class="soc-bm-link-text">Delicious</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-digg"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4174&amp;title=Arthrobacter%20siccitolerans%20sp.%20nov.%2C%20a%20highly%20desiccation-tolerant%2C%20xeroprotectant-producing%20strain%20isolated%20from%20dry%20soil+--+SantaCruz-Calvo%20et%20al.%2063%20%28Pt%2011%29%3A%204174+--+IJSEM&amp;doi=10.1099/ijs.0.052902-0&amp;link_type=DIGG"><img src="/shared/img/common/social-bookmarking/digg.gif" alt="Add to Digg"
+                             title="Digg" /></a><span class="soc-bm-link-text">Digg</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-facebook"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/short/63/Pt_11/4174&amp;title=Arthrobacter%20siccitolerans%20sp.%20nov.%2C%20a%20highly%20desiccation-tolerant%2C%20xeroprotectant-producing%20strain%20isolated%20from%20dry%20soil+--+SantaCruz-Calvo%20et%20al.%2063%20%28Pt%2011%29%3A%204174+--+IJSEM&amp;doi=10.1099/ijs.0.052902-0&amp;link_type=FACEBOOK"
+                        class="sb-facebook"
+                        rel="external-nw"><img src="/shared/img/common/social-bookmarking/facebook.gif" alt="Add to Facebook"
+                             title="Facebook" /></a><span class="soc-bm-link-text">Facebook</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-googleplus"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4174&amp;title=Arthrobacter%20siccitolerans%20sp.%20nov.%2C%20a%20highly%20desiccation-tolerant%2C%20xeroprotectant-producing%20strain%20isolated%20from%20dry%20soil+--+SantaCruz-Calvo%20et%20al.%2063%20%28Pt%2011%29%3A%204174+--+IJSEM&amp;doi=10.1099/ijs.0.052902-0&amp;link_type=GOOGLEPLUS&amp;log_only=yes"><img src="/shared/img/common/social-bookmarking/googleplus.jpg" alt="Add to Google+"
+                             title="Google+" /></a><span class="soc-bm-link-text">Google+</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-linkedin"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4174&amp;title=Arthrobacter%20siccitolerans%20sp.%20nov.%2C%20a%20highly%20desiccation-tolerant%2C%20xeroprotectant-producing%20strain%20isolated%20from%20dry%20soil+--+SantaCruz-Calvo%20et%20al.%2063%20%28Pt%2011%29%3A%204174+--+IJSEM&amp;doi=10.1099/ijs.0.052902-0&amp;link_type=LINKEDIN"><img src="/shared/img/common/social-bookmarking/linkedin.gif" alt="Add to LinkedIn"
+                             title="LinkedIn" /></a><span class="soc-bm-link-text">LinkedIn</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-mendeley"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4174&amp;title=Arthrobacter%20siccitolerans%20sp.%20nov.%2C%20a%20highly%20desiccation-tolerant%2C%20xeroprotectant-producing%20strain%20isolated%20from%20dry%20soil+--+SantaCruz-Calvo%20et%20al.%2063%20%28Pt%2011%29%3A%204174+--+IJSEM&amp;doi=10.1099/ijs.0.052902-0&amp;link_type=MENDELEY"><img src="/shared/img/common/social-bookmarking/mendeley.gif" alt="Add to Mendeley"
+                             title="Mendeley" /></a><span class="soc-bm-link-text">Mendeley</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-reddit"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4174&amp;title=Arthrobacter%20siccitolerans%20sp.%20nov.%2C%20a%20highly%20desiccation-tolerant%2C%20xeroprotectant-producing%20strain%20isolated%20from%20dry%20soil+--+SantaCruz-Calvo%20et%20al.%2063%20%28Pt%2011%29%3A%204174+--+IJSEM&amp;doi=10.1099/ijs.0.052902-0&amp;link_type=REDDIT"><img src="/shared/img/common/social-bookmarking/reddit.gif" alt="Add to Reddit"
+                             title="Reddit" /></a><span class="soc-bm-link-text">Reddit</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-twitter"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4174&amp;title=Arthrobacter%20siccitolerans%20sp.%20nov.%2C%20a%20highly%20desiccation-tolerant%2C%20xeroprotectant-producing%20strain%20isolated%20from%20dry%20soil+--+SantaCruz-Calvo%20et%20al.%2063%20%28Pt%2011%29%3A%204174+--+IJSEM&amp;doi=10.1099/ijs.0.052902-0&amp;link_type=TWITTER"><img src="/shared/img/common/social-bookmarking/twitter.gif" alt="Add to Twitter"
+                             title="Twitter" /></a><span class="soc-bm-link-text">Twitter</span></li>
+               </ul>
+               
+               <p class="social-bookmarking-help"><a href="/help/social_bookmarks.dtl">What's this?</a></p>
+               
+            </div><span id="related-urls"></span></div>
+         <div id="col-2">
+            
+            <div class="article-nav sidebar-nav">
+               <a href="/content/63/Pt_11/4167.short" title="Previous article" class="previous">« Previous</a><span class="article-nav-sep"> | </span><a href="/content/63/Pt_11/4181.short" title="Next article" class="next">Next Article »</a>
+               
+               <span class="toc-link">
+                  				<a href="/content/63/Pt_11.toc" title="Table of Contents">Table of Contents</a>
+                  			</span>
+               
+               
+            </div>
+            <div class="open-access-note">
+               <span class="open-access-note">OPEN ACCESS ARTICLE</span>
+               
+            </div>
+            <div class="content-box" id="article-cb-main">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Article</span></h3>
+                  <div class="cb-section cb-slug">
+                     <ol>
+                        <li>
+                           <div id="slugline">
+                              
+                              
+                              	    <span class="slug-metadata-note ahead-of-print">
+                                 	
+                                 Published online ahead of print
+                                 
+                                 <span class="slug-ahead-of-print-date">June 14, 2013</span>,
+                                 doi:
+                                 <span title="10.1099/ijs.0.052902-0" class="slug-doi">10.1099/ijs.0.052902-0
+                                    </span>
+                                 </span>
+                              
+                              <cite>
+                                 	    <abbr title="International Journal of Systematic and Evolutionary Microbiology"
+                                       class="slug-jnl-abbrev">
+                                    IJSEM</abbr><span class="slug-pub-date" itemprop="datePublished">
+                                    	    November 2013 
+                                    </span>
+                                 	    <span class="slug-vol">
+                                    vol. 63 
+                                    </span><span class="slug-issue">
+                                    no. Pt 11 
+                                    </span><span class="slug-pages">
+                                    4174-4180
+                                    </span>
+                                 </cite>
+                              
+                              	           
+                              
+                              
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section cb-views">
+                     <ol>
+                        <li><span class="oa-article">Free via Open Access: <span>OA</span></span></li>
+                        <li><span class="creative-commons-article">Free via Creative Commons: <span>CC</span></span></li>
+                        <li><span class="ccv cc-version-by/2.5/"></span></li>
+                        <li class="abstract-view-link primary"><span class="oa-view">OA </span><a href="/content/63/Pt_11/4174.abstract" rel="view-abstract">Abstract</a><span class="free">Free</span></li>
+                        <li class="notice full-text-view-link primary"><span class="variant-indicator">» <span>Full Text</span></span><span class="free">Free</span></li>
+                        <li class="notice full-text-pdf-view-link primary"><a href="/content/63/Pt_11/4174.full.pdf+html" rel="view-full-text.pdf">Full Text (PDF)</a><span class="free">Free</span></li>
+                        <li><a href="/content/63/Pt_11/4174/suppl/DC1" rel="supplemental-data"
+                              class="dslink-supplementary-material">Supplementary material</a></li>
+                        <li><a href="/powerpoint/63/Pt_11/4174">PPT Slides of All Figures</a></li>
+                        <li class="cb-versions">
+                           <div><span id="pap-all-versions-label">All Versions of this Article:</span><ol class="version-list">
+                                 <li><a href="/content/early/2013/06/10/ijs.0.052902-0">ijs.0.052902-0v1</a></li>
+                                 <li class="current-li"><span>63/Pt_11/4174</span> <span class="current-version">most recent</span></li>
+                              </ol>
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible" id="cb-art-cat">
+                     <h4 class="cb-section-header"><span>Classifications</span></h4>
+                     <ol>
+                        <li>
+                           <ul class="subject-headings">
+                              <li>New Taxa
+                                 <ul class="subject-sub-headings last-child">
+                                    <li><a class="tocsection-search"
+                                          href="/search?tocsectionid=Actinobacteria&amp;sortspec=date&amp;submit=Submit">Actinobacteria</a></li>
+                                 </ul>
+                              </li>
+                           </ul>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible" id="cb-art-svcs">
+                     <h4 class="cb-section-header"><span>Services</span></h4>
+                     <ol>
+                        <li class="mail-a-friend-link icon-link"><a href="/email?gca=ijs%3B63%2FPt_11%2F4174&amp;current-view-path=/content/63/Pt_11/4174.full">
+                              Email this article to a colleague</a></li>
+                        <li class="alert-link icon-link"><a href="/cgi/alerts/ctalert?alertType=citedby&amp;addAlert=cited_by&amp;cited_by_criteria_resid=ijs%3B63%2FPt_11%2F4174&amp;saveAlert=no&amp;return-type=article&amp;return_url=http://ijs.sgmjournals.org/content/63/Pt_11/4174.full">Alert me when this article is cited</a></li>
+                        <li class="alert-link icon-link"><a href="/cgi/alerts/ctalert?alertType=correction&amp;addAlert=correction&amp;correction_criteria_value=63/Pt_11/4174&amp;saveAlert=no&amp;return-type=article&amp;return_url=http://ijs.sgmjournals.org/content/63/Pt_11/4174.full">Alert me if a correction is posted</a></li>
+                        <li class="similar-link"><a href="/search?qbe=ijs%3Bijs.0.052902-0&amp;citation=SantaCruz-Calvo%20et%20al.%2063%20%28Pt%2011%29:%204174&amp;submit=yes">Similar articles in this journal</a></li>
+                        <li class="similar-link"><a href="/external-ref?access_num=ijs%3B63%2FPt_11%2F4174&amp;link_type=ISI_RELATEDRECORDS"
+                              id="cb-isi-similar-articles"
+                              class="similar-link">Similar articles in Web of Science</a></li>
+                        <li class="similar-link"><a href="/external-ref?access_num=23771623&amp;link_type=MED_NBRS"
+                              class="similar-link">Similar articles in PubMed</a></li>
+                        <li class="cit-man-link icon-link cite-link"><a href="/citmgr?gca=ijs%3B63%2FPt_11%2F4174">Download to citation manager</a></li>
+                        <li class="copyright-link icon-link"><a href="/external-ref?link_type=PERMISSIONDIRECT"><img src="/shared/img/content/permissions.gif" /></a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-cit">
+                     <h4 class="cb-section-header"><span>Citing Articles</span></h4>
+                     <ol>
+                        <li class="hw-citing-link"><a href="/content/63/Pt_11/4174.full?cited-by=yes&amp;legid=ijs;63/Pt_11/4174#cited-by"
+                              id="cb-hw-citing-articles">Load citing article information</a></li>
+                        <li><a href="/cgi/crossref-forward-links/63/Pt_11/4174" rel="external-nw"
+                              id="cb-crossref-citing-articles">Citing articles via CrossRef</a></li>
+                        <li><a href="/external-ref?access_num=%2Fijs%2F63%2FPt_11%2F4174&amp;link_type=ISI_CITING&amp;accnum_type=native"
+                              rel="external-nw"
+                              id="cb-isi-citing-articles">Citing articles via Web of Science</a></li>
+                        <li><a href="/external-ref?access_num=http://ijs.sgmjournals.org/content/63/Pt_11/4174.abstract&amp;link_type=GOOGLESCHOLAR">Citing articles via Google Scholar</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-gs">
+                     <h4 class="cb-section-header"><span>Google Scholar</span></h4>
+                     <ol>
+                        <li class="cb-art-gs-auth author-link"><a href="http://scholar.google.com/scholar?q=%22author%3ASantaCruz-Calvo%20author%3AL.%22"
+                              class="cb-art-gs-auth author-link">Articles by  SantaCruz-Calvo, L.</a></li>
+                        <li class="cb-art-gs-auth author-link"><a href="http://scholar.google.com/scholar?q=%22author%3AManzanera%20author%3AM.%22"
+                              class="cb-art-gs-auth author-link">Articles by  Manzanera, M.</a></li>
+                        <li class="cb-art-gs-rel similar-link"><a href="/external-ref?access_num=http://ijs.sgmjournals.org/content/63/Pt_11/4174.abstract&amp;link_type=GOOGLESCHOLARRELATED">Search for related content</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-pm">
+                     <h4 class="cb-section-header"><span>PubMed</span></h4>
+                     <ol>
+                        <li class="cb-art-pm-cite cite-link icon-link"><a href="/external-ref?access_num=23771623&amp;link_type=PUBMED"
+                              class="cb-art-pm-cite cite-link icon-link">PubMed citation</a></li>
+                        <li class="cb-art-pm-auth author-link"><a href="/external-ref?access_num=SantaCruz-Calvo%20L&amp;link_type=AUTHORSEARCH"
+                              class="cb-art-pm-auth author-link">Articles by  SantaCruz-Calvo, L.</a></li>
+                        <li class="cb-art-pm-auth author-link"><a href="/external-ref?access_num=Manzanera%20M&amp;link_type=AUTHORSEARCH"
+                              class="cb-art-pm-auth author-link">Articles by  Manzanera, M.</a></li>
+                        <li>
+                           <div id="cb-entrez-links-placeholder"><a href="/entrez-links/23771623"></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-rel">
+                     <h4 class="cb-section-header"><span>Related Content</span></h4>
+                     <ol>
+                        <li><a href="/content/63/Pt_11/4174.full?related-urls=yes&amp;legid=ijs;63/Pt_11/4174#related-urls"
+                              id="cb-related-urls">Load related web page information</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed soc-links icon-link"
+                       id="cb-art-soc">
+                     <h4 class="cb-section-header"><span>Social Bookmarking</span></h4>
+                     <ol>
+                        <li>
+                           <div class="social-bookmarking">
+                              
+                              <ul class="social-bookmark-links">
+                                 <li class="social-bookmarking-item social-bookmarking-item-citeulike"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4174&amp;title=Arthrobacter%20siccitolerans%20sp.%20nov.%2C%20a%20highly%20desiccation-tolerant%2C%20xeroprotectant-producing%20strain%20isolated%20from%20dry%20soil+--+SantaCruz-Calvo%20et%20al.%2063%20%28Pt%2011%29%3A%204174+--+IJSEM&amp;doi=10.1099/ijs.0.052902-0&amp;link_type=CITEULIKE"><img src="/shared/img/common/social-bookmarking/citeulike.gif"
+                                            alt="Add to CiteULike"
+                                            title="CiteULike" /></a><span class="soc-bm-link-text">CiteULike</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-delicious"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4174&amp;title=Arthrobacter%20siccitolerans%20sp.%20nov.%2C%20a%20highly%20desiccation-tolerant%2C%20xeroprotectant-producing%20strain%20isolated%20from%20dry%20soil+--+SantaCruz-Calvo%20et%20al.%2063%20%28Pt%2011%29%3A%204174+--+IJSEM&amp;doi=10.1099/ijs.0.052902-0&amp;link_type=DEL_ICIO_US"><img src="/shared/img/common/social-bookmarking/delicious.gif"
+                                            alt="Add to Delicious"
+                                            title="Delicious" /></a><span class="soc-bm-link-text">Delicious</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-digg"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4174&amp;title=Arthrobacter%20siccitolerans%20sp.%20nov.%2C%20a%20highly%20desiccation-tolerant%2C%20xeroprotectant-producing%20strain%20isolated%20from%20dry%20soil+--+SantaCruz-Calvo%20et%20al.%2063%20%28Pt%2011%29%3A%204174+--+IJSEM&amp;doi=10.1099/ijs.0.052902-0&amp;link_type=DIGG"><img src="/shared/img/common/social-bookmarking/digg.gif" alt="Add to Digg"
+                                            title="Digg" /></a><span class="soc-bm-link-text">Digg</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-facebook"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/short/63/Pt_11/4174&amp;title=Arthrobacter%20siccitolerans%20sp.%20nov.%2C%20a%20highly%20desiccation-tolerant%2C%20xeroprotectant-producing%20strain%20isolated%20from%20dry%20soil+--+SantaCruz-Calvo%20et%20al.%2063%20%28Pt%2011%29%3A%204174+--+IJSEM&amp;doi=10.1099/ijs.0.052902-0&amp;link_type=FACEBOOK"
+                                       class="sb-facebook"
+                                       rel="external-nw"><img src="/shared/img/common/social-bookmarking/facebook.gif" alt="Add to Facebook"
+                                            title="Facebook" /></a><span class="soc-bm-link-text">Facebook</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-googleplus"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4174&amp;title=Arthrobacter%20siccitolerans%20sp.%20nov.%2C%20a%20highly%20desiccation-tolerant%2C%20xeroprotectant-producing%20strain%20isolated%20from%20dry%20soil+--+SantaCruz-Calvo%20et%20al.%2063%20%28Pt%2011%29%3A%204174+--+IJSEM&amp;doi=10.1099/ijs.0.052902-0&amp;link_type=GOOGLEPLUS&amp;log_only=yes"><img src="/shared/img/common/social-bookmarking/googleplus.jpg" alt="Add to Google+"
+                                            title="Google+" /></a><span class="soc-bm-link-text">Google+</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-linkedin"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4174&amp;title=Arthrobacter%20siccitolerans%20sp.%20nov.%2C%20a%20highly%20desiccation-tolerant%2C%20xeroprotectant-producing%20strain%20isolated%20from%20dry%20soil+--+SantaCruz-Calvo%20et%20al.%2063%20%28Pt%2011%29%3A%204174+--+IJSEM&amp;doi=10.1099/ijs.0.052902-0&amp;link_type=LINKEDIN"><img src="/shared/img/common/social-bookmarking/linkedin.gif" alt="Add to LinkedIn"
+                                            title="LinkedIn" /></a><span class="soc-bm-link-text">LinkedIn</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-mendeley"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4174&amp;title=Arthrobacter%20siccitolerans%20sp.%20nov.%2C%20a%20highly%20desiccation-tolerant%2C%20xeroprotectant-producing%20strain%20isolated%20from%20dry%20soil+--+SantaCruz-Calvo%20et%20al.%2063%20%28Pt%2011%29%3A%204174+--+IJSEM&amp;doi=10.1099/ijs.0.052902-0&amp;link_type=MENDELEY"><img src="/shared/img/common/social-bookmarking/mendeley.gif" alt="Add to Mendeley"
+                                            title="Mendeley" /></a><span class="soc-bm-link-text">Mendeley</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-reddit"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4174&amp;title=Arthrobacter%20siccitolerans%20sp.%20nov.%2C%20a%20highly%20desiccation-tolerant%2C%20xeroprotectant-producing%20strain%20isolated%20from%20dry%20soil+--+SantaCruz-Calvo%20et%20al.%2063%20%28Pt%2011%29%3A%204174+--+IJSEM&amp;doi=10.1099/ijs.0.052902-0&amp;link_type=REDDIT"><img src="/shared/img/common/social-bookmarking/reddit.gif" alt="Add to Reddit"
+                                            title="Reddit" /></a><span class="soc-bm-link-text">Reddit</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-twitter"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4174&amp;title=Arthrobacter%20siccitolerans%20sp.%20nov.%2C%20a%20highly%20desiccation-tolerant%2C%20xeroprotectant-producing%20strain%20isolated%20from%20dry%20soil+--+SantaCruz-Calvo%20et%20al.%2063%20%28Pt%2011%29%3A%204174+--+IJSEM&amp;doi=10.1099/ijs.0.052902-0&amp;link_type=TWITTER"><img src="/shared/img/common/social-bookmarking/twitter.gif" alt="Add to Twitter"
+                                            title="Twitter" /></a><span class="soc-bm-link-text">Twitter</span></li>
+                              </ul>
+                              
+                              <p class="social-bookmarking-help"><a href="/help/social_bookmarks.dtl">What's this?</a></p>
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+            
+            <div class="content-box" id="article-dyn-nav">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>Navigate This Article</span></h3>
+                  <div class="cb-section" id="cb-art-nav">
+                     <ol>
+                        <li><a href="#content-block">Top</a></li>
+                        <li><a href="#abstract-1">Abstract</a></li>
+                        <li><a href="#ack-1">Acknowledgements</a></li>
+                        <li><a href="#ref-list-1">References</a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+         </div>
+         <div id="col-3">
+            
+            <div class="content-box" id="sidebar-current-issue">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Month's Issue</span></h3>
+                  <div class="cb-section">
+                     <ol>
+                        <li><span><a href="/content/current" rel="current-issue">April 2015, 65 (Pt 4)</a></span></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section">
+                     <ol>
+                        <li>
+                           <div class="current-issue"><a href="/content/current" rel="current-issue"><img src="/content/65/Pt_4.cover.gif" width="67" height="89" alt="Current Issue" /></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section sidebar-etoc-link">
+                     <ol>
+                        <li><a href="/cgi/alerts/etoc">Alert me to new issues of IJSEM
+                              </a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            <div id="sidebar-global-nav">
+               
+               		
+               <ul class="button-list pub-links">
+                  <li class="first"><a href="/site/misc/about.xhtml" title="ABOUT IJSEM"><span>ABOUT IJSEM</span></a></li>
+                  <li><a href="/site/misc/edboard.xhtml" title="EDITORIAL BOARD &amp; STAFF"><span>EDITORIAL BOARD &amp; STAFF</span></a></li>
+                  <li><a href="http://www.editorialmanager.com/ijs/" title="SUBMIT A MANUSCRIPT"><span>SUBMIT A MANUSCRIPT</span></a></li>
+                  <li><a href="/site/misc/ifora.xhtml" title="INFORMATION FOR AUTHORS"><span>INFORMATION FOR AUTHORS</span></a></li>
+                  <li><a href="/site/misc/iforr.xhtml" title="INFORMATION FOR REVIEWERS"><span>INFORMATION FOR REVIEWERS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/site/librarians/index.xhtml"
+                        title="INFORMATION FOR LIBRARIANS"><span>INFORMATION FOR LIBRARIANS</span></a></li>
+                  <li><a href="/site/misc/reprints.xhtml" title="PERMISSIONS AND REPRINTS"><span>PERMISSIONS AND REPRINTS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/subscriptions" title="SUBSCRIPTIONS"><span>SUBSCRIPTIONS</span></a></li>
+                  <li><a href="/site/misc/addir.xhtml" title="ADVERTISING"><span>ADVERTISING</span></a></li>
+                  <li class="rss-img-button"><a href="/site/misc/alerts_feeds.xhtml" title="ALERTS &amp; FEEDS"><span>ALERTS &amp; FEEDS</span></a></li>
+                  <li class="last"><a href="/feedback" title="FEEDBACK"><span>FEEDBACK</span></a></li>
+               </ul>
+               		
+               <ul class="button-list pub-links umbrella-links">
+                  <li class="first"><a href="http://mic.sgmjournals.org" title="MICROBIOLOGY"><span>MICROBIOLOGY</span></a></li>
+                  <li><a href="http://vir.sgmjournals.org" title="J GEN VIROL"><span>J GEN VIROL</span></a></li>
+                  <li><a href="http://jmm.sgmjournals.org" title="J MED MICROBIOL"><span>J MED MICROBIOL</span></a></li>
+                  <li><a href="http://jmmcr.sgmjournals.org" title="JMM CASE REPORTS"><span>JMM CASE REPORTS</span></a></li>
+                  <li class="last"><a href="http://www.sgmjournals.org" title="ALL SGM JOURNALS"><span>ALL SGM JOURNALS</span></a></li>
+               </ul>
+               		
+               <div class="sidebar-icon-group">
+                  			
+                  <div class="icons">
+                     			<a href="http://www.sgm.ac.uk/" rel="external-nw"><img src="/publisher/img/society_logo.gif" class="publisher-icon" alt="Society Logo" /></a>
+                     			<a href="http://www.the-icsp.org/" rel="external-nw"><img src="/publisher/img/icsp_logo.gif" class="publisher-icon" alt="ICSP Logo" /></a>
+                     			<a href="http://highwire.stanford.edu/" rel="external-nw"><img src="/publisher/img/hplogo.gif" class="hw-icon" alt="HighWire Press Logo" /></a>
+                     			
+                  </div>
+                  			
+                  <div class="sidebar-icon-text"><span>The <a href="http://www.sgmjournals.org"> Society for General Microbiology</a> publishes online with the assistance of <a href="http://highwire.stanford.edu">HighWire Press®</a>.</span></div>
+                  		
+               </div>
+               	
+            </div>
+            <div class="most-links-box js-marker">
+               
+               <div class="most-header">
+                  
+                  <h3>Most</h3>
+                  
+               </div>
+               
+               <ul>
+                  <li class="most-cur-sel">
+                     <h4>Viewed</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/1070?rss=1&amp;ssource=mfr">Proposal to consistently apply the International Code of Nomenclature of Prokaryotes (ICNP) to names of the oxygenic photosynthetic
+                                 bacteria (cyanobacteria), including those validly published under the International Code of Botanical Nomenclature (ICBN)/International
+                                 Code of Nomenclature for algae, fungi and plants (ICN), and proposal to change Principle 2 of the ICNP</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfr">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/316?rss=1&amp;ssource=mfr">Integrating genomics into the taxonomy and systematics of the Bacteria and Archaea</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/333?rss=1&amp;ssource=mfr">Applications of next-generation sequencing to unravelling the evolutionary history of algae</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/739?rss=1&amp;ssource=mfr">Notification that new names of prokaryotes, new combinations, and new taxonomic opinions have appeared in volume 64, part
+                                 12, of the IJSEM</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfr1.dtl" class="view-all">» View all Most Viewed articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+                  <li>
+                     <h4>Cited</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4386?rss=1&amp;ssource=mfc">Chryseobacterium hispalense sp. nov., a plant-growth-promoting bacterium isolated from a rainwater pond in an olive plant
+                                 nursery, and emended descriptions of Chryseobacterium defluvii, Chryseobacterium indologenes, Chryseobacterium wanjuense and
+                                 Chryseobacterium gregarium</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfc">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_1/138?rss=1&amp;ssource=mfc">Aquibacter zeaxanthinifaciens gen. nov., sp. nov., a zeaxanthin-producing bacterium of the family Flavobacteriaceae isolated
+                                 from surface seawater, and emended descriptions of the genera Aestuariibaculum and Gaetbulibacter</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4790?rss=1&amp;ssource=mfc">Kordia aquimaris sp. nov., a zeaxanthin-producing member of the family Flavobacteriaceae isolated from surface seawater, and
+                                 emended description of the genus Kordia</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4524?rss=1&amp;ssource=mfc">Erythrobacter odishensis sp. nov. and Pontibacter odishensis sp. nov. isolated from dry soil of a solar saltern</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfc1.dtl" class="view-all">» View all Most Cited articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+               </ul>
+               
+               
+            </div>
+            
+            
+            
+         </div>
+         <div id="footer">
+            
+            <div class="bar">
+               
+               <div class="footer-group footer-col-left">
+                  		
+                  <p class="copyright">Copyright ©
+                     		2015 International Union of Microbiological Societies
+                     	
+                  </p>
+                  	
+               </div>
+               
+               <div class="footer-group footer-col-right">
+                  	    
+                  <ul class="issns">
+                     <li>
+                        <span>Print ISSN: </span>
+                        <span class="issn">1466-5026</span>
+                        
+                     </li>
+                     <li>
+                        <span>Online ISSN: </span>
+                        <span class="issn">1466-5034</span>
+                        
+                     </li>
+                  </ul>
+                  	  
+               </div>
+               	  
+            </div>
+            
+            
+            <div class="block-2 sb-div"></div>
+            
+         </div><script type="text/javascript">
+        var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
+        document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
+        </script><script type="text/javascript">
+        try {
+        var pageTracker = _gat._getTracker("UA-189672-25");
+        pageTracker._setDomainName(".sgmjournals.org");
+        pageTracker._trackPageview();
+        } catch(err) {}
+        </script><script type="text/javascript">
+	(function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
+		(i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
+		m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
+	})(window,document,'script','//www.google-analytics.com/analytics.js','ga');
+
+	ga('create', 'UA-48529861-1', '.sgmjournals.org');
+	ga('send', 'pageview');
+	</script></div>
+   </body>
+</html>
\ No newline at end of file
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4174.full/fulltext.pdf b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4174.full/fulltext.pdf
new file mode 100644
index 00000000..030ee9d7
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4174.full/fulltext.pdf differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4174.full/results.json b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4174.full/results.json
new file mode 100644
index 00000000..ecb2065b
--- /dev/null
+++ b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4174.full/results.json
@@ -0,0 +1,89 @@
+{
+  "publisher": {
+    "value": [
+      "Society for General Microbiology"
+    ]
+  },
+  "journal": {
+    "value": [
+      "International Journal of Systematic and Evolutionary\n                Microbiology"
+    ]
+  },
+  "title": {
+    "value": [
+      "Arthrobacter siccitolerans sp. nov., a highly desiccation-tolerant, xeroprotectant-producing strain isolated from dry soil"
+    ]
+  },
+  "authors": {
+    "value": [
+      "L. SantaCruz-Calvo",
+      "J. González-López",
+      "M. Manzanera"
+    ]
+  },
+  "date": {
+    "value": [
+      "11/01/2013"
+    ]
+  },
+  "doi": {
+    "value": [
+      "10.1099/ijs.0.052902-0"
+    ]
+  },
+  "volume": {
+    "value": [
+      "63"
+    ]
+  },
+  "issue": {
+    "value": [
+      "Pt 11"
+    ]
+  },
+  "firstpage": {
+    "value": [
+      "4174"
+    ]
+  },
+  "abstract": {
+    "value": [
+      "\n                  \n                      Next Section\n                  Abstract\n                  \n                  A novel desiccation-tolerant, xeroprotectant-producing bacterium, designated strain 4J27T, was isolated from a Nerium oleander rhizosphere subjected to seasonal drought in Granada, Spain. Phylogenetic analysis based on 16S rRNA gene sequencing placed\n                     the isolate within the genus Arthrobacter, its closest relative being Arthrobacter phenanthrenivorans Shep3 DSM 18606T, with which it showed 99.23 % 16S rRNA gene sequence similarity. DNA–DNA hybridization measurements showed less than 25 %\n                     relatedness between strain 4J27T and Arthrobacter phenanthrenivorans DSM 18606T. The DNA base composition of strain 4J27T was 65.3 mol%. The main fatty acids were anteiso C15 : 0, anteiso C17 : 0, C16 : 0 and iso C16 : 0 and the major menaquinone was MK-9 (H2). The peptidoglycan type was A3α with an l-Lys–l-Ser–l-Thr–l-Ala interpeptide bridge. The bacterium tested positive for catalase activity and negative for oxidase activity. Phylogenetic,\n                     chemotaxonomic and phenotypic analyses indicated that the desiccation-tolerant strain 4J27T represents a novel species within the genus Arthrobacter, for which the name Arthrobacter siccitolerans is proposed. The type strain is 4J27T ( = CECT 8257T = LMG 27359T).\n                  \n                  \n               "
+    ]
+  },
+  "fulltext_html": {
+    "value": [
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4174.full"
+    ]
+  },
+  "fulltext_pdf": {
+    "value": [
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4174.full.pdf"
+    ]
+  },
+  "supplementary_material": {
+    "value": [
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4174/suppl/DC1"
+    ]
+  },
+  "figure": {
+    "value": [
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4174/F1.small.gif"
+    ]
+  },
+  "figure_caption": {
+    "value": [
+      "Fig. 1.  \n                     \n                     Neighbour-joining phylogenetic tree based on 16S rRNA sequence comparisons of strain 4J27T and its 24 closest relatives. Streptomyces albus AS 4.164T was used as the outgroup. The numbers at bifurcations indicate how many times each species coincided in this position as\n                        percentages and only values > 50% are shown. Bar, 0.01 changes per nucleotide position.\n                     \n                     \n                     \n                  "
+    ]
+  },
+  "license": {
+    "value": [
+      "\n                  This is an open-access article distributed under the terms of the Creative Commons Attribution License, which permits unrestricted\n                     use, distribution, and reproduction in any medium, provided the original work is properly cited.\n                  \n               "
+    ]
+  },
+  "copyright": {
+    "value": [
+      "Copyright ©\n                     \t\t2015 International Union of Microbiological Societies\n                     \t\n                  "
+    ]
+  }
+}
\ No newline at end of file
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/DC1 b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/DC1
new file mode 100644
index 00000000..a8f9850b
--- /dev/null
+++ b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/DC1
@@ -0,0 +1,357 @@
+<!DOCTYPE html
+  PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html
+      xmlns="http://www.w3.org/1999/xhtml"
+      xml:lang="en"
+      lang="en">
+   <head>
+      <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
+      <title>Supplementary material </title>
+      <meta name="googlebot" content="NOODP" />
+      <meta name="HW.ad-path" content="/cgi/content/full/ijs.0.052647-0/DC1" />
+      <link rel="stylesheet" type="text/css" media="all" href="/shared/css/hw-global.css" />
+      <link rel="stylesheet" type="text/css" media="print" href="/shared/css/hw-print.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/standard-designs/design25/main.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/local/css/hw-local-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-page-data-supp.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-page-data-supp.css" /><script type="text/javascript" id="session-d7801268e1">var callbackToken='5632E7F846A4E52';</script><script type="text/javascript" id="session-d7801268e3">
+                      var subCode='sgmjournal_sub';
+                    </script><script type="text/javascript" src="/shared/js/jquery-min.js"></script><script type="text/javascript" src="/shared/js/fingerprint.js"></script><script type="text/javascript" src="/shared/js/hw-shared.js"></script><script type="text/javascript" src="/shared/js/design/hw-design1.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-shared.js"></script><script type="text/javascript" src="/shared/js/pages/hw-data-supp.js"></script></head>
+   <body>
+      <div class="hw-gen-page pagetype-content" id="pageid-data-supp">
+         <div id="header">
+            
+            <h1><a id="logo" href="/"><span>International Journal of Systematic and Evolutionary Microbiology</span></a></h1>
+            
+            <p id="skip-link">
+               <a href="#content-block">Skip to main page content</a>
+               
+            </p>
+            
+            <ul class="button-list header-buttons">
+               <li class="first"><a href="/" title="HOME"><span>HOME</span></a></li>
+               <li><a href="/content/current" title="CURRENT ISSUE"><span>CURRENT ISSUE</span></a></li>
+               <li><a href="/content" title="ARCHIVE"><span>ARCHIVE</span></a></li>
+               <li><a href="/search" title="SEARCH"><span>SEARCH</span></a></li>
+               <li><a href="/help" title="HELP"><span>HELP</span></a></li>
+               <li class="last"><a href="/feedback" title="CONTACT US"><span>CONTACT US</span></a></li>
+            </ul>
+            
+            
+            <div class="header-qs">
+               
+               <form class="searchbox" action="/search" method="get">
+                  <div>
+                     	<label for="header-qs-input" id="header-qs-search-label">Search for Keyword:</label>
+                     <input value="" title="Search" type="text" name="fulltext" id="header-qs-input" /><input type="hidden" name="submit" value="yes" /><label for="header-qs-search" id="header-qs-search-label">GO</label><input value="GO" alt="Link: Go" type="image" id="header-qs-search-go"
+                            src="/shared/img/standard-design/design2/go.gif" /> 
+                     
+                  </div>
+                  <div class="adv-search-link"><a href="/search">Advanced Search</a></div>
+               </form>
+               
+               
+            </div>
+            
+            <div class="header-ac-elements">
+               
+               <div id="authstring" class="suppress-header-login">
+                  
+                  <ul>
+                     <li class="subscr-ref">Institution: THE NATURAL HISTORY MUSEUM</li>
+                     <li>
+                        <a href="/login?uri=http%3A%2F%2Fijs.sgmjournals.org%2Fcontent%2F63%2FPt_11%2F4218%2Fsuppl%2FDC1">
+                           Sign In as Member / Individual
+                           </a>
+                        
+                     </li>
+                  </ul>           
+                  
+               </div> 
+               
+               <div id="hdr-login" class="suppress-header-login"></div>
+               
+            </div>
+            
+            <div class="banner-ads">
+               		
+               <ul>
+                  <li class="position-1 no-ad hdr_left"><span>  </span></li>
+               </ul>
+               	
+            </div>
+            
+            <div class="bar">
+               
+               <div class="bar-inner"></div>
+               
+            </div>
+            
+         </div>
+         <div id="content-block">
+            <h1 class="data-supp-article-title"><em>Prevotella jejuni</em> sp. nov., isolated from the small intestine of a child with coeliac disease
+            </h1>
+            <div><span class="highwire-journal-article-marker-start"></span><div class="auto-clean"><span style="font-family: Verdana,Arial,Helvetica,sans-serif;  font-size: 83.33%">
+                     
+                     
+                     <h2>Supplementary material</h2>
+                     
+                     <p><strong>Files in this Data Supplement:</strong></p>
+                     
+                     <ul>
+                        <li><a href="/content/suppl/2013/11/04/ijs.0.052647-0.DC1/ijs052647_forPAP.pdf">Supplementary material</a> 
+                           		
+                           
+                        </li>
+                     </ul>
+                     </span>
+                  
+                  
+               </div><span class="highwire-journal-article-marker-end"></span></div><span id="related-urls"></span></div>
+         <div id="col-2">
+            
+            <div class="content-box" id="article-cb-main">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Article</span></h3>
+                  <div class="cb-section cb-slug">
+                     <ol>
+                        <li>
+                           <div id="slugline">
+                              
+                              	<span class="slug-metadata-note ahead-of-print">
+                                 
+                                 Published online ahead of print
+                                 
+                                 <span class="slug-ahead-of-print-date">June 2013</span>,
+                                 doi:
+                                 <span title="10.1099/ijs.0.052647-0" class="slug-doi">10.1099/ijs.0.052647-0</span>
+                                 </span>
+                              
+                              
+                              
+                              <cite>
+                                 	    <abbr title="International Journal of Systematic and Evolutionary Microbiology"
+                                       class="slug-jnl-abbrev">
+                                    IJSEM</abbr><span class="slug-pub-date">
+                                    November 2013 
+                                    </span>
+                                 	    <span class="slug-vol">
+                                    vol. 63 
+                                    </span><span class="slug-issue">
+                                    no. Pt 11 
+                                    </span><span class="slug-pages">
+                                    4218-4223
+                                    </span>
+                                 </cite>
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section cb-views">
+                     <ol>
+                        <li><span class="oa-article">Free via Open Access: <span>OA</span></span></li>
+                        <li class="abstract-view-link primary"><span class="oa-view">OA </span><a href="/content/63/Pt_11/4218.abstract" rel="view-abstract">Abstract</a><span class="free">Free</span></li>
+                        <li class="notice full-text-view-link primary"><span class="oa-view">OA </span><a href="/content/63/Pt_11/4218.full" rel="view-full-text">Full Text</a><span class="free">Free</span></li>
+                        <li class="notice full-text-pdf-view-link primary"><a href="/content/63/Pt_11/4218.full.pdf+html" rel="view-full-text.pdf">Full Text (PDF)</a></li>
+                        <li><span class="variant-indicator">» <span>Supplementary material</span></span></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+            
+            
+         </div>
+         <div id="col-3">
+            
+            <div class="content-box" id="sidebar-current-issue">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Month's Issue</span></h3>
+                  <div class="cb-section">
+                     <ol>
+                        <li><span><a href="/content/current" rel="current-issue">April 2015, 65 (Pt 4)</a></span></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section">
+                     <ol>
+                        <li>
+                           <div class="current-issue"><a href="/content/current" rel="current-issue"><img src="/content/65/Pt_4.cover.gif" width="67" height="89" alt="Current Issue" /></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section sidebar-etoc-link">
+                     <ol>
+                        <li><a href="/cgi/alerts/etoc">Alert me to new issues of IJSEM
+                              </a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            <div id="sidebar-global-nav">
+               
+               		
+               <ul class="button-list pub-links">
+                  <li class="first"><a href="/site/misc/about.xhtml" title="ABOUT IJSEM"><span>ABOUT IJSEM</span></a></li>
+                  <li><a href="/site/misc/edboard.xhtml" title="EDITORIAL BOARD &amp; STAFF"><span>EDITORIAL BOARD &amp; STAFF</span></a></li>
+                  <li><a href="http://www.editorialmanager.com/ijs/" title="SUBMIT A MANUSCRIPT"><span>SUBMIT A MANUSCRIPT</span></a></li>
+                  <li><a href="/site/misc/ifora.xhtml" title="INFORMATION FOR AUTHORS"><span>INFORMATION FOR AUTHORS</span></a></li>
+                  <li><a href="/site/misc/iforr.xhtml" title="INFORMATION FOR REVIEWERS"><span>INFORMATION FOR REVIEWERS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/site/librarians/index.xhtml"
+                        title="INFORMATION FOR LIBRARIANS"><span>INFORMATION FOR LIBRARIANS</span></a></li>
+                  <li><a href="/site/misc/reprints.xhtml" title="PERMISSIONS AND REPRINTS"><span>PERMISSIONS AND REPRINTS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/subscriptions" title="SUBSCRIPTIONS"><span>SUBSCRIPTIONS</span></a></li>
+                  <li><a href="/site/misc/addir.xhtml" title="ADVERTISING"><span>ADVERTISING</span></a></li>
+                  <li class="rss-img-button"><a href="/site/misc/alerts_feeds.xhtml" title="ALERTS &amp; FEEDS"><span>ALERTS &amp; FEEDS</span></a></li>
+                  <li class="last"><a href="/feedback" title="FEEDBACK"><span>FEEDBACK</span></a></li>
+               </ul>
+               		
+               <ul class="button-list pub-links umbrella-links">
+                  <li class="first"><a href="http://mic.sgmjournals.org" title="MICROBIOLOGY"><span>MICROBIOLOGY</span></a></li>
+                  <li><a href="http://vir.sgmjournals.org" title="J GEN VIROL"><span>J GEN VIROL</span></a></li>
+                  <li><a href="http://jmm.sgmjournals.org" title="J MED MICROBIOL"><span>J MED MICROBIOL</span></a></li>
+                  <li><a href="http://jmmcr.sgmjournals.org" title="JMM CASE REPORTS"><span>JMM CASE REPORTS</span></a></li>
+                  <li class="last"><a href="http://www.sgmjournals.org" title="ALL SGM JOURNALS"><span>ALL SGM JOURNALS</span></a></li>
+               </ul>
+               		
+               <div class="sidebar-icon-group">
+                  			
+                  <div class="icons">
+                     			<a href="http://www.sgm.ac.uk/" rel="external-nw"><img src="/publisher/img/society_logo.gif" class="publisher-icon" alt="Society Logo" /></a>
+                     			<a href="http://www.the-icsp.org/" rel="external-nw"><img src="/publisher/img/icsp_logo.gif" class="publisher-icon" alt="ICSP Logo" /></a>
+                     			<a href="http://highwire.stanford.edu/" rel="external-nw"><img src="/publisher/img/hplogo.gif" class="hw-icon" alt="HighWire Press Logo" /></a>
+                     			
+                  </div>
+                  			
+                  <div class="sidebar-icon-text"><span>The <a href="http://www.sgmjournals.org"> Society for General Microbiology</a> publishes online with the assistance of <a href="http://highwire.stanford.edu">HighWire Press®</a>.</span></div>
+                  		
+               </div>
+               	
+            </div>
+            <div class="most-links-box js-marker">
+               
+               <div class="most-header">
+                  
+                  <h3>Most</h3>
+                  
+               </div>
+               
+               <ul>
+                  <li class="most-cur-sel">
+                     <h4>Viewed</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/1070?rss=1&amp;ssource=mfr">Proposal to consistently apply the International Code of Nomenclature of Prokaryotes (ICNP) to names of the oxygenic photosynthetic
+                                 bacteria (cyanobacteria), including those validly published under the International Code of Botanical Nomenclature (ICBN)/International
+                                 Code of Nomenclature for algae, fungi and plants (ICN), and proposal to change Principle 2 of the ICNP</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfr">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/316?rss=1&amp;ssource=mfr">Integrating genomics into the taxonomy and systematics of the Bacteria and Archaea</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/333?rss=1&amp;ssource=mfr">Applications of next-generation sequencing to unravelling the evolutionary history of algae</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/739?rss=1&amp;ssource=mfr">Notification that new names of prokaryotes, new combinations, and new taxonomic opinions have appeared in volume 64, part
+                                 12, of the IJSEM</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfr1.dtl" class="view-all">» View all Most Viewed articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+                  <li>
+                     <h4>Cited</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4386?rss=1&amp;ssource=mfc">Chryseobacterium hispalense sp. nov., a plant-growth-promoting bacterium isolated from a rainwater pond in an olive plant
+                                 nursery, and emended descriptions of Chryseobacterium defluvii, Chryseobacterium indologenes, Chryseobacterium wanjuense and
+                                 Chryseobacterium gregarium</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfc">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_1/138?rss=1&amp;ssource=mfc">Aquibacter zeaxanthinifaciens gen. nov., sp. nov., a zeaxanthin-producing bacterium of the family Flavobacteriaceae isolated
+                                 from surface seawater, and emended descriptions of the genera Aestuariibaculum and Gaetbulibacter</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4790?rss=1&amp;ssource=mfc">Kordia aquimaris sp. nov., a zeaxanthin-producing member of the family Flavobacteriaceae isolated from surface seawater, and
+                                 emended description of the genus Kordia</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4524?rss=1&amp;ssource=mfc">Erythrobacter odishensis sp. nov. and Pontibacter odishensis sp. nov. isolated from dry soil of a solar saltern</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfc1.dtl" class="view-all">» View all Most Cited articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+               </ul>
+               
+               
+            </div>
+            
+            
+            
+         </div>
+         <div id="footer">
+            
+            <div class="bar">
+               
+               <div class="footer-group footer-col-left">
+                  		
+                  <p class="copyright">Copyright ©
+                     		2015 International Union of Microbiological Societies
+                     	
+                  </p>
+                  	
+               </div>
+               
+               <div class="footer-group footer-col-right">
+                  	    
+                  <ul class="issns">
+                     <li>
+                        <span>Print ISSN: </span>
+                        <span class="issn">1466-5026</span>
+                        
+                     </li>
+                     <li>
+                        <span>Online ISSN: </span>
+                        <span class="issn">1466-5034</span>
+                        
+                     </li>
+                  </ul>
+                  	  
+               </div>
+               	  
+            </div>
+            
+            
+            <div class="block-2 sb-div"></div>
+            
+         </div><script type="text/javascript">
+        var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
+        document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
+        </script><script type="text/javascript">
+        try {
+        var pageTracker = _gat._getTracker("UA-189672-25");
+        pageTracker._setDomainName(".sgmjournals.org");
+        pageTracker._trackPageview();
+        } catch(err) {}
+        </script><script type="text/javascript">
+	(function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
+		(i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
+		m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
+	})(window,document,'script','//www.google-analytics.com/analytics.js','ga');
+
+	ga('create', 'UA-48529861-1', '.sgmjournals.org');
+	ga('send', 'pageview');
+	</script></div>
+   </body>
+</html>
\ No newline at end of file
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/F1.small.gif b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/F1.small.gif
new file mode 100644
index 00000000..6f3a61dc
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/F1.small.gif differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/F2.small.gif b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/F2.small.gif
new file mode 100644
index 00000000..700987a0
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/F2.small.gif differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/fulltext.html b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/fulltext.html
new file mode 100644
index 00000000..5f681458
--- /dev/null
+++ b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/fulltext.html
@@ -0,0 +1,1390 @@
+<!DOCTYPE html
+  PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html
+      xmlns="http://www.w3.org/1999/xhtml"
+      xml:lang="en"
+      lang="en">
+   <head>
+      <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
+      <title>Prevotella jejuni sp. nov., isolated from the small intestine of a child with coeliac disease </title>
+      <meta name="googlebot" content="NOODP" />
+      <meta name="HW.ad-path" content="/cgi/content/full/63/Pt_11/4218" />
+      <meta content="/ijs/63/Pt_11/4218.atom" name="HW.identifier" />
+      <meta name="DC.Format" content="text/html" />
+      <meta name="DC.Language" content="en" />
+      <meta content="Prevotella jejuni sp. nov., isolated from the small intestine of a child with coeliac disease"
+            name="DC.Title" />
+      <meta content="10.1099/ijs.0.052647-0" name="DC.Identifier" />
+      <meta content="2013-11-01" name="DC.Date" />
+      <meta content="Society for General Microbiology" name="DC.Publisher" />
+      <meta content="Maria E. Hedberg" name="DC.Contributor" />
+      <meta content="Anne Israelsson" name="DC.Contributor" />
+      <meta content="Edward R. B. Moore" name="DC.Contributor" />
+      <meta content="Liselott Svensson-Stadler" name="DC.Contributor" />
+      <meta content="Sun Nyunt Wai" name="DC.Contributor" />
+      <meta content="Grzegorz Pietz" name="DC.Contributor" />
+      <meta content="Olof Sandström" name="DC.Contributor" />
+      <meta content="Olle Hernell" name="DC.Contributor" />
+      <meta content="Marie-Louise Hammarström" name="DC.Contributor" />
+      <meta content="Sten Hammarström" name="DC.Contributor" />
+      <meta content="International Journal of Systematic and Evolutionary&#xA;                Microbiology"
+            name="citation_journal_title" />
+      <meta content="Int J Syst Evol&#xA;                Microbiol"
+            name="citation_journal_abbrev" />
+      <meta content="1466-5026" name="citation_issn" />
+      <meta content="1466-5034" name="citation_issn" />
+      <meta name="citation_author" content="Maria E. Hedberg" />
+      <meta name="citation_author_institution"
+            content="1Department of Clinical Microbiology, Immunology, Umeå University, SE-90187 Umeå, Sweden" />
+      <meta name="citation_author" content="Anne Israelsson" />
+      <meta name="citation_author_institution"
+            content="1Department of Clinical Microbiology, Immunology, Umeå University, SE-90187 Umeå, Sweden" />
+      <meta name="citation_author" content="Edward R. B. Moore" />
+      <meta name="citation_author_institution"
+            content="2CCUG – Culture Collection University of Gothenburg, Department of Clinical Bacteriology, Sahlgrenska University Hospital, SE-41345 Göteborg, Sweden" />
+      <meta name="citation_author_institution"
+            content="3Department of Infectious Diseases, Sahlgrenska Academy of the University of Gothenburg, SE-40530 Göteborg, Sweden" />
+      <meta name="citation_author" content="Liselott Svensson-Stadler" />
+      <meta name="citation_author_institution"
+            content="2CCUG – Culture Collection University of Gothenburg, Department of Clinical Bacteriology, Sahlgrenska University Hospital, SE-41345 Göteborg, Sweden" />
+      <meta name="citation_author" content="Sun Nyunt Wai" />
+      <meta name="citation_author_institution"
+            content="4Department of Molecular Biology, Umeå University, SE-90187 Umeå, Sweden" />
+      <meta name="citation_author" content="Grzegorz Pietz" />
+      <meta name="citation_author_institution"
+            content="1Department of Clinical Microbiology, Immunology, Umeå University, SE-90187 Umeå, Sweden" />
+      <meta name="citation_author" content="Olof Sandström" />
+      <meta name="citation_author_institution"
+            content="5Department of Clinical Sciences, Pediatrics, Umeå University, SE-90187 Umeå, Sweden" />
+      <meta name="citation_author" content="Olle Hernell" />
+      <meta name="citation_author_institution"
+            content="5Department of Clinical Sciences, Pediatrics, Umeå University, SE-90187 Umeå, Sweden" />
+      <meta name="citation_author" content="Marie-Louise Hammarström" />
+      <meta name="citation_author_institution"
+            content="1Department of Clinical Microbiology, Immunology, Umeå University, SE-90187 Umeå, Sweden" />
+      <meta name="citation_author" content="Sten Hammarström" />
+      <meta name="citation_author_institution"
+            content="1Department of Clinical Microbiology, Immunology, Umeå University, SE-90187 Umeå, Sweden" />
+      <meta content="Prevotella jejuni sp. nov., isolated from the small intestine of a child with coeliac disease"
+            name="citation_title" />
+      <meta content="11/01/2013" name="citation_date" />
+      <meta content="63" name="citation_volume" />
+      <meta content="Pt 11" name="citation_issue" />
+      <meta content="4218" name="citation_firstpage" />
+      <meta content="4223" name="citation_lastpage" />
+      <meta content="63/Pt_11/4218" name="citation_id" />
+      <meta content="63/Pt 11/4218" name="citation_id_from_sass_path" />
+      <meta content="ijs;63/Pt_11/4218" name="citation_mjid" />
+      <meta content="10.1099/ijs.0.052647-0" name="citation_doi" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4218.abstract"
+            name="citation_abstract_html_url" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4218.full"
+            name="citation_fulltext_html_url" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4218.full.pdf"
+            name="citation_pdf_url" />
+      <meta content="/content/63/Pt_11.cover.gif" name="issue_cover_image" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4218"
+            name="citation_public_url" />
+      <meta content="23793857" name="citation_pmid" />
+      <meta name="citation_access" content="all" />
+      <meta name="citation_fulltext_world_readable" content="" />
+      <meta name="citation_section" content="Bacteroidetes" />
+      <meta name="robots" content="noarchive,nofollow" />
+      <meta name="googlebot" content="noarchive" />
+      <link href="/content/63/Pt_11/4207.short" rel="prev" />
+      <link href="/content/63/Pt_11/4224.short" rel="next" />
+      <link rel="stylesheet" type="text/css" media="all" href="/shared/css/hw-global.css" />
+      <link rel="stylesheet" type="text/css" media="print" href="/shared/css/hw-print.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/standard-designs/design25/main.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/local/css/hw-local-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/jquery.fancybox-1.3.4.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-global-colexpand.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-global-colexpand.css" /><script type="text/javascript" id="session-d7796104e1">var callbackToken='5632E7F846A4E52';</script><script type="text/javascript" id="session-d7796104e3">
+                      var subCode='sgmjournal_sub';
+                    </script><script type="text/javascript" src="/shared/js/jquery-min.js"></script><script type="text/javascript" src="/shared/js/fingerprint.js"></script><script type="text/javascript" src="/shared/js/hw-shared.js"></script><script type="text/javascript" src="/shared/js/design/hw-design1.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-shared.js"></script><script type="text/javascript" src="/shared/js/pages/hw-content.js"></script><script type="text/javascript" src="/shared/js/fancybox/jquery.fancybox-1.3.4.js"></script><script type="text/javascript" src="/shared/js/fancybox/jquery.easing-1.3.pack.js"></script><script type="text/javascript"
+              src="/shared/js/fancybox/jquery.mousewheel-3.0.4.pack.js"></script><script type="text/javascript" src="/shared/js/util/content.jquery.addVariantLink.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-custom-free.js"></script><script type="text/javascript" src="/shared/js/util/hw-col-expand.js"></script><script type="text/javascript"
+              src="https://data.namesforlife.com/script/NamesforLife.js"></script></head>
+   <body>
+      <div class="hw-gen-page pagetype-content" id="pageid-content" itemscope="itemscope"
+           itemtype="http://schema.org/ScholarlyArticle">
+         <div id="header">
+            
+            <h1><a id="logo" href="/"><span>International Journal of Systematic and Evolutionary Microbiology</span></a></h1>
+            
+            <p id="skip-link">
+               <a href="#content-block">Skip to main page content</a>
+               
+            </p>
+            
+            <ul class="button-list header-buttons">
+               <li class="first"><a href="/" title="HOME"><span>HOME</span></a></li>
+               <li><a href="/content/current" title="CURRENT ISSUE"><span>CURRENT ISSUE</span></a></li>
+               <li><a href="/content" title="ARCHIVE"><span>ARCHIVE</span></a></li>
+               <li><a href="/search" title="SEARCH"><span>SEARCH</span></a></li>
+               <li><a href="/help" title="HELP"><span>HELP</span></a></li>
+               <li class="last"><a href="/feedback" title="CONTACT US"><span>CONTACT US</span></a></li>
+            </ul>
+            
+            
+            <div class="header-qs">
+               
+               <form class="searchbox" action="/search" method="get">
+                  <div>
+                     	<label for="header-qs-input" id="header-qs-search-label">Search for Keyword:</label>
+                     <input value="" title="Search" type="text" name="fulltext" id="header-qs-input" /><input type="hidden" name="submit" value="yes" /><label for="header-qs-search" id="header-qs-search-label">GO</label><input value="GO" alt="Link: Go" type="image" id="header-qs-search-go"
+                            src="/shared/img/standard-design/design2/go.gif" /> 
+                     
+                  </div>
+                  <div class="adv-search-link"><a href="/search">Advanced Search</a></div>
+               </form>
+               
+               
+            </div>
+            
+            <div class="header-ac-elements">
+               
+               <div id="authstring" class="suppress-header-login">
+                  
+                  <ul>
+                     <li class="subscr-ref">Institution: THE NATURAL HISTORY MUSEUM</li>
+                     <li>
+                        <a href="/login?uri=http%3A%2F%2Fijs.sgmjournals.org%2Fcontent%2F63%2FPt_11%2F4218.full">
+                           Sign In as Member / Individual
+                           </a>
+                        
+                     </li>
+                  </ul>           
+                  
+               </div> 
+               
+               <div id="hdr-login" class="suppress-header-login"></div>
+               
+            </div>
+            
+            <div class="banner-ads">
+               		
+               <ul>
+                  <li class="position-1 no-ad hdr_left"><span>  </span></li>
+               </ul>
+               	
+            </div>
+            
+            <div class="bar">
+               
+               <div class="bar-inner"></div>
+               
+            </div>
+            
+         </div>
+         <div id="content-block">
+            <div class="article fulltext-view " itemprop="articleBody"><span class="highwire-journal-article-marker-start"></span><h1 id="article-title-1" itemprop="headline"><em>Prevotella jejuni</em> sp. nov., isolated from the small intestine of a child with coeliac disease
+               </h1>
+               <div class="contributors">
+                  <ol class="contributor-list" id="contrib-group-1">
+                     <li class="contributor" id="contrib-1" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Maria+E.+Hedberg&amp;sortspec=date&amp;submit=Submit">Maria E. Hedberg</a></span><a id="xref-aff-1-1" class="xref-aff" href="#aff-1"><sup>1</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-2" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Anne+Israelsson&amp;sortspec=date&amp;submit=Submit">Anne Israelsson</a></span><a id="xref-aff-1-2" class="xref-aff" href="#aff-1"><sup>1</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-3" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Edward+R.+B.+Moore&amp;sortspec=date&amp;submit=Submit">Edward R. B. Moore</a></span><a id="xref-aff-2-1" class="xref-aff" href="#aff-2"><sup>2</sup></a><span class="xref-sep">,</span><a id="xref-aff-3-1" class="xref-aff" href="#aff-3"><sup>3</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-4" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Liselott+Svensson-Stadler&amp;sortspec=date&amp;submit=Submit">Liselott Svensson-Stadler</a></span><a id="xref-aff-2-2" class="xref-aff" href="#aff-2"><sup>2</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-5" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Sun+Nyunt+Wai&amp;sortspec=date&amp;submit=Submit">Sun Nyunt Wai</a></span><a id="xref-aff-4-1" class="xref-aff" href="#aff-4"><sup>4</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-6" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Grzegorz+Pietz&amp;sortspec=date&amp;submit=Submit">Grzegorz Pietz</a></span><a id="xref-aff-1-3" class="xref-aff" href="#aff-1"><sup>1</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-7" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Olof+Sandstr%C3%B6m&amp;sortspec=date&amp;submit=Submit">Olof Sandström</a></span><a id="xref-aff-5-1" class="xref-aff" href="#aff-5"><sup>5</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-8" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Olle+Hernell&amp;sortspec=date&amp;submit=Submit">Olle Hernell</a></span><a id="xref-aff-5-2" class="xref-aff" href="#aff-5"><sup>5</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-9" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Marie-Louise+Hammarstr%C3%B6m&amp;sortspec=date&amp;submit=Submit">Marie-Louise Hammarström</a></span><a id="xref-aff-1-4" class="xref-aff" href="#aff-1"><sup>1</sup></a> and 
+                     </li>
+                     <li class="last" id="contrib-10"><span class="name"><a class="name-search"
+                              href="/search?author1=Sten+Hammarstr%C3%B6m&amp;sortspec=date&amp;submit=Submit">Sten Hammarström</a></span><a id="xref-aff-1-5" class="xref-aff" href="#aff-1"><sup>1</sup></a></li>
+                  </ol>
+                  <ol class="affiliation-list">
+                     <li class="aff"><a id="aff-1" name="aff-1"></a><address><sup>1</sup>Department of Clinical Microbiology, Immunology, Umeå University, SE-90187 Umeå, Sweden
+                        </address>
+                     </li>
+                     <li class="aff"><a id="aff-2" name="aff-2"></a><address><sup>2</sup>CCUG – Culture Collection University of Gothenburg, Department of Clinical Bacteriology, Sahlgrenska University Hospital,
+                           SE-41345 Göteborg, Sweden
+                        </address>
+                     </li>
+                     <li class="aff"><a id="aff-3" name="aff-3"></a><address><sup>3</sup>Department of Infectious Diseases, Sahlgrenska Academy of the University of Gothenburg, SE-40530 Göteborg, Sweden
+                        </address>
+                     </li>
+                     <li class="aff"><a id="aff-4" name="aff-4"></a><address><sup>4</sup>Department of Molecular Biology, Umeå University, SE-90187 Umeå, Sweden
+                        </address>
+                     </li>
+                     <li class="aff"><a id="aff-5" name="aff-5"></a><address><sup>5</sup>Department of Clinical Sciences, Pediatrics, Umeå University, SE-90187 Umeå, Sweden
+                        </address>
+                     </li>
+                  </ol>
+                  <ol class="corresp-list">
+                     <li class="corresp" id="corresp-1"><strong>Correspondence</strong><br /> Maria E. Hedberg <span class="em-link"><span class="em-addr">maria.hedberg{at}climi.umu.se</span></span> Sten Hammarström <span class="em-link"><span class="em-addr">sten.hammarstrom{at}climi.umu.se</span></span></li>
+                  </ol>
+               </div>
+               <div class="section abstract" id="abstract-1" itemprop="description">
+                  <div class="section-nav">
+                     <div class="nav-placeholder"> </div><a href="#fn-group-1" title="Next Section" class="next-section-link"><span>Next Section</span></a></div>
+                  <h2>Abstract</h2>
+                  
+                  <p id="p-4">Five obligately anaerobic, Gram-stain-negative, saccharolytic and proteolytic, non-spore-forming bacilli (strains CD3 : 27,
+                     CD3 : 28<sup>T</sup>, CD3 : 33, CD3 : 32 and CD3 : 34) are described. All five strains were isolated from the small intestine of a female child
+                     with coeliac disease. Cells of the five strains were short rods or coccoid cells with longer filamentous forms seen sporadically.
+                     The organisms produced acetic acid and succinic acid as major metabolic end products. Phylogenetic analysis based on comparative
+                     16S rRNA gene sequence analysis revealed close relationships between CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33, between CD3 : 32 and <span class="named-content species" id="named-content-1"><a class="namesforlife" rel="namesforlife-name" title="Prevotella histicola"
+                           href="doi:10.1601/nm.13539"><em>Prevotella histicola</em></a></span> CCUG 55407<sup>T</sup>, and between CD3 : 34 and <span class="named-content species" id="named-content-2"><a class="namesforlife" rel="namesforlife-name" title="Prevotella melaninogenica"
+                           href="doi:10.1601/nm.8043"><em>Prevotella melaninogenica</em></a></span> CCUG 4944B<sup>T</sup>. Strains CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33 were clearly different from all recognized species within the genus <span class="named-content genus" id="named-content-3"><a class="namesforlife" rel="namesforlife-name" title="Prevotella"
+                           href="doi:10.1601/nm.8042"><em>Prevotella</em></a></span> and related most closely to but distinct from <span class="named-content species" id="named-content-4"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                           href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span>. Based on 16S rRNA, RNA polymerase β-subunit (<em>rpoB</em>) and 60 kDa chaperonin protein subunit (<em>cpn60</em>) gene sequencing, and phenotypic, chemical and biochemical properties, strains CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33 are considered to represent a novel species within the genus <span class="named-content genus" id="named-content-5"><a class="namesforlife" rel="namesforlife-name" title="Prevotella"
+                           href="doi:10.1601/nm.8042"><em>Prevotella</em></a></span>, for which the name <em>Prevotella jejuni</em> sp. nov. is proposed. Strain CD3 : 28<sup>T</sup> ( = CCUG 60371<sup>T</sup> = DSM 26989<sup>T</sup>) is the type strain of the proposed novel species. All five strains were able to form homologous aggregates, in which tube-like
+                     structures were connecting individual bacteria cells. The five strains were able to bind to human intestinal carcinoma cell
+                     lines at 37 °C.
+                  </p>
+                  
+               </div>
+               <div class="section fn-group" id="fn-group-1">
+                  <div class="section-nav"><a href="#abstract-1" title="Abstract" class="prev-section-link"><span>Previous Section</span></a><a href="#sec-1" title="Next Section" class="next-section-link"><span>Next Section</span></a></div>
+                  <ul>
+                     <li class="fn-other" id="fn-1">
+                        <p id="p-1">The GenBank/EMBL/DDBJ accession number for the 16S rRNA gene sequence of strain CD3 : 28<sup>T</sup> is JQ778983.
+                        </p>
+                     </li>
+                     <li class="fn-supplementary-material" id="fn-2">
+                        <p id="p-2">One supplementary figure and three supplementary tables are available with the online version of this paper.</p>
+                     </li>
+                  </ul>
+               </div>
+               <div class="license" id="license-1">
+                  <p id="p-3">This is an open-access article distributed under the terms of the Creative Commons Attribution License, which permits unrestricted
+                     use, distribution, and reproduction in any medium, provided the original work is properly cited.
+                  </p>
+               </div>
+               <p id="p-12">Coeliac disease (CD) is an immune-mediated enteropathy with a multifactorial aetiology. Early childhood infections have been
+                  shown to be a risk factor for CD (<a id="xref-ref-13-1" class="xref-bibr" href="#ref-13">Myléus <em>et al.</em>, 2012</a>). Also, the jejunal microbiota is considered to play a role in the pathogenesis of CD (<a id="xref-ref-14-1" class="xref-bibr" href="#ref-14">Olivares <em>et al.</em>, 2013</a>). This is supported by epidemiological data from Sweden showing that childhood CD has features of an infectious disease with
+                  a peak incidence between 1985 and 1996 in children younger than 2 years of age, a period referred to as ‘the Swedish CD epidemic’
+                  (<a id="xref-ref-10-1" class="xref-bibr" href="#ref-10">Ivarsson <em>et al.</em>, 2000</a>). A similar increase in incidence was seen later, during 2001–2004 (<a id="xref-ref-15-1" class="xref-bibr" href="#ref-15">Olsson <em>et al.</em>, 2008</a>; Namatovu, F. <em>et</em> <em>al.</em>, unpublished data). After both peaks, incidence returned to normal. We have shown that CD patients born during ‘the Swedish
+                  CD epidemic’ had a significant enrichment of mucosa-associated rod-shaped bacteria of the order <span class="named-content order" id="named-content-6"><a class="namesforlife" rel="namesforlife-name" title="Clostridiales"
+                        href="doi:10.1601/nm.3876"><em>Clostridiales</em></a></span>, and genera <span class="named-content genus" id="named-content-7"><a class="namesforlife" rel="namesforlife-name" title="Prevotella"
+                        href="doi:10.1601/nm.8042"><em>Prevotella</em></a></span> and <span class="named-content genus" id="named-content-8"><a class="namesforlife" rel="namesforlife-name" title="Actinomyces"
+                        href="doi:10.1601/nm.5771"><em>Actinomyces</em></a></span> in the jejunum (<a id="xref-ref-5-1" class="xref-bibr" href="#ref-5">Forsberg <em>et al.</em>, 2004</a>; <a id="xref-ref-16-1" class="xref-bibr" href="#ref-16">Ou <em>et al.</em>, 2009</a>). Recently, we characterized a novel species of a new genus, <span class="named-content species" id="named-content-9"><a class="namesforlife" rel="namesforlife-name"
+                        title="Lachnoanaerobaculum umeaense"
+                        href="doi:10.1601/nm.23523"><em>Lachnoanaerobaculum umeaense</em></a></span>, that had been isolated from the jejunal mucosa of a child born during ‘the Swedish CD epidemic’ (<a id="xref-ref-9-1" class="xref-bibr" href="#ref-9">Hedberg <em>et al.</em>, 2012</a>). We assumed that this bacterium corresponded to the prevalent bacteria of the order <span class="named-content order" id="named-content-10"><a class="namesforlife" rel="namesforlife-name" title="Clostridiales"
+                        href="doi:10.1601/nm.3876"><em>Clostridiales</em></a></span> we had previously reported (<a id="xref-ref-16-2" class="xref-bibr" href="#ref-16">Ou <em>et al.</em>, 2009</a>). To further characterize the microbiota of the small intestine of children with CD born during the first epidemic we have
+                  now studied isolates of the genus <span class="named-content genus" id="named-content-11"><a class="namesforlife" rel="namesforlife-name" title="Prevotella"
+                        href="doi:10.1601/nm.8042"><em>Prevotella</em></a></span>.
+               </p>
+               <p id="p-13">At the time of writing, 48 species of the genus <span class="named-content genus" id="named-content-12"><a class="namesforlife" rel="namesforlife-name" title="Prevotella"
+                        href="doi:10.1601/nm.8042"><em>Prevotella</em></a></span> have been described (<a id="xref-ref-4-1" class="xref-bibr" href="#ref-4">Euzéby, 2013</a>). The vast majority were isolated from humans, with the oral cavity being the main source (<a id="xref-ref-2-1" class="xref-bibr" href="#ref-2">Dewhirst <em>et al.</em>, 2010</a>). However, <span class="named-content genus" id="named-content-13"><a class="namesforlife" rel="namesforlife-name" title="Prevotella"
+                        href="doi:10.1601/nm.8042"><em>Prevotella</em></a></span> species have also been isolated from faeces (<a id="xref-ref-8-1" class="xref-bibr" href="#ref-8">Hayashi <em>et al.</em>, 2007</a>), the female genital tract, skin and respiratory tract, and from the rumen and hindgut of non-human mammals (<a id="xref-ref-1-1" class="xref-bibr" href="#ref-1">Alauzet <em>et al.</em>, 2010</a>). Until now, no species of the genus <span class="named-content genus" id="named-content-14"><a class="namesforlife" rel="namesforlife-name" title="Prevotella"
+                        href="doi:10.1601/nm.8042"><em>Prevotella</em></a></span> from the human small intestine had been characterized. Species of the genus <span class="named-content genus" id="named-content-15"><a class="namesforlife" rel="namesforlife-name" title="Prevotella"
+                        href="doi:10.1601/nm.8042"><em>Prevotella</em></a></span> are generally considered to be non-pathogenic or opportunistic pathogens. However, they have been shown to be involved in
+                  serious infections, and virulence factors such as haemolysins, haemagglutinins, fimbrial adhesins, proteases and phospholipases
+                  have been demonstrated in strains of several species (<a id="xref-ref-1-2" class="xref-bibr" href="#ref-1">Alauzet <em>et al.</em>, 2010</a>).
+               </p>
+               <p id="p-14">This study describes the phenotypic and genotypic characterization of strains CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33, representing isolates of a novel species, CD3 : 32, probably a strain of <span class="named-content species" id="named-content-16"><a class="namesforlife" rel="namesforlife-name" title="Prevotella histicola"
+                        href="doi:10.1601/nm.13539"><em>Prevotella histicola</em></a></span> (<a id="xref-ref-3-1" class="xref-bibr" href="#ref-3">Downes <em>et al.</em>, 2008</a>), and CD3 : 34, probably a strain of <span class="named-content species" id="named-content-17"><a class="namesforlife" rel="namesforlife-name" title="Prevotella melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>Prevotella melaninogenica</em></a></span> (<a id="xref-ref-19-1" class="xref-bibr" href="#ref-19">Shah &amp; Collins, 1990</a>). Additionally, we describe the phylogenetic relationships between the five isolates and other members of the genus <span class="named-content genus" id="named-content-18"><a class="namesforlife" rel="namesforlife-name" title="Prevotella"
+                        href="doi:10.1601/nm.8042"><em>Prevotella</em></a></span>, based upon comparative 16S rRNA gene sequence analyses. Moreover, the five isolates have been subjected to whole genome
+                  sequencing (WGS) using 454 pyro-sequencing technology (GS Junior; Roche Diagnostics), and the sequences of the genes encoding
+                  chaperonin 60 (<em>cpn60</em>) and DNA-directed RNA polymerase subunit-β (<em>rpoB</em>) have also been compared.
+               </p>
+               <p id="p-15">The five strains were isolated from a biopsy of the proximal small intestine of a girl with CD, born in 1995, i.e. during
+                  the 1985–1996 Swedish CD epidemic. She was on a gluten-free diet when the biopsy was taken at the Department of Paediatrics,
+                  Umeå University Hospital, Umeå, in 2007. Informed consent was obtained from her parents. The study was approved by the local
+                  Research Ethics Committee of the Faculty of Medicine (Um dnr: 96-304 and 04-156). The biopsy was weighed, homogenized and
+                  serially diluted ten-fold in Fastidious Anaerobe Broth medium (Lab M) and immediately plated onto selective and non-selective
+                  agar media. All <span class="named-content genus" id="named-content-19"><a class="namesforlife" rel="namesforlife-name" title="Prevotella"
+                        href="doi:10.1601/nm.8042"><em>Prevotella</em></a></span> strains were primarily isolated on blood agar plates [Columbia Blood Agar Base (Acumedia), supplemented with 5 % defibrinated
+                  horse blood]. <span class="named-content species" id="named-content-20"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> CCUG 55407<sup>T</sup>, <span class="named-content species" id="named-content-21"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> CCUG 4944B<sup>T</sup> and <span class="named-content species" id="named-content-22"><a class="namesforlife" rel="namesforlife-name" title="Prevotella stercorea"
+                        href="doi:10.1601/nm.10959"><em>Prevotella stercorea</em></a></span> CCUG 55595<sup>T</sup> were obtained from the Culture Collection University of Gothenburg (CCUG; <a href="http://www.ccug.se">http://www.ccug.se</a>).
+               </p>
+               <p id="p-16">Pure cultures of the five strains grew well on blood agar plates and in Brucella broth (BBL) supplemented with vitamin K (1
+                  µg ml<sup>−1</sup>) and haemin (5 µg ml<sup>−1</sup>) under an anaerobic atmosphere (10 % H<sub>2</sub>, 5 % CO<sub>2</sub> in N<sub>2</sub>) at 37 °C.
+               </p>
+               <p id="p-17">Colony morphologies and the results of presumptive identification tests by diagnostic discs (<a id="xref-ref-11-1" class="xref-bibr" href="#ref-11">Jousimies-Somer <em>et al.</em>, 2002</a>) were examined on blood agar plates after incubation for 3–5 days. None of the five strains grew in the presence of oxygen
+                  and they should be considered strictly anaerobic. Growth was improved and pigmentation and haemolytic activity increased if
+                  the atmosphere contained 10 % CO<sub>2</sub> and 5 % H<sub>2</sub> as compared with standard conditions. The appearance of the colonies of the five strains differed: isolate CD3 : 27 had circular,
+                  raised, convex, weakly to moderately pigmented and strongly haemolytic colonies; CD3 : 28<sup>T</sup> and CD3 : 33 had circular, convex, weakly pigmented, weakly haemolytic colonies; CD3 : 32 had circular, slightly raised and
+                  brown-reddish pigmented colonies with a shiny ‘wet’ appearance. Moreover, the centres of the colonies of CD3 : 32 were darker
+                  than the outer part. Colonies of CD3 : 34 were similar to those of CD3 : 28<sup>T</sup> and CD3 : 33, but with a surface appearing ‘drier’ (Fig. S1 available in IJSEM Online).
+               </p>
+               <p id="p-18">Light microscopy after Gram staining, dark field microscopy, scanning electron microscopy (SEM) and transmission electron
+                  microscopy (TEM) were used to investigate cell morphologies. Cells of the five strains were rod-shaped, 0.7×0.8–2 µm in size,
+                  occurring most often as short rods or as coccoid cells, with longer filamentous forms (&gt;10 µm) seen sporadically. All five
+                  strains were Gram-stain-negative and lacked spores. SEM revealed that all five strains, particularly if grown on agar medium,
+                  as opposed to in liquid culture, formed large aggregates of bacterial cells connected to each other by multiple, thin, strait,
+                  rod-shaped structures (<a id="xref-fig-1-1" class="xref-fig" href="#F1">Fig. 1a–c</a>). Cells of strains CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33 showed a similar degree of interconnectivity. Outer membrane vesicles were frequently observed. Analysis of
+                  thin sections of the aggregates by TEM suggested that the rod-shaped structures were hollow, characterized as tubes connecting
+                  cells to each other (<a id="xref-fig-1-2" class="xref-fig" href="#F1">Fig. 1d</a>).
+               </p>
+               <div id="F1" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4218/F1.expansion.html"><img alt="Fig. 1. " src="4218/F1.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4218/F1.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4218/F1.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4218/F1">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 1. </span> 
+                     
+                     <p id="p-19" class="first-child">Scanning electron micrographs showing surface structures of cells of <em>P. jejuni</em>, strains CD3 : 27 (a) and CD3 : 28<sup>T</sup> (b) and <em>P. histicola</em> strain CD3 : 32 (c). (d) Transmission electron micrograph of a cell of strain <em>P. jejuni</em> CD3 : 33; arrows indicate cross-section of the tube-like structures shown in (a)–(c) and arrowheads indicate outer membrane
+                        vesicles. Bars, 0.2 µm (a, b, d); 1 µm (c).
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <p id="p-20">All five strains exhibited a temperature optimum for growth at 37 °C. The optimal pH for growth was 6–7 with reduced growth
+                  at pH 5.5 and 7.5. Motility was not observed. All five strains were haemolytic and produced NH<sub>3</sub>. Growth on glucose as the sole carbon source yielded acetic acid, succinic acid and small amounts of isovaleric acid for
+                  strains CD3 : 27, CD3 : 32 and CD3 : 34, and acetic acid and succinic acid for strains CD3 : 28<sup>T</sup> and CD3 : 33.
+               </p>
+               <p id="p-21">The nucleotide sequences of the 16S rRNA genes of strains CD3 : 27, CD3 : 28<sup>T</sup>, CD3 : 33, CD3 : 32 and CD3 : 34 were determined by primer walking, covering the gene, and by cloning and sequencing of PCR
+                  amplification fragments also covering the gene (<a id="xref-ref-9-2" class="xref-bibr" href="#ref-9">Hedberg <em>et al.</em>, 2012</a>). These sequences were subsequently confirmed by genomic sequencing, allowing us to establish that there was only one copy
+                  of the 16S rRNA gene per genome. Other 16S rRNA gene sequences for comparative analyses were retrieved from the NCBI database
+                  (<a id="xref-ref-18-1" class="xref-bibr" href="#ref-18">Sayers <em>et al.</em>, 2010</a>). Strains CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33 shared &gt;99.8 % 16S rRNA gene sequence similarity with each other and 98.1–98.3 % similarity with <span class="named-content species" id="named-content-23"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> CCUG 4944B<sup>T</sup> (AY323525), <span class="named-content species" id="named-content-24"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> CCUG 55407<sup>T</sup> (AB547685), N 12-20 (EU126662), CD3 : 34 and CD3 : 32, and 97.3–97.7 % similarity with <span class="named-content species" id="named-content-25"><a class="namesforlife" rel="namesforlife-name" title="Prevotella veroralis"
+                        href="doi:10.1601/nm.8066"><em>Prevotella veroralis</em></a></span> CCUG 15422<sup>T</sup> (AY836507). Strain CD3 : 32 was related most closely to <span class="named-content species" id="named-content-26"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> (AB547685 and EU126662) showing &gt;99.6 % sequence similarity. Strain CD3 : 34 showed 99.8 % sequence similarity to <span class="named-content species" id="named-content-27"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> (AY323525 and NC-014370). <a id="xref-fig-2-1" class="xref-fig" href="#F2">Fig. 2</a> shows the phylogenetic tree reconstructed using the maximum composite likelihood model based on 16S rRNA gene sequences.
+                  Strains CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33 formed a separate group distinct from recognized species of the genus <span class="named-content genus" id="named-content-28"><a class="namesforlife" rel="namesforlife-name" title="Prevotella"
+                        href="doi:10.1601/nm.8042"><em>Prevotella</em></a></span> while strain CD3 : 32 clustered with <span class="named-content species" id="named-content-29"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> and strain CD3 : 34 with <span class="named-content species" id="named-content-30"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span>.
+               </p>
+               <div id="F2" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4218/F2.expansion.html"><img alt="Fig. 2. " src="4218/F2.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4218/F2.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4218/F2.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4218/F2">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 2. </span> 
+                     
+                     <p id="p-22" class="first-child">Phylogenetic tree based on 16S rRNA gene sequences showing the relationships between strains CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33 and related species. The 16S rRNA gene sequence of <span class="named-content species" id="named-content-31"><a class="namesforlife" rel="namesforlife-name" title="Porphyromonas gingivalis"
+                              href="doi:10.1601/nm.8029"><em>Porphyromonas gingivalis</em></a></span> ATCC 33277<sup>T</sup> served as an outgroup. Bar, 0.02 substitutions per nucleotide position.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <p id="p-23">Genomic DNA–DNA reassociation analysis was carried out using the hybridization protocols described by <a id="xref-ref-21-1" class="xref-bibr" href="#ref-21">Urdiain <em>et al.</em> (2008)</a>. Strain CD3 : 28<sup>T</sup> hybridized to a high level (95–112 %) with strains CD3 : 27 and CD3 : 33, confirming that these three strains belong to the
+                  same species. The level of hybridization between strain CD3 : 28<sup>T</sup> and <span class="named-content species" id="named-content-32"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> CCUG 55407<sup>T</sup>, <span class="named-content species" id="named-content-33"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> CCUG 4944B<sup>T</sup>, <span class="named-content species" id="named-content-34"><a class="namesforlife" rel="namesforlife-name" title="Prevotella scopos"
+                        href="doi:10.1601/nm.21331"><em>Prevotella scopos</em></a></span> CCUG 57945<sup>T</sup> and <span class="named-content species" id="named-content-35"><a class="namesforlife" rel="namesforlife-name" title="P. veroralis"
+                        href="doi:10.1601/nm.8066"><em>P. veroralis</em></a></span> CCUG 15422<sup>T</sup> was below 43 %. Levels of hybridization between strain CD3 : 28<sup>T</sup> and strains CD3 : 32 and CD3 : 34 were 49 and 59 % respectively. The level of hybridization between <span class="named-content species" id="named-content-36"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> CCUG 4944B<sup>T</sup> and strain CD3 : 34 was high (104 %), while that between strain CD3 : 34 and strain CD3 : 28<sup>T</sup> was 51 %. <span class="named-content species" id="named-content-37"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> hybridized to a low level (30 %) with <span class="named-content species" id="named-content-38"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> CCUG 55407<sup>T</sup>. The coefficient of variation was less than 5.5 %. As the genomic DNA hybridization values were well below 70 % for strains
+                  CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33 on the one hand and strains CD3 : 32 or CD3 : 34 on the other, the strains can be considered to represent different
+                  species (<a id="xref-ref-20-1" class="xref-bibr" href="#ref-20">Stackebrandt &amp; Goebel, 1994</a>).
+               </p>
+               <p id="p-24">To shed further light on whether CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33 should be considered as strains of the same novel species we compared the nucleotide sequences of the <em>rpoB</em> and <em>cpn60</em> genes (<a id="xref-ref-1-3" class="xref-bibr" href="#ref-1">Alauzet <em>et al.</em>, 2010</a>; <a id="xref-ref-17-1" class="xref-bibr" href="#ref-17">Sakamoto &amp; Ohkuma, 2010</a>). Similarly, we compared strain CD3 : 32 with <span class="named-content species" id="named-content-39"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> and strain CD3 : 34 with <span class="named-content species" id="named-content-40"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span>. The <em>rpoB</em> and <em>cpn60</em> (3810 and 1626 nt respectively) gene sequences were 100.0 % identical between strains CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33. Sequence similarity between CD3 : 32 and <span class="named-content species" id="named-content-41"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> F0411 was 99.3 % for <em>rpoB</em> and 98.7 % for <em>cpn60</em>. Strain CD3 : 34 and <span class="named-content species" id="named-content-42"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> CCUG 4944B<sup>T</sup> shared 98.3 % <em>rpoB</em> gene sequence similarity and 97.7 % <em>cpn60</em> gene sequence similarity.
+               </p>
+               <p id="p-25">The sizes of the genomes and the DNA G+C contents of the five strains were determined from WGS data (<a id="xref-table-wrap-1-1" class="xref-table" href="#T1">Table 1</a>). Strains CD3 : 28<sup>T</sup> and CD3 : 33 had almost the same genome size, 3.81×10<sup>6</sup> and 3.80×10<sup>6</sup> bp, respectively, while CD3 : 27 had a size of 3.68×10<sup>6</sup> bp. The genome of strain CD3 : 32 had a size of 3.20×10<sup>6</sup> bp, larger than that of the closely related <span class="named-content species" id="named-content-43"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> F0411 (2.99×10<sup>6</sup> bp). The genome size of strain CD3 : 34 was 3.27×10<sup>6</sup> bp, about 102×10<sup>3</sup> bp larger than that of <span class="named-content species" id="named-content-44"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> CCUG 4944B<sup>T</sup>. The DNA G+C contents of the strains grouped together, in that strains CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33 had values of 41.7–41.8 mol%, CD3 : 32 and <span class="named-content species" id="named-content-45"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> F0411 had values of 41.1 and 41.2 mol%, respectively, and CD3 : 34 and <span class="named-content species" id="named-content-46"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> CCUG 4944B<sup>T</sup> values of 40.7 and 41.0 mol%, respectively.
+               </p>
+               <div id="T1" class="table pos-float">
+                  <div class="table-inline">
+                     <div class="callout"><span>View this table:</span><ul class="callout-links">
+                           <li><a href="4218/T1.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4218/T1.expansion.html">In a new window</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="table-caption"><span class="table-label">Table 1. </span> 
+                     <span class="caption-title">Genome size and DNA G+C content of <em>Prevotella jejuni</em> sp. nov., and the other two <span class="named-content genus" id="named-content-47"><a class="namesforlife" rel="namesforlife-name" title="Prevotella"
+                              href="doi:10.1601/nm.8042"><em>Prevotella</em></a></span> isolates from human small intestine compared with <span class="named-content species" id="named-content-48"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                              href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> and <span class="named-content species" id="named-content-49"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                              href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span></span>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <p id="p-28">Cellular fatty acid (CFA) methyl ester analyses were performed using a standardized protocol (<a href="http://www.ccug.se/pages/CFA_method_2008">http://www.ccug.se/pages/CFA_method_2008</a> and as detailed by <a id="xref-ref-9-3" class="xref-bibr" href="#ref-9">Hedberg <em>et al.</em>, 2012</a>). Strains were grown anaerobically (10 % H<sub>2</sub>, 5 % CO<sub>2</sub> in N<sub>2</sub>), using chocolate agar as culture medium at 37 °C, and harvested after 48 h. CFAs were extracted and saponified by mild alkaline
+                  methanolysis and released fatty acids were methylated. CFAs were identified and quantified by GC (Hewlett Packard HP 5890).
+                  Retention times of CFA peaks were converted to equivalent chain-length values and the relative amount (w/w) of each fatty
+                  acid was expressed as a percentage of the total fatty acids in the profile of the respective strain (Table S1). The major
+                  CFAs detected in strains CD3 : 27, CD3 : 28<sup>T</sup>, CD3 : 33, CD3 : 32 and CD3 : 34 were iso-C<sub>15 : 0</sub>, anteiso-C<sub>15 : 0</sub>, C<sub>16 : 0</sub>, C<sub>18 : 2</sub>ω6,9<em>c</em>/anteiso-C<sub>18 : 0</sub> and iso-C<sub>17 : 0</sub> 3-OH. These five CFAs occurred in approximately the same relative amounts in the five strains with anteiso-C<sub>15 : 0</sub> accounting for 38.5–42.5 % of the total CFAs. Interestingly, strains CD3 : 27, CD3 : 28<sup>T</sup>, CD3 : 33, CD3 : 32 and CD3 : 34 were more similar to each other than were CD3 : 32 to <span class="named-content species" id="named-content-52"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> CCUG 55407<sup>T</sup> or CD3 : 34 to <span class="named-content species" id="named-content-53"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> CCUG 4944B<sup>T</sup> (Table S1). The similarities between the five jejunal isolates, although representing three different species, are perhaps
+                  a reflection of the fact that they were isolated from the same organ of one individual.
+               </p>
+               <p id="p-29">Analysis of metabolic and biochemical characteristics (rapid ID 32A, API 20A and APIZYM; bioMérieux) showed that the five
+                  strains are saccharolytic and proteolytic (Table S2). Strains CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33 demonstrated an almost identical pattern of biochemical characteristics. The only difference observed was that
+                  strain CD3 : 33 had α-galactosidase activity, while the other two strains did not. CD3 : 32 and <span class="named-content species" id="named-content-54"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> CCUG 55407<sup>T</sup> showed an identical pattern of biochemical characteristics and the same was true for the comparison between CD3 : 34 and
+                  <span class="named-content species" id="named-content-55"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> CCUG 4944B<sup>T</sup>. Sialidase activity was detected using 2′-(4-methylumbelliferyl)α-<span class="sc">d</span>-<em>N</em>-acetylneuraminic acid as substrate (<a id="xref-ref-12-1" class="xref-bibr" href="#ref-12">Moncla &amp; Braham, 1989</a>). All strains produced sialidase except CD3 : 32 and <span class="named-content species" id="named-content-56"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> CCUG 55407<sup>T</sup>.
+               </p>
+               <p id="p-30">By disc diffusion it was shown that all five isolates and <span class="named-content species" id="named-content-57"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> CCUG 55407<sup>T</sup> were resistant to vancomycin (5 µg) but susceptible to kanamycin (1 mg), colistin (10 µg) (Oxoid) and bile (1000 µg) (Oxgall
+                  tablets; Rosco Diagnostica), whereas <span class="named-content species" id="named-content-58"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> CCUG 4944B<sup>T</sup> was resistant to vancomycin and kanamycin but susceptible to colistin and bile. <span class="named-content species" id="named-content-59"><a class="namesforlife" rel="namesforlife-name" title="P. stercorea"
+                        href="doi:10.1601/nm.10959"><em>P. stercorea</em></a></span> CCUG 55595<sup>T</sup> was resistant to kanamycin and colistin but susceptible to bile and unexpectedly also susceptible to vancomycin (<a id="xref-ref-11-2" class="xref-bibr" href="#ref-11">Jousimies-Somer <em>et al.</em>, 2002</a>). Because the bacteria were isolated from the small intestine adjacent to the bile duct, susceptibility to bile was investigated
+                  further using an agar dilution technique. A stock solution containing 320 mM synthetic bile acids (taurocholate, 134.4 mM;
+                  taurochenodeoxycholate, 83.2 mM; glycocholate, 70.4 mM; glycochenodeoxycholate, 32 mM) yielded final concentrations of 0.125–16
+                  mM bile acids in the assay. Interestingly, growth and haemolytic activity of all five jejunum isolates were stimulated at
+                  low concentrations of bile (0.5–1.5 mM) compared with medium without bile, while growth was inhibited at higher bile concentrations
+                  (2–8 mM).
+               </p>
+               <p id="p-31">Susceptibility to penicillin G was tested using MIC Evaluator Strips (Oxoid). Strains CD3 : 32, CD3 : 34 and <span class="named-content species" id="named-content-60"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> CCUG 55407<sup>T</sup> were resistant (MIC &gt;32 µg ml<sup>−1</sup>). The other strains were susceptible to penicillin G, with MICs ranging from 0.003 to 0.015 µg ml<sup>−1</sup>. According to the nitrocefin disc test (Remel), strains CD3 : 32, CD3 : 34 and <span class="named-content species" id="named-content-61"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> CCUG 55407<sup>T</sup> produce β-lactamase. WGS revealed the presence of the <em>cfxA</em> β-lactamase gene in strains CD3 : 32 and CD3 : 34, but not in <span class="named-content species" id="named-content-62"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> F0411, the only other <span class="named-content species" id="named-content-63"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> isolate that has been sequenced so far, or <span class="named-content species" id="named-content-64"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> CCUG 4944B<sup>T</sup>. Strains CD3 : 32 and CD3 : 34 shared 100 and 99 % <em>cfxA</em> gene sequence similarity with <span class="named-content species" id="named-content-65"><a class="namesforlife" rel="namesforlife-name" title="Prevotella marshii"
+                        href="doi:10.1601/nm.9557"><em>Prevotella marshii</em></a></span> CCUG 50419<sup>T</sup>, respectively.
+               </p>
+               <p id="p-32">The abilities of strains CD3 : 27, CD3 : 28<sup>T</sup>, CD3 : 33, CD3 : 32, CD3 : 34, <span class="named-content species" id="named-content-66"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> CCUG 55407<sup>T</sup> and <span class="named-content species" id="named-content-67"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> CCUG 4944B<sup>T</sup> to agglutinate human erythrocytes was investigated. Strains CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33 strongly agglutinated human O and AB erythrocytes; there was no difference in the strength of the agglutination
+                  reaction between the three strains, nor was there a difference in their ability to agglutinate AB versus O red blood cells.
+                  Strain CD3 : 34 showed a weak agglutination reaction while strains CD3 : 32, <span class="named-content species" id="named-content-68"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> CCUG 55407<sup>T</sup> and <span class="named-content species" id="named-content-69"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> CCUG 4944B<sup>T</sup> were negative. The finding that some strains of <span class="named-content species" id="named-content-70"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> are able to weakly agglutinate red blood cells (<a id="xref-ref-7-1" class="xref-bibr" href="#ref-7">Haraldsson <em>et al.</em>, 2005</a>) is in agreement with our results.
+               </p>
+               <p id="p-33">To confirm that the five jejunal isolates were able to bind to intestinal epithelial cells, binding of PKH-2 fluorescence
+                  dye-labelled bacteria to PKH-26 fluorescence dye-labelled intestinal epithelial cells was studied by flow cytometry (<a id="xref-ref-6-1" class="xref-bibr" href="#ref-6">Hara-Kaonga &amp; Pistole, 2007</a>). Binding was evaluated after incubation at 37 °C and at 4 °C for 1 h. The cell lines were T84 (colon carcinoma), LS174T
+                  (colon carcinoma), HT29 (small intestine-like carcinoma) and Int407 (fetal small intestine epithelial cells), all obtained
+                  from the American Type Culture Collection (Rockville, MD). At 37 °C, all five isolates were able to bind to the four cell
+                  lines with two exceptions: strains CD3 : 27 and CD3 : 28<sup>T</sup> did not bind to LS174T cells (Table S3).
+               </p>
+               <p id="p-34">We conclude that strains CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33 represent a novel species of the genus <span class="named-content genus" id="named-content-71"><a class="namesforlife" rel="namesforlife-name" title="Prevotella"
+                        href="doi:10.1601/nm.8042"><em>Prevotella</em></a></span>, for which the name <em>Prevotella jejuni</em> sp. nov. is proposed, that CD3 : 32 is a strain of <span class="named-content species" id="named-content-72"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> and that CD3 : 34 is a strain of <span class="named-content species" id="named-content-73"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span>. The latter two jejunal isolates have larger genome sizes than the corresponding previously characterized strains. All five
+                  jejunal isolates are able to bind to human intestinal epithelial cells.
+               </p>
+               <div class="section" id="sec-1">
+                  <div class="section-nav"><a href="#fn-group-1" title="Previous Section" class="prev-section-link"><span>Previous Section</span></a><a href="#ack-1" title="Acknowledgements" class="next-section-link"><span>Next Section</span></a></div>
+                  
+                  
+                  <div id="sec-2" class="subsection">
+                     
+                     <h3>Description of <em>Prevotella jejuni</em> sp. nov.
+                     </h3>
+                     
+                     <p id="p-35"><em>Prevotella jejuni</em> (je.ju′ni. L. gen. n. <em>jejuni</em> of or from the jejunum, referring to the isolation of the type strain from the jejunum).
+                     </p>
+                     
+                     <p id="p-36">The description is based on three strains isolated from the human jejunum. Cells are obligately anaerobic, non-motile, Gram-stain-negative
+                        bacilli (0.7×0.8–2 µm). After 3–5 days of incubation on blood agar plates, colonies are 1–2 mm in diameter, circular, convex,
+                        weakly to moderately pigmented and weakly to strongly haemolytic. The optimum conditions for growth are 37 °C and pH 6–7.
+                        Acetic acid, succinic acid and small amounts of isovaleric acid are produced from glucose. NH<sub>3</sub> is produced. Cells are saccharolytic and proteolytic and are able to ferment glucose, lactose, maltose, mannose, raffinose
+                        and sucrose, but not arabinose, cellobiose, mannitol, melezitose, rhamnose, salicin, sorbitol, trehalose or xylose. Positive
+                        for activity of β-galactosidase, β-galactosidase-6-phosphate, α-glucosidase, <em>N</em>-acetyl-β-glucosaminidase, α-fucosidase, sialidase, acid phosphatase, alkaline phosphatase, naphthol-AS-BI-phosphate, arginine
+                        arylamidase, alanine arylamidase, leucine arylamidase and leucyl glycine arylamidase (Table S2). Gelatin is hydrolysed but
+                        aesculin is not. Cells agglutinate human AB and O erythrocytes and bind to several human intestinal cell lines. The predominant
+                        CFA is anteiso-C<sub>15 : 0</sub>, accounting for 42.5 % of the total CFA profile. 
+                     </p>
+                     
+                     <p id="p-37">The type strain is CD3 : 28<sup>T</sup> ( = CCUG 60371<sup>T</sup> = DSM 26989<sup>T</sup>), which was isolated from a biopsy of the small intestine of a child with CD. Strains CD3 : 27 ( = CCUG 60308) and CD3 : 33
+                        ( = CCUG 60311) are additional strains of this species. The DNA G+C content of the type strain is 41.7 mol%.
+                     </p>
+                     
+                  </div>
+               </div>
+               <div class="section ack" id="ack-1">
+                  <div class="section-nav"><a href="#sec-1" title="Previous Section" class="prev-section-link"><span>Previous Section</span></a><a href="#ref-list-1" title="References" class="next-section-link"><span>Next Section</span></a></div>
+                  <h2>Acknowledgements</h2>
+                  
+                  <p id="p-38">Funding was provided by: the Swedish Research Council, Natural Sciences and Engineering Sciences (no. 2010-5669); the TORNADO-project
+                     within the 7th framework program theme (grant agreement no. 222720-2); the Fund for Biotechnology-oriented Basic Science at
+                     Umeå University; the County of Västerbotten; and the Medical Faculty of Umeå University. The funders had no role in study
+                     design, data collection and analysis, decision to publish, or preparation of the manuscript.
+                  </p>
+                  
+               </div>
+               <div class="section ref-list" id="ref-list-1">
+                  <div class="section-nav"><a href="#ack-1" title="Acknowledgements" class="prev-section-link"><span>Previous Section</span></a><div class="nav-placeholder"> </div>
+                  </div>
+                  <h2>References</h2>
+                  <ol class="cit-list ref-use-labels">
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-1-1" title="View reference  in text"
+                           id="ref-1">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.1"
+                             data-doi="10.2217/fmb.10.126">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Alauzet</span>,  <span class="cit-name-given-names">C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Marchandin</span>,  <span class="cit-name-given-names">H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lozniewski</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2010</span><strong>).</strong> <span class="cit-article-title">New insights into <em>Prevotella</em> diversity and medical microbiology</span>. <abbr class="cit-jnl-abbrev">Future Microbiol</abbr> <span class="cit-vol">5</span>, <span class="cit-fpage">1695</span>–<span class="cit-lpage">1718</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.2217/fmb.10.126</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>21133690</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.2217/fmb.10.126&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=21133690&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=New%20insights%20into%20Prevotella%20diversity%20and%20medical%20microbiology&amp;author=C.%20Alauzet&amp;author=H.%20Marchandin&amp;author=A.%20Lozniewski&amp;publication_year=2010&amp;journal=Future%20Microbiol&amp;volume=5&amp;pages=1695-1718&amp;doi=10.2217%2Ffmb.10.126&amp;pmid=21133690">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-2-1" title="View reference  in text"
+                           id="ref-2">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.2"
+                             data-doi="10.1128/JB.00542-10">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Dewhirst</span>,  <span class="cit-name-given-names">F. E.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Chen</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Izard</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Paster</span>,  <span class="cit-name-given-names">B. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Tanner</span>,  <span class="cit-name-given-names">A. C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Yu</span>,  <span class="cit-name-given-names">W. H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lakshmanan</span>,  <span class="cit-name-given-names">A.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wade</span>,  <span class="cit-name-given-names">W. G.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2010</span><strong>).</strong> <span class="cit-article-title">The human oral microbiome</span>. <abbr class="cit-jnl-abbrev">J Bacteriol</abbr> <span class="cit-vol">192</span>, <span class="cit-fpage">5002</span>–<span class="cit-lpage">5017</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/JB.00542-10</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>20656903</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=jb&amp;resid=192/19/5002"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-3-1" title="View reference  in text"
+                           id="ref-3">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.3"
+                             data-doi="10.1099/ijs.0.65656-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Downes</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hooper</span>,  <span class="cit-name-given-names">S. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wilson</span>,  <span class="cit-name-given-names">M. J.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wade</span>,  <span class="cit-name-given-names">W. G.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2008</span><strong>).</strong> <span class="cit-article-title"><em>Prevotella histicola</em> sp. nov., isolated from the human oral cavity</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">58</span>, <span class="cit-fpage">1788</span>–<span class="cit-lpage">1791</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.65656-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>18676457</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=58/8/1788"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-4-1" title="View reference  in text"
+                           id="ref-4">↵</a><div class="cit ref-cit ref-other" id="cit-63.Pt_11.4218.4">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Euzéby</span>,  <span class="cit-name-given-names">J. P.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2013</span><strong>).</strong> <span class="cit-article-title">List of prokaryotic names with standing in nomenclature</span>. <a href="http://www.bacterio.cict.fr/classifgenerafamilies.html">www.bacterio.cict.fr/classifgenerafamilies.html</a></cite></div>
+                           <div class="cit-extra"></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-5-1" title="View reference  in text"
+                           id="ref-5">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.5"
+                             data-doi="10.1111/j.1572-0241.2004.04157.x">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Forsberg</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Fahlgren</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hörstedt</span>,  <span class="cit-name-given-names">P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hammarström</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hernell</span>,  <span class="cit-name-given-names">O.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hammarström</span>,  <span class="cit-name-given-names">M.-L.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2004</span><strong>).</strong> <span class="cit-article-title">Presence of bacteria and innate immunity of intestinal epithelium in childhood celiac disease</span>. <abbr class="cit-jnl-abbrev">Am J Gastroenterol</abbr> <span class="cit-vol">99</span>, <span class="cit-fpage">894</span>–<span class="cit-lpage">904</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1111/j.1572-0241.2004.04157.x</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>15128357</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1111/j.1572-0241.2004.04157.x&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=15128357&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Presence%20of%20bacteria%20and%20innate%20immunity%20of%20intestinal%20epithelium%20in%20childhood%20celiac%20disease&amp;author=G.%20Forsberg&amp;author=A.%20Fahlgren&amp;author=P.%20H%C3%B6rstedt&amp;author=S.%20Hammarstr%C3%B6m&amp;author=O.%20Hernell&amp;author=M.-L.%20Hammarstr%C3%B6m&amp;publication_year=2004&amp;journal=Am%20J%20Gastroenterol&amp;volume=99&amp;pages=894-904&amp;doi=10.1111%2Fj.1572-0241.2004.04157.x&amp;pmid=15128357">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-6-1" title="View reference  in text"
+                           id="ref-6">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.6"
+                             data-doi="10.1016/j.mimet.2006.11.017">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hara-Kaonga</span>,  <span class="cit-name-given-names">B.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pistole</span>,  <span class="cit-name-given-names">T. G.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2007</span><strong>).</strong> <span class="cit-article-title">A dual fluorescence flow cytometric analysis of bacterial adherence to mammalian host cells</span>. <abbr class="cit-jnl-abbrev">J Microbiol Methods</abbr> <span class="cit-vol">69</span>, <span class="cit-fpage">37</span>–<span class="cit-lpage">43</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/j.mimet.2006.11.017</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>17222473</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/j.mimet.2006.11.017&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=17222473&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=A%20dual%20fluorescence%20flow%20cytometric%20analysis%20of%20bacterial%20adherence%20to%20mammalian%20host%20cells&amp;author=B.%20Hara-Kaonga&amp;author=T.%20G.%20Pistole&amp;publication_year=2007&amp;journal=J%20Microbiol%20Methods&amp;volume=69&amp;pages=37-43&amp;doi=10.1016%2Fj.mimet.2006.11.017&amp;pmid=17222473">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-7-1" title="View reference  in text"
+                           id="ref-7">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.7"
+                             data-doi="10.1016/j.anaerobe.2005.02.004">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Haraldsson</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Meurman</span>,  <span class="cit-name-given-names">J. H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Könönen</span>,  <span class="cit-name-given-names">E.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Holbrook</span>,  <span class="cit-name-given-names">W. P.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2005</span><strong>).</strong> <span class="cit-article-title">Properties of hemagglutination by <em>Prevotella melaninogenica</em></span>. <abbr class="cit-jnl-abbrev">Anaerobe</abbr> <span class="cit-vol">11</span>, <span class="cit-fpage">285</span>–<span class="cit-lpage">289</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/j.anaerobe.2005.02.004</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>16701585</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/j.anaerobe.2005.02.004&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=16701585&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Properties%20of%20hemagglutination%20by%20Prevotella%20melaninogenica&amp;author=G.%20Haraldsson&amp;author=J.%20H.%20Meurman&amp;author=E.%20K%C3%B6n%C3%B6nen&amp;author=W.%20P.%20Holbrook&amp;publication_year=2005&amp;journal=Anaerobe&amp;volume=11&amp;pages=285-289&amp;doi=10.1016%2Fj.anaerobe.2005.02.004&amp;pmid=16701585">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-8-1" title="View reference  in text"
+                           id="ref-8">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.8"
+                             data-doi="10.1099/ijs.0.64778-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hayashi</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Shibata</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sakamoto</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Tomita</span>,  <span class="cit-name-given-names">S.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Benno</span>,  <span class="cit-name-given-names">Y.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2007</span><strong>).</strong> <span class="cit-article-title"><em>Prevotella copri</em> sp. nov. and <em>Prevotella stercorea</em> sp. nov., isolated from human faeces</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">57</span>, <span class="cit-fpage">941</span>–<span class="cit-lpage">946</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.64778-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>17473237</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=57/5/941"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-9-1" title="View reference  in text"
+                           id="ref-9">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.9"
+                             data-doi="10.1099/ijs.0.033613-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hedberg</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Moore</span>,  <span class="cit-name-given-names">E. R. B.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Svensson-Stadler</span>,  <span class="cit-name-given-names">L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hörstedt</span>,  <span class="cit-name-given-names">P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Baranov</span>,  <span class="cit-name-given-names">V.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hernell</span>,  <span class="cit-name-given-names">O.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nyunt Wai</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hammarström</span>,  <span class="cit-name-given-names">S.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hammarström</span>,  <span class="cit-name-given-names">M.-L.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2012</span><strong>).</strong> <span class="cit-article-title"><em>Lachnoanaerobaculum</em> gen. nov., a new genus in the <em>Lachnospiraceae</em>; characterization of <em>Lachnoanaerobaculum umeaense</em> gen. nov., sp. nov., isolated from the human small intestine, <em>Lachnoanaerobaculum orale</em> sp. nov., isolated from saliva and reclassification of <em>Eubacterium saburreum</em> (Prévot) Holdeman and Moore 1970 as <em>Lachnoanaerobaculum saburreum</em> comb. nov.</span> <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">62</span>, <span class="cit-fpage">2685</span>–<span class="cit-lpage">2690</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.033613-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>22228654</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=62/Pt_11/2685"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-10-1" title="View reference  in text"
+                           id="ref-10">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.10"
+                             data-doi="10.1080/080352500750028771">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ivarsson</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Persson</span>,  <span class="cit-name-given-names">L.-Å.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nyström</span>,  <span class="cit-name-given-names">L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ascher</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Cavell</span>,  <span class="cit-name-given-names">B.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Danielsson</span>,  <span class="cit-name-given-names">L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Dannaeus</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lindberg</span>,  <span class="cit-name-given-names">T.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lindquist</span>,  <span class="cit-name-given-names">B.</span></span></li>
+                              </ol><cite> <strong>&amp; other authors (</strong><span class="cit-pub-date">2000</span><strong>).</strong> <span class="cit-article-title">Epidemic of coeliac disease in Swedish children</span>. <abbr class="cit-jnl-abbrev">Acta Paediatr</abbr> <span class="cit-vol">89</span>, <span class="cit-fpage">165</span>–<span class="cit-lpage">171</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1111/j.1651-2227.2000.tb01210.x</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>10709885</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1080/080352500750028771&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=10709885&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Epidemic%20of%20coeliac%20disease%20in%20Swedish%20children&amp;author=A.%20Ivarsson&amp;author=L.-%C3%85.%20Persson&amp;author=L.%20Nystr%C3%B6m&amp;author=H.%20Ascher&amp;author=B.%20Cavell&amp;author=L.%20Danielsson&amp;author=A.%20Dannaeus&amp;author=T.%20Lindberg&amp;author=B.%20Lindquist&amp;publication_year=2000&amp;journal=Acta%20Paediatr&amp;volume=89&amp;pages=165-171&amp;doi=10.1111%2Fj.1651-2227.2000.tb01210.x&amp;pmid=10709885">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-11-1" title="View reference  in text"
+                           id="ref-11">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4218.11">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jousimies-Somer</span>,  <span class="cit-name-given-names">H. R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Summanen</span>,  <span class="cit-name-given-names">P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Citron</span>,  <span class="cit-name-given-names">D. M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Baron</span>,  <span class="cit-name-given-names">E. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wexler</span>,  <span class="cit-name-given-names">H. M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Finegold</span>,  <span class="cit-name-given-names">S. M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2002</span><strong>).</strong> <span class="cit-source">Wadsworth-KTL anaerobic bacteriology manual</span>, <span class="cit-edition">6th edn</span>. <span class="cit-publ-loc">Belmont, CA</span>: <span class="cit-publ-name">Star Publishing Company</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Wadsworth-KTL%20anaerobic%20bacteriology%20manual&amp;author=H.%20R.%20Jousimies-Somer&amp;author=P.%20Summanen&amp;author=D.%20M.%20Citron&amp;author=E.%20J.%20Baron&amp;author=H.%20M.%20Wexler&amp;author=S.%20M.%20Finegold&amp;publication_year=2002">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-12-1" title="View reference  in text"
+                           id="ref-12">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.12">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Moncla</span>,  <span class="cit-name-given-names">B.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Braham</span>,  <span class="cit-name-given-names">P.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1989</span><strong>).</strong> <span class="cit-article-title">Detection of sialidase (neuraminidase) by using 2′-(4-methylumbelliferyl)α-<span class="sc">d</span>-<em>N</em>-acetylneuraminic acid in a filter paper spot test</span>. <abbr class="cit-jnl-abbrev">J Clin Microbiol</abbr> <span class="cit-vol">27</span>, <span class="cit-fpage">182</span>–<span class="cit-lpage">184</span>.<span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>2643620</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=jcm&amp;resid=27/1/182"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-13-1" title="View reference  in text"
+                           id="ref-13">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.13"
+                             data-doi="10.1186/1471-2431-12-194">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Myléus</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hernell</span>,  <span class="cit-name-given-names">O.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Gothefors</span>,  <span class="cit-name-given-names">L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hammarström</span>,  <span class="cit-name-given-names">M.-L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Persson</span>,  <span class="cit-name-given-names">L.-Å.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stenlund</span>,  <span class="cit-name-given-names">H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ivarsson</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2012</span><strong>).</strong> <span class="cit-article-title">Early infections are associated with increased risk for celiac disease: an incident case-referent study</span>. <abbr class="cit-jnl-abbrev">BMC Pediatr</abbr> <span class="cit-vol">12</span>, <span class="cit-fpage">194</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1186/1471-2431-12-194</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>23249321</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1186/1471-2431-12-194&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=23249321&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Early%20infections%20are%20associated%20with%20increased%20risk%20for%20celiac%20disease%3A%20an%20incident%20case-referent%20study&amp;author=A.%20Myl%C3%A9us&amp;author=O.%20Hernell&amp;author=L.%20Gothefors&amp;author=M.-L.%20Hammarstr%C3%B6m&amp;author=L.-%C3%85.%20Persson&amp;author=H.%20Stenlund&amp;author=A.%20Ivarsson&amp;publication_year=2012&amp;journal=BMC%20Pediatr&amp;volume=12&amp;pages=194&amp;doi=10.1186%2F1471-2431-12-194&amp;pmid=23249321">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-14-1" title="View reference  in text"
+                           id="ref-14">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.14"
+                             data-doi="10.1017/S0007114512005521">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Olivares</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Laparra</span>,  <span class="cit-name-given-names">J. M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sanz</span>,  <span class="cit-name-given-names">Y.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2013</span><strong>).</strong> <span class="cit-article-title">Host genotype, intestinal microbiota and inflammatory disorders</span>. <abbr class="cit-jnl-abbrev">Br J Nutr</abbr> <span class="cit-vol">109</span> (<span class="cit-supplement">Suppl 2</span>), <span class="cit-fpage">S76</span>–<span class="cit-lpage">S80</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1017/S0007114512005521</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>23360883</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1017/S0007114512005521&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=23360883&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Host%20genotype%2C%20intestinal%20microbiota%20and%20inflammatory%20disorders&amp;author=M.%20Olivares&amp;author=J.%20M.%20Laparra&amp;author=Y.%20Sanz&amp;publication_year=2013&amp;journal=Br%20J%20Nutr&amp;volume=109&amp;pages=S76-S80&amp;doi=10.1017%2FS0007114512005521&amp;pmid=23360883">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-15-1" title="View reference  in text"
+                           id="ref-15">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.15"
+                             data-doi="10.1542/peds.2007-2989">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Olsson</span>,  <span class="cit-name-given-names">C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hernell</span>,  <span class="cit-name-given-names">O.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hörnell</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lönnberg</span>,  <span class="cit-name-given-names">G.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ivarsson</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2008</span><strong>).</strong> <span class="cit-article-title">Difference in celiac disease risk between Swedish birth cohorts suggests an opportunity for primary prevention</span>. <abbr class="cit-jnl-abbrev">Pediatrics</abbr> <span class="cit-vol">122</span>, <span class="cit-fpage">528</span>–<span class="cit-lpage">534</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1542/peds.2007-2989</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>18762522</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=pediatrics&amp;resid=122/3/528"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-16-1" title="View reference  in text"
+                           id="ref-16">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.16"
+                             data-doi="10.1038/ajg.2009.524">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ou</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hedberg</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hörstedt</span>,  <span class="cit-name-given-names">P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Baranov</span>,  <span class="cit-name-given-names">V.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Forsberg</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Drobni</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sandström</span>,  <span class="cit-name-given-names">O.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wai</span>,  <span class="cit-name-given-names">S. N.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Johansson</span>,  <span class="cit-name-given-names">I.</span></span></li>
+                              </ol><cite> <strong>&amp; other authors (</strong><span class="cit-pub-date">2009</span><strong>).</strong> <span class="cit-article-title">Proximal small intestinal microbiota and identification of rod-shaped bacteria associated with childhood celiac disease</span>. <abbr class="cit-jnl-abbrev">Am J Gastroenterol</abbr> <span class="cit-vol">104</span>, <span class="cit-fpage">3058</span>–<span class="cit-lpage">3067</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1038/ajg.2009.524</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>19755974</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1038/ajg.2009.524&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=19755974&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Proximal%20small%20intestinal%20microbiota%20and%20identification%20of%20rod-shaped%20bacteria%20associated%20with%20childhood%20celiac%20disease&amp;author=G.%20Ou&amp;author=M.%20Hedberg&amp;author=P.%20H%C3%B6rstedt&amp;author=V.%20Baranov&amp;author=G.%20Forsberg&amp;author=M.%20Drobni&amp;author=O.%20Sandstr%C3%B6m&amp;author=S.%20N.%20Wai&amp;author=I.%20Johansson&amp;publication_year=2009&amp;journal=Am%20J%20Gastroenterol&amp;volume=104&amp;pages=3058-3067&amp;doi=10.1038%2Fajg.2009.524&amp;pmid=19755974">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-17-1" title="View reference  in text"
+                           id="ref-17">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.17"
+                             data-doi="10.1099/jmm.0.020420-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sakamoto</span>,  <span class="cit-name-given-names">M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ohkuma</span>,  <span class="cit-name-given-names">M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2010</span><strong>).</strong> <span class="cit-article-title">Usefulness of the <em>hsp60</em> gene for the identification and classification of Gram-negative anaerobic rods</span>. <abbr class="cit-jnl-abbrev">J Med Microbiol</abbr> <span class="cit-vol">59</span>, <span class="cit-fpage">1293</span>–<span class="cit-lpage">1302</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/jmm.0.020420-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>20671088</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=medmicro&amp;resid=59/11/1293"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-18-1" title="View reference  in text"
+                           id="ref-18">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.18"
+                             data-doi="10.1093/nar/gkp967">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sayers</span>,  <span class="cit-name-given-names">E. W.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Barrett</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Benson</span>,  <span class="cit-name-given-names">D. A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bolton</span>,  <span class="cit-name-given-names">E.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bryant</span>,  <span class="cit-name-given-names">S. H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Canese</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Chetvernin</span>,  <span class="cit-name-given-names">V.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Church</span>,  <span class="cit-name-given-names">D. M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Dicuccio</span>,  <span class="cit-name-given-names">M.</span></span></li>
+                              </ol><cite> <strong>&amp; other authors (</strong><span class="cit-pub-date">2010</span><strong>).</strong> <span class="cit-article-title">Database resources of the National Center for Biotechnology Information</span>. <abbr class="cit-jnl-abbrev">Nucleic Acids Res</abbr> <span class="cit-vol">38</span> (<span class="cit-supplement">Database issue</span>), <span class="cit-fpage">D5</span>–<span class="cit-lpage">D16</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1093/nar/gkp967</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>19910364</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=nar&amp;resid=38/suppl_1/D5"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-19-1" title="View reference  in text"
+                           id="ref-19">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.19"
+                             data-doi="10.1099/00207713-40-2-205">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Shah</span>,  <span class="cit-name-given-names">H. N.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Collins</span>,  <span class="cit-name-given-names">D. M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1990</span><strong>).</strong> <span class="cit-article-title"><em>Prevotella</em>, a new genus to include <em>Bacteroides melaninogenicus</em> and related species formerly classified in the genus <em>Bacteroides</em></span>. <abbr class="cit-jnl-abbrev">Int J Syst Bacteriol</abbr> <span class="cit-vol">40</span>, <span class="cit-fpage">205</span>–<span class="cit-lpage">208</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-40-2-205</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>2223612</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=40/2/205"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-20-1" title="View reference  in text"
+                           id="ref-20">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.20"
+                             data-doi="10.1099/00207713-44-4-846">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stackebrandt</span>,  <span class="cit-name-given-names">E.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Goebel</span>,  <span class="cit-name-given-names">B. M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1994</span><strong>).</strong> <span class="cit-article-title">Taxonomic note: a place for DNA-DNA reassociation and 16S rRNA sequence analysis in the present species definition in bacteriology</span>. <abbr class="cit-jnl-abbrev">Int J Syst Bacteriol</abbr> <span class="cit-vol">44</span>, <span class="cit-fpage">846</span>–<span class="cit-lpage">849</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-44-4-846</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=44/4/846"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-21-1" title="View reference  in text"
+                           id="ref-21">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.21"
+                             data-doi="10.1016/j.syapm.2008.07.002">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Urdiain</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">López-López</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Gonzalo</span>,  <span class="cit-name-given-names">C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Busse</span>,  <span class="cit-name-given-names">H. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Langer</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kämpfer</span>,  <span class="cit-name-given-names">P.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Rosselló-Móra</span>,  <span class="cit-name-given-names">R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2008</span><strong>).</strong> <span class="cit-article-title">Reclassification of <em>Rhodobium marinum</em> and <em>Rhodobium pfennigii</em> as <em>Afifella marina</em> gen. nov. comb. nov. and <em>Afifella pfennigii</em> comb. nov., a new genus of photoheterotrophic <em>Alphaproteobacteria</em> and emended descriptions of <em>Rhodobium</em>, <em>Rhodobium orientis</em> and <em>Rhodobium gokarnense</em></span>. <abbr class="cit-jnl-abbrev">Syst Appl Microbiol</abbr> <span class="cit-vol">31</span>, <span class="cit-fpage">339</span>–<span class="cit-lpage">351</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/j.syapm.2008.07.002</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>18774253</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/j.syapm.2008.07.002&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=18774253&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Reclassification%20of%20Rhodobium%20marinum%20and%20Rhodobium%20pfennigii%20as%20Afifella%20marina%20gen.%20nov.%20comb.%20nov.%20and%20Afifella%20pfennigii%20comb.%20nov.%2C%20a%20new%20genus%20of%20photoheterotrophic%20Alphaproteobacteria%20and%20emended%20descriptions%20of%20Rhodobium%2C%20Rhodobium%20orientis%20and%20Rhodobium%20gokarnense&amp;author=M.%20Urdiain&amp;author=A.%20L%C3%B3pez-L%C3%B3pez&amp;author=C.%20Gonzalo&amp;author=H.%20J.%20Busse&amp;author=S.%20Langer&amp;author=P.%20K%C3%A4mpfer&amp;author=R.%20Rossell%C3%B3-M%C3%B3ra&amp;publication_year=2008&amp;journal=Syst%20Appl%20Microbiol&amp;volume=31&amp;pages=339-351&amp;doi=10.1016%2Fj.syapm.2008.07.002&amp;pmid=18774253">Google Scholar</a></div>
+                        </div>
+                     </li>
+                  </ol>
+               </div><span class="highwire-journal-article-marker-end"></span></div>
+            <div class="social-bookmarking">
+               
+               <ul class="social-bookmark-links">
+                  <li class="social-bookmarking-item social-bookmarking-item-citeulike"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=CITEULIKE"><img src="/shared/img/common/social-bookmarking/citeulike.gif"
+                             alt="Add to CiteULike"
+                             title="CiteULike" /></a><span class="soc-bm-link-text">CiteULike</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-delicious"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=DEL_ICIO_US"><img src="/shared/img/common/social-bookmarking/delicious.gif"
+                             alt="Add to Delicious"
+                             title="Delicious" /></a><span class="soc-bm-link-text">Delicious</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-digg"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=DIGG"><img src="/shared/img/common/social-bookmarking/digg.gif" alt="Add to Digg"
+                             title="Digg" /></a><span class="soc-bm-link-text">Digg</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-facebook"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/short/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=FACEBOOK"
+                        class="sb-facebook"
+                        rel="external-nw"><img src="/shared/img/common/social-bookmarking/facebook.gif" alt="Add to Facebook"
+                             title="Facebook" /></a><span class="soc-bm-link-text">Facebook</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-googleplus"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=GOOGLEPLUS&amp;log_only=yes"><img src="/shared/img/common/social-bookmarking/googleplus.jpg" alt="Add to Google+"
+                             title="Google+" /></a><span class="soc-bm-link-text">Google+</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-linkedin"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=LINKEDIN"><img src="/shared/img/common/social-bookmarking/linkedin.gif" alt="Add to LinkedIn"
+                             title="LinkedIn" /></a><span class="soc-bm-link-text">LinkedIn</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-mendeley"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=MENDELEY"><img src="/shared/img/common/social-bookmarking/mendeley.gif" alt="Add to Mendeley"
+                             title="Mendeley" /></a><span class="soc-bm-link-text">Mendeley</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-reddit"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=REDDIT"><img src="/shared/img/common/social-bookmarking/reddit.gif" alt="Add to Reddit"
+                             title="Reddit" /></a><span class="soc-bm-link-text">Reddit</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-twitter"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=TWITTER"><img src="/shared/img/common/social-bookmarking/twitter.gif" alt="Add to Twitter"
+                             title="Twitter" /></a><span class="soc-bm-link-text">Twitter</span></li>
+               </ul>
+               
+               <p class="social-bookmarking-help"><a href="/help/social_bookmarks.dtl">What's this?</a></p>
+               
+            </div><span id="related-urls"></span></div>
+         <div id="col-2">
+            
+            <div class="article-nav sidebar-nav">
+               <a href="/content/63/Pt_11/4207.short" title="Previous article" class="previous">« Previous</a><span class="article-nav-sep"> | </span><a href="/content/63/Pt_11/4224.short" title="Next article" class="next">Next Article »</a>
+               
+               <span class="toc-link">
+                  				<a href="/content/63/Pt_11.toc" title="Table of Contents">Table of Contents</a>
+                  			</span>
+               
+               
+            </div>
+            <div class="open-access-note">
+               <span class="open-access-note">OPEN ACCESS ARTICLE</span>
+               
+            </div>
+            <div class="content-box" id="article-cb-main">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Article</span></h3>
+                  <div class="cb-section cb-slug">
+                     <ol>
+                        <li>
+                           <div id="slugline">
+                              
+                              
+                              	    <span class="slug-metadata-note ahead-of-print">
+                                 	
+                                 Published online ahead of print
+                                 
+                                 <span class="slug-ahead-of-print-date">June 21, 2013</span>,
+                                 doi:
+                                 <span title="10.1099/ijs.0.052647-0" class="slug-doi">10.1099/ijs.0.052647-0
+                                    </span>
+                                 </span>
+                              
+                              <cite>
+                                 	    <abbr title="International Journal of Systematic and Evolutionary Microbiology"
+                                       class="slug-jnl-abbrev">
+                                    IJSEM</abbr><span class="slug-pub-date" itemprop="datePublished">
+                                    	    November 2013 
+                                    </span>
+                                 	    <span class="slug-vol">
+                                    vol. 63 
+                                    </span><span class="slug-issue">
+                                    no. Pt 11 
+                                    </span><span class="slug-pages">
+                                    4218-4223
+                                    </span>
+                                 </cite>
+                              
+                              	           
+                              
+                              
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section cb-views">
+                     <ol>
+                        <li><span class="oa-article">Free via Open Access: <span>OA</span></span></li>
+                        <li><span class="creative-commons-article">Free via Creative Commons: <span>CC</span></span></li>
+                        <li><span class="ccv cc-version-by/2.5/"></span></li>
+                        <li class="abstract-view-link primary"><span class="oa-view">OA </span><a href="/content/63/Pt_11/4218.abstract" rel="view-abstract">Abstract</a><span class="free">Free</span></li>
+                        <li class="notice full-text-view-link primary"><span class="variant-indicator">» <span>Full Text</span></span><span class="free">Free</span></li>
+                        <li class="notice full-text-pdf-view-link primary"><a href="/content/63/Pt_11/4218.full.pdf+html" rel="view-full-text.pdf">Full Text (PDF)</a><span class="free">Free</span></li>
+                        <li><a href="/content/63/Pt_11/4218/suppl/DC1" rel="supplemental-data"
+                              class="dslink-supplementary-material">Supplementary material</a></li>
+                        <li><a href="/powerpoint/63/Pt_11/4218">PPT Slides of All Figures</a></li>
+                        <li class="cb-versions">
+                           <div><span id="pap-all-versions-label">All Versions of this Article:</span><ol class="version-list">
+                                 <li><a href="/content/early/2013/06/18/ijs.0.052647-0">ijs.0.052647-0v1</a></li>
+                                 <li class="current-li"><span>63/Pt_11/4218</span> <span class="current-version">most recent</span></li>
+                              </ol>
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible" id="cb-art-cat">
+                     <h4 class="cb-section-header"><span>Classifications</span></h4>
+                     <ol>
+                        <li>
+                           <ul class="subject-headings">
+                              <li>New Taxa
+                                 <ul class="subject-sub-headings last-child">
+                                    <li><a class="tocsection-search"
+                                          href="/search?tocsectionid=Bacteroidetes&amp;sortspec=date&amp;submit=Submit">Bacteroidetes</a></li>
+                                 </ul>
+                              </li>
+                           </ul>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible" id="cb-art-svcs">
+                     <h4 class="cb-section-header"><span>Services</span></h4>
+                     <ol>
+                        <li class="mail-a-friend-link icon-link"><a href="/email?gca=ijs%3B63%2FPt_11%2F4218&amp;current-view-path=/content/63/Pt_11/4218.full">
+                              Email this article to a colleague</a></li>
+                        <li class="alert-link icon-link"><a href="/cgi/alerts/ctalert?alertType=citedby&amp;addAlert=cited_by&amp;cited_by_criteria_resid=ijs%3B63%2FPt_11%2F4218&amp;saveAlert=no&amp;return-type=article&amp;return_url=http://ijs.sgmjournals.org/content/63/Pt_11/4218.full">Alert me when this article is cited</a></li>
+                        <li class="alert-link icon-link"><a href="/cgi/alerts/ctalert?alertType=correction&amp;addAlert=correction&amp;correction_criteria_value=63/Pt_11/4218&amp;saveAlert=no&amp;return-type=article&amp;return_url=http://ijs.sgmjournals.org/content/63/Pt_11/4218.full">Alert me if a correction is posted</a></li>
+                        <li class="similar-link"><a href="/search?qbe=ijs%3Bijs.0.052647-0&amp;citation=Hedberg%20et%20al.%2063%20%28Pt%2011%29:%204218&amp;submit=yes">Similar articles in this journal</a></li>
+                        <li class="similar-link"><a href="/external-ref?access_num=ijs%3B63%2FPt_11%2F4218&amp;link_type=ISI_RELATEDRECORDS"
+                              id="cb-isi-similar-articles"
+                              class="similar-link">Similar articles in Web of Science</a></li>
+                        <li class="similar-link"><a href="/external-ref?access_num=23793857&amp;link_type=MED_NBRS"
+                              class="similar-link">Similar articles in PubMed</a></li>
+                        <li class="cit-man-link icon-link cite-link"><a href="/citmgr?gca=ijs%3B63%2FPt_11%2F4218">Download to citation manager</a></li>
+                        <li class="copyright-link icon-link"><a href="/external-ref?link_type=PERMISSIONDIRECT"><img src="/shared/img/content/permissions.gif" /></a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-cit">
+                     <h4 class="cb-section-header"><span>Citing Articles</span></h4>
+                     <ol>
+                        <li class="hw-citing-link"><a href="/content/63/Pt_11/4218.full?cited-by=yes&amp;legid=ijs;63/Pt_11/4218#cited-by"
+                              id="cb-hw-citing-articles">Load citing article information</a></li>
+                        <li><a href="/cgi/crossref-forward-links/63/Pt_11/4218" rel="external-nw"
+                              id="cb-crossref-citing-articles">Citing articles via CrossRef</a></li>
+                        <li><a href="/external-ref?access_num=%2Fijs%2F63%2FPt_11%2F4218&amp;link_type=ISI_CITING&amp;accnum_type=native"
+                              rel="external-nw"
+                              id="cb-isi-citing-articles">Citing articles via Web of Science</a></li>
+                        <li><a href="/external-ref?access_num=http://ijs.sgmjournals.org/content/63/Pt_11/4218.abstract&amp;link_type=GOOGLESCHOLAR">Citing articles via Google Scholar</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-gs">
+                     <h4 class="cb-section-header"><span>Google Scholar</span></h4>
+                     <ol>
+                        <li class="cb-art-gs-auth author-link"><a href="http://scholar.google.com/scholar?q=%22author%3AHedberg%20author%3AM.E.%22"
+                              class="cb-art-gs-auth author-link">Articles by  Hedberg, M. E.</a></li>
+                        <li class="cb-art-gs-auth author-link"><a href="http://scholar.google.com/scholar?q=%22author%3AHammarstr%C3%B6m%20author%3AS.%22"
+                              class="cb-art-gs-auth author-link">Articles by  Hammarström, S.</a></li>
+                        <li class="cb-art-gs-rel similar-link"><a href="/external-ref?access_num=http://ijs.sgmjournals.org/content/63/Pt_11/4218.abstract&amp;link_type=GOOGLESCHOLARRELATED">Search for related content</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-pm">
+                     <h4 class="cb-section-header"><span>PubMed</span></h4>
+                     <ol>
+                        <li class="cb-art-pm-cite cite-link icon-link"><a href="/external-ref?access_num=23793857&amp;link_type=PUBMED"
+                              class="cb-art-pm-cite cite-link icon-link">PubMed citation</a></li>
+                        <li class="cb-art-pm-auth author-link"><a href="/external-ref?access_num=Hedberg%20ME&amp;link_type=AUTHORSEARCH"
+                              class="cb-art-pm-auth author-link">Articles by  Hedberg, M. E.</a></li>
+                        <li class="cb-art-pm-auth author-link"><a href="/external-ref?access_num=Hammarstr%C3%B6m%20S&amp;link_type=AUTHORSEARCH"
+                              class="cb-art-pm-auth author-link">Articles by  Hammarström, S.</a></li>
+                        <li>
+                           <div id="cb-entrez-links-placeholder"><a href="/entrez-links/23793857"></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-rel">
+                     <h4 class="cb-section-header"><span>Related Content</span></h4>
+                     <ol>
+                        <li><a href="/content/63/Pt_11/4218.full?related-urls=yes&amp;legid=ijs;63/Pt_11/4218#related-urls"
+                              id="cb-related-urls">Load related web page information</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed soc-links icon-link"
+                       id="cb-art-soc">
+                     <h4 class="cb-section-header"><span>Social Bookmarking</span></h4>
+                     <ol>
+                        <li>
+                           <div class="social-bookmarking">
+                              
+                              <ul class="social-bookmark-links">
+                                 <li class="social-bookmarking-item social-bookmarking-item-citeulike"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=CITEULIKE"><img src="/shared/img/common/social-bookmarking/citeulike.gif"
+                                            alt="Add to CiteULike"
+                                            title="CiteULike" /></a><span class="soc-bm-link-text">CiteULike</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-delicious"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=DEL_ICIO_US"><img src="/shared/img/common/social-bookmarking/delicious.gif"
+                                            alt="Add to Delicious"
+                                            title="Delicious" /></a><span class="soc-bm-link-text">Delicious</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-digg"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=DIGG"><img src="/shared/img/common/social-bookmarking/digg.gif" alt="Add to Digg"
+                                            title="Digg" /></a><span class="soc-bm-link-text">Digg</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-facebook"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/short/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=FACEBOOK"
+                                       class="sb-facebook"
+                                       rel="external-nw"><img src="/shared/img/common/social-bookmarking/facebook.gif" alt="Add to Facebook"
+                                            title="Facebook" /></a><span class="soc-bm-link-text">Facebook</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-googleplus"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=GOOGLEPLUS&amp;log_only=yes"><img src="/shared/img/common/social-bookmarking/googleplus.jpg" alt="Add to Google+"
+                                            title="Google+" /></a><span class="soc-bm-link-text">Google+</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-linkedin"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=LINKEDIN"><img src="/shared/img/common/social-bookmarking/linkedin.gif" alt="Add to LinkedIn"
+                                            title="LinkedIn" /></a><span class="soc-bm-link-text">LinkedIn</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-mendeley"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=MENDELEY"><img src="/shared/img/common/social-bookmarking/mendeley.gif" alt="Add to Mendeley"
+                                            title="Mendeley" /></a><span class="soc-bm-link-text">Mendeley</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-reddit"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=REDDIT"><img src="/shared/img/common/social-bookmarking/reddit.gif" alt="Add to Reddit"
+                                            title="Reddit" /></a><span class="soc-bm-link-text">Reddit</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-twitter"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=TWITTER"><img src="/shared/img/common/social-bookmarking/twitter.gif" alt="Add to Twitter"
+                                            title="Twitter" /></a><span class="soc-bm-link-text">Twitter</span></li>
+                              </ul>
+                              
+                              <p class="social-bookmarking-help"><a href="/help/social_bookmarks.dtl">What's this?</a></p>
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+            
+            <div class="content-box" id="article-dyn-nav">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>Navigate This Article</span></h3>
+                  <div class="cb-section" id="cb-art-nav">
+                     <ol>
+                        <li><a href="#content-block">Top</a></li>
+                        <li><a href="#abstract-1">Abstract</a></li>
+                        <li><a href="#ack-1">Acknowledgements</a></li>
+                        <li><a href="#ref-list-1">References</a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+         </div>
+         <div id="col-3">
+            
+            <div class="content-box" id="sidebar-current-issue">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Month's Issue</span></h3>
+                  <div class="cb-section">
+                     <ol>
+                        <li><span><a href="/content/current" rel="current-issue">April 2015, 65 (Pt 4)</a></span></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section">
+                     <ol>
+                        <li>
+                           <div class="current-issue"><a href="/content/current" rel="current-issue"><img src="/content/65/Pt_4.cover.gif" width="67" height="89" alt="Current Issue" /></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section sidebar-etoc-link">
+                     <ol>
+                        <li><a href="/cgi/alerts/etoc">Alert me to new issues of IJSEM
+                              </a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            <div id="sidebar-global-nav">
+               
+               		
+               <ul class="button-list pub-links">
+                  <li class="first"><a href="/site/misc/about.xhtml" title="ABOUT IJSEM"><span>ABOUT IJSEM</span></a></li>
+                  <li><a href="/site/misc/edboard.xhtml" title="EDITORIAL BOARD &amp; STAFF"><span>EDITORIAL BOARD &amp; STAFF</span></a></li>
+                  <li><a href="http://www.editorialmanager.com/ijs/" title="SUBMIT A MANUSCRIPT"><span>SUBMIT A MANUSCRIPT</span></a></li>
+                  <li><a href="/site/misc/ifora.xhtml" title="INFORMATION FOR AUTHORS"><span>INFORMATION FOR AUTHORS</span></a></li>
+                  <li><a href="/site/misc/iforr.xhtml" title="INFORMATION FOR REVIEWERS"><span>INFORMATION FOR REVIEWERS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/site/librarians/index.xhtml"
+                        title="INFORMATION FOR LIBRARIANS"><span>INFORMATION FOR LIBRARIANS</span></a></li>
+                  <li><a href="/site/misc/reprints.xhtml" title="PERMISSIONS AND REPRINTS"><span>PERMISSIONS AND REPRINTS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/subscriptions" title="SUBSCRIPTIONS"><span>SUBSCRIPTIONS</span></a></li>
+                  <li><a href="/site/misc/addir.xhtml" title="ADVERTISING"><span>ADVERTISING</span></a></li>
+                  <li class="rss-img-button"><a href="/site/misc/alerts_feeds.xhtml" title="ALERTS &amp; FEEDS"><span>ALERTS &amp; FEEDS</span></a></li>
+                  <li class="last"><a href="/feedback" title="FEEDBACK"><span>FEEDBACK</span></a></li>
+               </ul>
+               		
+               <ul class="button-list pub-links umbrella-links">
+                  <li class="first"><a href="http://mic.sgmjournals.org" title="MICROBIOLOGY"><span>MICROBIOLOGY</span></a></li>
+                  <li><a href="http://vir.sgmjournals.org" title="J GEN VIROL"><span>J GEN VIROL</span></a></li>
+                  <li><a href="http://jmm.sgmjournals.org" title="J MED MICROBIOL"><span>J MED MICROBIOL</span></a></li>
+                  <li><a href="http://jmmcr.sgmjournals.org" title="JMM CASE REPORTS"><span>JMM CASE REPORTS</span></a></li>
+                  <li class="last"><a href="http://www.sgmjournals.org" title="ALL SGM JOURNALS"><span>ALL SGM JOURNALS</span></a></li>
+               </ul>
+               		
+               <div class="sidebar-icon-group">
+                  			
+                  <div class="icons">
+                     			<a href="http://www.sgm.ac.uk/" rel="external-nw"><img src="/publisher/img/society_logo.gif" class="publisher-icon" alt="Society Logo" /></a>
+                     			<a href="http://www.the-icsp.org/" rel="external-nw"><img src="/publisher/img/icsp_logo.gif" class="publisher-icon" alt="ICSP Logo" /></a>
+                     			<a href="http://highwire.stanford.edu/" rel="external-nw"><img src="/publisher/img/hplogo.gif" class="hw-icon" alt="HighWire Press Logo" /></a>
+                     			
+                  </div>
+                  			
+                  <div class="sidebar-icon-text"><span>The <a href="http://www.sgmjournals.org"> Society for General Microbiology</a> publishes online with the assistance of <a href="http://highwire.stanford.edu">HighWire Press®</a>.</span></div>
+                  		
+               </div>
+               	
+            </div>
+            <div class="most-links-box js-marker">
+               
+               <div class="most-header">
+                  
+                  <h3>Most</h3>
+                  
+               </div>
+               
+               <ul>
+                  <li class="most-cur-sel">
+                     <h4>Viewed</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/1070?rss=1&amp;ssource=mfr">Proposal to consistently apply the International Code of Nomenclature of Prokaryotes (ICNP) to names of the oxygenic photosynthetic
+                                 bacteria (cyanobacteria), including those validly published under the International Code of Botanical Nomenclature (ICBN)/International
+                                 Code of Nomenclature for algae, fungi and plants (ICN), and proposal to change Principle 2 of the ICNP</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfr">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/316?rss=1&amp;ssource=mfr">Integrating genomics into the taxonomy and systematics of the Bacteria and Archaea</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/333?rss=1&amp;ssource=mfr">Applications of next-generation sequencing to unravelling the evolutionary history of algae</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/739?rss=1&amp;ssource=mfr">Notification that new names of prokaryotes, new combinations, and new taxonomic opinions have appeared in volume 64, part
+                                 12, of the IJSEM</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfr1.dtl" class="view-all">» View all Most Viewed articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+                  <li>
+                     <h4>Cited</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4386?rss=1&amp;ssource=mfc">Chryseobacterium hispalense sp. nov., a plant-growth-promoting bacterium isolated from a rainwater pond in an olive plant
+                                 nursery, and emended descriptions of Chryseobacterium defluvii, Chryseobacterium indologenes, Chryseobacterium wanjuense and
+                                 Chryseobacterium gregarium</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfc">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_1/138?rss=1&amp;ssource=mfc">Aquibacter zeaxanthinifaciens gen. nov., sp. nov., a zeaxanthin-producing bacterium of the family Flavobacteriaceae isolated
+                                 from surface seawater, and emended descriptions of the genera Aestuariibaculum and Gaetbulibacter</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4790?rss=1&amp;ssource=mfc">Kordia aquimaris sp. nov., a zeaxanthin-producing member of the family Flavobacteriaceae isolated from surface seawater, and
+                                 emended description of the genus Kordia</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4524?rss=1&amp;ssource=mfc">Erythrobacter odishensis sp. nov. and Pontibacter odishensis sp. nov. isolated from dry soil of a solar saltern</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfc1.dtl" class="view-all">» View all Most Cited articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+               </ul>
+               
+               
+            </div>
+            
+            
+            
+         </div>
+         <div id="footer">
+            
+            <div class="bar">
+               
+               <div class="footer-group footer-col-left">
+                  		
+                  <p class="copyright">Copyright ©
+                     		2015 International Union of Microbiological Societies
+                     	
+                  </p>
+                  	
+               </div>
+               
+               <div class="footer-group footer-col-right">
+                  	    
+                  <ul class="issns">
+                     <li>
+                        <span>Print ISSN: </span>
+                        <span class="issn">1466-5026</span>
+                        
+                     </li>
+                     <li>
+                        <span>Online ISSN: </span>
+                        <span class="issn">1466-5034</span>
+                        
+                     </li>
+                  </ul>
+                  	  
+               </div>
+               	  
+            </div>
+            
+            
+            <div class="block-2 sb-div"></div>
+            
+         </div><script type="text/javascript">
+        var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
+        document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
+        </script><script type="text/javascript">
+        try {
+        var pageTracker = _gat._getTracker("UA-189672-25");
+        pageTracker._setDomainName(".sgmjournals.org");
+        pageTracker._trackPageview();
+        } catch(err) {}
+        </script><script type="text/javascript">
+	(function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
+		(i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
+		m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
+	})(window,document,'script','//www.google-analytics.com/analytics.js','ga');
+
+	ga('create', 'UA-48529861-1', '.sgmjournals.org');
+	ga('send', 'pageview');
+	</script></div>
+   </body>
+</html>
\ No newline at end of file
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/fulltext.pdf b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/fulltext.pdf
new file mode 100644
index 00000000..8cc6e132
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/fulltext.pdf differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/results.json b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/results.json
new file mode 100644
index 00000000..69f8f5c2
--- /dev/null
+++ b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/results.json
@@ -0,0 +1,98 @@
+{
+  "publisher": {
+    "value": [
+      "Society for General Microbiology"
+    ]
+  },
+  "journal": {
+    "value": [
+      "International Journal of Systematic and Evolutionary\n                Microbiology"
+    ]
+  },
+  "title": {
+    "value": [
+      "Prevotella jejuni sp. nov., isolated from the small intestine of a child with coeliac disease"
+    ]
+  },
+  "authors": {
+    "value": [
+      "Maria E. Hedberg",
+      "Anne Israelsson",
+      "Edward R. B. Moore",
+      "Liselott Svensson-Stadler",
+      "Sun Nyunt Wai",
+      "Grzegorz Pietz",
+      "Olof Sandström",
+      "Olle Hernell",
+      "Marie-Louise Hammarström",
+      "Sten Hammarström"
+    ]
+  },
+  "date": {
+    "value": [
+      "11/01/2013"
+    ]
+  },
+  "doi": {
+    "value": [
+      "10.1099/ijs.0.052647-0"
+    ]
+  },
+  "volume": {
+    "value": [
+      "63"
+    ]
+  },
+  "issue": {
+    "value": [
+      "Pt 11"
+    ]
+  },
+  "firstpage": {
+    "value": [
+      "4218"
+    ]
+  },
+  "abstract": {
+    "value": [
+      "\n                  \n                      Next Section\n                  Abstract\n                  \n                  Five obligately anaerobic, Gram-stain-negative, saccharolytic and proteolytic, non-spore-forming bacilli (strains CD3 : 27,\n                     CD3 : 28T, CD3 : 33, CD3 : 32 and CD3 : 34) are described. All five strains were isolated from the small intestine of a female child\n                     with coeliac disease. Cells of the five strains were short rods or coccoid cells with longer filamentous forms seen sporadically.\n                     The organisms produced acetic acid and succinic acid as major metabolic end products. Phylogenetic analysis based on comparative\n                     16S rRNA gene sequence analysis revealed close relationships between CD3 : 27, CD3 : 28T and CD3 : 33, between CD3 : 32 and Prevotella histicola CCUG 55407T, and between CD3 : 34 and Prevotella melaninogenica CCUG 4944BT. Strains CD3 : 27, CD3 : 28T and CD3 : 33 were clearly different from all recognized species within the genus Prevotella and related most closely to but distinct from P. melaninogenica. Based on 16S rRNA, RNA polymerase β-subunit (rpoB) and 60 kDa chaperonin protein subunit (cpn60) gene sequencing, and phenotypic, chemical and biochemical properties, strains CD3 : 27, CD3 : 28T and CD3 : 33 are considered to represent a novel species within the genus Prevotella, for which the name Prevotella jejuni sp. nov. is proposed. Strain CD3 : 28T ( = CCUG 60371T = DSM 26989T) is the type strain of the proposed novel species. All five strains were able to form homologous aggregates, in which tube-like\n                     structures were connecting individual bacteria cells. The five strains were able to bind to human intestinal carcinoma cell\n                     lines at 37 °C.\n                  \n                  \n               "
+    ]
+  },
+  "fulltext_html": {
+    "value": [
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4218.full"
+    ]
+  },
+  "fulltext_pdf": {
+    "value": [
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4218.full.pdf"
+    ]
+  },
+  "supplementary_material": {
+    "value": [
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4218/suppl/DC1"
+    ]
+  },
+  "figure": {
+    "value": [
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4218/F1.small.gif",
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4218/F2.small.gif"
+    ]
+  },
+  "figure_caption": {
+    "value": [
+      "Fig. 1.  \n                     \n                     Scanning electron micrographs showing surface structures of cells of P. jejuni, strains CD3 : 27 (a) and CD3 : 28T (b) and P. histicola strain CD3 : 32 (c). (d) Transmission electron micrograph of a cell of strain P. jejuni CD3 : 33; arrows indicate cross-section of the tube-like structures shown in (a)–(c) and arrowheads indicate outer membrane\n                        vesicles. Bars, 0.2 µm (a, b, d); 1 µm (c).\n                     \n                     \n                     \n                  ",
+      "Fig. 2.  \n                     \n                     Phylogenetic tree based on 16S rRNA gene sequences showing the relationships between strains CD3 : 27, CD3 : 28T and CD3 : 33 and related species. The 16S rRNA gene sequence of Porphyromonas gingivalis ATCC 33277T served as an outgroup. Bar, 0.02 substitutions per nucleotide position.\n                     \n                     \n                     \n                  "
+    ]
+  },
+  "license": {
+    "value": [
+      "\n                  This is an open-access article distributed under the terms of the Creative Commons Attribution License, which permits unrestricted\n                     use, distribution, and reproduction in any medium, provided the original work is properly cited.\n                  \n               "
+    ]
+  },
+  "copyright": {
+    "value": [
+      "Copyright ©\n                     \t\t2015 International Union of Microbiological Societies\n                     \t\n                  "
+    ]
+  }
+}
\ No newline at end of file
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/DC1 b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/DC1
new file mode 100644
index 00000000..d45128cb
--- /dev/null
+++ b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/DC1
@@ -0,0 +1,351 @@
+<!DOCTYPE html
+  PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html
+      xmlns="http://www.w3.org/1999/xhtml"
+      xml:lang="en"
+      lang="en">
+   <head>
+      <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
+      <title>Supplementary material </title>
+      <meta name="googlebot" content="NOODP" />
+      <meta name="HW.ad-path" content="/cgi/content/full/ijs.0.053900-0/DC1" />
+      <link rel="stylesheet" type="text/css" media="all" href="/shared/css/hw-global.css" />
+      <link rel="stylesheet" type="text/css" media="print" href="/shared/css/hw-print.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/standard-designs/design25/main.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/local/css/hw-local-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-page-data-supp.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-page-data-supp.css" /><script type="text/javascript" id="session-d7459754e1">var callbackToken='5635C00598180E6';</script><script type="text/javascript" id="session-d7459754e3">
+                      var subCode='sgmjournal_sub';
+                    </script><script type="text/javascript" src="/shared/js/jquery-min.js"></script><script type="text/javascript" src="/shared/js/fingerprint.js"></script><script type="text/javascript" src="/shared/js/hw-shared.js"></script><script type="text/javascript" src="/shared/js/design/hw-design1.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-shared.js"></script><script type="text/javascript" src="/shared/js/pages/hw-data-supp.js"></script></head>
+   <body>
+      <div class="hw-gen-page pagetype-content" id="pageid-data-supp">
+         <div id="header">
+            
+            <h1><a id="logo" href="/"><span>International Journal of Systematic and Evolutionary Microbiology</span></a></h1>
+            
+            <p id="skip-link">
+               <a href="#content-block">Skip to main page content</a>
+               
+            </p>
+            
+            <ul class="button-list header-buttons">
+               <li class="first"><a href="/" title="HOME"><span>HOME</span></a></li>
+               <li><a href="/content/current" title="CURRENT ISSUE"><span>CURRENT ISSUE</span></a></li>
+               <li><a href="/content" title="ARCHIVE"><span>ARCHIVE</span></a></li>
+               <li><a href="/search" title="SEARCH"><span>SEARCH</span></a></li>
+               <li><a href="/help" title="HELP"><span>HELP</span></a></li>
+               <li class="last"><a href="/feedback" title="CONTACT US"><span>CONTACT US</span></a></li>
+            </ul>
+            
+            
+            <div class="header-qs">
+               
+               <form class="searchbox" action="/search" method="get">
+                  <div>
+                     	<label for="header-qs-input" id="header-qs-search-label">Search for Keyword:</label>
+                     <input value="" title="Search" type="text" name="fulltext" id="header-qs-input" /><input type="hidden" name="submit" value="yes" /><label for="header-qs-search" id="header-qs-search-label">GO</label><input value="GO" alt="Link: Go" type="image" id="header-qs-search-go"
+                            src="/shared/img/standard-design/design2/go.gif" /> 
+                     
+                  </div>
+                  <div class="adv-search-link"><a href="/search">Advanced Search</a></div>
+               </form>
+               
+               
+            </div>
+            
+            <div class="header-ac-elements">
+               
+               <div id="authstring" class="suppress-header-login">
+                  
+                  <ul>
+                     <li class="subscr-ref">Institution: THE NATURAL HISTORY MUSEUM</li>
+                     <li>
+                        <a href="/login?uri=http%3A%2F%2Fijs.sgmjournals.org%2Fcontent%2F63%2FPt_11%2F4340%2Fsuppl%2FDC1">
+                           Sign In as Member / Individual
+                           </a>
+                        
+                     </li>
+                  </ul>           
+                  
+               </div> 
+               
+               <div id="hdr-login" class="suppress-header-login"></div>
+               
+            </div>
+            
+            <div class="banner-ads">
+               		
+               <ul>
+                  <li class="position-1 no-ad hdr_left"><span>  </span></li>
+               </ul>
+               	
+            </div>
+            
+            <div class="bar">
+               
+               <div class="bar-inner"></div>
+               
+            </div>
+            
+         </div>
+         <div id="content-block">
+            <h1 class="data-supp-article-title">Molecular and phenotypic analyses reveal the non-identity of the <em>Phaeobacter gallaeciensis</em> type strain deposits CIP 105210<sup>T</sup> and DSM 17395
+            </h1>
+            <div><span class="highwire-journal-article-marker-start"></span><div class="auto-clean"><span style="font-family: Verdana,Arial,Helvetica,sans-serif;  font-size: 83.33%">
+                     
+                     
+                     <h2>Supplementary material</h2>
+                     
+                     <p><strong>Files in this Data Supplement:</strong></p>
+                     
+                     <ul>
+                        <li><a href="/content/suppl/2013/11/05/ijs.0.053900-0.DC1/ijs053900.pdf">Supplementary material</a> 
+                           		
+                           
+                        </li>
+                     </ul>
+                     </span>
+                  
+                  
+               </div><span class="highwire-journal-article-marker-end"></span></div><span id="related-urls"></span></div>
+         <div id="col-2">
+            
+            <div class="content-box" id="article-cb-main">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Article</span></h3>
+                  <div class="cb-section cb-slug">
+                     <ol>
+                        <li>
+                           <div id="slugline">
+                              
+                              	
+                              
+                              
+                              doi:
+                              <span title="10.1099/ijs.0.053900-0" class="slug-doi">10.1099/ijs.0.053900-0</span>
+                              
+                              <cite>
+                                 	    <abbr title="International Journal of Systematic and Evolutionary Microbiology"
+                                       class="slug-jnl-abbrev">
+                                    IJSEM</abbr><span class="slug-pub-date">
+                                    November 2013 
+                                    </span>
+                                 	    <span class="slug-vol">
+                                    vol. 63 
+                                    </span><span class="slug-issue">
+                                    no. Pt 11 
+                                    </span><span class="slug-pages">
+                                    4340-4349
+                                    </span>
+                                 </cite>
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section cb-views">
+                     <ol>
+                        <li class="abstract-view-link primary"><a href="/content/63/Pt_11/4340.abstract" rel="view-abstract">Abstract</a><span class="free">Free</span></li>
+                        <li class="notice full-text-view-link primary"><a href="/content/63/Pt_11/4340.full" rel="view-full-text">Full Text</a><span class="free">Free</span></li>
+                        <li class="notice full-text-pdf-view-link primary"><a href="/content/63/Pt_11/4340.full.pdf+html" rel="view-full-text.pdf">Full Text (PDF)</a></li>
+                        <li><span class="variant-indicator">» <span>Supplementary material</span></span></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+            
+            
+         </div>
+         <div id="col-3">
+            
+            <div class="content-box" id="sidebar-current-issue">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Month's Issue</span></h3>
+                  <div class="cb-section">
+                     <ol>
+                        <li><span><a href="/content/current" rel="current-issue">April 2015, 65 (Pt 4)</a></span></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section">
+                     <ol>
+                        <li>
+                           <div class="current-issue"><a href="/content/current" rel="current-issue"><img src="/content/65/Pt_4.cover.gif" width="67" height="89" alt="Current Issue" /></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section sidebar-etoc-link">
+                     <ol>
+                        <li><a href="/cgi/alerts/etoc">Alert me to new issues of IJSEM
+                              </a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            <div id="sidebar-global-nav">
+               
+               		
+               <ul class="button-list pub-links">
+                  <li class="first"><a href="/site/misc/about.xhtml" title="ABOUT IJSEM"><span>ABOUT IJSEM</span></a></li>
+                  <li><a href="/site/misc/edboard.xhtml" title="EDITORIAL BOARD &amp; STAFF"><span>EDITORIAL BOARD &amp; STAFF</span></a></li>
+                  <li><a href="http://www.editorialmanager.com/ijs/" title="SUBMIT A MANUSCRIPT"><span>SUBMIT A MANUSCRIPT</span></a></li>
+                  <li><a href="/site/misc/ifora.xhtml" title="INFORMATION FOR AUTHORS"><span>INFORMATION FOR AUTHORS</span></a></li>
+                  <li><a href="/site/misc/iforr.xhtml" title="INFORMATION FOR REVIEWERS"><span>INFORMATION FOR REVIEWERS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/site/librarians/index.xhtml"
+                        title="INFORMATION FOR LIBRARIANS"><span>INFORMATION FOR LIBRARIANS</span></a></li>
+                  <li><a href="/site/misc/reprints.xhtml" title="PERMISSIONS AND REPRINTS"><span>PERMISSIONS AND REPRINTS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/subscriptions" title="SUBSCRIPTIONS"><span>SUBSCRIPTIONS</span></a></li>
+                  <li><a href="/site/misc/addir.xhtml" title="ADVERTISING"><span>ADVERTISING</span></a></li>
+                  <li class="rss-img-button"><a href="/site/misc/alerts_feeds.xhtml" title="ALERTS &amp; FEEDS"><span>ALERTS &amp; FEEDS</span></a></li>
+                  <li class="last"><a href="/feedback" title="FEEDBACK"><span>FEEDBACK</span></a></li>
+               </ul>
+               		
+               <ul class="button-list pub-links umbrella-links">
+                  <li class="first"><a href="http://mic.sgmjournals.org" title="MICROBIOLOGY"><span>MICROBIOLOGY</span></a></li>
+                  <li><a href="http://vir.sgmjournals.org" title="J GEN VIROL"><span>J GEN VIROL</span></a></li>
+                  <li><a href="http://jmm.sgmjournals.org" title="J MED MICROBIOL"><span>J MED MICROBIOL</span></a></li>
+                  <li><a href="http://jmmcr.sgmjournals.org" title="JMM CASE REPORTS"><span>JMM CASE REPORTS</span></a></li>
+                  <li class="last"><a href="http://www.sgmjournals.org" title="ALL SGM JOURNALS"><span>ALL SGM JOURNALS</span></a></li>
+               </ul>
+               		
+               <div class="sidebar-icon-group">
+                  			
+                  <div class="icons">
+                     			<a href="http://www.sgm.ac.uk/" rel="external-nw"><img src="/publisher/img/society_logo.gif" class="publisher-icon" alt="Society Logo" /></a>
+                     			<a href="http://www.the-icsp.org/" rel="external-nw"><img src="/publisher/img/icsp_logo.gif" class="publisher-icon" alt="ICSP Logo" /></a>
+                     			<a href="http://highwire.stanford.edu/" rel="external-nw"><img src="/publisher/img/hplogo.gif" class="hw-icon" alt="HighWire Press Logo" /></a>
+                     			
+                  </div>
+                  			
+                  <div class="sidebar-icon-text"><span>The <a href="http://www.sgmjournals.org"> Society for General Microbiology</a> publishes online with the assistance of <a href="http://highwire.stanford.edu">HighWire Press®</a>.</span></div>
+                  		
+               </div>
+               	
+            </div>
+            <div class="most-links-box js-marker">
+               
+               <div class="most-header">
+                  
+                  <h3>Most</h3>
+                  
+               </div>
+               
+               <ul>
+                  <li class="most-cur-sel">
+                     <h4>Viewed</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/1070?rss=1&amp;ssource=mfr">Proposal to consistently apply the International Code of Nomenclature of Prokaryotes (ICNP) to names of the oxygenic photosynthetic
+                                 bacteria (cyanobacteria), including those validly published under the International Code of Botanical Nomenclature (ICBN)/International
+                                 Code of Nomenclature for algae, fungi and plants (ICN), and proposal to change Principle 2 of the ICNP</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfr">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/316?rss=1&amp;ssource=mfr">Integrating genomics into the taxonomy and systematics of the Bacteria and Archaea</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/333?rss=1&amp;ssource=mfr">Applications of next-generation sequencing to unravelling the evolutionary history of algae</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/739?rss=1&amp;ssource=mfr">Notification that new names of prokaryotes, new combinations, and new taxonomic opinions have appeared in volume 64, part
+                                 12, of the IJSEM</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfr1.dtl" class="view-all">» View all Most Viewed articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+                  <li>
+                     <h4>Cited</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4386?rss=1&amp;ssource=mfc">Chryseobacterium hispalense sp. nov., a plant-growth-promoting bacterium isolated from a rainwater pond in an olive plant
+                                 nursery, and emended descriptions of Chryseobacterium defluvii, Chryseobacterium indologenes, Chryseobacterium wanjuense and
+                                 Chryseobacterium gregarium</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfc">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_1/138?rss=1&amp;ssource=mfc">Aquibacter zeaxanthinifaciens gen. nov., sp. nov., a zeaxanthin-producing bacterium of the family Flavobacteriaceae isolated
+                                 from surface seawater, and emended descriptions of the genera Aestuariibaculum and Gaetbulibacter</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4790?rss=1&amp;ssource=mfc">Kordia aquimaris sp. nov., a zeaxanthin-producing member of the family Flavobacteriaceae isolated from surface seawater, and
+                                 emended description of the genus Kordia</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4524?rss=1&amp;ssource=mfc">Erythrobacter odishensis sp. nov. and Pontibacter odishensis sp. nov. isolated from dry soil of a solar saltern</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfc1.dtl" class="view-all">» View all Most Cited articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+               </ul>
+               
+               
+            </div>
+            
+            
+            
+         </div>
+         <div id="footer">
+            
+            <div class="bar">
+               
+               <div class="footer-group footer-col-left">
+                  		
+                  <p class="copyright">Copyright ©
+                     		2015 International Union of Microbiological Societies
+                     	
+                  </p>
+                  	
+               </div>
+               
+               <div class="footer-group footer-col-right">
+                  	    
+                  <ul class="issns">
+                     <li>
+                        <span>Print ISSN: </span>
+                        <span class="issn">1466-5026</span>
+                        
+                     </li>
+                     <li>
+                        <span>Online ISSN: </span>
+                        <span class="issn">1466-5034</span>
+                        
+                     </li>
+                  </ul>
+                  	  
+               </div>
+               	  
+            </div>
+            
+            
+            <div class="block-2 sb-div"></div>
+            
+         </div><script type="text/javascript">
+        var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
+        document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
+        </script><script type="text/javascript">
+        try {
+        var pageTracker = _gat._getTracker("UA-189672-25");
+        pageTracker._setDomainName(".sgmjournals.org");
+        pageTracker._trackPageview();
+        } catch(err) {}
+        </script><script type="text/javascript">
+	(function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
+		(i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
+		m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
+	})(window,document,'script','//www.google-analytics.com/analytics.js','ga');
+
+	ga('create', 'UA-48529861-1', '.sgmjournals.org');
+	ga('send', 'pageview');
+	</script></div>
+   </body>
+</html>
\ No newline at end of file
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/F1.small.gif b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/F1.small.gif
new file mode 100644
index 00000000..c2605f4c
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/F1.small.gif differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/F2.small.gif b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/F2.small.gif
new file mode 100644
index 00000000..c7425362
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/F2.small.gif differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/F3.small.gif b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/F3.small.gif
new file mode 100644
index 00000000..4a47a828
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/F3.small.gif differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/F4.small.gif b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/F4.small.gif
new file mode 100644
index 00000000..fbf04a12
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/F4.small.gif differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/F5.small.gif b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/F5.small.gif
new file mode 100644
index 00000000..229bd2c8
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/F5.small.gif differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/fulltext.html b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/fulltext.html
new file mode 100644
index 00000000..02e884f3
--- /dev/null
+++ b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/fulltext.html
@@ -0,0 +1,2072 @@
+<!DOCTYPE html
+  PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html
+      xmlns="http://www.w3.org/1999/xhtml"
+      xml:lang="en"
+      lang="en">
+   <head>
+      <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
+      <title>Molecular and phenotypic analyses reveal the non-identity of the Phaeobacter gallaeciensis type strain deposits CIP 105210T
+         and DSM 17395 
+      </title>
+      <meta name="googlebot" content="NOODP" />
+      <meta name="HW.ad-path" content="/cgi/content/full/63/Pt_11/4340" />
+      <meta content="/ijs/63/Pt_11/4340.atom" name="HW.identifier" />
+      <meta name="DC.Format" content="text/html" />
+      <meta name="DC.Language" content="en" />
+      <meta content="Molecular and phenotypic analyses reveal the non-identity of the Phaeobacter gallaeciensis type strain deposits CIP 105210T and DSM 17395"
+            name="DC.Title" />
+      <meta content="10.1099/ijs.0.053900-0" name="DC.Identifier" />
+      <meta content="2013-11-01" name="DC.Date" />
+      <meta content="Society for General Microbiology" name="DC.Publisher" />
+      <meta content="Nora Buddruhs" name="DC.Contributor" />
+      <meta content="Silke Pradella" name="DC.Contributor" />
+      <meta content="Markus Göker" name="DC.Contributor" />
+      <meta content="Orsola Päuker" name="DC.Contributor" />
+      <meta content="Rüdiger Pukall" name="DC.Contributor" />
+      <meta content="Cathrin Spröer" name="DC.Contributor" />
+      <meta content="Peter Schumann" name="DC.Contributor" />
+      <meta content="Jörn Petersen" name="DC.Contributor" />
+      <meta content="Thorsten Brinkhoff" name="DC.Contributor" />
+      <meta content="International Journal of Systematic and Evolutionary&#xA;                Microbiology"
+            name="citation_journal_title" />
+      <meta content="Int J Syst Evol&#xA;                Microbiol"
+            name="citation_journal_abbrev" />
+      <meta content="1466-5026" name="citation_issn" />
+      <meta content="1466-5034" name="citation_issn" />
+      <meta name="citation_author" content="Nora Buddruhs" />
+      <meta name="citation_author_institution"
+            content="1Leibniz Institute DSMZ – German Collection of Microorganisms and Cell Cultures, Braunschweig, Germany" />
+      <meta name="citation_author" content="Silke Pradella" />
+      <meta name="citation_author_institution"
+            content="1Leibniz Institute DSMZ – German Collection of Microorganisms and Cell Cultures, Braunschweig, Germany" />
+      <meta name="citation_author" content="Markus Göker" />
+      <meta name="citation_author_institution"
+            content="1Leibniz Institute DSMZ – German Collection of Microorganisms and Cell Cultures, Braunschweig, Germany" />
+      <meta name="citation_author" content="Orsola Päuker" />
+      <meta name="citation_author_institution"
+            content="1Leibniz Institute DSMZ – German Collection of Microorganisms and Cell Cultures, Braunschweig, Germany" />
+      <meta name="citation_author" content="Rüdiger Pukall" />
+      <meta name="citation_author_institution"
+            content="1Leibniz Institute DSMZ – German Collection of Microorganisms and Cell Cultures, Braunschweig, Germany" />
+      <meta name="citation_author" content="Cathrin Spröer" />
+      <meta name="citation_author_institution"
+            content="1Leibniz Institute DSMZ – German Collection of Microorganisms and Cell Cultures, Braunschweig, Germany" />
+      <meta name="citation_author" content="Peter Schumann" />
+      <meta name="citation_author_institution"
+            content="1Leibniz Institute DSMZ – German Collection of Microorganisms and Cell Cultures, Braunschweig, Germany" />
+      <meta name="citation_author" content="Jörn Petersen" />
+      <meta name="citation_author_institution"
+            content="1Leibniz Institute DSMZ – German Collection of Microorganisms and Cell Cultures, Braunschweig, Germany" />
+      <meta name="citation_author" content="Thorsten Brinkhoff" />
+      <meta name="citation_author_institution"
+            content="2Institute for Chemistry and Biology of the Marine Environment, University of Oldenburg, Oldenburg, Germany" />
+      <meta content="Molecular and phenotypic analyses reveal the non-identity of the Phaeobacter gallaeciensis type strain deposits CIP 105210T and DSM 17395"
+            name="citation_title" />
+      <meta content="11/01/2013" name="citation_date" />
+      <meta content="63" name="citation_volume" />
+      <meta content="Pt 11" name="citation_issue" />
+      <meta content="4340" name="citation_firstpage" />
+      <meta content="4349" name="citation_lastpage" />
+      <meta content="63/Pt_11/4340" name="citation_id" />
+      <meta content="63/Pt 11/4340" name="citation_id_from_sass_path" />
+      <meta content="ijs;63/Pt_11/4340" name="citation_mjid" />
+      <meta content="10.1099/ijs.0.053900-0" name="citation_doi" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4340.abstract"
+            name="citation_abstract_html_url" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4340.full"
+            name="citation_fulltext_html_url" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4340.full.pdf"
+            name="citation_pdf_url" />
+      <meta content="/content/63/Pt_11.cover.gif" name="issue_cover_image" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4340"
+            name="citation_public_url" />
+      <meta content="24187021" name="citation_pmid" />
+      <meta name="citation_fulltext_world_readable" content="" />
+      <meta name="citation_section" content="Taxonomic Note" />
+      <meta name="robots" content="noarchive,nofollow" />
+      <meta name="googlebot" content="noarchive" />
+      <link href="/content/63/Pt_11/4330.short" rel="prev" />
+      <link href="/content/63/Pt_11/4350.short" rel="next" />
+      <link rel="stylesheet" type="text/css" media="all" href="/shared/css/hw-global.css" />
+      <link rel="stylesheet" type="text/css" media="print" href="/shared/css/hw-print.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/standard-designs/design25/main.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/local/css/hw-local-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/jquery.fancybox-1.3.4.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-global-colexpand.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-global-colexpand.css" /><script type="text/javascript" id="session-d7460001e1">var callbackToken='5635C00598180E6';</script><script type="text/javascript" id="session-d7460001e3">
+                      var subCode='sgmjournal_sub';
+                    </script><script type="text/javascript" src="/shared/js/jquery-min.js"></script><script type="text/javascript" src="/shared/js/fingerprint.js"></script><script type="text/javascript" src="/shared/js/hw-shared.js"></script><script type="text/javascript" src="/shared/js/design/hw-design1.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-shared.js"></script><script type="text/javascript" src="/shared/js/pages/hw-content.js"></script><script type="text/javascript" src="/shared/js/fancybox/jquery.fancybox-1.3.4.js"></script><script type="text/javascript" src="/shared/js/fancybox/jquery.easing-1.3.pack.js"></script><script type="text/javascript"
+              src="/shared/js/fancybox/jquery.mousewheel-3.0.4.pack.js"></script><script type="text/javascript" src="/shared/js/util/content.jquery.addVariantLink.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-custom-free.js"></script><script type="text/javascript" src="/shared/js/util/hw-col-expand.js"></script><script type="text/javascript"
+              src="https://data.namesforlife.com/script/NamesforLife.js"></script></head>
+   <body>
+      <div class="hw-gen-page pagetype-content" id="pageid-content" itemscope="itemscope"
+           itemtype="http://schema.org/ScholarlyArticle">
+         <div id="header">
+            
+            <h1><a id="logo" href="/"><span>International Journal of Systematic and Evolutionary Microbiology</span></a></h1>
+            
+            <p id="skip-link">
+               <a href="#content-block">Skip to main page content</a>
+               
+            </p>
+            
+            <ul class="button-list header-buttons">
+               <li class="first"><a href="/" title="HOME"><span>HOME</span></a></li>
+               <li><a href="/content/current" title="CURRENT ISSUE"><span>CURRENT ISSUE</span></a></li>
+               <li><a href="/content" title="ARCHIVE"><span>ARCHIVE</span></a></li>
+               <li><a href="/search" title="SEARCH"><span>SEARCH</span></a></li>
+               <li><a href="/help" title="HELP"><span>HELP</span></a></li>
+               <li class="last"><a href="/feedback" title="CONTACT US"><span>CONTACT US</span></a></li>
+            </ul>
+            
+            
+            <div class="header-qs">
+               
+               <form class="searchbox" action="/search" method="get">
+                  <div>
+                     	<label for="header-qs-input" id="header-qs-search-label">Search for Keyword:</label>
+                     <input value="" title="Search" type="text" name="fulltext" id="header-qs-input" /><input type="hidden" name="submit" value="yes" /><label for="header-qs-search" id="header-qs-search-label">GO</label><input value="GO" alt="Link: Go" type="image" id="header-qs-search-go"
+                            src="/shared/img/standard-design/design2/go.gif" /> 
+                     
+                  </div>
+                  <div class="adv-search-link"><a href="/search">Advanced Search</a></div>
+               </form>
+               
+               
+            </div>
+            
+            <div class="header-ac-elements">
+               
+               <div id="authstring" class="suppress-header-login">
+                  
+                  <ul>
+                     <li class="subscr-ref">Institution: THE NATURAL HISTORY MUSEUM</li>
+                     <li>
+                        <a href="/login?uri=http%3A%2F%2Fijs.sgmjournals.org%2Fcontent%2F63%2FPt_11%2F4340.full">
+                           Sign In as Member / Individual
+                           </a>
+                        
+                     </li>
+                  </ul>           
+                  
+               </div> 
+               
+               <div id="hdr-login" class="suppress-header-login"></div>
+               
+            </div>
+            
+            <div class="banner-ads">
+               		
+               <ul>
+                  <li class="position-1 no-ad hdr_left"><span>  </span></li>
+               </ul>
+               	
+            </div>
+            
+            <div class="bar">
+               
+               <div class="bar-inner"></div>
+               
+            </div>
+            
+         </div>
+         <div id="content-block">
+            <div class="article fulltext-view " itemprop="articleBody"><span class="highwire-journal-article-marker-start"></span><h1 id="article-title-1" itemprop="headline">Molecular and phenotypic analyses reveal the non-identity of the <em>Phaeobacter gallaeciensis</em> type strain deposits CIP 105210<sup>T</sup> and DSM 17395
+               </h1>
+               <div class="contributors">
+                  <ol class="contributor-list" id="contrib-group-1">
+                     <li class="contributor" id="contrib-1" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Nora+Buddruhs&amp;sortspec=date&amp;submit=Submit">Nora Buddruhs</a></span><a id="xref-aff-1-1" class="xref-aff" href="#aff-1"><sup>1</sup></a><span class="xref-sep">,</span><a id="xref-fn-1-1" class="xref-fn" href="#fn-1">†</a>, 
+                     </li>
+                     <li class="contributor" id="contrib-2" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Silke+Pradella&amp;sortspec=date&amp;submit=Submit">Silke Pradella</a></span><a id="xref-aff-1-2" class="xref-aff" href="#aff-1"><sup>1</sup></a><span class="xref-sep">,</span><a id="xref-fn-1-2" class="xref-fn" href="#fn-1">†</a>, 
+                     </li>
+                     <li class="contributor" id="contrib-3" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Markus+G%C3%B6ker&amp;sortspec=date&amp;submit=Submit">Markus Göker</a></span><a id="xref-aff-1-3" class="xref-aff" href="#aff-1"><sup>1</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-4" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Orsola+P%C3%A4uker&amp;sortspec=date&amp;submit=Submit">Orsola Päuker</a></span><a id="xref-aff-1-4" class="xref-aff" href="#aff-1"><sup>1</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-5" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=R%C3%BCdiger+Pukall&amp;sortspec=date&amp;submit=Submit">Rüdiger Pukall</a></span><a id="xref-aff-1-5" class="xref-aff" href="#aff-1"><sup>1</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-6" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Cathrin+Spr%C3%B6er&amp;sortspec=date&amp;submit=Submit">Cathrin Spröer</a></span><a id="xref-aff-1-6" class="xref-aff" href="#aff-1"><sup>1</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-7" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Peter+Schumann&amp;sortspec=date&amp;submit=Submit">Peter Schumann</a></span><a id="xref-aff-1-7" class="xref-aff" href="#aff-1"><sup>1</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-8" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=J%C3%B6rn+Petersen&amp;sortspec=date&amp;submit=Submit">Jörn Petersen</a></span><a id="xref-aff-1-8" class="xref-aff" href="#aff-1"><sup>1</sup></a> and 
+                     </li>
+                     <li class="last" id="contrib-9"><span class="name"><a class="name-search"
+                              href="/search?author1=Thorsten+Brinkhoff&amp;sortspec=date&amp;submit=Submit">Thorsten Brinkhoff</a></span><a id="xref-aff-2-1" class="xref-aff" href="#aff-2"><sup>2</sup></a></li>
+                  </ol>
+                  <ol class="affiliation-list">
+                     <li class="aff"><a id="aff-1" name="aff-1"></a><address><sup>1</sup>Leibniz Institute DSMZ – German Collection of Microorganisms and Cell Cultures, Braunschweig, Germany
+                        </address>
+                     </li>
+                     <li class="aff"><a id="aff-2" name="aff-2"></a><address><sup>2</sup>Institute for Chemistry and Biology of the Marine Environment, University of Oldenburg, Oldenburg, Germany
+                        </address>
+                     </li>
+                  </ol>
+                  <ol class="corresp-list">
+                     <li class="corresp" id="corresp-1"><strong>Correspondence</strong><br /> Jörn Petersen <span class="em-link"><span class="em-addr">joern.petersen{at}dsmz.de</span></span></li>
+                  </ol>
+               </div>
+               <div class="section abstract" id="abstract-1" itemprop="description">
+                  <div class="section-nav">
+                     <div class="nav-placeholder"> </div><a href="#fn-group-1" title="Next Section" class="next-section-link"><span>Next Section</span></a></div>
+                  <h2>Abstract</h2>
+                  
+                  <p id="p-4">The marine genus <span class="named-content genus" id="named-content-4"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                           href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> currently comprises six species, some of which were intensively studied mainly due to their ability to produce secondary
+                     metabolites. The type strain of the type species, <span class="named-content species" id="named-content-5"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>Phaeobacter gallaeciensis</em></a></span> BS107<sup>T</sup>, has been deposited at several public culture collections worldwide. Based on differences in plasmid profiles, we detected
+                     that the alleged <span class="named-content species" id="named-content-6"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> type strains deposited at the Collection Institute Pasteur (CIP; Paris, France) as CIP 105210 and at the German Collection
+                     of Microorganisms and Cell Cultures (DSMZ; Braunschweig, Germany) as DSM 17395 are not identical. To determine the identity
+                     of these strains, we conducted DNA–DNA hybridization, matrix-assisted laser desorption/ionization time-of-flight mass spectrometry
+                     (MALDI-TOF), 16S rRNA gene and internal transcribed spacer (ITS) sequence analyses, as well as physiological experiments.
+                     Based on the detailed 16S rRNA gene reanalysis we showed that strain CIP 105210 most likely corresponds to the original <span class="named-content species" id="named-content-7"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> type strain BS107<sup>T</sup>. In contrast, the <span class="named-content genus" id="named-content-8"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                           href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strain DSM 17395 exhibits a much closer affiliation to <span class="named-content species" id="named-content-9"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter inhibens"
+                           href="doi:10.1601/nm.10132"><em>Phaeobacter inhibens</em></a></span> DSM 16374<sup>T</sup> ( = T5<sup>T</sup>) and should thus be allocated to this species. The detection of the dissimilarity of strains CIP 105210<sup>T</sup> and DSM 17395 will influence future comparative studies within the genus <span class="named-content genus" id="named-content-10"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                           href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span>.
+                  </p>
+                  
+               </div>
+               <div class="section fn-group" id="fn-group-1">
+                  <div class="section-nav"><a href="#abstract-1" title="Abstract" class="prev-section-link"><span>Previous Section</span></a><a href="#sec-1" title="Introduction" class="next-section-link"><span>Next Section</span></a></div>
+                  <ul>
+                     <li class="fn-equal" id="fn-1">
+                        <p id="p-1"><a class="rev-xref" href="#xref-fn-1-1">↵</a><span class="fn-label">†</span> These authors contributed equally to this work.
+                        </p>
+                     </li>
+                     <li class="fn-other" id="fn-2">
+                        <p id="p-2">The GenBank/EMBL/DDBJ accession numbers for the 16S rRNA gene sequences of the <span class="named-content genus" id="named-content-2"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains CIP 105210<sup>T</sup>, DSM 16374<sup>T</sup>, DSM 17395 and DSM 24564<sup>T</sup> are KC176239, KC176240, KC176241 and KC176242, respectively. The GenBank/EMBL/DDBJ accession numbers for the 16S–23S rRNA
+                           gene internal transcribed spacer of the <span class="named-content genus" id="named-content-3"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains CIP 105210<sup>T</sup>, DSM 16374<sup>T</sup>, DSM 17395, DSM 23529<sup>T</sup>, DSM 23566<sup>T</sup>, DSM 24564<sup>T</sup> and DSM 25627<sup>T</sup> are KC176233, KC176234, KC176235, KC176236, KC176237, KC176238 and KC907729, respectively.
+                        </p>
+                     </li>
+                     <li class="fn-supplementary-material" id="fn-3">
+                        <p id="p-3">Four supplementary figures and four supplementary tables are available with the online version of this paper.</p>
+                     </li>
+                  </ul>
+               </div>
+               <div class="section intro" id="sec-1">
+                  <div class="section-nav"><a href="#fn-group-1" title="Previous Section" class="prev-section-link"><span>Previous Section</span></a><a href="#sec-2" title="Methods" class="next-section-link"><span>Next Section</span></a></div>
+                  
+                  <h2>Introduction</h2>
+                  
+                  <p id="p-13">The genus <span class="named-content genus" id="named-content-11"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                           href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span><em>,</em> currently comprising the species <span class="named-content species" id="named-content-12"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>Phaeobacter gallaeciensis</em></a></span>, <span class="named-content species" id="named-content-13"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                           href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span>, <span class="named-content species" id="named-content-14"><a class="namesforlife" rel="namesforlife-name" title="P. daeponensis"
+                           href="doi:10.1601/nm.10944"><em>P. daeponensis</em></a></span><em>,</em> <span class="named-content species" id="named-content-15"><a class="namesforlife" rel="namesforlife-name" title="P. caeruleus"
+                           href="doi:10.1601/nm.14301"><em>P. caeruleus</em></a></span>, <span class="named-content species" id="named-content-16"><a class="namesforlife" rel="namesforlife-name" title="P. arcticus"
+                           href="doi:10.1601/nm.14057"><em>P. arcticus</em></a></span> and <span class="named-content species" id="named-content-17"><a class="namesforlife" rel="namesforlife-name" title="P. leonis"
+                           href="doi:10.1601/nm.24496"><em>P. leonis</em></a></span> (<a id="xref-ref-16-1" class="xref-bibr" href="#ref-16">Gaboyer <em>et al.</em>, 2013</a>), belongs to the marine <span class="named-content genus" id="named-content-18"><a class="namesforlife" rel="namesforlife-name" title="Roseobacter"
+                           href="doi:10.1601/nm.1134"><em>Roseobacter</em></a></span> clade. It was established by <a id="xref-ref-25-1" class="xref-bibr" href="#ref-25">Martens <em>et al.</em> (2006)</a> after reclassification of <span class="named-content species" id="named-content-19"><a class="namesforlife" rel="namesforlife-name" title="Roseobacter gallaeciensis"
+                           href="doi:10.1601/nm.1138"><em>Roseobacter gallaeciensis</em></a></span> (<a id="xref-ref-34-1" class="xref-bibr" href="#ref-34">Ruiz-Ponte <em>et al.</em>, 1998</a>) as <span class="named-content species" id="named-content-20"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span>, which is the type species of the genus, and description of <span class="named-content species" id="named-content-21"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                           href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> as a new species. During recent years, <span class="named-content genus" id="named-content-22"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                           href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains have received a lot of interest due to the production of various secondary metabolites (e.g. <a id="xref-ref-2-1" class="xref-bibr" href="#ref-2">Berger <em>et al.</em>, 2011</a>, <a id="xref-ref-3-1" class="xref-bibr" href="#ref-3">2012</a>; <a id="xref-ref-6-1" class="xref-bibr" href="#ref-6">Brinkhoff <em>et al.</em>, 2004</a>; <a id="xref-ref-7-1" class="xref-bibr" href="#ref-7">Bruhn <em>et al.</em>, 2007</a>; <a id="xref-ref-17-1" class="xref-bibr" href="#ref-17">Geng <em>et al.</em>, 2008</a>; <a id="xref-ref-26-1" class="xref-bibr" href="#ref-26">Martens <em>et al.</em>, 2007</a>; <a id="xref-ref-35-1" class="xref-bibr" href="#ref-35">Seyedsayamdost <em>et al.</em>, 2011a</a>, <a id="xref-ref-36-1" class="xref-bibr" href="#ref-36">b</a>).
+                  </p>
+                  
+                  <p id="p-14">Recently the genomes of three <span class="named-content genus" id="named-content-23"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                           href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains have been published, <span class="named-content species" id="named-content-24"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> DSM 17395, <span class="named-content species" id="named-content-25"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> 2.10 (<a id="xref-ref-40-1" class="xref-bibr" href="#ref-40">Thole <em>et al.</em>, 2012</a>) and <span class="named-content species" id="named-content-26"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> ANG1 (<a id="xref-ref-9-1" class="xref-bibr" href="#ref-9">Collins &amp; Nyholm, 2011</a>). However, evidence already indicated that strain ANG1 is more similar to <span class="named-content species" id="named-content-27"><a class="namesforlife" rel="namesforlife-name" title="P. daeponensis"
+                           href="doi:10.1601/nm.10944"><em>P. daeponensis</em></a></span> DSM 23529<sup>T</sup> ( = TF-218<sup>T</sup>) than to either DSM 17395 or DSM 24588 ( = 2.10) (unpublished results). Strain 2.10 was previously used in competition experiments
+                     of bacterial biofilms on the thalloid green alga <em>Ulva australis</em> (<a id="xref-ref-32-1" class="xref-bibr" href="#ref-32">Rao <em>et al.</em>, 2005</a>). Various physiological and genetic aspects of <span class="named-content species" id="named-content-28"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> DSM 17395 have also been studied, such as the pathway and substrate specificity of the algal metabolite dimethylsulfoniopropionate
+                     (DMSP) catabolism (<a id="xref-ref-11-1" class="xref-bibr" href="#ref-11">Dickschat <em>et al.</em>, 2010</a>), the compatibility of the plasmids (<a id="xref-ref-28-1" class="xref-bibr" href="#ref-28">Petersen, 2011</a>), and the primary metabolism by proteome analyses (<a id="xref-ref-44-1" class="xref-bibr" href="#ref-44">Zech <em>et al.</em>, 2009</a>).
+                  </p>
+                  
+                  <p id="p-15">With the description of the species <span class="named-content species" id="named-content-29"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> (basonym <span class="named-content species" id="named-content-30"><a class="namesforlife" rel="namesforlife-name" title="R. gallaeciensis"
+                           href="doi:10.1601/nm.1138"><em>R. gallaeciensis</em></a></span>) in 1998, the type strain BS107<sup>T</sup> was primarily deposited at the Collection Institute Pasteur (CIP; Paris, France) as CIP 105210 (<a id="xref-ref-34-2" class="xref-bibr" href="#ref-34">Ruiz-Ponte <em>et al.</em>, 1998</a>). According to the strain history (<a href="http://www.straininfo.net/strains/620650">http://www.straininfo.net/strains/620650</a>), the CIP referred the strain to the Colección Española de Cultivos Tipo (CECT; Burjassot, Spain) and to the American Type
+                     Culture Collection (ATCC; Manassas, USA), which in turn referred it to the Japan Collection of Micro-organisms at the RIKEN
+                     Bioscience Center (Tsikiba, Japan) followed by a transfer to the NITE (National Institute of Technology and Evaluation) Biological
+                     Resource Center (Kisarazu, Japan). At these culture collections the derivatives of strain CIP 105210 were designated CECT
+                     7277<sup>T</sup>, ATCC 700781<sup>T</sup>, JCM 21319<sup>T</sup> and NBRC 16654<sup>T</sup>, respectively. The Leibniz Institute DSMZ – German Collection of Microorganisms and Cell Cultures (DSMZ; Braunschweig, Germany)
+                     independently requested <span class="named-content species" id="named-content-31"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> BS107<sup>T</sup> from the laboratory of the original depositor in 2005 and included it as DSM 17395 in the strain collection. Strain DSM 17395
+                     was subsequently collected by the Laboratorium voor Microbiologie (LMG; Gent, Belgium) and deposited as LMG 24391<sup>T</sup>. When investigating plasmid profiles of various <span class="named-content genus" id="named-content-32"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                           href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains, we observed differences between the strains CIP 105210 and DSM 17395 even though both were considered identical
+                     with the type strain BS107<sup>T</sup>. This is critical, as due to the broad scientific interest in the <span class="named-content species" id="named-content-33"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> type strain, it was either obtained from the public culture collections or retrieved from other sources several times. For
+                     example, <a id="xref-ref-36-2" class="xref-bibr" href="#ref-36">Seyedsayamdost <em>et al.</em> (2011b)</a> allegedly used strain BS107<sup>T</sup> to investigate the mutualistic or pathogenic symbioses between <span class="named-content species" id="named-content-34"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> and the unicellular haptophycean alga <em>Emiliania huxleyi</em>. It was indicated that these authors received the strain BS107<sup>T</sup> from a collaborating laboratory; hence the biological identity of the strain used is ultimately unclear.
+                  </p>
+                  
+                  <p id="p-16">In this study, we consequently reassessed the biological identity of these strains. We compared in detail the characteristics
+                     of the strains CIP 105210 and DSM 17395 with those of the description of BS107<sup>T</sup> given by <a id="xref-ref-34-3" class="xref-bibr" href="#ref-34">Ruiz-Ponte <em>et al.</em> (1998)</a> and with those of other closely related <span class="named-content genus" id="named-content-35"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                           href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains, i.e. <span class="named-content species" id="named-content-36"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> DSM 24588 ( = 2.10; <a id="xref-ref-40-2" class="xref-bibr" href="#ref-40">Thole <em>et al.</em>, 2012</a>) and <span class="named-content species" id="named-content-37"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                           href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> DSM 16374<sup>T</sup> ( = T5<sup>T</sup>; <a id="xref-ref-25-2" class="xref-bibr" href="#ref-25">Martens <em>et al.</em>, 2006</a>). Based on our results, according reclassifications are proposed.
+                  </p>
+                  
+               </div>
+               <div class="section methods" id="sec-2">
+                  <div class="section-nav"><a href="#sec-1" title="Introduction" class="prev-section-link"><span>Previous Section</span></a><a href="#sec-11" title="Results" class="next-section-link"><span>Next Section</span></a></div>
+                  
+                  <h2>Methods</h2>
+                  
+                  <div id="sec-3" class="subsection">
+                     
+                     
+                     <div id="sec-4" class="subsection">
+                        
+                        <h4>Source of bacteria and culturing.</h4>
+                        
+                        <p id="p-17">The <span class="named-content genus" id="named-content-38"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains DSM 16374<sup>T</sup> ( = T5<sup>T</sup>), DSM 17395, DSM 23529<sup>T</sup> ( = TF-218<sup>T</sup>), DSM 23566<sup>T</sup> ( = 20188<sup>T</sup>), DSM 24564<sup>T</sup>, DSM 24588 ( = 2.10) and DSM 25627<sup>T</sup> ( = 306<sup>T</sup>) as well as <span class="named-content species" id="named-content-39"><a class="namesforlife" rel="namesforlife-name" title="Roseobacter litoralis"
+                                 href="doi:10.1601/nm.1135"><em>Roseobacter litoralis</em></a></span> DSM 6996<sup>T</sup>, <span class="named-content species" id="named-content-40"><a class="namesforlife" rel="namesforlife-name" title="Marinovum algicola"
+                                 href="doi:10.1601/nm.9794"><em>Marinovum algicola</em></a></span> DSM 10251<sup>T</sup> and <span class="named-content species" id="named-content-41"><a class="namesforlife" rel="namesforlife-name" title="Roseobacter denitrificans"
+                                 href="doi:10.1601/nm.1137"><em>Roseobacter denitrificans</em></a></span> DSM 7001<sup>T</sup> were obtained from the DSMZ. The <span class="named-content genus" id="named-content-42"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strain CIP 105210 was obtained from the CIP. Unless otherwise stated, cells were grown in marine broth 2216 (MB; Difco) or
+                           on MB agar at 28 °C (and at 25 °C in case of <span class="named-content species" id="named-content-43"><a class="namesforlife" rel="namesforlife-name" title="P. leonis"
+                                 href="doi:10.1601/nm.24496"><em>P. leonis</em></a></span> DSM 25627<sup>T</sup>).
+                        </p>
+                        
+                     </div>
+                     <div id="sec-5" class="subsection">
+                        
+                        <h4>Profiles of the extrachromosomal elements.</h4>
+                        
+                        <p id="p-18">To analyse the plasmid content of the <span class="named-content genus" id="named-content-44"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains, their high-molecular-mass total genomic DNA was prepared within agarose plugs as previously described and subjected
+                           to pulsed-field gel electrophoresis (PFGE; <a id="xref-ref-30-1" class="xref-bibr" href="#ref-30">Pradella <em>et al.</em>, 2010</a>). PFGE was performed in a contour-clamped homogeneous electric field (CHEF) system on a CHEF-DR III device (Bio-Rad) with
+                           1 % or 1.2 % agarose gels and modified 0.5× TBE buffer (45 mM Tris, 45 mM boric acid, 0.1 mM EDTA) at 14 °C. PFGE parameters,
+                           namely pulse time ramps and run times, were varied both to resolve chromosomal and extrachromosomal DNA and to identify different
+                           plasmid conformations (<a id="xref-ref-33-1" class="xref-bibr" href="#ref-33">Römling <em>et al.</em>, 1996</a>). Two PFGE parameter sets were applied to assess plasmid topology: (i) set A, 1 % (w/v) agarose gel with pulse times of 1
+                           to 48 s for 24 h at 200 V (6 V cm<sup>−1</sup>) and (ii) set B, 1 % (w/v) agarose gel with pulse times of 1 to 20 s for 22 h at 200 V (6 V cm<sup>−1</sup>). At least two PFGE gels were evaluated to determine plasmid sizes. The resulting plasmid profiles were interpreted as described
+                           by <a id="xref-ref-30-2" class="xref-bibr" href="#ref-30">Pradella <em>et al.</em> (2010)</a>. Conventional unidirectional gel electrophoresis of DNA was in 0.8 % agarose gels and 1× TBE (89 mM Tris, 89 mM boric acid,
+                           2 mM EDTA) at 10 °C and 70 mA for 8.5 h. The BAC Tracker supercoiled DNA ladder (from 38 to 120 kb; Epicentre) was used to
+                           size plasmids with covalently closed circular (ccc) DNA topology.
+                        </p>
+                        
+                     </div>
+                     <div id="sec-6" class="subsection">
+                        
+                        <h4>16S rRNA gene and 16S–23S rRNA gene internal transcribed spacer (ITS) analysis.</h4>
+                        
+                        <p id="p-19">The PCR amplification of 16S rRNA genes from the genomic DNA of the <span class="named-content genus" id="named-content-45"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains was done as described by <a id="xref-ref-31-1" class="xref-bibr" href="#ref-31">Rainey <em>et al.</em> (1996)</a>. For the PCR amplification of the ITS region, the primer pair 16S_1401f 5′-GRGCCTTGYACACACCG-3′ (<a id="xref-ref-23-1" class="xref-bibr" href="#ref-23">Lane, 1991</a>) and 23S_130r 5′-GGTTBCCCCATTCRG-3′ (<a id="xref-ref-18-1" class="xref-bibr" href="#ref-18">Gürtler &amp; Stanisich, 1996</a>) was used. Resulting PCR products were cycle sequenced with the primers mentioned above in ‘Extended Hot Shot’ reactions
+                           as offered by the Seqlab company, Germany. The sequence analysis tool BioEdit 7.0.1 (<a href="http://www.mbio.ncsu.edu/BioEdit/bioedit.html">http://www.mbio.ncsu.edu/BioEdit/bioedit.html</a>) was utilized for 16S rRNA gene and ITS sequence editing. The accession numbers of retrieved 16S rRNA gene sequences from
+                           <span class="named-content species" id="named-content-46"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> BS107<sup>T</sup> (<a id="xref-ref-34-4" class="xref-bibr" href="#ref-34">Ruiz-Ponte <em>et al.</em>, 1998</a>), <span class="named-content species" id="named-content-47"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                 href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> T5<sup>T</sup> (<a id="xref-ref-25-3" class="xref-bibr" href="#ref-25">Martens <em>et al.</em>, 2006</a>), <span class="named-content species" id="named-content-48"><a class="namesforlife" rel="namesforlife-name" title="P. daeponensis"
+                                 href="doi:10.1601/nm.10944"><em>P. daeponensis</em></a></span> TF-218<sup>T</sup>, <span class="named-content species" id="named-content-49"><a class="namesforlife" rel="namesforlife-name" title="P. arcticus"
+                                 href="doi:10.1601/nm.14057"><em>P. arcticus</em></a></span> 20188<sup>T</sup>, <span class="named-content species" id="named-content-50"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> LSS9 and <span class="named-content species" id="named-content-51"><a class="namesforlife" rel="namesforlife-name" title="P. leonis"
+                                 href="doi:10.1601/nm.24496"><em>P. leonis</em></a></span> 306<sup>T</sup> were Y13244, AY177712, NR_044026, NR_043888, GQ906799 and HE661585, respectively. Further 16S rRNA gene or ITS sequences
+                           used in this study were extracted from the genome sequences of <span class="named-content genus" id="named-content-52"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains DSM 17395 (ABIF01000000), DSM 24588 ( = 2.10; CP002972–CP002975) and ANG1 (AFCF01000000) using the Integrated Microbial
+                           Genomes (IMG) system (<a href="http://img.jgi.doe.gov/cgi-bin/w/main.cgi">http://img.jgi.doe.gov/cgi-bin/w/main.cgi</a>; <a id="xref-ref-24-1" class="xref-bibr" href="#ref-24">Markowitz <em>et al.</em>, 2012</a>).
+                        </p>
+                        
+                        <p id="p-20">Sequences were aligned with <span class="sc">mafft</span> version 6.850b, using the ‘--<em>genafpair</em>’ option but default settings otherwise (<a id="xref-ref-22-1" class="xref-bibr" href="#ref-22">Katoh <em>et al.</em>, 2005</a>). Phylogenetic analysis under the maximum-likelihood (ML) criterion (<a id="xref-ref-13-1" class="xref-bibr" href="#ref-13">Felsenstein, 1981</a>) was conducted with RAxML version 7.2.8, using its novel rapid bootstrap option combined with the autoMRE bootstrapping criterion
+                           (<a id="xref-ref-27-1" class="xref-bibr" href="#ref-27">Pattengale <em>et al.</em>, 2010</a>) with subsequent search for the best tree under the GTRMIX approach (<a id="xref-ref-38-1" class="xref-bibr" href="#ref-38">Stamatakis <em>et al.</em>, 2008</a>). Branch-and-bound search for the best trees under the maximum-parsimony (MP) criterion (<a id="xref-ref-15-1" class="xref-bibr" href="#ref-15">Fitch, 1971</a>) was done with <span class="sc">paup</span>* version 4.0b10 (<a id="xref-ref-39-1" class="xref-bibr" href="#ref-39">Swofford, 2002</a>), treating gaps as missing data and collapsing branches of zero minimum length; 1000 bootstrap replicates were conducted
+                           in the same manner. The resulting best trees were rooted using the midpoint-rooting method (<a id="xref-ref-12-1" class="xref-bibr" href="#ref-12">Farris, 1972</a>; <a id="xref-ref-20-1" class="xref-bibr" href="#ref-20">Hess &amp; De Moraes Russo, 2007</a>).
+                        </p>
+                        
+                     </div>
+                     <div id="sec-7" class="subsection">
+                        
+                        <h4>MALDI-TOF MS protein analysis.</h4>
+                        
+                        <p id="p-21">Whole-cell protein extracts of the <span class="named-content genus" id="named-content-53"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains CIP 105210, DSM 17395, DSM 24588, DSM 16374<sup>T</sup>, DSM 23529<sup>T</sup>, DSM 23566<sup>T</sup>, DSM 24564<sup>T</sup> and DSM 25627<sup>T</sup> were analysed by matrix-assisted laser desorption/ionization time-of-flight mass spectrometry (MALDI-TOF MS) using a Microflex
+                           L20 mass spectrometer (Bruker Daltonics) equipped with a N<sub>2</sub> laser. Sample preparation for MALDI-TOF MS protein analysis was carried out according to the ethanol/formic acid extraction
+                           protocol recommended by Bruker Daltonics as described in detail by <a id="xref-ref-41-1" class="xref-bibr" href="#ref-41">Tóth <em>et al.</em> (2008)</a>. The MALDI-TOF mass spectra were analysed with the BioTyper software (version 3.0; Bruker Daltonics).
+                        </p>
+                        
+                     </div>
+                     <div id="sec-8" class="subsection">
+                        
+                        <h4>DNA–DNA hybridization (DDH).</h4>
+                        
+                        <p id="p-22">Cells of the <span class="named-content genus" id="named-content-54"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains CIP 105210, DSM 17395, DSM 16374<sup>T</sup> and DSM 24588 were disrupted by using a Constant Systems TS 0.75 kW (IUL Instruments) and the DNA in the crude lysate was
+                           purified by chromatography on hydroxyapatite as described by <a id="xref-ref-8-1" class="xref-bibr" href="#ref-8">Cashion <em>et al.</em> (1977)</a>. DNA–DNA hybridization was carried out as described by <a id="xref-ref-10-1" class="xref-bibr" href="#ref-10">De Ley <em>et al.</em> (1970)</a> and modified by <a id="xref-ref-21-1" class="xref-bibr" href="#ref-21">Huß <em>et al.</em> (1983)</a> using a model Cary 100 Bio UV/VIS-spectrophotometer equipped with a Peltier-thermostatted 6×6 multi-cell changer and a temperature
+                           controller with <em>in situ</em> temperature probe (Varian). Each strain was measured in two technical replicates and the mean result was taken.
+                        </p>
+                        
+                     </div>
+                     <div id="sec-9" class="subsection">
+                        
+                        <h4>Growth and hydrolysis experiments.</h4>
+                        
+                        <p id="p-23">To determine the substrate spectrum of the <span class="named-content genus" id="named-content-55"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains CIP 105210 and DSM 17395, cells were grown in artificial seawater (ASW; solution of Sigma sea salts: S9883) supplemented
+                           with 10 mg caseine hydrolysate l<sup>−1</sup> (CAS: 65072-00-6; Merck) to avoid auxotrophy and with different carbon sources at a concentration of 0.1 % each, including
+                           2-ketoglutarate, acetate, <span class="sc">l</span>-arabinose, butyrate, cellobiose, citrate, <span class="sc">d</span>-fucose, glucosamine, glycerol, <span class="sc">l</span>-leucine, maltose, <span class="sc">l</span>-rhamnose, <span class="sc">l</span>-serine, <span class="sc">d</span>-sorbitol, succinate, sucrose, trehalose, Tween 20, Tween 40 and Tween 80. The tests were performed in the 24-well microtitre-plate
+                           format. In detail, cells were grown on MB agar for 2 days at 28 °C, then harvested with a sterile swab and inoculated in ASW
+                           medium. The cell suspension was thereby adjusted to a turbidity of 80 % transmittance using a turbidimeter (AES Chemunex BLG
+                           3531). Afterwards, 2 ml of each suspension was pipetted into a 24-well microtitre plate (Greiner). A sample lacking any carbon
+                           source was included as negative control. Cells were incubated in a microtitre plate reader (Infinite F200 pro; Tecan) at 23
+                           °C and with shaking at 88 r.p.m. for 7 days. Growth was automatically measured every 15 min with the Infinite F200 system
+                           as increase of the OD<sub>600</sub>. Growth at temperatures of 4 °C and 37 °C was determined in 200 ml MB within Erlenmeyer flasks for one month and measured
+                           photometrically as increase of the OD<sub>600</sub> using an Ultrospec II spectrophotometer (LKB-Biochrom).
+                        </p>
+                        
+                        <p id="p-24">Exoenzyme activities (hydrolysis of gelatin, starch and Tween 80) were analysed using MB solidified with 4 % (w/v) gelatin
+                           or 1.5 % (w/v) agarose and supplemented with 0.2 % (w/v) starch and 1 % (v/v) Tween 80, respectively, as described by <a id="xref-ref-37-1" class="xref-bibr" href="#ref-37">Smibert &amp; Krieg (1981)</a>. As a positive control, <span class="named-content species" id="named-content-56"><a class="namesforlife" rel="namesforlife-name" title="R. litoralis"
+                                 href="doi:10.1601/nm.1135"><em>R. litoralis</em></a></span> DSM 6996<sup>T</sup> was used for gelatin and Tween 80 hydrolysis and <span class="named-content species" id="named-content-57"><a class="namesforlife" rel="namesforlife-name" title="M. algicola"
+                                 href="doi:10.1601/nm.9794"><em>M. algicola</em></a></span> DSM 10251<sup>T</sup> for starch hydrolysis. Reduction of nitrate was tested according to <a id="xref-ref-37-2" class="xref-bibr" href="#ref-37">Smibert &amp; Krieg (1981)</a> in MB supplemented with 0.1 % (w/v) potassium nitrate; <span class="named-content species" id="named-content-58"><a class="namesforlife" rel="namesforlife-name" title="R. denitrificans"
+                                 href="doi:10.1601/nm.1137"><em>R. denitrificans</em></a></span> DSM 7001<sup>T</sup> served as a negative control. The assays were incubated for 7 days at 28 °C, except for the hydrolysis of starch, conducted
+                           at 20 °C. The growth and hydrolysis tests described above were all performed in three technical replicates.
+                        </p>
+                        
+                     </div>
+                     <div id="sec-10" class="subsection">
+                        
+                        <h4>Phenotype MicroArray (PM) experiments.</h4>
+                        
+                        <p id="p-25">To determine the metabolic properties of the <span class="named-content genus" id="named-content-59"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains CIP 105210, DSM 17395, DSM 24588 and DSM 16374<sup>T</sup> we used the PM technology (Biolog; <a id="xref-ref-4-1" class="xref-bibr" href="#ref-4">Bochner, 2009</a>). The <span class="named-content genus" id="named-content-60"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains were grown on MB agar for 48 h and subsequently analysed using the Phenotype MicroArray MicroPlate PM01 and PM02-A
+                           (AES Chemunex BLG 12111, BLG 12112) over 70 h; thus 190 different carbon sources were tested. Each strain was measured in
+                           three biological replicates. The inoculation medium was modified according to the requirements of marine bacteria, i.e. 10
+                           ml of the inoculation fluid IF-0a (AES Chemunex BLG 72268) was supplemented with 1200 µl artificial seawater stock solution,
+                           120 µl vitamin stock solution, 12 µl trace element stock solution, 120 µl NaHCO<sub>3</sub> buffer, 428 µl ultrapure H<sub>2</sub>O and 120 µl DyeD (AES Chemunex BLG 74224). The stock solutions had the following composition (l<sup>−1</sup>): (i) artificial seawater stock solution: 200 g NaCl, 40 g Na<sub>2</sub>SO<sub>4</sub>, 30 g MgCl<sub>2</sub> . 6H<sub>2</sub>O, 5 g KCl, 2.5 g NH<sub>4</sub>Cl, 2 g KH<sub>2</sub>PO<sub>4</sub>, 1.5 g CaCl<sub>2</sub> . 2H<sub>2</sub>O; (ii) trace element stock solution: 2.1 g FeSO<sub>4</sub> . 7H<sub>2</sub>O, 13 ml 25 % HCl, 5.2 g Titriplex III (Na<sub>2</sub>EDTA; adjust pH to 6.0–6.5 to resolve), 190 mg CoCl<sub>2</sub> . 6H<sub>2</sub>O, 144 mg ZnSO<sub>4</sub> . 7H<sub>2</sub>O, 100 mg MnCl<sub>2</sub> . 4H<sub>2</sub>O, 36 mg Na<sub>2</sub>MoO<sub>4</sub> . 2H<sub>2</sub>O, 30 mg H<sub>3</sub>BO<sub>3</sub>, 24 mg NiCl<sub>2</sub> . 6H<sub>2</sub>O, 2 mg CuCl<sub>2</sub> . 2H<sub>2</sub>O; (iii) vitamin stock solution: 100 mg thiamine, 20 mg niacin, 8 mg 4-aminobenzoic acid, 2 mg biotin; and (iii) buffer stock
+                           solution: 19 g NaHCO<sub>3</sub>.
+                        </p>
+                        
+                        <p id="p-26">The cells were suspended in the modified inoculation medium using a sterile swab. The turbidity was adjusted to a cell density
+                           of 85 % transmittance using a turbidimeter (AES Chemunex BLG 3531) and 100 µl of the cell suspension were pipetted in each
+                           of the wells. The MicroPlates were sealed with Parafilm, incubated at 28 °C and measured in the Omnilog unit (Biolog). The
+                           results were analysed using the R package ‘<em>opm</em>’ (<a id="xref-ref-42-1" class="xref-bibr" href="#ref-42">Vaas <em>et al.</em>, 2012</a>). The curve parameter maximum height (A) was estimated for each substrate, differences were visualized using heat maps, and
+                           the data were discretized into negative, ambiguous and positive reactions using the built-in functions of ‘<em>opm</em>’ under default settings.
+                        </p>
+                        
+                     </div>
+                  </div>
+               </div>
+               <div class="section results" id="sec-11">
+                  <div class="section-nav"><a href="#sec-2" title="Methods" class="prev-section-link"><span>Previous Section</span></a><a href="#sec-19" title="Discussion" class="next-section-link"><span>Next Section</span></a></div>
+                  
+                  <h2>Results</h2>
+                  
+                  <div id="sec-12" class="subsection">
+                     
+                     <h3>Profiles of the extrachromosomal elements</h3>
+                     
+                     <p id="p-27">The high-molecular-mass genomic DNA of different <span class="named-content genus" id="named-content-61"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                              href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains was separated with PFGE. A representative PFGE gel resolving linear DNA molecules in the size range from 23 to 533
+                        kb is shown in <a id="xref-fig-1-1" class="xref-fig" href="#F1">Fig. 1(a)</a>. In addition to the chromosomes (<a id="xref-fig-1-2" class="xref-fig" href="#F1">Fig. 1a</a>, Chr) a distinct number of extrachromosomal bands was revealed for each of the strains CIP 105210, DSM 17395, DSM 24588 and
+                        DSM 16374<sup>T</sup>. To determine the conformation of the detected extrachromosomal DNA (ccc versus linear; <a id="xref-ref-30-3" class="xref-bibr" href="#ref-30">Pradella <em>et al.</em>, 2010</a>; <a id="xref-ref-33-2" class="xref-bibr" href="#ref-33">Römling <em>et al.</em>, 1996</a>), we varied the PFGE conditions (PFGE parameter set A and B) in different gel runs. Using PFGE parameter set A, the fuzzy,
+                        faint bands within the lanes of strains CIP 105210 and DSM 17395 (<a id="xref-fig-1-3" class="xref-fig" href="#F1">Fig. 1a</a>, marked a, b and c, respectively) ran at approximately 319 (a) and 380 (b, c) kb (<a id="xref-fig-1-4" class="xref-fig" href="#F1">Fig. 1a</a>). With PFGE parameter set B (data not shown) band (a) ran at 184 kb and bands (b) and (c) ran at approximately 210 kb indicating
+                        that the respective bands migrated independently of the PFGE parameters applied. From this anomalous migration behaviour we
+                        concluded that the inherent DNA had a circular conformation. The sizes of the detected ccc DNA were estimated as 66 (a) and
+                        79 (b, c) kb by conventional electrophoresis using the BAC Tracker as ccc size marker (data not shown). As these sizes were
+                        close to those estimated for the linearized plasmids of 64 and 77 kb in <span class="named-content genus" id="named-content-62"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                              href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strain CIP 105210 and 75 kb in strain DSM 17395 (see below), it is most likely that they represent the same plasmids in different
+                        conformations.
+                     </p>
+                     
+                     <div id="F1" class="fig pos-float type-figure  odd">
+                        <div class="fig-inline"><a href="4340/F1.expansion.html"><img alt="Fig. 1. " src="4340/F1.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                                 <li><a href="4340/F1.expansion.html">In this window</a></li>
+                                 <li><a class="in-nw" href="4340/F1.expansion.html">In a new window</a></li>
+                              </ul>
+                              <ul class="fig-services">
+                                 <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4340/F1">Download as PowerPoint Slide</a></li>
+                              </ul>
+                           </div>
+                        </div>
+                        <div class="fig-caption"><span class="fig-label">Fig. 1. </span> 
+                           
+                           <p id="p-28" class="first-child">(a) PFGE plasmid profiles of the <span class="named-content genus" id="named-content-63"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                    href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains CIP 105210<sup>T</sup>, DSM 17395, DSM 24588 and DSM 16374<sup>T</sup> based on uncut high-molecular-mass genomic DNA. (b) Calculated plasmid sizes as mean values taken from at least two different
+                              gel runs. The PFGE conditions were: 1 % (w/v) agarose gel with pulse times of 1 to 48 s for 24 h at 200 V (6 V cm<sup>−1</sup>). Chr, chromosomal DNA; λ, lambda phage concatemers as molecular-mass PFGE markers (New England Biolabs); li, linear. <sup>(*)</sup>, The two largest plasmids (linearized forms) of <span class="named-content genus" id="named-content-64"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                    href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains CIP 105210<sup>T</sup> and DSM 17395 migrated about the same distance in the gel and thus seemed to have an identical size. In contrast, both bands
+                              could be clearly distinguished by their size in other PFGE runs (data not shown) using different DNA sample preparations.
+                              DNA mobility is largely influenced by the DNA concentration of the sample. The observed discrepancy can thus be explained
+                              by the relatively high DNA concentration in CIP 105210<sup>T</sup> (compared to DSM 17395<sup>T</sup>), which retards band migration (<a id="xref-ref-33-3" class="xref-bibr" href="#ref-33">Römling <em>et al.</em>, 1996</a>). <sup>(†) (‡)</sup>, The PFGE-based plasmid size estimations of 75 and 63 kb of DSM 17395 correspond to the plasmid sizes of 78 and 65 kb, respectively,
+                              determined by genome sequencing (<a id="xref-ref-40-3" class="xref-bibr" href="#ref-40">Thole <em>et al.</em>, 2012</a>; NC_018287.1, NC_018288.1). <sup>(§)</sup>, The 36 kb plasmid of <span class="named-content species" id="named-content-65"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                    href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> CIP 105210<sup>T</sup> had a very low fluorescence intensity and is thus hardly visible on the gel image. ++, The 77 kb band of strain CIP 105210<sup>T</sup> showed increased fluorescence intensity and presumably represents a double band (plasmid duplet).
+                           </p>
+                           
+                           <div class="sb-div caption-clear"></div>
+                        </div>
+                     </div>
+                     
+                     <p id="p-29">By contrast, the sharp bands between 23 kb and 262 kb were separated strictly in accordance with their size when PFGE parameter
+                        sets A and B were used. They were thus assumed linear (li, <a id="xref-fig-1-5" class="xref-fig" href="#F1">Fig. 1a</a>), most possibly originating from randomly linearized ccc plasmids (<a id="xref-ref-30-4" class="xref-bibr" href="#ref-30">Pradella <em>et al.</em>, 2010</a>).
+                     </p>
+                     
+                     <p id="p-30">Regarding the linearized plasmid fraction of the <span class="named-content genus" id="named-content-66"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                              href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains, which was very well suited to determine the plasmid complement of the strains and their sizes (<a id="xref-ref-30-5" class="xref-bibr" href="#ref-30">Pradella <em>et al.</em>, 2010</a>), seven extrachromosomal replicons were evident in <span class="named-content species" id="named-content-67"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                              href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> CIP 105210, four in <span class="named-content species" id="named-content-68"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                              href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> DSM 16374<sup>T</sup> and three in the strains DSM 17395 and DSM 24588. The estimated sizes of the detected plasmids (17 altogether) ranged from
+                        36 to 262 kb (<a id="xref-fig-1-6" class="xref-fig" href="#F1">Fig. 1b</a>). They were all different, but their size distribution in the individual strains showed some similarity, i.e. all <span class="named-content genus" id="named-content-69"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                              href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains have one large plasmid (262, 253, 239 and 227 kb in strains DSM 17395, CIP 105210, DSM 24588 and DSM 16374<sup>T</sup>, respectively) and two or three smaller ones in the size range between 63 and 77 kb. Our PFGE analysis thus indicated that
+                        the <span class="named-content genus" id="named-content-70"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                              href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains CIP 105210 and DSM 17395 – both deposited as type strain of <span class="named-content species" id="named-content-71"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter gallaeciensis"
+                              href="doi:10.1601/nm.9798"><em>Phaeobacter gallaeciensis</em></a></span> – are not identical.
+                     </p>
+                     
+                  </div>
+                  <div id="sec-13" class="subsection">
+                     
+                     <h3>Classification of the <span class="named-content genus" id="named-content-72"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                              href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains using 16S rRNA gene sequence, MALDI-TOF MS protein and 16S–23S rRNA gene ITS analyses
+                     </h3>
+                     
+                     <div id="sec-14" class="subsection">
+                        
+                        <h4>16S rRNA gene sequence analysis.</h4>
+                        
+                        <p id="p-31">We re-evaluated the phylogenetic relationships of the <span class="named-content genus" id="named-content-73"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains and therefore resequenced the PCR-amplified 16S rRNA genes of strains DSM 17395, DSM 16374<sup>T</sup> and CIP 105210. In the phylogenetic tree inferred from 16S rRNA gene sequences of representative members of the genus <span class="named-content genus" id="named-content-74"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span>, as well as strains DSM 24588 ( = 2.10), ANG1 and LSS9, for which finished or draft genome sequences exist (<a id="xref-ref-9-2" class="xref-bibr" href="#ref-9">Collins &amp; Nyholm, 2011</a>; <a id="xref-ref-14-1" class="xref-bibr" href="#ref-14">Fernandes <em>et al.</em>, 2011</a>; <a id="xref-ref-40-4" class="xref-bibr" href="#ref-40">Thole <em>et al.</em>, 2012</a>; <a id="xref-fig-2-1" class="xref-fig" href="#F2">Fig. 2</a>), the <span class="named-content genus" id="named-content-75"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains DSM 17395, DSM 24588 ( = 2.10), DSM 16374<sup>T</sup> and CIP 105210 clustered together (<span class="named-content species" id="named-content-76"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span>/<span class="named-content species" id="named-content-77"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                 href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> cluster) and were well separated from the <span class="named-content species" id="named-content-78"><a class="namesforlife" rel="namesforlife-name" title="P. arcticus"
+                                 href="doi:10.1601/nm.14057"><em>P. arcticus</em></a></span><em>/</em><span class="named-content species" id="named-content-79"><a class="namesforlife" rel="namesforlife-name" title="P. leonis"
+                                 href="doi:10.1601/nm.24496"><em>P. leonis</em></a></span> lineage and the branch formed by <span class="named-content species" id="named-content-80"><a class="namesforlife" rel="namesforlife-name" title="P. caeruleus"
+                                 href="doi:10.1601/nm.14301"><em>P. caeruleus</em></a></span>, <span class="named-content species" id="named-content-81"><em>Phaeobacter</em> sp.</span> ANG1 and <span class="named-content species" id="named-content-82"><a class="namesforlife" rel="namesforlife-name" title="P. daeponensis"
+                                 href="doi:10.1601/nm.10944"><em>P. daeponensis</em></a></span> (16S rRNA gene identity ≥97.8 %). Within the <span class="named-content species" id="named-content-83"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span>/<span class="named-content species" id="named-content-84"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                 href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> cluster, the 16S rRNA gene of strain CIP 105210 (KC176239) grouped together with the originally deposited BS107<sup>T</sup> sequence (Y13244), exhibiting 72 % and 91 % support from MP and ML bootstrapping, respectively. The 16S rRNA gene sequences
+                           of the <span class="named-content genus" id="named-content-85"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains DSM 17395, DSM 24588 and DSM 16374<sup>T</sup> (KC176240) were identical and differed by four bases from the <span class="named-content species" id="named-content-86"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> CIP 105210 sequence KC176239 (16S rRNA gene identity of 99.7 %; see below).
+                        </p>
+                        
+                        <div id="F2" class="fig pos-float type-figure  odd">
+                           <div class="fig-inline"><a href="4340/F2.expansion.html"><img alt="Fig. 2. " src="4340/F2.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                                    <li><a href="4340/F2.expansion.html">In this window</a></li>
+                                    <li><a class="in-nw" href="4340/F2.expansion.html">In a new window</a></li>
+                                 </ul>
+                                 <ul class="fig-services">
+                                    <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4340/F2">Download as PowerPoint Slide</a></li>
+                                 </ul>
+                              </div>
+                           </div>
+                           <div class="fig-caption"><span class="fig-label">Fig. 2. </span> 
+                              
+                              <p id="p-32" class="first-child">Midpoint-rooted MP phylogeny inferred from 16S rRNA gene sequences of <span class="named-content genus" id="named-content-87"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                       href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains closely related to <span class="named-content species" id="named-content-88"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                       href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> and <span class="named-content species" id="named-content-89"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                       href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span>. Branches are scaled in terms of the minimum number of substitutions (using <span class="sc">deltran</span> optimization; <a id="xref-ref-38-2" class="xref-bibr" href="#ref-38">Stamatakis <em>et al.</em>, 2008</a>). Numbers above branches are support values from MP (left) and ML (right) bootstrapping. Original designation of strains
+                                 that are deposited at culture collections is indicated in parentheses; square brackets give the respective accession number.
+                              </p>
+                              
+                              <div class="sb-div caption-clear"></div>
+                           </div>
+                        </div>
+                        
+                        <p id="p-33">Neither the 16S rRNA gene sequence of <span class="named-content species" id="named-content-90"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> CIP 105210 (KC176239) nor the sequence of <span class="named-content species" id="named-content-91"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                 href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> DSM 16374<sup>T</sup> (KC176240) was exactly identical to that of the original deposit, <span class="named-content species" id="named-content-92"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> BS107<sup>T</sup> (Y13244) or <span class="named-content species" id="named-content-93"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                 href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> T5<sup>T</sup> (AY177712), respectively (<a id="xref-fig-2-2" class="xref-fig" href="#F2">Fig. 2</a>, Fig. S1 available in IJSEM Online). More precisely, the 16S rRNA gene sequences of the alleged <span class="named-content species" id="named-content-94"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> type strains differed at the base positions (<span class="named-content species" id="named-content-95"><a class="namesforlife" rel="namesforlife-name" title="Escherichia coli"
+                                 href="doi:10.1601/nm.3093"><em>Escherichia coli</em></a></span> numbering; <a id="xref-ref-19-1" class="xref-bibr" href="#ref-19">Gutell <em>et al.</em>, 1994</a>) 47, 260, 777, 928, 930, 1030, 1210 and 1387 (Fig. S1; Table S1); and those of the alleged <span class="named-content species" id="named-content-96"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                 href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> type strains at the positions 29, 1210, 1387, 1436, 1459, 1466 and 1480 (Fig. S1; Table S2). We assessed in detail whether
+                           these discrepancies could be caused by sequencing errors, as is already indicated by the long-terminal branches leading to
+                           BS107<sup>T</sup> and T5<sup>T</sup> (<a id="xref-fig-2-3" class="xref-fig" href="#F2">Fig. 2</a>). We thus compared the respective sequences with the bacterial 16S rRNA variability map (<a id="xref-ref-1-1" class="xref-bibr" href="#ref-1">Baker <em>et al.</em>, 2003</a>) and/or the 16S rRNA secondary structure model (<a id="xref-ref-19-2" class="xref-bibr" href="#ref-19">Gutell <em>et al.</em>, 1994</a>) and showed that the 16S rRNA gene sequences provided in this study were all in accordance with bases categorized as conserved
+                           by <a id="xref-ref-1-2" class="xref-bibr" href="#ref-1">Baker <em>et al.</em> (2003)</a> or the proposed rRNA secondary structure (Tables S1 and S2), whereas the previously determined 16S rRNA gene sequences Y13244
+                           and AY177712 were flawed.
+                        </p>
+                        
+                        <p id="p-34">Furthermore, we examined whether the four differences in the 16S rRNA gene sequences of <span class="named-content species" id="named-content-97"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> CIP 105210 (KC176239) and <span class="named-content species" id="named-content-98"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                 href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> DSM 16374<sup>T</sup> (KC176240) were genuine. They were localized at the base positions 614 (<span class="named-content species" id="named-content-99"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span>: G; <span class="named-content species" id="named-content-100"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                 href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span>: A) and 626 (<span class="named-content species" id="named-content-101"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span>: C; <span class="named-content species" id="named-content-102"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                 href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span>: U) within the 16S rRNA variable region V4 (<a id="xref-ref-1-3" class="xref-bibr" href="#ref-1">Baker <em>et al.</em>, 2003</a>) and at the positions 835 (<span class="named-content species" id="named-content-103"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span>: G; <span class="named-content species" id="named-content-104"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                 href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span>: A) and 851 (<span class="named-content species" id="named-content-105"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span>: C; <span class="named-content species" id="named-content-106"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                 href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span>: U) within the variable V5 region, respectively (<span class="named-content species" id="named-content-107"><a class="namesforlife" rel="namesforlife-name" title="E. coli"
+                                 href="doi:10.1601/nm.3093"><em>E. coli</em></a></span> numbering; Fig. S1; Table S3). Comparison with the secondary 16S rRNA structure model (<a id="xref-ref-19-3" class="xref-bibr" href="#ref-19">Gutell <em>et al.</em>, 1994</a>) and a simulation of the rRNA folding using the Mfold web server (<a id="xref-ref-45-1" class="xref-bibr" href="#ref-45">Zuker, 2003</a>) indicated that bases 614 and 626 paired in the variable region V4 stem–loop (<a id="xref-fig-3-1" class="xref-fig" href="#F3">Fig. 3</a>); similarly, bases 835 and 851 matched in the V5 stem–loop (Fig. S2). We thus assumed that the present transitions of G and
+                           C in <span class="named-content species" id="named-content-108"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> to A and U in <span class="named-content species" id="named-content-109"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                 href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span>, respectively, reflect genuine and characteristic mutations in the 16S rRNA genes of these species. Considering these bases,
+                           the 16S rRNA gene sequence of <span class="named-content genus" id="named-content-110"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strain CIP 105210 resembled the original one of BS107<sup>T</sup> (Y13244), which would indicate that strain CIP 105210 is the type strain of <span class="named-content species" id="named-content-111"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span>.
+                        </p>
+                        
+                        <div id="F3" class="fig pos-float type-figure  odd">
+                           <div class="fig-inline"><a href="4340/F3.expansion.html"><img alt="Fig. 3. " src="4340/F3.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                                    <li><a href="4340/F3.expansion.html">In this window</a></li>
+                                    <li><a class="in-nw" href="4340/F3.expansion.html">In a new window</a></li>
+                                 </ul>
+                                 <ul class="fig-services">
+                                    <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4340/F3">Download as PowerPoint Slide</a></li>
+                                 </ul>
+                              </div>
+                           </div>
+                           <div class="fig-caption"><span class="fig-label">Fig. 3. </span> 
+                              
+                              <p id="p-35" class="first-child">Secondary structure of the 16S rRNA variable region V4 of <span class="named-content species" id="named-content-112"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                       href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> CIP 105210<sup>T</sup> (a) and <span class="named-content species" id="named-content-113"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                       href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> DSM 17395 (b) demonstrating transition of bases 614 and 626 (<span class="named-content species" id="named-content-114"><a class="namesforlife" rel="namesforlife-name" title="E. coli"
+                                       href="doi:10.1601/nm.3093"><em>E. coli</em></a></span> numbering; bases 529 and 541 according to the CIP 105210<sup>T</sup> numbering). RNA folding was simulated using the Mfold web server for nucleic acid folding and hybridization prediction (<a id="xref-ref-45-2" class="xref-bibr" href="#ref-45">Zuker, 2003</a>; <a href="http://mfold.rna.albany.edu/?q=mfold/RNA-Folding-Form">http://mfold.rna.albany.edu/?q=mfold/RNA-Folding-Form</a>).
+                              </p>
+                              
+                              <div class="sb-div caption-clear"></div>
+                           </div>
+                        </div>
+                     </div>
+                     <div id="sec-15" class="subsection">
+                        
+                        <h4>MALDI-TOF MS analysis.</h4>
+                        
+                        <p id="p-36">In the MALDI-TOF MS dendrogram (<a id="xref-fig-4-1" class="xref-fig" href="#F4">Fig. 4</a>), the <span class="named-content genus" id="named-content-115"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains DSM 16374<sup>T</sup>, DSM 24588 and DSM 17395 not only formed a cluster but were virtually indistinguishable from each other. Strain CIP 105210
+                           appeared as the sister group of those three strains, whereas <span class="named-content species" id="named-content-116"><a class="namesforlife" rel="namesforlife-name" title="P. daeponensis"
+                                 href="doi:10.1601/nm.10944"><em>P. daeponensis</em></a></span> and <span class="named-content species" id="named-content-117"><a class="namesforlife" rel="namesforlife-name" title="P. caeruleus"
+                                 href="doi:10.1601/nm.14301"><em>P. caeruleus</em></a></span> as well as <span class="named-content species" id="named-content-118"><a class="namesforlife" rel="namesforlife-name" title="P. arcticus"
+                                 href="doi:10.1601/nm.14057"><em>P. arcticus</em></a></span> and <span class="named-content species" id="named-content-119"><a class="namesforlife" rel="namesforlife-name" title="P. leonis"
+                                 href="doi:10.1601/nm.24496"><em>P. leonis</em></a></span> were well set apart.
+                        </p>
+                        
+                        <div id="F4" class="fig pos-float type-figure  odd">
+                           <div class="fig-inline"><a href="4340/F4.expansion.html"><img alt="Fig. 4. " src="4340/F4.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                                    <li><a href="4340/F4.expansion.html">In this window</a></li>
+                                    <li><a class="in-nw" href="4340/F4.expansion.html">In a new window</a></li>
+                                 </ul>
+                                 <ul class="fig-services">
+                                    <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4340/F4">Download as PowerPoint Slide</a></li>
+                                 </ul>
+                              </div>
+                           </div>
+                           <div class="fig-caption"><span class="fig-label">Fig. 4. </span> 
+                              
+                              <p id="p-37" class="first-child">Score-oriented dendrogram showing the similarity of MALDI-TOF mass spectra from cell extracts of selected <span class="named-content genus" id="named-content-120"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                       href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains. The dendrogram was generated by the BioTyper software (version 3.0; Bruker Daltonics).
+                              </p>
+                              
+                              <div class="sb-div caption-clear"></div>
+                           </div>
+                        </div>
+                     </div>
+                     <div id="sec-16" class="subsection">
+                        
+                        <h4>ITS analysis.</h4>
+                        
+                        <p id="p-38">A comparable picture was observed in the ITS analysis (<a id="xref-fig-5-1" class="xref-fig" href="#F5">Fig. 5</a>). <span class="named-content genus" id="named-content-121"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strain DSM 17395 appeared as sister strain of <span class="named-content species" id="named-content-122"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                 href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> DSM 16374<sup>T</sup> with 93 % support under ML and 99 % support under MP. The sister-group relationship of these and strain DSM 24588 was supported
+                           with 70 % and 88 % bootstrap values, respectively, to the exclusion of <span class="named-content species" id="named-content-123"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> CIP 105210. <span class="named-content species" id="named-content-124"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter sp."
+                                 href="doi:10.1601/nm.17585"><em>Phaeobacter sp.</em></a></span> ANG1 was placed in a distinct cluster together with the type strains of <span class="named-content species" id="named-content-125"><a class="namesforlife" rel="namesforlife-name" title="P. daeponensis"
+                                 href="doi:10.1601/nm.10944"><em>P. daeponensis</em></a></span> and <span class="named-content species" id="named-content-126"><a class="namesforlife" rel="namesforlife-name" title="P. caeruleus"
+                                 href="doi:10.1601/nm.14301"><em>P. caeruleus</em></a></span> (100 % support).
+                        </p>
+                        
+                        <div id="F5" class="fig pos-float type-figure  odd">
+                           <div class="fig-inline"><a href="4340/F5.expansion.html"><img alt="Fig. 5. " src="4340/F5.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                                    <li><a href="4340/F5.expansion.html">In this window</a></li>
+                                    <li><a class="in-nw" href="4340/F5.expansion.html">In a new window</a></li>
+                                 </ul>
+                                 <ul class="fig-services">
+                                    <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4340/F5">Download as PowerPoint Slide</a></li>
+                                 </ul>
+                              </div>
+                           </div>
+                           <div class="fig-caption"><span class="fig-label">Fig. 5. </span> 
+                              
+                              <p id="p-39" class="first-child">Midpoint-rooted ML phylogeny inferred from ITS sequences of <span class="named-content genus" id="named-content-127"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                       href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains closely related to <span class="named-content species" id="named-content-128"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                       href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> and <span class="named-content species" id="named-content-129"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                       href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span>. Branches are scaled in terms of the expected number of substitutions per site. Numbers above branches are support values
+                                 from ML (left) and MP (right) bootstrapping. Original designation of strains that are deposited at culture collections is
+                                 indicated in parentheses; square brackets give the respective accession number.
+                              </p>
+                              
+                              <div class="sb-div caption-clear"></div>
+                           </div>
+                        </div>
+                     </div>
+                  </div>
+                  <div id="sec-17" class="subsection">
+                     
+                     <h3>DNA–DNA hybridization.</h3>
+                     
+                     <p id="p-40">In contrast to the highly similar genomic DNA between the strains DSM 17395 and DSM 16374<sup>T</sup> (82 %) as well as between the strains DSM 16374<sup>T</sup> and DSM 24588 (83 %), strain CIP 105210 shared only 62 % and 63 % DNA–DNA relatedness to the strains DSM 17395 and DSM 16374<sup>T</sup>, respectively (<a id="xref-table-wrap-1-1" class="xref-table" href="#T1">Table 1</a>). This is below the threshold of 70 % recommended by <a id="xref-ref-43-1" class="xref-bibr" href="#ref-43">Wayne <em>et al.</em> (1987)</a> hence indicating the status of strain CIP 105210 in a separate species. Conversely, the values clearly above 70 % indicate
+                        that strains DSM 17395, DSM 16374<sup>T</sup> and DSM 24588 belong to the same species.
+                     </p>
+                     
+                     <div id="T1" class="table pos-float">
+                        <div class="table-inline">
+                           <div class="callout"><span>View this table:</span><ul class="callout-links">
+                                 <li><a href="4340/T1.expansion.html">In this window</a></li>
+                                 <li><a class="in-nw" href="4340/T1.expansion.html">In a new window</a></li>
+                              </ul>
+                           </div>
+                        </div>
+                        <div class="table-caption"><span class="table-label">Table 1. </span> 
+                           <span class="caption-title">Mean DNA–DNA similarity values (<em>n</em> = 2) between the <span class="named-content genus" id="named-content-130"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                    href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains CIP 105210<sup>T</sup>, DSM 17395, DSM 16374<sup>T</sup> and DSM 24588</span>
+                           
+                           <div class="sb-div caption-clear"></div>
+                        </div>
+                     </div>
+                  </div>
+                  <div id="sec-18" class="subsection">
+                     
+                     <h3>Growth, hydrolysis and PM experiments</h3>
+                     
+                     <p id="p-42">The growth and hydrolysis experiments for <span class="named-content genus" id="named-content-132"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                              href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains CIP 105210 and DSM 17395 could only partially reproduce those conducted by <a id="xref-ref-34-5" class="xref-bibr" href="#ref-34">Ruiz-Ponte <em>et al.</em> (1998)</a> (Table S4). The results for strain CIP 105210 differed from all other series of measurements by growth of this strain on
+                        <span class="sc">l</span>-arabinose and hydrolysis of Tween 80. Strain DSM 17395 showed no specific characteristics, but it – as well as CIP 105210
+                        – differed from strain BS107<sup>T</sup> (<a id="xref-ref-34-6" class="xref-bibr" href="#ref-34">Ruiz-Ponte <em>et al.</em>, 1998</a>) as they grew on serine (like T5<sup>T</sup>; <a id="xref-ref-25-4" class="xref-bibr" href="#ref-25">Martens <em>et al.</em>, 2006</a>) and showed slow growth on <span class="sc">l</span>-rhamnose and 2-ketoglutarate (Table S4). The overall number of specific differences of all other strains to T5<sup>T</sup> (<a id="xref-ref-25-5" class="xref-bibr" href="#ref-25">Martens <em>et al.</em>, 2006</a>) was four (growth on citrate, glucosamine and on MB at 4 °C or 37 °C).
+                     </p>
+                     
+                     <p id="p-43">In contrast, the PM experiments, which are more sensitive than bacterial growth tests because they monitor substrate respiration
+                        (<a id="xref-ref-5-1" class="xref-bibr" href="#ref-5">Bochner <em>et al.</em>, 2001</a>), yielded significant physiological differences between all four tested <span class="named-content genus" id="named-content-133"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                              href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains, DSM 24588, DSM 16374<sup>T</sup>, DSM 17395 and CIP 105210 (Figs S3 and S4). The physiological similarity between strains CIP 105210 and DSM 17395 was high,
+                        but the differences between the two were clearly reproducible. According to the discretization approach implemented in ‘<em>opm</em>’ (<a id="xref-ref-42-2" class="xref-bibr" href="#ref-42">Vaas <em>et al.</em>, 2012</a>), respiration on tyramine (PM01-H04; blue box Fig. S3) was positive in DSM 17395 and DSM 16374, weak in DSM 24588 but negative
+                        in CIP 105210. Respiration on butyrate (PM02A-D12; Fig. S4) was positive in CIP 105210 and DSM 24588, weak in DSM 16374<sup>T</sup>, but negative in DSM 17395.
+                     </p>
+                     
+                     <p id="p-44">Regarding the common subset of growth or hydrolysis experiments on the one hand and PM experiments on the other hand, the
+                        results were identical with a few exceptions. Expectedly, no substrate was detected on which growth (or hydrolysis) was measurable
+                        but respiration was not observed, whereas on some substrates respiration was detected by PM analysis even though these substrates
+                        sustained no growth. Accordingly, a weak PM reaction on <span class="sc">l</span>-arabinose (PM01-A02) and a positive PM reaction on citrate (PM01-F02) were observed for all four tested strains. A positive
+                        PM reaction to Tween 80 (PM01-E05) was observed for strains DSM 24588 and CIP 105210, whereas strains DSM 17395 and DSM 16374<sup>T</sup> showed a weak reaction (compare red boxes in Fig. S3 with Table S4).
+                     </p>
+                     
+                  </div>
+               </div>
+               <div class="section discussion" id="sec-19">
+                  <div class="section-nav"><a href="#sec-11" title="Results" class="prev-section-link"><span>Previous Section</span></a><a href="#ack-1" title="Acknowledgements" class="next-section-link"><span>Next Section</span></a></div>
+                  
+                  <h2>Discussion</h2>
+                  
+                  <p id="p-45">According to the PFGE profiles of the extrachromosomal elements – which are largely supported by the complete genome sequences
+                     of the <span class="named-content genus" id="named-content-134"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                           href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains DSM 17395, DSM 24588 (<a id="xref-ref-40-5" class="xref-bibr" href="#ref-40">Thole <em>et al.</em>, 2012</a>), DSM 16374<sup>T</sup> (Dogs, M. and others, unpublished) and CIP 105210 (Frank, O. and others, unpublished) – DDH similarities, 16S rRNA gene sequence
+                     analysis, 16S–23S rRNA gene ITS sequence analysis, MALDI-TOF MS protein analysis, and high-throughput phenotyping using the
+                     PM technology, the <span class="named-content genus" id="named-content-135"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                           href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains CIP 105210 and DSM 17395, both supposed to be deposits of the type strain of <span class="named-content species" id="named-content-136"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> BS107<sup>T</sup>, are biologically clearly distinct. ITS sequence and MALDI-TOF analysis additionally showed that DSM 17395 (and DSM 24588)
+                     group together with <span class="named-content species" id="named-content-137"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                           href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> DSM 16374<sup>T</sup> to the exclusion of CIP 105210. As confirmed by DDH (≥76 % similarity), DSM 16374<sup>T</sup>, DSM 17395 and DSM 24588 are conspecific, i.e. all belong to the species <span class="named-content species" id="named-content-138"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                           href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span>. Analysis of 16S rRNA gene sequences was in accordance with this finding, too, because the sequences of these strains were
+                     identical (if the resequenced 16S rRNA gene sequence of DSM 16374<sup>T</sup> was considered). Our sequence analyses confirmed the finding of <a id="xref-ref-40-6" class="xref-bibr" href="#ref-40">Thole <em>et al.</em> (2012)</a> that the <span class="named-content species" id="named-content-139"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter sp."
+                           href="doi:10.1601/nm.17585"><em>Phaeobacter</em> sp.</a></span> ANG1 does not belong to the species <span class="named-content species" id="named-content-140"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span>.
+                  </p>
+                  
+                  <p id="p-46">Because DSM 17395 must hence be excluded from the species <span class="named-content species" id="named-content-141"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span>, the question arises whether the alternative type strain deposit, CIP 105210, represents <span class="named-content species" id="named-content-142"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> BS107<sup>T</sup>. DDH analysis (&lt;70 % similarity) indicates that CIP 105210 is not conspecific with <span class="named-content species" id="named-content-143"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                           href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span>. Analysis of growth behaviours and enzymic activities could not fully reproduce the findings of <a id="xref-ref-34-7" class="xref-bibr" href="#ref-34">Ruiz-Ponte <em>et al.</em> (1998)</a>, but given the overall low number of characters tested, the low number of known differences to the type strain of the sister
+                     species, <span class="named-content species" id="named-content-144"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                           href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span>, and the well-known difficulties in reproducing physiological tests in distinct laboratories in general, the significance
+                     of these discrepancies is unclear. Essentially, based on the newly generated CIP 105210 16S rRNA gene sequence that is identical
+                     to the one from BS107<sup>T</sup>, except for deviations that were likely to be sequencing errors, we could clearly document the type strain status of <span class="named-content species" id="named-content-145"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> CIP 105210<sup>T</sup>. As the strains CIP 105210<sup>T</sup> and DSM 17395 have been independently deposited at the CIP and the DSMZ, respectively, it is the most probable explanation
+                     that the later strain has been mixed-up prior to deposition.
+                  </p>
+                  
+                  <p id="p-47">Research laboratories are usually not equipped with sufficient resources to verify the biological identity of their cultures.
+                     Moreover, culture collections have to cope with the deposition of interchanged or contaminated strains and the quality of
+                     incoming material will presumably even deteriorate due to the decline of basic microbiological methodology in the era of molecular
+                     biology. Problems are expected particularly if confusion with closely related strains has occurred, as in the case of DSM
+                     17395, which apparently belongs to the sister species of the correct strain. Hence, it is advisable that researchers working
+                     on a certain strain exactly denote the source from which it was received. Providing the accession numbers of culture-collection
+                     deposits (such as ‘CIP 105210<sup>T</sup>’ or ‘DSM 17395’) should thus be preferred over just stating the original strain designator (such as ‘BS107<sup>T</sup>’) irrespective of the source from which the strain has been received. In any case, with respect to cultivatable microbes,
+                     only strains with a demonstrable history should be considered in serious research.
+                  </p>
+                  
+                  <p id="p-48">The three homologous plasmids of the completely sequenced <span class="named-content species" id="named-content-146"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                           href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> strains DSM 17395 and DSM 24588 exhibit a long-range synteny (<a id="xref-ref-40-7" class="xref-bibr" href="#ref-40">Thole <em>et al.</em>, 2012</a>), but several indels (insertions/deletions) are responsible for the deviating plasmid sizes [262 versus 238 kb (DnaA-like
+                     replicon; <a id="xref-ref-28-2" class="xref-bibr" href="#ref-28">Petersen, 2011</a>), 75(78)  versus 94 kb (RepB-I), 65(63) versus 70 kb (RepA-I); <a id="xref-fig-1-7" class="xref-fig" href="#F1">Fig. 1</a>]. Homologues of these replicons may also be present in the sister species <span class="named-content species" id="named-content-147"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> CIP 105210<sup>T</sup> e.g. represented by the 253, 77 and 64 kb replicons. However, the conspicuously different plasmid profiles in <span class="named-content species" id="named-content-148"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> and <span class="named-content species" id="named-content-149"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                           href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> (<a id="xref-fig-1-8" class="xref-fig" href="#F1">Fig. 1</a>) may reflect horizontal recruitment of four additional replicons in <span class="named-content species" id="named-content-150"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> CIP 105210<sup>T</sup>. The same explanation is supported by the presence of a type IV secretion system on the fourth 86 kb plasmid of the <span class="named-content species" id="named-content-151"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                           href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> type strain DSM 16374<sup>T</sup> (Dogs, M. and others, unpublished), which may be responsible for plasmid mobilization via conjugation (<a id="xref-ref-29-1" class="xref-bibr" href="#ref-29">Petersen <em>et al.</em>, 2013</a>). In the near future, genome sequencing and comparative genomics of more distantly related strains, such as <span class="named-content species" id="named-content-152"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter arcticus"
+                           href="doi:10.1601/nm.14057"><em>Phaeobacter arcticus</em></a></span>, will help to reveal the extent of horizontal exchange and vertical evolution within the <span class="named-content genus" id="named-content-153"><a class="namesforlife" rel="namesforlife-name" title="Roseobacter"
+                           href="doi:10.1601/nm.1134"><em>Roseobacter</em></a></span> clade.
+                  </p>
+                  
+               </div>
+               <div class="section ack" id="ack-1">
+                  <div class="section-nav"><a href="#sec-19" title="Discussion" class="prev-section-link"><span>Previous Section</span></a><a href="#ref-list-1" title="References" class="next-section-link"><span>Next Section</span></a></div>
+                  <h2>Acknowledgements</h2>
+                  
+                  <p id="p-49">This work, including a PhD stipend for N. B., was supported by the Transregional Collaborative Research Center ‘<em>Roseobacter</em>’ of the Deutsche Forschungsgemeinschaft (Transregio TRR 51) and the MICROME project, EU Framework Program 7 Collaborative
+                     Project (222886-2). We thank Victoria Michael, Bettina Sträubler and Ulrike Steiner for excellent technical assistance, Brian
+                     Tindall and Sabine Gronow for their helpful discussions, as well as the two anonymous reviewers for their constructive criticism.
+                  </p>
+                  
+               </div>
+               <div class="section ref-list" id="ref-list-1">
+                  <div class="section-nav"><a href="#ack-1" title="Acknowledgements" class="prev-section-link"><span>Previous Section</span></a><div class="nav-placeholder"> </div>
+                  </div>
+                  <h2>References</h2>
+                  <ol class="cit-list ref-use-labels">
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-1-1" title="View reference  in text"
+                           id="ref-1">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.1"
+                             data-doi="10.1016/j.mimet.2003.08.009">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Baker</span>,  <span class="cit-name-given-names">G. C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Smith</span>,  <span class="cit-name-given-names">J. J.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Cowan</span>,  <span class="cit-name-given-names">D. A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2003</span><strong>).</strong> <span class="cit-article-title">Review and re-analysis of domain-specific 16S primers</span>. <abbr class="cit-jnl-abbrev">J Microbiol Methods</abbr> <span class="cit-vol">55</span>, <span class="cit-fpage">541</span>–<span class="cit-lpage">555</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/j.mimet.2003.08.009</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>14607398</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/j.mimet.2003.08.009&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=14607398&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Review%20and%20re-analysis%20of%20domain-specific%2016S%20primers&amp;author=G.%20C.%20Baker&amp;author=J.%20J.%20Smith&amp;author=D.%20A.%20Cowan&amp;publication_year=2003&amp;journal=J%20Microbiol%20Methods&amp;volume=55&amp;pages=541-555&amp;doi=10.1016%2Fj.mimet.2003.08.009&amp;pmid=14607398">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-2-1" title="View reference  in text"
+                           id="ref-2">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.2"
+                             data-doi="10.1128/JB.05818-11">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Berger</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Neumann</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Schulz</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Simon</span>,  <span class="cit-name-given-names">M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brinkhoff</span>,  <span class="cit-name-given-names">T.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2011</span><strong>).</strong> <span class="cit-article-title">Tropodithietic acid production in <em>Phaeobacter gallaeciensis</em> is regulated by <em>N</em>-acyl homoserine lactone-mediated quorum sensing</span>. <abbr class="cit-jnl-abbrev">J Bacteriol</abbr> <span class="cit-vol">193</span>, <span class="cit-fpage">6576</span>–<span class="cit-lpage">6585</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/JB.05818-11</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>21949069</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=jb&amp;resid=193/23/6576"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-3-1" title="View reference  in text"
+                           id="ref-3">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.3"
+                             data-doi="10.1128/AEM.07657-11">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Berger</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brock</span>,  <span class="cit-name-given-names">N. L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Liesegang</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Dogs</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Preuth</span>,  <span class="cit-name-given-names">I.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Simon</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Dickschat</span>,  <span class="cit-name-given-names">J. S.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brinkhoff</span>,  <span class="cit-name-given-names">T.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2012</span><strong>).</strong> <span class="cit-article-title">Genetic analysis of the upper phenylacetate catabolic pathway in the production of tropodithietic acid by <em>Phaeobacter gallaeciensis</em></span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">78</span>, <span class="cit-fpage">3539</span>–<span class="cit-lpage">3551</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.07657-11</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>22407685</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=78/10/3539"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-4-1" title="View reference  in text"
+                           id="ref-4">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.4"
+                             data-doi="10.1111/j.1574-6976.2008.00149.x">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bochner</span>,  <span class="cit-name-given-names">B. R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2009</span><strong>).</strong> <span class="cit-article-title">Global phenotypic characterization of bacteria</span>. <abbr class="cit-jnl-abbrev">FEMS Microbiol Rev</abbr> <span class="cit-vol">33</span>, <span class="cit-fpage">191</span>–<span class="cit-lpage">205</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1111/j.1574-6976.2008.00149.x</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>19054113</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=femsre&amp;resid=33/1/191"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-5-1" title="View reference  in text"
+                           id="ref-5">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.5"
+                             data-doi="10.1101/gr.186501">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bochner</span>,  <span class="cit-name-given-names">B. R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Gadzinski</span>,  <span class="cit-name-given-names">P.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Panomitros</span>,  <span class="cit-name-given-names">E.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2001</span><strong>).</strong> <span class="cit-article-title">Phenotype microarrays for high-throughput phenotypic testing and assay of gene function</span>. <abbr class="cit-jnl-abbrev">Genome Res</abbr> <span class="cit-vol">11</span>, <span class="cit-fpage">1246</span>–<span class="cit-lpage">1255</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1101/gr.186501</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>11435407</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=genome&amp;resid=11/7/1246"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-6-1" title="View reference  in text"
+                           id="ref-6">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.6"
+                             data-doi="10.1128/AEM.70.4.2560-2565.2003">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brinkhoff</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bach</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Heidorn</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Liang</span>,  <span class="cit-name-given-names">L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Schlingloff</span>,  <span class="cit-name-given-names">A.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Simon</span>,  <span class="cit-name-given-names">M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2004</span><strong>).</strong> <span class="cit-article-title">Antibiotic production by a <em>Roseobacter</em> clade-affiliated species from the German Wadden Sea and its antagonistic effects on indigenous isolates</span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">70</span>, <span class="cit-fpage">2560</span>–<span class="cit-lpage">2565</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.70.4.2560-2565.2003</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>15066861</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=70/4/2560"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-7-1" title="View reference  in text"
+                           id="ref-7">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.7"
+                             data-doi="10.1128/AEM.02238-06">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bruhn</span>,  <span class="cit-name-given-names">J. B.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Gram</span>,  <span class="cit-name-given-names">L.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Belas</span>,  <span class="cit-name-given-names">R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2007</span><strong>).</strong> <span class="cit-article-title">Production of antibacterial compounds and biofilm formation by <em>Roseobacter</em> species are influenced by culture conditions</span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">73</span>, <span class="cit-fpage">442</span>–<span class="cit-lpage">450</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.02238-06</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>17098910</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=73/2/442"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-8-1" title="View reference  in text"
+                           id="ref-8">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.8"
+                             data-doi="10.1016/0003-2697(77)90720-5">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Cashion</span>,  <span class="cit-name-given-names">P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Holder-Franklin</span>,  <span class="cit-name-given-names">M. A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">McCully</span>,  <span class="cit-name-given-names">J.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Franklin</span>,  <span class="cit-name-given-names">M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1977</span><strong>).</strong> <span class="cit-article-title">A rapid method for the base ratio determination of bacterial DNA</span>. <abbr class="cit-jnl-abbrev">Anal Biochem</abbr> <span class="cit-vol">81</span>, <span class="cit-fpage">461</span>–<span class="cit-lpage">466</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/0003-2697(77)90720-5</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>907108</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/0003-2697(77)90720-5&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=907108&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=A%20rapid%20method%20for%20the%20base%20ratio%20determination%20of%20bacterial%20DNA&amp;author=P.%20Cashion&amp;author=M.%20A.%20Holder-Franklin&amp;author=J.%20McCully&amp;author=M.%20Franklin&amp;publication_year=1977&amp;journal=Anal%20Biochem&amp;volume=81&amp;pages=461-466&amp;doi=10.1016%2F0003-2697%2877%2990720-5&amp;pmid=907108">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-9-1" title="View reference  in text"
+                           id="ref-9">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.9"
+                             data-doi="10.1128/JB.05139-11">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Collins</span>,  <span class="cit-name-given-names">A. J.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nyholm</span>,  <span class="cit-name-given-names">S. V.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2011</span><strong>).</strong> <span class="cit-article-title">Draft genome of <em>Phaeobacter gallaeciensis</em> ANG1, a dominant member of the accessory nidamental gland of <em>Euprymna scolopes</em></span>. <abbr class="cit-jnl-abbrev">J Bacteriol</abbr> <span class="cit-vol">193</span>, <span class="cit-fpage">3397</span>–<span class="cit-lpage">3398</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/JB.05139-11</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>21551313</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=jb&amp;resid=193/13/3397"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-10-1" title="View reference  in text"
+                           id="ref-10">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.10"
+                             data-doi="10.1111/j.1432-1033.1970.tb00830.x">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">De Ley</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Cattoir</span>,  <span class="cit-name-given-names">H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Reynaerts</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1970</span><strong>).</strong> <span class="cit-article-title">The quantitative measurement of DNA hybridization from renaturation rates</span>. <abbr class="cit-jnl-abbrev">Eur J Biochem</abbr> <span class="cit-vol">12</span>, <span class="cit-fpage">133</span>–<span class="cit-lpage">142</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1111/j.1432-1033.1970.tb00830.x</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>4984993</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1111/j.1432-1033.1970.tb00830.x&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=4984993&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=The%20quantitative%20measurement%20of%20DNA%20hybridization%20from%20renaturation%20rates&amp;author=J.%20De%20Ley&amp;author=H.%20Cattoir&amp;author=A.%20Reynaerts&amp;publication_year=1970&amp;journal=Eur%20J%20Biochem&amp;volume=12&amp;pages=133-142&amp;doi=10.1111%2Fj.1432-1033.1970.tb00830.x&amp;pmid=4984993">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-11-1" title="View reference  in text"
+                           id="ref-11">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.11"
+                             data-doi="10.1002/cbic.200900668">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Dickschat</span>,  <span class="cit-name-given-names">J. S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Zell</span>,  <span class="cit-name-given-names">C.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brock</span>,  <span class="cit-name-given-names">N. L.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2010</span><strong>).</strong> <span class="cit-article-title">Pathways and substrate specificity of DMSP catabolism in marine bacteria of the <em>Roseobacter</em> clade</span>. <abbr class="cit-jnl-abbrev">ChemBioChem</abbr> <span class="cit-vol">11</span>, <span class="cit-fpage">417</span>–<span class="cit-lpage">425</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1002/cbic.200900668</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>20043308</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1002/cbic.200900668&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=20043308&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Pathways%20and%20substrate%20specificity%20of%20DMSP%20catabolism%20in%20marine%20bacteria%20of%20the%20Roseobacter%20clade&amp;author=J.%20S.%20Dickschat&amp;author=C.%20Zell&amp;author=N.%20L.%20Brock&amp;publication_year=2010&amp;journal=ChemBioChem&amp;volume=11&amp;pages=417-425&amp;doi=10.1002%2Fcbic.200900668&amp;pmid=20043308">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-12-1" title="View reference  in text"
+                           id="ref-12">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.12"
+                             data-doi="10.1086/282802">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Farris</span>,  <span class="cit-name-given-names">J. S.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1972</span><strong>).</strong> <span class="cit-article-title">Estimating phylogenetic trees from distance matrices</span>. <abbr class="cit-jnl-abbrev">Am Nat</abbr> <span class="cit-vol">106</span>, <span class="cit-fpage">645</span>–<span class="cit-lpage">668</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1086/282802</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1086/282802&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Estimating%20phylogenetic%20trees%20from%20distance%20matrices&amp;author=J.%20S.%20Farris&amp;publication_year=1972&amp;journal=Am%20Nat&amp;volume=106&amp;pages=645-668&amp;doi=10.1086%2F282802">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-13-1" title="View reference  in text"
+                           id="ref-13">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.13"
+                             data-doi="10.1007/BF01734359">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Felsenstein</span>,  <span class="cit-name-given-names">J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1981</span><strong>).</strong> <span class="cit-article-title">Evolutionary trees from DNA sequences: a maximum likelihood approach</span>. <abbr class="cit-jnl-abbrev">J Mol Evol</abbr> <span class="cit-vol">17</span>, <span class="cit-fpage">368</span>–<span class="cit-lpage">376</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/BF01734359</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>7288891</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/BF01734359&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=7288891&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Evolutionary%20trees%20from%20DNA%20sequences%3A%20a%20maximum%20likelihood%20approach&amp;author=J.%20Felsenstein&amp;publication_year=1981&amp;journal=J%20Mol%20Evol&amp;volume=17&amp;pages=368-376&amp;doi=10.1007%2FBF01734359&amp;pmid=7288891">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-14-1" title="View reference  in text"
+                           id="ref-14">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.14"
+                             data-doi="10.1371/journal.pone.0027387">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Fernandes</span>,  <span class="cit-name-given-names">N.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Case</span>,  <span class="cit-name-given-names">R. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Longford</span>,  <span class="cit-name-given-names">S. R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Seyedsayamdost</span>,  <span class="cit-name-given-names">M. R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Steinberg</span>,  <span class="cit-name-given-names">P. D.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kjelleberg</span>,  <span class="cit-name-given-names">S.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Thomas</span>,  <span class="cit-name-given-names">T.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2011</span><strong>).</strong> <span class="cit-article-title">Genomes and virulence factors of novel bacterial pathogens causing bleaching disease in the marine red alga <em>Delisea pulchra</em></span>. <abbr class="cit-jnl-abbrev">PLoS ONE</abbr> <span class="cit-vol">6</span>, <span class="cit-fpage">e27387</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1371/journal.pone.0027387</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>22162749</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1371/journal.pone.0027387&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=22162749&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Genomes%20and%20virulence%20factors%20of%20novel%20bacterial%20pathogens%20causing%20bleaching%20disease%20in%20the%20marine%20red%20alga%20Delisea%20pulchra&amp;author=N.%20Fernandes&amp;author=R.%20J.%20Case&amp;author=S.%20R.%20Longford&amp;author=M.%20R.%20Seyedsayamdost&amp;author=P.%20D.%20Steinberg&amp;author=S.%20Kjelleberg&amp;author=T.%20Thomas&amp;publication_year=2011&amp;journal=PLoS%20ONE&amp;volume=6&amp;pages=e27387&amp;doi=10.1371%2Fjournal.pone.0027387&amp;pmid=22162749">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-15-1" title="View reference  in text"
+                           id="ref-15">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.15"
+                             data-doi="10.1093/sysbio/20.4.406">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Fitch</span>,  <span class="cit-name-given-names">W. M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1971</span><strong>).</strong> <span class="cit-article-title">Towards defining the course of evolution: minimal change for a specified tree topology</span>. <abbr class="cit-jnl-abbrev">Syst Zool</abbr> <span class="cit-vol">20</span>, <span class="cit-fpage">406</span>–<span class="cit-lpage">416</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.2307/2412116</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=sysbio&amp;resid=20/4/406"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-16-1" title="View reference  in text"
+                           id="ref-16">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.16"
+                             data-doi="10.1099/ijs.0.046128-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Gaboyer</span>,  <span class="cit-name-given-names">F.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Tindall</span>,  <span class="cit-name-given-names">B. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ciobanu</span>,  <span class="cit-name-given-names">M.-C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Duthoit</span>,  <span class="cit-name-given-names">F.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Le Romancer</span>,  <span class="cit-name-given-names">M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Alain</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2013</span><strong>).</strong> <span class="cit-article-title"><em>Phaeobacter leonis</em> sp. nov., an alphaproteobacterium from Mediterranean Sea sediments</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">63</span>, <span class="cit-fpage">3301</span>–<span class="cit-lpage">3306</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.046128-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>23475346</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=63/Pt_9/3301"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-17-1" title="View reference  in text"
+                           id="ref-17">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.17"
+                             data-doi="10.1128/AEM.02339-07">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Geng</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bruhn</span>,  <span class="cit-name-given-names">J. B.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nielsen</span>,  <span class="cit-name-given-names">K. F.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Gram</span>,  <span class="cit-name-given-names">L.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Belas</span>,  <span class="cit-name-given-names">R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2008</span><strong>).</strong> <span class="cit-article-title">Genetic dissection of tropodithietic acid biosynthesis by marine roseobacters</span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">74</span>, <span class="cit-fpage">1535</span>–<span class="cit-lpage">1545</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.02339-07</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>18192410</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=74/5/1535"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-18-1" title="View reference  in text"
+                           id="ref-18">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.18"
+                             data-doi="10.1099/13500872-142-1-3">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Gürtler</span>,  <span class="cit-name-given-names">V.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stanisich</span>,  <span class="cit-name-given-names">V. A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1996</span><strong>).</strong> <span class="cit-article-title">New approaches to typing and identification of bacteria using the 16S–23S rDNA spacer region</span>. <abbr class="cit-jnl-abbrev">Microbiology</abbr> <span class="cit-vol">142</span>, <span class="cit-fpage">3</span>–<span class="cit-lpage">16</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/13500872-142-1-3</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>8581168</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=PDF&amp;journalCode=mic&amp;resid=142/1/3"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-19-1" title="View reference  in text"
+                           id="ref-19">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.19">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Gutell</span>,  <span class="cit-name-given-names">R. R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Larsen</span>,  <span class="cit-name-given-names">N.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Woese</span>,  <span class="cit-name-given-names">C. R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1994</span><strong>).</strong> <span class="cit-article-title">Lessons from an evolving rRNA: 16S and 23S rRNA structures from a comparative perspective</span>. <abbr class="cit-jnl-abbrev">Microbiol Rev</abbr> <span class="cit-vol">58</span>, <span class="cit-fpage">10</span>–<span class="cit-lpage">26</span>.<span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>8177168</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=mmbr&amp;resid=58/1/10"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-20-1" title="View reference  in text"
+                           id="ref-20">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.20"
+                             data-doi="10.1111/j.1095-8312.2007.00864.x">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hess</span>,  <span class="cit-name-given-names">P. N.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">De Moraes Russo</span>,  <span class="cit-name-given-names">C. A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2007</span><strong>).</strong> <span class="cit-article-title">An empirical test of the midpoint rooting method</span>. <abbr class="cit-jnl-abbrev">Biol J Linn Soc Lond</abbr> <span class="cit-vol">92</span>, <span class="cit-fpage">669</span>–<span class="cit-lpage">674</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1111/j.1095-8312.2007.00864.x</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1111/j.1095-8312.2007.00864.x&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=An%20empirical%20test%20of%20the%20midpoint%20rooting%20method&amp;author=P.%20N.%20Hess&amp;author=C.%20A.%20De%20Moraes%20Russo&amp;publication_year=2007&amp;journal=Biol%20J%20Linn%20Soc%20Lond&amp;volume=92&amp;pages=669-674&amp;doi=10.1111%2Fj.1095-8312.2007.00864.x">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-21-1" title="View reference  in text"
+                           id="ref-21">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.21"
+                             data-doi="10.1016/S0723-2020(83)80048-4">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Huß</span>,  <span class="cit-name-given-names">V. A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Festl</span>,  <span class="cit-name-given-names">H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Schleifer</span>,  <span class="cit-name-given-names">K. H.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1983</span><strong>).</strong> <span class="cit-article-title">Studies on the spectrophotometric determination of DNA hybridization from renaturation rates</span>. <abbr class="cit-jnl-abbrev">Syst Appl Microbiol</abbr> <span class="cit-vol">4</span>, <span class="cit-fpage">184</span>–<span class="cit-lpage">192</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/S0723-2020(83)80048-4</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>23194591</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/S0723-2020(83)80048-4&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=23194591&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Studies%20on%20the%20spectrophotometric%20determination%20of%20DNA%20hybridization%20from%20renaturation%20rates&amp;author=V.%20A.%20Hu%C3%9F&amp;author=H.%20Festl&amp;author=K.%20H.%20Schleifer&amp;publication_year=1983&amp;journal=Syst%20Appl%20Microbiol&amp;volume=4&amp;pages=184-192&amp;doi=10.1016%2FS0723-2020%2883%2980048-4&amp;pmid=23194591">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-22-1" title="View reference  in text"
+                           id="ref-22">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.22"
+                             data-doi="10.1093/nar/gki198">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Katoh</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kuma</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Toh</span>,  <span class="cit-name-given-names">H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Miyata</span>,  <span class="cit-name-given-names">T.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2005</span><strong>).</strong> <span class="cit-article-title"><span class="sc">mafft</span> version 5: improvement in accuracy of multiple sequence alignment</span>. <abbr class="cit-jnl-abbrev">Nucleic Acids Res</abbr> <span class="cit-vol">33</span>, <span class="cit-fpage">511</span>–<span class="cit-lpage">518</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1093/nar/gki198</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>15661851</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=nar&amp;resid=33/2/511"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-23-1" title="View reference  in text"
+                           id="ref-23">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4340.23">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Stackebrandt</span>,  <span class="cit-name-given-names">E.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Goodfellow</span>,  <span class="cit-name-given-names">M.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lane</span>,  <span class="cit-name-given-names">D. J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1991</span><strong>).</strong> <span class="cit-article-title">16S/23S rRNA sequencing</span>. In <span class="cit-source">Nucleic Acid Techniques in Bacterial Systematics</span>, pp. <span class="cit-fpage">115</span>–<span class="cit-lpage">175</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Stackebrandt</span>,  <span class="cit-name-given-names">E.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Goodfellow</span>,  <span class="cit-name-given-names">M.</span></span>
+                                 . <span class="cit-publ-loc">Chichester</span>: <span class="cit-publ-name">Wiley</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=16S%2F23S%20rRNA%20sequencing&amp;author=D.%20J.%20Lane&amp;publication_year=1991&amp;citation_inbook_title=Nucleic%20Acid%20Techniques%20in%20Bacterial%20Systematics">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-24-1" title="View reference  in text"
+                           id="ref-24">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.24"
+                             data-doi="10.1093/nar/gkr1044">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Markowitz</span>,  <span class="cit-name-given-names">V. M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Chen</span>,  <span class="cit-name-given-names">I.-M. A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Palaniappan</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Chu</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Szeto</span>,  <span class="cit-name-given-names">E.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Grechkin</span>,  <span class="cit-name-given-names">Y.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ratner</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jacob</span>,  <span class="cit-name-given-names">B.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Huang</span>,  <span class="cit-name-given-names">J.</span></span></li>
+                              </ol><cite> <strong>&amp; other authors (</strong><span class="cit-pub-date">2012</span><strong>).</strong> <span class="cit-article-title">IMG: the Integrated Microbial Genomes database and comparative analysis system</span>. <abbr class="cit-jnl-abbrev">Nucleic Acids Res</abbr> <span class="cit-vol">40</span> (<span class="cit-supplement">Database issue</span>), <span class="cit-fpage">D115</span>–<span class="cit-lpage">D122</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1093/nar/gkr1044</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>22194640</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=nar&amp;resid=40/D1/D115"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-25-1" title="View reference  in text"
+                           id="ref-25">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.25"
+                             data-doi="10.1099/ijs.0.63724-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Martens</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Heidorn</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pukall</span>,  <span class="cit-name-given-names">R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Simon</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Tindall</span>,  <span class="cit-name-given-names">B. J.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brinkhoff</span>,  <span class="cit-name-given-names">T.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2006</span><strong>).</strong> <span class="cit-article-title">Reclassification of <em>Roseobacter gallaeciensis</em> Ruiz-Ponte <em>et al.</em> 1998 as <em>Phaeobacter gallaeciensis</em> gen. nov., comb. nov., description of <em>Phaeobacter inhibens</em> sp. nov., reclassification of <em>Ruegeria algicola</em> (Lafay <em>et al.</em> 1995) Uchino <em>et al.</em> 1999 as <em>Marinovum algicola</em> gen. nov., comb. nov., and emended descriptions of the genera <em>Roseobacter</em>, <em>Ruegeria</em> and <em>Leisingera</em></span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">56</span>, <span class="cit-fpage">1293</span>–<span class="cit-lpage">1304</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.63724-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>16738106</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=56/6/1293"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-26-1" title="View reference  in text"
+                           id="ref-26">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.26"
+                             data-doi="10.1007/s00248-006-9165-2">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Martens</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Gram</span>,  <span class="cit-name-given-names">L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Grossart</span>,  <span class="cit-name-given-names">H.-P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kessler</span>,  <span class="cit-name-given-names">D.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Müller</span>,  <span class="cit-name-given-names">R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Simon</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wenzel</span>,  <span class="cit-name-given-names">S. C.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brinkhoff</span>,  <span class="cit-name-given-names">T.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2007</span><strong>).</strong> <span class="cit-article-title">Bacteria of the <em>Roseobacter</em> clade show potential for secondary metabolite production</span>. <abbr class="cit-jnl-abbrev">Microb Ecol</abbr> <span class="cit-vol">54</span>, <span class="cit-fpage">31</span>–<span class="cit-lpage">42</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/s00248-006-9165-2</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>17351813</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/s00248-006-9165-2&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=17351813&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Bacteria%20of%20the%20Roseobacter%20clade%20show%20potential%20for%20secondary%20metabolite%20production&amp;author=T.%20Martens&amp;author=L.%20Gram&amp;author=H.-P.%20Grossart&amp;author=D.%20Kessler&amp;author=R.%20M%C3%BCller&amp;author=M.%20Simon&amp;author=S.%20C.%20Wenzel&amp;author=T.%20Brinkhoff&amp;publication_year=2007&amp;journal=Microb%20Ecol&amp;volume=54&amp;pages=31-42&amp;doi=10.1007%2Fs00248-006-9165-2&amp;pmid=17351813">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-27-1" title="View reference  in text"
+                           id="ref-27">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.27"
+                             data-doi="10.1089/cmb.2009.0179">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pattengale</span>,  <span class="cit-name-given-names">N. D.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Alipour</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bininda-Emonds</span>,  <span class="cit-name-given-names">O. R. P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Moret</span>,  <span class="cit-name-given-names">B. M. E.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stamatakis</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2010</span><strong>).</strong> <span class="cit-article-title">How many bootstrap replicates are necessary?</span> <abbr class="cit-jnl-abbrev">J Comput Biol</abbr> <span class="cit-vol">17</span>, <span class="cit-fpage">337</span>–<span class="cit-lpage">354</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1089/cmb.2009.0179</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>20377449</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1089/cmb.2009.0179&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=20377449&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=How%20many%20bootstrap%20replicates%20are%20necessary%3F&amp;author=N.%20D.%20Pattengale&amp;author=M.%20Alipour&amp;author=O.%20R.%20P.%20Bininda-Emonds&amp;author=B.%20M.%20E.%20Moret&amp;author=A.%20Stamatakis&amp;publication_year=2010&amp;journal=J%20Comput%20Biol&amp;volume=17&amp;pages=337-354&amp;doi=10.1089%2Fcmb.2009.0179&amp;pmid=20377449">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-28-1" title="View reference  in text"
+                           id="ref-28">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.28">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Petersen</span>,  <span class="cit-name-given-names">J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2011</span><strong>).</strong> <span class="cit-article-title">Phylogeny and compatibility: plasmid classification in the genomics era</span>. <abbr class="cit-jnl-abbrev">Arch Microbiol</abbr> <span class="cit-vol">193</span>, <span class="cit-fpage">313</span>–<span class="cit-lpage">321</span>.<span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>21374058</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=21374058&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Phylogeny%20and%20compatibility%3A%20plasmid%20classification%20in%20the%20genomics%20era&amp;author=J.%20Petersen&amp;publication_year=2011&amp;journal=Arch%20Microbiol&amp;volume=193&amp;pages=313-321&amp;pmid=21374058">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-29-1" title="View reference  in text"
+                           id="ref-29">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.29"
+                             data-doi="10.1007/s00253-013-4746-8">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Petersen</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Frank</span>,  <span class="cit-name-given-names">O.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Göker</span>,  <span class="cit-name-given-names">M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pradella</span>,  <span class="cit-name-given-names">S.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2013</span><strong>).</strong> <span class="cit-article-title">Extrachromosomal, extraordinary and essential — the plasmids of the Roseobacter clade</span>. <abbr class="cit-jnl-abbrev">Appl Microbiol Biotechnol</abbr> <span class="cit-vol">97</span>, <span class="cit-fpage">2805</span>–<span class="cit-lpage">2815</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/s00203-009-0535-2</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>20039020</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/s00253-013-4746-8&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=20039020&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Extrachromosomal%2C%20extraordinary%20and%20essential%20%E2%80%94%20the%20plasmids%20of%20the%20Roseobacter%20clade&amp;author=J.%20Petersen&amp;author=O.%20Frank&amp;author=M.%20G%C3%B6ker&amp;author=S.%20Pradella&amp;publication_year=2013&amp;journal=Appl%20Microbiol%20Biotechnol&amp;volume=97&amp;pages=2805-2815&amp;doi=10.1007%2Fs00203-009-0535-2&amp;pmid=20039020">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-30-1" title="View reference  in text"
+                           id="ref-30">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.30"
+                             data-doi="10.1007/s00203-009-0535-2">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pradella</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Päuker</span>,  <span class="cit-name-given-names">O.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Petersen</span>,  <span class="cit-name-given-names">J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2010</span><strong>).</strong> <span class="cit-article-title">Genome organisation of the marine <em>Roseobacter</em> clade member <em>Marinovum algicola</em></span>. <abbr class="cit-jnl-abbrev">Arch Microbiol</abbr> <span class="cit-vol">192</span>, <span class="cit-fpage">115</span>–<span class="cit-lpage">126</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/s00203-009-0535-2</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>20039020</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/s00203-009-0535-2&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=20039020&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Genome%20organisation%20of%20the%20marine%20Roseobacter%20clade%20member%20Marinovum%20algicola&amp;author=S.%20Pradella&amp;author=O.%20P%C3%A4uker&amp;author=J.%20Petersen&amp;publication_year=2010&amp;journal=Arch%20Microbiol&amp;volume=192&amp;pages=115-126&amp;doi=10.1007%2Fs00203-009-0535-2&amp;pmid=20039020">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-31-1" title="View reference  in text"
+                           id="ref-31">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.31"
+                             data-doi="10.1099/00207713-46-4-1088">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Rainey</span>,  <span class="cit-name-given-names">F. A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ward-Rainey</span>,  <span class="cit-name-given-names">N.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kroppenstedt</span>,  <span class="cit-name-given-names">R. M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stackebrandt</span>,  <span class="cit-name-given-names">E.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1996</span><strong>).</strong> <span class="cit-article-title">The genus <em>Nocardiopsis</em> represents a phylogenetically coherent taxon and a distinct actinomycete lineage: proposal of <em>Nocardiopsaceae</em> fam. nov.</span> <abbr class="cit-jnl-abbrev">Int J Syst Bacteriol</abbr> <span class="cit-vol">46</span>, <span class="cit-fpage">1088</span>–<span class="cit-lpage">1092</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-46-4-1088</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>8863440</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=46/4/1088"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-32-1" title="View reference  in text"
+                           id="ref-32">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.32"
+                             data-doi="10.1128/AEM.71.4.1729-1736.2005">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Rao</span>,  <span class="cit-name-given-names">D.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Webb</span>,  <span class="cit-name-given-names">J. S.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kjelleberg</span>,  <span class="cit-name-given-names">S.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2005</span><strong>).</strong> <span class="cit-article-title">Competitive interactions in mixed-species biofilms containing the marine bacterium <em>Pseudoalteromonas tunicata</em></span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">71</span>, <span class="cit-fpage">1729</span>–<span class="cit-lpage">1736</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.71.4.1729-1736.2005</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>15811995</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=71/4/1729"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-33-1" title="View reference  in text"
+                           id="ref-33">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4340.33"
+                             data-doi="10.1016/B978-012101285-4/50007-2">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Birren</span>,  <span class="cit-name-given-names">B.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Lai</span>,  <span class="cit-name-given-names">E.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Römling</span>,  <span class="cit-name-given-names">U.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Fislage</span>,  <span class="cit-name-given-names">R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Tümmler</span>,  <span class="cit-name-given-names">B.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1996</span><strong>).</strong> <span class="cit-article-title">Macrorestriction mapping an analysis of bacterial genomes</span>. In <span class="cit-source">Nonmammalian Genomic Analysis: A Practical Guide</span>, pp. <span class="cit-fpage">165</span>–<span class="cit-lpage">195</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Birren</span>,  <span class="cit-name-given-names">B.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Lai</span>,  <span class="cit-name-given-names">E.</span></span>
+                                 . <span class="cit-publ-loc">San Diego, CA</span>: <span class="cit-publ-name">Academic Press</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/B978-012101285-4/50007-2</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/B978-012101285-4/50007-2&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Macrorestriction%20mapping%20an%20analysis%20of%20bacterial%20genomes&amp;author=U.%20R%C3%B6mling&amp;author=R.%20Fislage&amp;author=B.%20T%C3%BCmmler&amp;publication_year=1996&amp;citation_inbook_title=Nonmammalian%20Genomic%20Analysis%3A%20A%20Practical%20Guide">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-34-1" title="View reference  in text"
+                           id="ref-34">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.34"
+                             data-doi="10.1099/00207713-48-2-537">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ruiz-Ponte</span>,  <span class="cit-name-given-names">C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Cilia</span>,  <span class="cit-name-given-names">V.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lambert</span>,  <span class="cit-name-given-names">C.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nicolas</span>,  <span class="cit-name-given-names">J. L.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1998</span><strong>).</strong> <span class="cit-article-title"><em>Roseobacter gallaeciensis</em> sp. nov., a new marine bacterium isolated from rearings and collectors of the scallop <em>Pecten maximus</em></span>. <abbr class="cit-jnl-abbrev">Int J Syst Bacteriol</abbr> <span class="cit-vol">48</span>, <span class="cit-fpage">537</span>–<span class="cit-lpage">542</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-48-2-537</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>9731295</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=48/2/537"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-35-1" title="View reference  in text"
+                           id="ref-35">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.35"
+                             data-doi="10.1021/ja207172s">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Seyedsayamdost</span>,  <span class="cit-name-given-names">M. R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Carr</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kolter</span>,  <span class="cit-name-given-names">R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Clardy</span>,  <span class="cit-name-given-names">J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2011a</span><strong>).</strong> <span class="cit-article-title">Roseobacticides: small molecule modulators of an algal-bacterial symbiosis</span>. <abbr class="cit-jnl-abbrev">J Am Chem Soc</abbr> <span class="cit-vol">133</span>, <span class="cit-fpage">18343</span>–<span class="cit-lpage">18349</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1021/ja207172s</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>21928816</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1021/ja207172s&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=21928816&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Roseobacticides%3A%20small%20molecule%20modulators%20of%20an%20algal-bacterial%20symbiosis&amp;author=M.%20R.%20Seyedsayamdost&amp;author=G.%20Carr&amp;author=R.%20Kolter&amp;author=J.%20Clardy&amp;publication_year=2011a&amp;journal=J%20Am%20Chem%20Soc&amp;volume=133&amp;pages=18343-18349&amp;doi=10.1021%2Fja207172s&amp;pmid=21928816">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-36-1" title="View reference  in text"
+                           id="ref-36">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.36"
+                             data-doi="10.1038/nchem.1002">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Seyedsayamdost</span>,  <span class="cit-name-given-names">M. R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Case</span>,  <span class="cit-name-given-names">R. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kolter</span>,  <span class="cit-name-given-names">R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Clardy</span>,  <span class="cit-name-given-names">J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2011b</span><strong>).</strong> <span class="cit-article-title">The Jekyll-and-Hyde chemistry of <em>Phaeobacter gallaeciensis</em></span>. <abbr class="cit-jnl-abbrev">Nat Chem</abbr> <span class="cit-vol">3</span>, <span class="cit-fpage">331</span>–<span class="cit-lpage">335</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1038/nchem.1002</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>21430694</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1038/nchem.1002&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=21430694&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=The%20Jekyll-and-Hyde%20chemistry%20of%20Phaeobacter%20gallaeciensis&amp;author=M.%20R.%20Seyedsayamdost&amp;author=R.%20J.%20Case&amp;author=R.%20Kolter&amp;author=J.%20Clardy&amp;publication_year=2011b&amp;journal=Nat%20Chem&amp;volume=3&amp;pages=331-335&amp;doi=10.1038%2Fnchem.1002&amp;pmid=21430694">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-37-1" title="View reference  in text"
+                           id="ref-37">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4340.37">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Gerhardt</span>,  <span class="cit-name-given-names">P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Murray</span>,  <span class="cit-name-given-names">R. G. E.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Wood</span>,  <span class="cit-name-given-names">W. A.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Smibert</span>,  <span class="cit-name-given-names">R. M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1981</span><strong>).</strong> <span class="cit-article-title">Phenotypic characterization</span>. In <span class="cit-source">Manual of Methods for General Bacteriology</span>, pp. <span class="cit-fpage">607</span>–<span class="cit-lpage">654</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Gerhardt</span>,  <span class="cit-name-given-names">P.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Murray</span>,  <span class="cit-name-given-names">R. G. E.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Wood</span>,  <span class="cit-name-given-names">W. A.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span>
+                                 . <span class="cit-publ-loc">Washington, DC</span>: <span class="cit-publ-name">American Society for Microbiology</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Phenotypic%20characterization&amp;author=R.%20M.%20Smibert&amp;author=N.%20R.%20Krieg&amp;publication_year=1981&amp;citation_inbook_title=Manual%20of%20Methods%20for%20General%20Bacteriology">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-38-1" title="View reference  in text"
+                           id="ref-38">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.38"
+                             data-doi="10.1080/10635150802429642">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stamatakis</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hoover</span>,  <span class="cit-name-given-names">P.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Rougemont</span>,  <span class="cit-name-given-names">J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2008</span><strong>).</strong> <span class="cit-article-title">A rapid bootstrap algorithm for the RAxML Web servers</span>. <abbr class="cit-jnl-abbrev">Syst Biol</abbr> <span class="cit-vol">57</span>, <span class="cit-fpage">758</span>–<span class="cit-lpage">771</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1080/10635150802429642</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>18853362</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=sysbio&amp;resid=57/5/758"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-39-1" title="View reference  in text"
+                           id="ref-39">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4340.39">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Swofford</span>,  <span class="cit-name-given-names">D. L.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2002</span><strong>).</strong> <span class="cit-article-title"><span class="sc">paup</span>*: Phylogenetic analysis using parsimony (and other methods), version 4.0b10</span>. <span class="cit-publ-loc">Sunderland</span>: <span class="cit-publ-name">Sinauer Associates</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=paup%2A%3A%20Phylogenetic%20analysis%20using%20parsimony%20%28and%20other%20methods%29%2C%20version%204.0b10&amp;author=D.%20L.%20Swofford&amp;publication_year=2002">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-40-1" title="View reference  in text"
+                           id="ref-40">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.40"
+                             data-doi="10.1038/ismej.2012.62">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Thole</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kalhoefer</span>,  <span class="cit-name-given-names">D.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Voget</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Berger</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Engelhardt</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Liesegang</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wollherr</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kjelleberg</span>,  <span class="cit-name-given-names">S.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Daniel</span>,  <span class="cit-name-given-names">R.</span></span></li>
+                              </ol><cite> <strong>&amp; other authors (</strong><span class="cit-pub-date">2012</span><strong>).</strong> <span class="cit-article-title"><em>Phaeobacter gallaeciensis</em> genomes from globally opposite locations reveal high similarity of adaptation to surface life</span>. <abbr class="cit-jnl-abbrev">ISME J</abbr> <span class="cit-vol">6</span>, <span class="cit-fpage">2229</span>–<span class="cit-lpage">2244</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1038/ismej.2012.62</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>21716312</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1038/ismej.2012.62&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=22717884&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Phaeobacter%20gallaeciensis%20genomes%20from%20globally%20opposite%20locations%20reveal%20high%20similarity%20of%20adaptation%20to%20surface%20life&amp;author=S.%20Thole&amp;author=D.%20Kalhoefer&amp;author=S.%20Voget&amp;author=M.%20Berger&amp;author=T.%20Engelhardt&amp;author=H.%20Liesegang&amp;author=A.%20Wollherr&amp;author=S.%20Kjelleberg&amp;author=R.%20Daniel&amp;publication_year=2012&amp;journal=ISME%20J&amp;volume=6&amp;pages=2229-2244&amp;doi=10.1038%2Fismej.2012.62&amp;pmid=21716312">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-41-1" title="View reference  in text"
+                           id="ref-41">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.41"
+                             data-doi="10.1099/ijs.0.65324-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Tóth</span>,  <span class="cit-name-given-names">E. M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Schumann</span>,  <span class="cit-name-given-names">P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Borsodi</span>,  <span class="cit-name-given-names">A. K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kéki</span>,  <span class="cit-name-given-names">Z.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kovács</span>,  <span class="cit-name-given-names">A. L.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Márialigeti</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2008</span><strong>).</strong> <span class="cit-article-title"><em>Wohlfahrtiimonas chitiniclastica</em> gen. nov., sp. nov., a new gammaproteobacterium isolated from <em>Wohlfahrtia magnifica</em> (Diptera: Sarcophagidae)</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">58</span>, <span class="cit-fpage">976</span>–<span class="cit-lpage">981</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.65324-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>18398205</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=58/4/976"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-42-1" title="View reference  in text"
+                           id="ref-42">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.42"
+                             data-doi="10.1371/journal.pone.0034846">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Vaas</span>,  <span class="cit-name-given-names">L. A. I.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sikorski</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Michael</span>,  <span class="cit-name-given-names">V.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Göker</span>,  <span class="cit-name-given-names">M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Klenk</span>,  <span class="cit-name-given-names">H.-P.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2012</span><strong>).</strong> <span class="cit-article-title">Visualization and curve-parameter estimation strategies for efficient exploration of phenotype microarray kinetics</span>. <abbr class="cit-jnl-abbrev">PLoS ONE</abbr> <span class="cit-vol">7</span>, <span class="cit-fpage">e34846</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1371/journal.pone.0034846</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>22536335</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1371/journal.pone.0034846&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=22536335&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Visualization%20and%20curve-parameter%20estimation%20strategies%20for%20efficient%20exploration%20of%20phenotype%20microarray%20kinetics&amp;author=L.%20A.%20I.%20Vaas&amp;author=J.%20Sikorski&amp;author=V.%20Michael&amp;author=M.%20G%C3%B6ker&amp;author=H.-P.%20Klenk&amp;publication_year=2012&amp;journal=PLoS%20ONE&amp;volume=7&amp;pages=e34846&amp;doi=10.1371%2Fjournal.pone.0034846&amp;pmid=22536335">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-43-1" title="View reference  in text"
+                           id="ref-43">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.43"
+                             data-doi="10.1099/00207713-37-4-463">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wayne</span>,  <span class="cit-name-given-names">L. G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brenner</span>,  <span class="cit-name-given-names">D. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Colwell</span>,  <span class="cit-name-given-names">R. R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Grimont</span>,  <span class="cit-name-given-names">P. A. D.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kandler</span>,  <span class="cit-name-given-names">O.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Krichevsky</span>,  <span class="cit-name-given-names">M. I.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Moore</span>,  <span class="cit-name-given-names">L. H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Moore</span>,  <span class="cit-name-given-names">W. E. C.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Murray</span>,  <span class="cit-name-given-names">R. G. E.</span></span></li>
+                              </ol><cite> <strong>&amp; other authors (</strong><span class="cit-pub-date">1987</span><strong>).</strong> <span class="cit-article-title">Report of the ad hoc committee on reconciliation of approaches to bacterial systematics</span>. <abbr class="cit-jnl-abbrev">Int J Syst Bacteriol</abbr> <span class="cit-vol">37</span>, <span class="cit-fpage">463</span>–<span class="cit-lpage">464</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-37-4-463</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=PDF&amp;journalCode=ijs&amp;resid=37/4/463"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-44-1" title="View reference  in text"
+                           id="ref-44">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.44"
+                             data-doi="10.1002/pmic.200900120">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Zech</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Thole</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Schreiber</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kalhöfer</span>,  <span class="cit-name-given-names">D.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Voget</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brinkhoff</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Simon</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Schomburg</span>,  <span class="cit-name-given-names">D.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Rabus</span>,  <span class="cit-name-given-names">R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2009</span><strong>).</strong> <span class="cit-article-title">Growth phase-dependent global protein and metabolite profiles of <em>Phaeobacter gallaeciensis</em> strain DSM 17395, a member of the marine <em>Roseobacter</em>-clade</span>. <abbr class="cit-jnl-abbrev">Proteomics</abbr> <span class="cit-vol">9</span>, <span class="cit-fpage">3677</span>–<span class="cit-lpage">3697</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1002/pmic.200900120</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>19639587</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1002/pmic.200900120&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=19639587&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Growth%20phase-dependent%20global%20protein%20and%20metabolite%20profiles%20of%20Phaeobacter%20gallaeciensis%20strain%20DSM%2017395%2C%20a%20member%20of%20the%20marine%20Roseobacter-clade&amp;author=H.%20Zech&amp;author=S.%20Thole&amp;author=K.%20Schreiber&amp;author=D.%20Kalh%C3%B6fer&amp;author=S.%20Voget&amp;author=T.%20Brinkhoff&amp;author=M.%20Simon&amp;author=D.%20Schomburg&amp;author=R.%20Rabus&amp;publication_year=2009&amp;journal=Proteomics&amp;volume=9&amp;pages=3677-3697&amp;doi=10.1002%2Fpmic.200900120&amp;pmid=19639587">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-45-1" title="View reference  in text"
+                           id="ref-45">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.45"
+                             data-doi="10.1093/nar/gkg595">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Zuker</span>,  <span class="cit-name-given-names">M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2003</span><strong>).</strong> <span class="cit-article-title">Mfold web server for nucleic acid folding and hybridization prediction</span>. <abbr class="cit-jnl-abbrev">Nucleic Acids Res</abbr> <span class="cit-vol">31</span>, <span class="cit-fpage">3406</span>–<span class="cit-lpage">3415</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1093/nar/gkg595</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>12824337</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=nar&amp;resid=31/13/3406"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                  </ol>
+               </div><span class="highwire-journal-article-marker-end"></span></div>
+            <div class="social-bookmarking">
+               
+               <ul class="social-bookmark-links">
+                  <li class="social-bookmarking-item social-bookmarking-item-citeulike"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=CITEULIKE"><img src="/shared/img/common/social-bookmarking/citeulike.gif"
+                             alt="Add to CiteULike"
+                             title="CiteULike" /></a><span class="soc-bm-link-text">CiteULike</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-delicious"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=DEL_ICIO_US"><img src="/shared/img/common/social-bookmarking/delicious.gif"
+                             alt="Add to Delicious"
+                             title="Delicious" /></a><span class="soc-bm-link-text">Delicious</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-digg"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=DIGG"><img src="/shared/img/common/social-bookmarking/digg.gif" alt="Add to Digg"
+                             title="Digg" /></a><span class="soc-bm-link-text">Digg</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-facebook"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/short/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=FACEBOOK"
+                        class="sb-facebook"
+                        rel="external-nw"><img src="/shared/img/common/social-bookmarking/facebook.gif" alt="Add to Facebook"
+                             title="Facebook" /></a><span class="soc-bm-link-text">Facebook</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-googleplus"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=GOOGLEPLUS&amp;log_only=yes"><img src="/shared/img/common/social-bookmarking/googleplus.jpg" alt="Add to Google+"
+                             title="Google+" /></a><span class="soc-bm-link-text">Google+</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-linkedin"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=LINKEDIN"><img src="/shared/img/common/social-bookmarking/linkedin.gif" alt="Add to LinkedIn"
+                             title="LinkedIn" /></a><span class="soc-bm-link-text">LinkedIn</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-mendeley"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=MENDELEY"><img src="/shared/img/common/social-bookmarking/mendeley.gif" alt="Add to Mendeley"
+                             title="Mendeley" /></a><span class="soc-bm-link-text">Mendeley</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-reddit"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=REDDIT"><img src="/shared/img/common/social-bookmarking/reddit.gif" alt="Add to Reddit"
+                             title="Reddit" /></a><span class="soc-bm-link-text">Reddit</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-twitter"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=TWITTER"><img src="/shared/img/common/social-bookmarking/twitter.gif" alt="Add to Twitter"
+                             title="Twitter" /></a><span class="soc-bm-link-text">Twitter</span></li>
+               </ul>
+               
+               <p class="social-bookmarking-help"><a href="/help/social_bookmarks.dtl">What's this?</a></p>
+               
+            </div><span id="related-urls"></span></div>
+         <div id="col-2">
+            
+            <div class="article-nav sidebar-nav">
+               <a href="/content/63/Pt_11/4330.short" title="Previous article" class="previous">« Previous</a><span class="article-nav-sep"> | </span><a href="/content/63/Pt_11/4350.short" title="Next article" class="next">Next Article »</a>
+               
+               <span class="toc-link">
+                  				<a href="/content/63/Pt_11.toc" title="Table of Contents">Table of Contents</a>
+                  			</span>
+               
+               
+            </div>
+            <div class="free-article">
+               <span class="free-article-note">
+                  FREE ARTICLE
+                  </span>
+               
+            </div>
+            <div class="content-box" id="article-cb-main">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Article</span></h3>
+                  <div class="cb-section cb-slug">
+                     <ol>
+                        <li>
+                           <div id="slugline">
+                              
+                              
+                              	    
+                              
+                              doi:
+                              <span title="10.1099/ijs.0.053900-0" class="slug-doi">10.1099/ijs.0.053900-0
+                                 </span>
+                              <cite>
+                                 	    <abbr title="International Journal of Systematic and Evolutionary Microbiology"
+                                       class="slug-jnl-abbrev">
+                                    IJSEM</abbr><span class="slug-pub-date" itemprop="datePublished">
+                                    	    November 2013 
+                                    </span>
+                                 	    <span class="slug-vol">
+                                    vol. 63 
+                                    </span><span class="slug-issue">
+                                    no. Pt 11 
+                                    </span><span class="slug-pages">
+                                    4340-4349
+                                    </span>
+                                 </cite>
+                              
+                              	           
+                              
+                              
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section cb-views">
+                     <ol>
+                        <li class="abstract-view-link primary"><a href="/content/63/Pt_11/4340.abstract" rel="view-abstract">Abstract</a><span class="free">Free</span></li>
+                        <li class="notice full-text-view-link primary"><span class="variant-indicator">» <span>Full Text</span></span><span class="free">Free</span></li>
+                        <li class="notice full-text-pdf-view-link primary"><a href="/content/63/Pt_11/4340.full.pdf+html" rel="view-full-text.pdf">Full Text (PDF)</a><span class="free">Free</span></li>
+                        <li><a href="/content/63/Pt_11/4340/suppl/DC1" rel="supplemental-data"
+                              class="dslink-supplementary-material">Supplementary material</a></li>
+                        <li><a href="/powerpoint/63/Pt_11/4340">PPT Slides of All Figures</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible" id="cb-art-cat">
+                     <h4 class="cb-section-header"><span>Classifications</span></h4>
+                     <ol>
+                        <li>
+                           <ul class="subject-headings last-child">
+                              <li><a class="tocsection-search"
+                                    href="/search?tocsectionid=Taxonomic+Note&amp;sortspec=date&amp;submit=Submit">Taxonomic Note</a></li>
+                           </ul>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible" id="cb-art-svcs">
+                     <h4 class="cb-section-header"><span>Services</span></h4>
+                     <ol>
+                        <li class="mail-a-friend-link icon-link"><a href="/email?gca=ijs%3B63%2FPt_11%2F4340&amp;current-view-path=/content/63/Pt_11/4340.full">
+                              Email this article to a colleague</a></li>
+                        <li class="alert-link icon-link"><a href="/cgi/alerts/ctalert?alertType=citedby&amp;addAlert=cited_by&amp;cited_by_criteria_resid=ijs%3B63%2FPt_11%2F4340&amp;saveAlert=no&amp;return-type=article&amp;return_url=http://ijs.sgmjournals.org/content/63/Pt_11/4340.full">Alert me when this article is cited</a></li>
+                        <li class="alert-link icon-link"><a href="/cgi/alerts/ctalert?alertType=correction&amp;addAlert=correction&amp;correction_criteria_value=63/Pt_11/4340&amp;saveAlert=no&amp;return-type=article&amp;return_url=http://ijs.sgmjournals.org/content/63/Pt_11/4340.full">Alert me if a correction is posted</a></li>
+                        <li class="similar-link"><a href="/search?qbe=ijs%3Bijs.0.053900-0&amp;citation=Buddruhs%20et%20al.%2063%20%28Pt%2011%29:%204340&amp;submit=yes">Similar articles in this journal</a></li>
+                        <li class="similar-link"><a href="/external-ref?access_num=ijs%3B63%2FPt_11%2F4340&amp;link_type=ISI_RELATEDRECORDS"
+                              id="cb-isi-similar-articles"
+                              class="similar-link">Similar articles in Web of Science</a></li>
+                        <li class="similar-link"><a href="/external-ref?access_num=24187021&amp;link_type=MED_NBRS"
+                              class="similar-link">Similar articles in PubMed</a></li>
+                        <li class="cit-man-link icon-link cite-link"><a href="/citmgr?gca=ijs%3B63%2FPt_11%2F4340">Download to citation manager</a></li>
+                        <li class="copyright-link icon-link"><a href="/external-ref?link_type=PERMISSIONDIRECT"><img src="/shared/img/content/permissions.gif" /></a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-cit">
+                     <h4 class="cb-section-header"><span>Citing Articles</span></h4>
+                     <ol>
+                        <li class="hw-citing-link"><a href="/content/63/Pt_11/4340.full?cited-by=yes&amp;legid=ijs;63/Pt_11/4340#cited-by"
+                              id="cb-hw-citing-articles">Load citing article information</a></li>
+                        <li><a href="/cgi/crossref-forward-links/63/Pt_11/4340" rel="external-nw"
+                              id="cb-crossref-citing-articles">Citing articles via CrossRef</a></li>
+                        <li><a href="/external-ref?access_num=%2Fijs%2F63%2FPt_11%2F4340&amp;link_type=ISI_CITING&amp;accnum_type=native"
+                              rel="external-nw"
+                              id="cb-isi-citing-articles">Citing articles via Web of Science</a></li>
+                        <li><a href="/external-ref?access_num=http://ijs.sgmjournals.org/content/63/Pt_11/4340.abstract&amp;link_type=GOOGLESCHOLAR">Citing articles via Google Scholar</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-gs">
+                     <h4 class="cb-section-header"><span>Google Scholar</span></h4>
+                     <ol>
+                        <li class="cb-art-gs-auth author-link"><a href="http://scholar.google.com/scholar?q=%22author%3ABuddruhs%20author%3AN.%22"
+                              class="cb-art-gs-auth author-link">Articles by  Buddruhs, N.</a></li>
+                        <li class="cb-art-gs-auth author-link"><a href="http://scholar.google.com/scholar?q=%22author%3ABrinkhoff%20author%3AT.%22"
+                              class="cb-art-gs-auth author-link">Articles by  Brinkhoff, T.</a></li>
+                        <li class="cb-art-gs-rel similar-link"><a href="/external-ref?access_num=http://ijs.sgmjournals.org/content/63/Pt_11/4340.abstract&amp;link_type=GOOGLESCHOLARRELATED">Search for related content</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-pm">
+                     <h4 class="cb-section-header"><span>PubMed</span></h4>
+                     <ol>
+                        <li class="cb-art-pm-cite cite-link icon-link"><a href="/external-ref?access_num=24187021&amp;link_type=PUBMED"
+                              class="cb-art-pm-cite cite-link icon-link">PubMed citation</a></li>
+                        <li class="cb-art-pm-auth author-link"><a href="/external-ref?access_num=Buddruhs%20N&amp;link_type=AUTHORSEARCH"
+                              class="cb-art-pm-auth author-link">Articles by  Buddruhs, N.</a></li>
+                        <li class="cb-art-pm-auth author-link"><a href="/external-ref?access_num=Brinkhoff%20T&amp;link_type=AUTHORSEARCH"
+                              class="cb-art-pm-auth author-link">Articles by  Brinkhoff, T.</a></li>
+                        <li>
+                           <div id="cb-entrez-links-placeholder"><a href="/entrez-links/24187021"></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-rel">
+                     <h4 class="cb-section-header"><span>Related Content</span></h4>
+                     <ol>
+                        <li><a href="/content/63/Pt_11/4340.full?related-urls=yes&amp;legid=ijs;63/Pt_11/4340#related-urls"
+                              id="cb-related-urls">Load related web page information</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed soc-links icon-link"
+                       id="cb-art-soc">
+                     <h4 class="cb-section-header"><span>Social Bookmarking</span></h4>
+                     <ol>
+                        <li>
+                           <div class="social-bookmarking">
+                              
+                              <ul class="social-bookmark-links">
+                                 <li class="social-bookmarking-item social-bookmarking-item-citeulike"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=CITEULIKE"><img src="/shared/img/common/social-bookmarking/citeulike.gif"
+                                            alt="Add to CiteULike"
+                                            title="CiteULike" /></a><span class="soc-bm-link-text">CiteULike</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-delicious"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=DEL_ICIO_US"><img src="/shared/img/common/social-bookmarking/delicious.gif"
+                                            alt="Add to Delicious"
+                                            title="Delicious" /></a><span class="soc-bm-link-text">Delicious</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-digg"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=DIGG"><img src="/shared/img/common/social-bookmarking/digg.gif" alt="Add to Digg"
+                                            title="Digg" /></a><span class="soc-bm-link-text">Digg</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-facebook"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/short/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=FACEBOOK"
+                                       class="sb-facebook"
+                                       rel="external-nw"><img src="/shared/img/common/social-bookmarking/facebook.gif" alt="Add to Facebook"
+                                            title="Facebook" /></a><span class="soc-bm-link-text">Facebook</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-googleplus"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=GOOGLEPLUS&amp;log_only=yes"><img src="/shared/img/common/social-bookmarking/googleplus.jpg" alt="Add to Google+"
+                                            title="Google+" /></a><span class="soc-bm-link-text">Google+</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-linkedin"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=LINKEDIN"><img src="/shared/img/common/social-bookmarking/linkedin.gif" alt="Add to LinkedIn"
+                                            title="LinkedIn" /></a><span class="soc-bm-link-text">LinkedIn</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-mendeley"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=MENDELEY"><img src="/shared/img/common/social-bookmarking/mendeley.gif" alt="Add to Mendeley"
+                                            title="Mendeley" /></a><span class="soc-bm-link-text">Mendeley</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-reddit"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=REDDIT"><img src="/shared/img/common/social-bookmarking/reddit.gif" alt="Add to Reddit"
+                                            title="Reddit" /></a><span class="soc-bm-link-text">Reddit</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-twitter"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=TWITTER"><img src="/shared/img/common/social-bookmarking/twitter.gif" alt="Add to Twitter"
+                                            title="Twitter" /></a><span class="soc-bm-link-text">Twitter</span></li>
+                              </ul>
+                              
+                              <p class="social-bookmarking-help"><a href="/help/social_bookmarks.dtl">What's this?</a></p>
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+            
+            <div class="content-box" id="article-dyn-nav">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>Navigate This Article</span></h3>
+                  <div class="cb-section" id="cb-art-nav">
+                     <ol>
+                        <li><a href="#content-block">Top</a></li>
+                        <li><a href="#abstract-1">Abstract</a></li>
+                        <li><a href="#sec-1">Introduction</a></li>
+                        <li><a href="#sec-2">Methods</a></li>
+                        <li><a href="#sec-11">Results</a></li>
+                        <li><a href="#sec-19">Discussion</a></li>
+                        <li><a href="#ack-1">Acknowledgements</a></li>
+                        <li><a href="#ref-list-1">References</a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+         </div>
+         <div id="col-3">
+            
+            <div class="content-box" id="sidebar-current-issue">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Month's Issue</span></h3>
+                  <div class="cb-section">
+                     <ol>
+                        <li><span><a href="/content/current" rel="current-issue">April 2015, 65 (Pt 4)</a></span></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section">
+                     <ol>
+                        <li>
+                           <div class="current-issue"><a href="/content/current" rel="current-issue"><img src="/content/65/Pt_4.cover.gif" width="67" height="89" alt="Current Issue" /></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section sidebar-etoc-link">
+                     <ol>
+                        <li><a href="/cgi/alerts/etoc">Alert me to new issues of IJSEM
+                              </a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            <div id="sidebar-global-nav">
+               
+               		
+               <ul class="button-list pub-links">
+                  <li class="first"><a href="/site/misc/about.xhtml" title="ABOUT IJSEM"><span>ABOUT IJSEM</span></a></li>
+                  <li><a href="/site/misc/edboard.xhtml" title="EDITORIAL BOARD &amp; STAFF"><span>EDITORIAL BOARD &amp; STAFF</span></a></li>
+                  <li><a href="http://www.editorialmanager.com/ijs/" title="SUBMIT A MANUSCRIPT"><span>SUBMIT A MANUSCRIPT</span></a></li>
+                  <li><a href="/site/misc/ifora.xhtml" title="INFORMATION FOR AUTHORS"><span>INFORMATION FOR AUTHORS</span></a></li>
+                  <li><a href="/site/misc/iforr.xhtml" title="INFORMATION FOR REVIEWERS"><span>INFORMATION FOR REVIEWERS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/site/librarians/index.xhtml"
+                        title="INFORMATION FOR LIBRARIANS"><span>INFORMATION FOR LIBRARIANS</span></a></li>
+                  <li><a href="/site/misc/reprints.xhtml" title="PERMISSIONS AND REPRINTS"><span>PERMISSIONS AND REPRINTS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/subscriptions" title="SUBSCRIPTIONS"><span>SUBSCRIPTIONS</span></a></li>
+                  <li><a href="/site/misc/addir.xhtml" title="ADVERTISING"><span>ADVERTISING</span></a></li>
+                  <li class="rss-img-button"><a href="/site/misc/alerts_feeds.xhtml" title="ALERTS &amp; FEEDS"><span>ALERTS &amp; FEEDS</span></a></li>
+                  <li class="last"><a href="/feedback" title="FEEDBACK"><span>FEEDBACK</span></a></li>
+               </ul>
+               		
+               <ul class="button-list pub-links umbrella-links">
+                  <li class="first"><a href="http://mic.sgmjournals.org" title="MICROBIOLOGY"><span>MICROBIOLOGY</span></a></li>
+                  <li><a href="http://vir.sgmjournals.org" title="J GEN VIROL"><span>J GEN VIROL</span></a></li>
+                  <li><a href="http://jmm.sgmjournals.org" title="J MED MICROBIOL"><span>J MED MICROBIOL</span></a></li>
+                  <li><a href="http://jmmcr.sgmjournals.org" title="JMM CASE REPORTS"><span>JMM CASE REPORTS</span></a></li>
+                  <li class="last"><a href="http://www.sgmjournals.org" title="ALL SGM JOURNALS"><span>ALL SGM JOURNALS</span></a></li>
+               </ul>
+               		
+               <div class="sidebar-icon-group">
+                  			
+                  <div class="icons">
+                     			<a href="http://www.sgm.ac.uk/" rel="external-nw"><img src="/publisher/img/society_logo.gif" class="publisher-icon" alt="Society Logo" /></a>
+                     			<a href="http://www.the-icsp.org/" rel="external-nw"><img src="/publisher/img/icsp_logo.gif" class="publisher-icon" alt="ICSP Logo" /></a>
+                     			<a href="http://highwire.stanford.edu/" rel="external-nw"><img src="/publisher/img/hplogo.gif" class="hw-icon" alt="HighWire Press Logo" /></a>
+                     			
+                  </div>
+                  			
+                  <div class="sidebar-icon-text"><span>The <a href="http://www.sgmjournals.org"> Society for General Microbiology</a> publishes online with the assistance of <a href="http://highwire.stanford.edu">HighWire Press®</a>.</span></div>
+                  		
+               </div>
+               	
+            </div>
+            <div class="most-links-box js-marker">
+               
+               <div class="most-header">
+                  
+                  <h3>Most</h3>
+                  
+               </div>
+               
+               <ul>
+                  <li class="most-cur-sel">
+                     <h4>Viewed</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/1070?rss=1&amp;ssource=mfr">Proposal to consistently apply the International Code of Nomenclature of Prokaryotes (ICNP) to names of the oxygenic photosynthetic
+                                 bacteria (cyanobacteria), including those validly published under the International Code of Botanical Nomenclature (ICBN)/International
+                                 Code of Nomenclature for algae, fungi and plants (ICN), and proposal to change Principle 2 of the ICNP</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfr">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/316?rss=1&amp;ssource=mfr">Integrating genomics into the taxonomy and systematics of the Bacteria and Archaea</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/333?rss=1&amp;ssource=mfr">Applications of next-generation sequencing to unravelling the evolutionary history of algae</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/739?rss=1&amp;ssource=mfr">Notification that new names of prokaryotes, new combinations, and new taxonomic opinions have appeared in volume 64, part
+                                 12, of the IJSEM</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfr1.dtl" class="view-all">» View all Most Viewed articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+                  <li>
+                     <h4>Cited</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4386?rss=1&amp;ssource=mfc">Chryseobacterium hispalense sp. nov., a plant-growth-promoting bacterium isolated from a rainwater pond in an olive plant
+                                 nursery, and emended descriptions of Chryseobacterium defluvii, Chryseobacterium indologenes, Chryseobacterium wanjuense and
+                                 Chryseobacterium gregarium</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfc">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_1/138?rss=1&amp;ssource=mfc">Aquibacter zeaxanthinifaciens gen. nov., sp. nov., a zeaxanthin-producing bacterium of the family Flavobacteriaceae isolated
+                                 from surface seawater, and emended descriptions of the genera Aestuariibaculum and Gaetbulibacter</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4790?rss=1&amp;ssource=mfc">Kordia aquimaris sp. nov., a zeaxanthin-producing member of the family Flavobacteriaceae isolated from surface seawater, and
+                                 emended description of the genus Kordia</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4524?rss=1&amp;ssource=mfc">Erythrobacter odishensis sp. nov. and Pontibacter odishensis sp. nov. isolated from dry soil of a solar saltern</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfc1.dtl" class="view-all">» View all Most Cited articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+               </ul>
+               
+               
+            </div>
+            
+            
+            
+         </div>
+         <div id="footer">
+            
+            <div class="bar">
+               
+               <div class="footer-group footer-col-left">
+                  		
+                  <p class="copyright">Copyright ©
+                     		2015 International Union of Microbiological Societies
+                     	
+                  </p>
+                  	
+               </div>
+               
+               <div class="footer-group footer-col-right">
+                  	    
+                  <ul class="issns">
+                     <li>
+                        <span>Print ISSN: </span>
+                        <span class="issn">1466-5026</span>
+                        
+                     </li>
+                     <li>
+                        <span>Online ISSN: </span>
+                        <span class="issn">1466-5034</span>
+                        
+                     </li>
+                  </ul>
+                  	  
+               </div>
+               	  
+            </div>
+            
+            
+            <div class="block-2 sb-div"></div>
+            
+         </div><script type="text/javascript">
+        var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
+        document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
+        </script><script type="text/javascript">
+        try {
+        var pageTracker = _gat._getTracker("UA-189672-25");
+        pageTracker._setDomainName(".sgmjournals.org");
+        pageTracker._trackPageview();
+        } catch(err) {}
+        </script><script type="text/javascript">
+	(function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
+		(i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
+		m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
+	})(window,document,'script','//www.google-analytics.com/analytics.js','ga');
+
+	ga('create', 'UA-48529861-1', '.sgmjournals.org');
+	ga('send', 'pageview');
+	</script></div>
+   </body>
+</html>
\ No newline at end of file
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/fulltext.pdf b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/fulltext.pdf
new file mode 100644
index 00000000..38beffcf
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/fulltext.pdf differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/results.json b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/results.json
new file mode 100644
index 00000000..c0b05d37
--- /dev/null
+++ b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/results.json
@@ -0,0 +1,101 @@
+{
+  "publisher": {
+    "value": [
+      "Society for General Microbiology"
+    ]
+  },
+  "journal": {
+    "value": [
+      "International Journal of Systematic and Evolutionary\n                Microbiology"
+    ]
+  },
+  "title": {
+    "value": [
+      "Molecular and phenotypic analyses reveal the non-identity of the Phaeobacter gallaeciensis type strain deposits CIP 105210T and DSM 17395"
+    ]
+  },
+  "authors": {
+    "value": [
+      "Nora Buddruhs",
+      "Silke Pradella",
+      "Markus Göker",
+      "Orsola Päuker",
+      "Rüdiger Pukall",
+      "Cathrin Spröer",
+      "Peter Schumann",
+      "Jörn Petersen",
+      "Thorsten Brinkhoff"
+    ]
+  },
+  "date": {
+    "value": [
+      "11/01/2013"
+    ]
+  },
+  "doi": {
+    "value": [
+      "10.1099/ijs.0.053900-0"
+    ]
+  },
+  "volume": {
+    "value": [
+      "63"
+    ]
+  },
+  "issue": {
+    "value": [
+      "Pt 11"
+    ]
+  },
+  "firstpage": {
+    "value": [
+      "4340"
+    ]
+  },
+  "abstract": {
+    "value": [
+      "\n                  \n                      Next Section\n                  Abstract\n                  \n                  The marine genus Phaeobacter currently comprises six species, some of which were intensively studied mainly due to their ability to produce secondary\n                     metabolites. The type strain of the type species, Phaeobacter gallaeciensis BS107T, has been deposited at several public culture collections worldwide. Based on differences in plasmid profiles, we detected\n                     that the alleged P. gallaeciensis type strains deposited at the Collection Institute Pasteur (CIP; Paris, France) as CIP 105210 and at the German Collection\n                     of Microorganisms and Cell Cultures (DSMZ; Braunschweig, Germany) as DSM 17395 are not identical. To determine the identity\n                     of these strains, we conducted DNA–DNA hybridization, matrix-assisted laser desorption/ionization time-of-flight mass spectrometry\n                     (MALDI-TOF), 16S rRNA gene and internal transcribed spacer (ITS) sequence analyses, as well as physiological experiments.\n                     Based on the detailed 16S rRNA gene reanalysis we showed that strain CIP 105210 most likely corresponds to the original P. gallaeciensis type strain BS107T. In contrast, the Phaeobacter strain DSM 17395 exhibits a much closer affiliation to Phaeobacter inhibens DSM 16374T ( = T5T) and should thus be allocated to this species. The detection of the dissimilarity of strains CIP 105210T and DSM 17395 will influence future comparative studies within the genus Phaeobacter.\n                  \n                  \n               "
+    ]
+  },
+  "fulltext_html": {
+    "value": [
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4340.full"
+    ]
+  },
+  "fulltext_pdf": {
+    "value": [
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4340.full.pdf"
+    ]
+  },
+  "supplementary_material": {
+    "value": [
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4340/suppl/DC1"
+    ]
+  },
+  "figure": {
+    "value": [
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4340/F1.small.gif",
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4340/F2.small.gif",
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4340/F3.small.gif",
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4340/F4.small.gif",
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4340/F5.small.gif"
+    ]
+  },
+  "figure_caption": {
+    "value": [
+      "Fig. 1.  \n                           \n                           (a) PFGE plasmid profiles of the Phaeobacter strains CIP 105210T, DSM 17395, DSM 24588 and DSM 16374T based on uncut high-molecular-mass genomic DNA. (b) Calculated plasmid sizes as mean values taken from at least two different\n                              gel runs. The PFGE conditions were: 1 % (w/v) agarose gel with pulse times of 1 to 48 s for 24 h at 200 V (6 V cm−1). Chr, chromosomal DNA; λ, lambda phage concatemers as molecular-mass PFGE markers (New England Biolabs); li, linear. (*), The two largest plasmids (linearized forms) of Phaeobacter strains CIP 105210T and DSM 17395 migrated about the same distance in the gel and thus seemed to have an identical size. In contrast, both bands\n                              could be clearly distinguished by their size in other PFGE runs (data not shown) using different DNA sample preparations.\n                              DNA mobility is largely influenced by the DNA concentration of the sample. The observed discrepancy can thus be explained\n                              by the relatively high DNA concentration in CIP 105210T (compared to DSM 17395T), which retards band migration (Römling et al., 1996). (†) (‡), The PFGE-based plasmid size estimations of 75 and 63 kb of DSM 17395 correspond to the plasmid sizes of 78 and 65 kb, respectively,\n                              determined by genome sequencing (Thole et al., 2012; NC_018287.1, NC_018288.1). (§), The 36 kb plasmid of P. gallaeciensis CIP 105210T had a very low fluorescence intensity and is thus hardly visible on the gel image. ++, The 77 kb band of strain CIP 105210T showed increased fluorescence intensity and presumably represents a double band (plasmid duplet).\n                           \n                           \n                           \n                        ",
+      "Fig. 2.  \n                              \n                              Midpoint-rooted MP phylogeny inferred from 16S rRNA gene sequences of Phaeobacter strains closely related to P. inhibens and P. gallaeciensis. Branches are scaled in terms of the minimum number of substitutions (using deltran optimization; Stamatakis et al., 2008). Numbers above branches are support values from MP (left) and ML (right) bootstrapping. Original designation of strains\n                                 that are deposited at culture collections is indicated in parentheses; square brackets give the respective accession number.\n                              \n                              \n                              \n                           ",
+      "Fig. 3.  \n                              \n                              Secondary structure of the 16S rRNA variable region V4 of P. gallaeciensis CIP 105210T (a) and P. inhibens DSM 17395 (b) demonstrating transition of bases 614 and 626 (E. coli numbering; bases 529 and 541 according to the CIP 105210T numbering). RNA folding was simulated using the Mfold web server for nucleic acid folding and hybridization prediction (Zuker, 2003; http://mfold.rna.albany.edu/?q=mfold/RNA-Folding-Form).\n                              \n                              \n                              \n                           ",
+      "Fig. 4.  \n                              \n                              Score-oriented dendrogram showing the similarity of MALDI-TOF mass spectra from cell extracts of selected Phaeobacter strains. The dendrogram was generated by the BioTyper software (version 3.0; Bruker Daltonics).\n                              \n                              \n                              \n                           ",
+      "Fig. 5.  \n                              \n                              Midpoint-rooted ML phylogeny inferred from ITS sequences of Phaeobacter strains closely related to P. inhibens and P. gallaeciensis. Branches are scaled in terms of the expected number of substitutions per site. Numbers above branches are support values\n                                 from ML (left) and MP (right) bootstrapping. Original designation of strains that are deposited at culture collections is\n                                 indicated in parentheses; square brackets give the respective accession number.\n                              \n                              \n                              \n                           "
+    ]
+  },
+  "license": {
+    "value": []
+  },
+  "copyright": {
+    "value": [
+      "Copyright ©\n                     \t\t2015 International Union of Microbiological Societies\n                     \t\n                  "
+    ]
+  }
+}
\ No newline at end of file
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4350.full/DC1 b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4350.full/DC1
new file mode 100644
index 00000000..b1d0469d
--- /dev/null
+++ b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4350.full/DC1
@@ -0,0 +1,353 @@
+<!DOCTYPE html
+  PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html
+      xmlns="http://www.w3.org/1999/xhtml"
+      xml:lang="en"
+      lang="en">
+   <head>
+      <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
+      <title>Supplementary material </title>
+      <meta name="googlebot" content="NOODP" />
+      <meta name="HW.ad-path" content="/cgi/content/full/ijs.0.054957-0/DC1" />
+      <link rel="stylesheet" type="text/css" media="all" href="/shared/css/hw-global.css" />
+      <link rel="stylesheet" type="text/css" media="print" href="/shared/css/hw-print.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/standard-designs/design25/main.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/local/css/hw-local-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-page-data-supp.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-page-data-supp.css" /><script type="text/javascript" id="session-d7760603e1">var callbackToken='5633EA7ACB0BFB1';</script><script type="text/javascript" id="session-d7760603e3">
+                      var subCode='sgmjournal_sub';
+                    </script><script type="text/javascript" src="/shared/js/jquery-min.js"></script><script type="text/javascript" src="/shared/js/fingerprint.js"></script><script type="text/javascript" src="/shared/js/hw-shared.js"></script><script type="text/javascript" src="/shared/js/design/hw-design1.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-shared.js"></script><script type="text/javascript" src="/shared/js/pages/hw-data-supp.js"></script></head>
+   <body>
+      <div class="hw-gen-page pagetype-content" id="pageid-data-supp">
+         <div id="header">
+            
+            <h1><a id="logo" href="/"><span>International Journal of Systematic and Evolutionary Microbiology</span></a></h1>
+            
+            <p id="skip-link">
+               <a href="#content-block">Skip to main page content</a>
+               
+            </p>
+            
+            <ul class="button-list header-buttons">
+               <li class="first"><a href="/" title="HOME"><span>HOME</span></a></li>
+               <li><a href="/content/current" title="CURRENT ISSUE"><span>CURRENT ISSUE</span></a></li>
+               <li><a href="/content" title="ARCHIVE"><span>ARCHIVE</span></a></li>
+               <li><a href="/search" title="SEARCH"><span>SEARCH</span></a></li>
+               <li><a href="/help" title="HELP"><span>HELP</span></a></li>
+               <li class="last"><a href="/feedback" title="CONTACT US"><span>CONTACT US</span></a></li>
+            </ul>
+            
+            
+            <div class="header-qs">
+               
+               <form class="searchbox" action="/search" method="get">
+                  <div>
+                     	<label for="header-qs-input" id="header-qs-search-label">Search for Keyword:</label>
+                     <input value="" title="Search" type="text" name="fulltext" id="header-qs-input" /><input type="hidden" name="submit" value="yes" /><label for="header-qs-search" id="header-qs-search-label">GO</label><input value="GO" alt="Link: Go" type="image" id="header-qs-search-go"
+                            src="/shared/img/standard-design/design2/go.gif" /> 
+                     
+                  </div>
+                  <div class="adv-search-link"><a href="/search">Advanced Search</a></div>
+               </form>
+               
+               
+            </div>
+            
+            <div class="header-ac-elements">
+               
+               <div id="authstring" class="suppress-header-login">
+                  
+                  <ul>
+                     <li class="subscr-ref">Institution: THE NATURAL HISTORY MUSEUM</li>
+                     <li>
+                        <a href="/login?uri=http%3A%2F%2Fijs.sgmjournals.org%2Fcontent%2F63%2FPt_11%2F4350%2Fsuppl%2FDC1">
+                           Sign In as Member / Individual
+                           </a>
+                        
+                     </li>
+                  </ul>           
+                  
+               </div> 
+               
+               <div id="hdr-login" class="suppress-header-login"></div>
+               
+            </div>
+            
+            <div class="banner-ads">
+               		
+               <ul>
+                  <li class="position-1 no-ad hdr_left"><span>  </span></li>
+               </ul>
+               	
+            </div>
+            
+            <div class="bar">
+               
+               <div class="bar-inner"></div>
+               
+            </div>
+            
+         </div>
+         <div id="content-block">
+            <h1 class="data-supp-article-title">Reclassification of <span class="named-content species" id="named-content-1"><a class="namesforlife" rel="namesforlife-name" title="Bifidobacterium stercoris"
+                     href="doi:10.1601/nm.20247"><em>Bifidobacterium stercoris</em></a></span> Kim <em>et al.</em> 2010 as a later heterotypic synonym of <span class="named-content species" id="named-content-2"><a class="namesforlife" rel="namesforlife-name"
+                     title="Bifidobacterium adolescentis"
+                     href="doi:10.1601/nm.7679"><em>Bifidobacterium adolescentis</em></a></span></h1>
+            <div><span class="highwire-journal-article-marker-start"></span><div class="auto-clean"><span style="font-family: Verdana,Arial,Helvetica,sans-serif;  font-size: 83.33%">
+                     
+                     
+                     <h2>Supplementary material</h2>
+                     
+                     <p><strong>Files in this Data Supplement:</strong></p>
+                     
+                     <ul>
+                        <li><a href="/content/suppl/2013/11/05/ijs.0.054957-0.DC1/ijs054957.pdf">Supplementary material</a> 
+                           		
+                           
+                        </li>
+                     </ul>
+                     </span>
+                  
+                  
+               </div><span class="highwire-journal-article-marker-end"></span></div><span id="related-urls"></span></div>
+         <div id="col-2">
+            
+            <div class="content-box" id="article-cb-main">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Article</span></h3>
+                  <div class="cb-section cb-slug">
+                     <ol>
+                        <li>
+                           <div id="slugline">
+                              
+                              	
+                              
+                              
+                              doi:
+                              <span title="10.1099/ijs.0.054957-0" class="slug-doi">10.1099/ijs.0.054957-0</span>
+                              
+                              <cite>
+                                 	    <abbr title="International Journal of Systematic and Evolutionary Microbiology"
+                                       class="slug-jnl-abbrev">
+                                    IJSEM</abbr><span class="slug-pub-date">
+                                    November 2013 
+                                    </span>
+                                 	    <span class="slug-vol">
+                                    vol. 63 
+                                    </span><span class="slug-issue">
+                                    no. Pt 11 
+                                    </span><span class="slug-pages">
+                                    4350-4353
+                                    </span>
+                                 </cite>
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section cb-views">
+                     <ol>
+                        <li class="abstract-view-link primary"><a href="/content/63/Pt_11/4350.abstract" rel="view-abstract">Abstract</a><span class="free">Free</span></li>
+                        <li class="notice full-text-view-link primary"><a href="/content/63/Pt_11/4350.full" rel="view-full-text">Full Text</a><span class="free">Free</span></li>
+                        <li class="notice full-text-pdf-view-link primary"><a href="/content/63/Pt_11/4350.full.pdf+html" rel="view-full-text.pdf">Full Text (PDF)</a></li>
+                        <li><span class="variant-indicator">» <span>Supplementary material</span></span></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+            
+            
+         </div>
+         <div id="col-3">
+            
+            <div class="content-box" id="sidebar-current-issue">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Month's Issue</span></h3>
+                  <div class="cb-section">
+                     <ol>
+                        <li><span><a href="/content/current" rel="current-issue">April 2015, 65 (Pt 4)</a></span></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section">
+                     <ol>
+                        <li>
+                           <div class="current-issue"><a href="/content/current" rel="current-issue"><img src="/content/65/Pt_4.cover.gif" width="67" height="89" alt="Current Issue" /></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section sidebar-etoc-link">
+                     <ol>
+                        <li><a href="/cgi/alerts/etoc">Alert me to new issues of IJSEM
+                              </a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            <div id="sidebar-global-nav">
+               
+               		
+               <ul class="button-list pub-links">
+                  <li class="first"><a href="/site/misc/about.xhtml" title="ABOUT IJSEM"><span>ABOUT IJSEM</span></a></li>
+                  <li><a href="/site/misc/edboard.xhtml" title="EDITORIAL BOARD &amp; STAFF"><span>EDITORIAL BOARD &amp; STAFF</span></a></li>
+                  <li><a href="http://www.editorialmanager.com/ijs/" title="SUBMIT A MANUSCRIPT"><span>SUBMIT A MANUSCRIPT</span></a></li>
+                  <li><a href="/site/misc/ifora.xhtml" title="INFORMATION FOR AUTHORS"><span>INFORMATION FOR AUTHORS</span></a></li>
+                  <li><a href="/site/misc/iforr.xhtml" title="INFORMATION FOR REVIEWERS"><span>INFORMATION FOR REVIEWERS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/site/librarians/index.xhtml"
+                        title="INFORMATION FOR LIBRARIANS"><span>INFORMATION FOR LIBRARIANS</span></a></li>
+                  <li><a href="/site/misc/reprints.xhtml" title="PERMISSIONS AND REPRINTS"><span>PERMISSIONS AND REPRINTS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/subscriptions" title="SUBSCRIPTIONS"><span>SUBSCRIPTIONS</span></a></li>
+                  <li><a href="/site/misc/addir.xhtml" title="ADVERTISING"><span>ADVERTISING</span></a></li>
+                  <li class="rss-img-button"><a href="/site/misc/alerts_feeds.xhtml" title="ALERTS &amp; FEEDS"><span>ALERTS &amp; FEEDS</span></a></li>
+                  <li class="last"><a href="/feedback" title="FEEDBACK"><span>FEEDBACK</span></a></li>
+               </ul>
+               		
+               <ul class="button-list pub-links umbrella-links">
+                  <li class="first"><a href="http://mic.sgmjournals.org" title="MICROBIOLOGY"><span>MICROBIOLOGY</span></a></li>
+                  <li><a href="http://vir.sgmjournals.org" title="J GEN VIROL"><span>J GEN VIROL</span></a></li>
+                  <li><a href="http://jmm.sgmjournals.org" title="J MED MICROBIOL"><span>J MED MICROBIOL</span></a></li>
+                  <li><a href="http://jmmcr.sgmjournals.org" title="JMM CASE REPORTS"><span>JMM CASE REPORTS</span></a></li>
+                  <li class="last"><a href="http://www.sgmjournals.org" title="ALL SGM JOURNALS"><span>ALL SGM JOURNALS</span></a></li>
+               </ul>
+               		
+               <div class="sidebar-icon-group">
+                  			
+                  <div class="icons">
+                     			<a href="http://www.sgm.ac.uk/" rel="external-nw"><img src="/publisher/img/society_logo.gif" class="publisher-icon" alt="Society Logo" /></a>
+                     			<a href="http://www.the-icsp.org/" rel="external-nw"><img src="/publisher/img/icsp_logo.gif" class="publisher-icon" alt="ICSP Logo" /></a>
+                     			<a href="http://highwire.stanford.edu/" rel="external-nw"><img src="/publisher/img/hplogo.gif" class="hw-icon" alt="HighWire Press Logo" /></a>
+                     			
+                  </div>
+                  			
+                  <div class="sidebar-icon-text"><span>The <a href="http://www.sgmjournals.org"> Society for General Microbiology</a> publishes online with the assistance of <a href="http://highwire.stanford.edu">HighWire Press®</a>.</span></div>
+                  		
+               </div>
+               	
+            </div>
+            <div class="most-links-box js-marker">
+               
+               <div class="most-header">
+                  
+                  <h3>Most</h3>
+                  
+               </div>
+               
+               <ul>
+                  <li class="most-cur-sel">
+                     <h4>Viewed</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/1070?rss=1&amp;ssource=mfr">Proposal to consistently apply the International Code of Nomenclature of Prokaryotes (ICNP) to names of the oxygenic photosynthetic
+                                 bacteria (cyanobacteria), including those validly published under the International Code of Botanical Nomenclature (ICBN)/International
+                                 Code of Nomenclature for algae, fungi and plants (ICN), and proposal to change Principle 2 of the ICNP</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfr">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/316?rss=1&amp;ssource=mfr">Integrating genomics into the taxonomy and systematics of the Bacteria and Archaea</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/333?rss=1&amp;ssource=mfr">Applications of next-generation sequencing to unravelling the evolutionary history of algae</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/739?rss=1&amp;ssource=mfr">Notification that new names of prokaryotes, new combinations, and new taxonomic opinions have appeared in volume 64, part
+                                 12, of the IJSEM</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfr1.dtl" class="view-all">» View all Most Viewed articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+                  <li>
+                     <h4>Cited</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4386?rss=1&amp;ssource=mfc">Chryseobacterium hispalense sp. nov., a plant-growth-promoting bacterium isolated from a rainwater pond in an olive plant
+                                 nursery, and emended descriptions of Chryseobacterium defluvii, Chryseobacterium indologenes, Chryseobacterium wanjuense and
+                                 Chryseobacterium gregarium</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfc">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_1/138?rss=1&amp;ssource=mfc">Aquibacter zeaxanthinifaciens gen. nov., sp. nov., a zeaxanthin-producing bacterium of the family Flavobacteriaceae isolated
+                                 from surface seawater, and emended descriptions of the genera Aestuariibaculum and Gaetbulibacter</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4790?rss=1&amp;ssource=mfc">Kordia aquimaris sp. nov., a zeaxanthin-producing member of the family Flavobacteriaceae isolated from surface seawater, and
+                                 emended description of the genus Kordia</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4524?rss=1&amp;ssource=mfc">Erythrobacter odishensis sp. nov. and Pontibacter odishensis sp. nov. isolated from dry soil of a solar saltern</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfc1.dtl" class="view-all">» View all Most Cited articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+               </ul>
+               
+               
+            </div>
+            
+            
+            
+         </div>
+         <div id="footer">
+            
+            <div class="bar">
+               
+               <div class="footer-group footer-col-left">
+                  		
+                  <p class="copyright">Copyright ©
+                     		2015 International Union of Microbiological Societies
+                     	
+                  </p>
+                  	
+               </div>
+               
+               <div class="footer-group footer-col-right">
+                  	    
+                  <ul class="issns">
+                     <li>
+                        <span>Print ISSN: </span>
+                        <span class="issn">1466-5026</span>
+                        
+                     </li>
+                     <li>
+                        <span>Online ISSN: </span>
+                        <span class="issn">1466-5034</span>
+                        
+                     </li>
+                  </ul>
+                  	  
+               </div>
+               	  
+            </div>
+            
+            
+            <div class="block-2 sb-div"></div>
+            
+         </div><script type="text/javascript">
+        var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
+        document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
+        </script><script type="text/javascript">
+        try {
+        var pageTracker = _gat._getTracker("UA-189672-25");
+        pageTracker._setDomainName(".sgmjournals.org");
+        pageTracker._trackPageview();
+        } catch(err) {}
+        </script><script type="text/javascript">
+	(function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
+		(i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
+		m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
+	})(window,document,'script','//www.google-analytics.com/analytics.js','ga');
+
+	ga('create', 'UA-48529861-1', '.sgmjournals.org');
+	ga('send', 'pageview');
+	</script></div>
+   </body>
+</html>
\ No newline at end of file
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4350.full/F1.small.gif b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4350.full/F1.small.gif
new file mode 100644
index 00000000..a50ecad2
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4350.full/F1.small.gif differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4350.full/fulltext.html b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4350.full/fulltext.html
new file mode 100644
index 00000000..fb6278da
--- /dev/null
+++ b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4350.full/fulltext.html
@@ -0,0 +1,1078 @@
+<!DOCTYPE html
+  PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html
+      xmlns="http://www.w3.org/1999/xhtml"
+      xml:lang="en"
+      lang="en">
+   <head>
+      <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
+      <title>Reclassification of Bifidobacterium stercoris Kim et al. 2010 as a later heterotypic synonym of Bifidobacterium adolescentis
+         
+      </title>
+      <meta name="googlebot" content="NOODP" />
+      <meta name="HW.ad-path" content="/cgi/content/full/63/Pt_11/4350" />
+      <meta content="/ijs/63/Pt_11/4350.atom" name="HW.identifier" />
+      <meta name="DC.Format" content="text/html" />
+      <meta name="DC.Language" content="en" />
+      <meta content="Reclassification of Bifidobacterium stercoris Kim et al. 2010 as a later heterotypic synonym of Bifidobacterium adolescentis"
+            name="DC.Title" />
+      <meta content="10.1099/ijs.0.054957-0" name="DC.Identifier" />
+      <meta content="2013-11-01" name="DC.Date" />
+      <meta content="Society for General Microbiology" name="DC.Publisher" />
+      <meta content="J. Killer" name="DC.Contributor" />
+      <meta content="I. Sedláček" name="DC.Contributor" />
+      <meta content="V. Rada" name="DC.Contributor" />
+      <meta content="J. Havlík" name="DC.Contributor" />
+      <meta content="J. Kopečný" name="DC.Contributor" />
+      <meta content="International Journal of Systematic and Evolutionary&#xA;                Microbiology"
+            name="citation_journal_title" />
+      <meta content="Int J Syst Evol&#xA;                Microbiol"
+            name="citation_journal_abbrev" />
+      <meta content="1466-5026" name="citation_issn" />
+      <meta content="1466-5034" name="citation_issn" />
+      <meta name="citation_author" content="J. Killer" />
+      <meta name="citation_author_institution"
+            content="1Institute of Animal Physiology and Genetics v.v.i., Academy of Sciences of the Czech Republic, Vídeňská 1083, Prague 4 – Krč, 142 20, Czech Republic" />
+      <meta name="citation_author_institution"
+            content="2Czech University of Life Sciences, Faculty of Agrobiology, Food and Natural Resources, Department of Microbiology, Nutrition and Dietetics, Kamýcká 129, Prague 6 – Suchdol, 165 21, Czech Republic" />
+      <meta name="citation_author" content="I. Sedláček" />
+      <meta name="citation_author_institution"
+            content="3Czech Collection of Microorganisms, Department of Experimental Biology, Faculty of Science, Masaryk University, Tvrdého 14, 60200 Brno, Czech Republic" />
+      <meta name="citation_author" content="V. Rada" />
+      <meta name="citation_author_institution"
+            content="2Czech University of Life Sciences, Faculty of Agrobiology, Food and Natural Resources, Department of Microbiology, Nutrition and Dietetics, Kamýcká 129, Prague 6 – Suchdol, 165 21, Czech Republic" />
+      <meta name="citation_author" content="J. Havlík" />
+      <meta name="citation_author_institution"
+            content="2Czech University of Life Sciences, Faculty of Agrobiology, Food and Natural Resources, Department of Microbiology, Nutrition and Dietetics, Kamýcká 129, Prague 6 – Suchdol, 165 21, Czech Republic" />
+      <meta name="citation_author" content="J. Kopečný" />
+      <meta name="citation_author_institution"
+            content="1Institute of Animal Physiology and Genetics v.v.i., Academy of Sciences of the Czech Republic, Vídeňská 1083, Prague 4 – Krč, 142 20, Czech Republic" />
+      <meta content="Reclassification of Bifidobacterium stercoris Kim et al. 2010 as a later heterotypic synonym of Bifidobacterium adolescentis"
+            name="citation_title" />
+      <meta content="11/01/2013" name="citation_date" />
+      <meta content="63" name="citation_volume" />
+      <meta content="Pt 11" name="citation_issue" />
+      <meta content="4350" name="citation_firstpage" />
+      <meta content="4353" name="citation_lastpage" />
+      <meta content="63/Pt_11/4350" name="citation_id" />
+      <meta content="63/Pt 11/4350" name="citation_id_from_sass_path" />
+      <meta content="ijs;63/Pt_11/4350" name="citation_mjid" />
+      <meta content="10.1099/ijs.0.054957-0" name="citation_doi" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4350.abstract"
+            name="citation_abstract_html_url" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4350.full"
+            name="citation_fulltext_html_url" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4350.full.pdf"
+            name="citation_pdf_url" />
+      <meta content="/content/63/Pt_11.cover.gif" name="issue_cover_image" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4350"
+            name="citation_public_url" />
+      <meta content="24187022" name="citation_pmid" />
+      <meta name="citation_fulltext_world_readable" content="" />
+      <meta name="citation_section" content="Taxonomic Note" />
+      <meta name="robots" content="noarchive,nofollow" />
+      <meta name="googlebot" content="noarchive" />
+      <link href="/content/63/Pt_11/4340.short" rel="prev" />
+      <link href="/content/63/Pt_11/4354.short" rel="next" />
+      <link rel="stylesheet" type="text/css" media="all" href="/shared/css/hw-global.css" />
+      <link rel="stylesheet" type="text/css" media="print" href="/shared/css/hw-print.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/standard-designs/design25/main.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/local/css/hw-local-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/jquery.fancybox-1.3.4.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-global-colexpand.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-global-colexpand.css" /><script type="text/javascript" id="session-d7759557e1">var callbackToken='5633EA7ACB0BFB1';</script><script type="text/javascript" id="session-d7759557e3">
+                      var subCode='sgmjournal_sub';
+                    </script><script type="text/javascript" src="/shared/js/jquery-min.js"></script><script type="text/javascript" src="/shared/js/fingerprint.js"></script><script type="text/javascript" src="/shared/js/hw-shared.js"></script><script type="text/javascript" src="/shared/js/design/hw-design1.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-shared.js"></script><script type="text/javascript" src="/shared/js/pages/hw-content.js"></script><script type="text/javascript" src="/shared/js/fancybox/jquery.fancybox-1.3.4.js"></script><script type="text/javascript" src="/shared/js/fancybox/jquery.easing-1.3.pack.js"></script><script type="text/javascript"
+              src="/shared/js/fancybox/jquery.mousewheel-3.0.4.pack.js"></script><script type="text/javascript" src="/shared/js/util/content.jquery.addVariantLink.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-custom-free.js"></script><script type="text/javascript" src="/shared/js/util/hw-col-expand.js"></script><script type="text/javascript"
+              src="https://data.namesforlife.com/script/NamesforLife.js"></script></head>
+   <body>
+      <div class="hw-gen-page pagetype-content" id="pageid-content" itemscope="itemscope"
+           itemtype="http://schema.org/ScholarlyArticle">
+         <div id="header">
+            
+            <h1><a id="logo" href="/"><span>International Journal of Systematic and Evolutionary Microbiology</span></a></h1>
+            
+            <p id="skip-link">
+               <a href="#content-block">Skip to main page content</a>
+               
+            </p>
+            
+            <ul class="button-list header-buttons">
+               <li class="first"><a href="/" title="HOME"><span>HOME</span></a></li>
+               <li><a href="/content/current" title="CURRENT ISSUE"><span>CURRENT ISSUE</span></a></li>
+               <li><a href="/content" title="ARCHIVE"><span>ARCHIVE</span></a></li>
+               <li><a href="/search" title="SEARCH"><span>SEARCH</span></a></li>
+               <li><a href="/help" title="HELP"><span>HELP</span></a></li>
+               <li class="last"><a href="/feedback" title="CONTACT US"><span>CONTACT US</span></a></li>
+            </ul>
+            
+            
+            <div class="header-qs">
+               
+               <form class="searchbox" action="/search" method="get">
+                  <div>
+                     	<label for="header-qs-input" id="header-qs-search-label">Search for Keyword:</label>
+                     <input value="" title="Search" type="text" name="fulltext" id="header-qs-input" /><input type="hidden" name="submit" value="yes" /><label for="header-qs-search" id="header-qs-search-label">GO</label><input value="GO" alt="Link: Go" type="image" id="header-qs-search-go"
+                            src="/shared/img/standard-design/design2/go.gif" /> 
+                     
+                  </div>
+                  <div class="adv-search-link"><a href="/search">Advanced Search</a></div>
+               </form>
+               
+               
+            </div>
+            
+            <div class="header-ac-elements">
+               
+               <div id="authstring" class="suppress-header-login">
+                  
+                  <ul>
+                     <li class="subscr-ref">Institution: THE NATURAL HISTORY MUSEUM</li>
+                     <li>
+                        <a href="/login?uri=http%3A%2F%2Fijs.sgmjournals.org%2Fcontent%2F63%2FPt_11%2F4350.full">
+                           Sign In as Member / Individual
+                           </a>
+                        
+                     </li>
+                  </ul>           
+                  
+               </div> 
+               
+               <div id="hdr-login" class="suppress-header-login"></div>
+               
+            </div>
+            
+            <div class="banner-ads">
+               		
+               <ul>
+                  <li class="position-1 no-ad hdr_left"><span>  </span></li>
+               </ul>
+               	
+            </div>
+            
+            <div class="bar">
+               
+               <div class="bar-inner"></div>
+               
+            </div>
+            
+         </div>
+         <div id="content-block">
+            <div class="article fulltext-view " itemprop="articleBody"><span class="highwire-journal-article-marker-start"></span><h1 id="article-title-1" itemprop="headline">Reclassification of <span class="named-content species" id="named-content-1"><a class="namesforlife" rel="namesforlife-name" title="Bifidobacterium stercoris"
+                        href="doi:10.1601/nm.20247"><em>Bifidobacterium stercoris</em></a></span> Kim <em>et al.</em> 2010 as a later heterotypic synonym of <span class="named-content species" id="named-content-2"><a class="namesforlife" rel="namesforlife-name"
+                        title="Bifidobacterium adolescentis"
+                        href="doi:10.1601/nm.7679"><em>Bifidobacterium adolescentis</em></a></span></h1>
+               <div class="contributors">
+                  <ol class="contributor-list" id="contrib-group-1">
+                     <li class="contributor" id="contrib-1" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=J.+Killer&amp;sortspec=date&amp;submit=Submit">J. Killer</a></span><a id="xref-aff-1-1" class="xref-aff" href="#aff-1"><sup>1</sup></a><span class="xref-sep">,</span><a id="xref-aff-2-1" class="xref-aff" href="#aff-2"><sup>2</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-2" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=I.+Sedl%C3%A1%C4%8Dek&amp;sortspec=date&amp;submit=Submit">I. Sedláček</a></span><a id="xref-aff-3-1" class="xref-aff" href="#aff-3"><sup>3</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-3" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search" href="/search?author1=V.+Rada&amp;sortspec=date&amp;submit=Submit">V. Rada</a></span><a id="xref-aff-2-2" class="xref-aff" href="#aff-2"><sup>2</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-4" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=J.+Havl%C3%ADk&amp;sortspec=date&amp;submit=Submit">J. Havlík</a></span><a id="xref-aff-2-3" class="xref-aff" href="#aff-2"><sup>2</sup></a> and 
+                     </li>
+                     <li class="last" id="contrib-5"><span class="name"><a class="name-search"
+                              href="/search?author1=J.+Kope%C4%8Dn%C3%BD&amp;sortspec=date&amp;submit=Submit">J. Kopečný</a></span><a id="xref-aff-1-2" class="xref-aff" href="#aff-1"><sup>1</sup></a></li>
+                  </ol>
+                  <ol class="affiliation-list">
+                     <li class="aff"><a id="aff-1" name="aff-1"></a><address><sup>1</sup>Institute of Animal Physiology and Genetics v.v.i., Academy of Sciences of the Czech Republic, Vídeňská 1083, Prague 4 – Krč,
+                           142 20, Czech Republic
+                        </address>
+                     </li>
+                     <li class="aff"><a id="aff-2" name="aff-2"></a><address><sup>2</sup>Czech University of Life Sciences, Faculty of Agrobiology, Food and Natural Resources, Department of Microbiology, Nutrition
+                           and Dietetics, Kamýcká 129, Prague 6 – Suchdol, 165 21, Czech Republic
+                        </address>
+                     </li>
+                     <li class="aff"><a id="aff-3" name="aff-3"></a><address><sup>3</sup>Czech Collection of Microorganisms, Department of Experimental Biology, Faculty of Science, Masaryk University, Tvrdého 14,
+                           60200 Brno, Czech Republic
+                        </address>
+                     </li>
+                  </ol>
+                  <ol class="corresp-list">
+                     <li class="corresp" id="corresp-1"><strong>Correspondence</strong><br /> J. Killer <span class="em-link"><span class="em-addr">Killer.Jiri{at}seznam.cz</span></span> <em>or</em>  <span class="em-link"><span class="em-addr">killer{at}iapg.cas.cz</span></span></li>
+                  </ol>
+               </div>
+               <div class="section abstract" id="abstract-1" itemprop="description">
+                  <div class="section-nav">
+                     <div class="nav-placeholder"> </div><a href="#fn-group-1" title="Next Section" class="next-section-link"><span>Next Section</span></a></div>
+                  <h2>Abstract</h2>
+                  
+                  <p id="p-3">The taxonomic position of <span class="named-content species" id="named-content-8"><a class="namesforlife" rel="namesforlife-name" title="Bifidobacterium stercoris"
+                           href="doi:10.1601/nm.20247"><em>Bifidobacterium stercoris</em></a></span> Eg1<sup>T</sup> ( = JCM 15918<sup>T</sup>) based on comparative 16S rRNA gene and <em>hsp60</em> sequence analyses was found to be controversial, as the strain showed high similarity to the type strain of <span class="named-content species" id="named-content-9"><a class="namesforlife" rel="namesforlife-name"
+                           title="Bifidobacterium adolescentis"
+                           href="doi:10.1601/nm.7679"><em>Bifidobacterium adolescentis</em></a></span>, CCUG 18363<sup>T</sup>. Therefore, the relationship between the two species was investigated by a taxonomic study that included, in addition to
+                     re-evaluation of the 16S rRNA gene sequence, determination of DNA–DNA binding and multilocus sequence analysis (MLSA) of housekeeping
+                     genes encoding the DNA-directed RNA polymerase B subunit (<em>rpoC</em>), putative xylulose-5-phosphate/fructose-6-phosphate phosphoketolase (<em>xfp</em>), elongation factor EF-G (<em>fusA</em>), 50S ribosomal protein L2 (<em>rplB</em>) and DNA gyrase B subunit (<em>gyrB</em>). Comparative 16S rRNA gene sequence analysis showed relatively high similarity (98.9 %) between <span class="named-content species" id="named-content-10"><a class="namesforlife" rel="namesforlife-name" title="B. stercoris"
+                           href="doi:10.1601/nm.20247"><em>B. stercoris</em></a></span> KCTC 5756<sup>T</sup> and <span class="named-content species" id="named-content-11"><a class="namesforlife" rel="namesforlife-name" title="B. adolescentis"
+                           href="doi:10.1601/nm.7679"><em>B. adolescentis</em></a></span> ATCC 15703<sup>T</sup>. MLSA revealed close relatedness between <span class="named-content species" id="named-content-12"><a class="namesforlife" rel="namesforlife-name" title="B. stercoris"
+                           href="doi:10.1601/nm.20247"><em>B. stercoris</em></a></span> KCTC 5756<sup>T</sup> and <span class="named-content species" id="named-content-13"><a class="namesforlife" rel="namesforlife-name" title="B. adolescentis"
+                           href="doi:10.1601/nm.7679"><em>B. adolescentis</em></a></span> CCUG 18363<sup>T</sup>, with 99.3–100 % similarity between the <em>rpoC</em>, <em>xfp</em>, <em>fusA</em>, <em>rplB</em> and <em>gyrB</em> gene sequences. In addition, relatively high <em>dnaJ1</em> gene sequence similarity of 97.7 % was found between the strains. Similar phenotypes and a high DNA–DNA binding value (78.9 %)
+                     confirmed that <span class="named-content species" id="named-content-14"><a class="namesforlife" rel="namesforlife-name" title="B. stercoris"
+                           href="doi:10.1601/nm.20247"><em>B. stercoris</em></a></span> and <span class="named-content species" id="named-content-15"><a class="namesforlife" rel="namesforlife-name" title="B. adolescentis"
+                           href="doi:10.1601/nm.7679"><em>B. adolescentis</em></a></span> are synonymous. Based on these results, it is proposed that the species <span class="named-content species" id="named-content-16"><a class="namesforlife" rel="namesforlife-name" title="Bifidobacterium stercoris"
+                           href="doi:10.1601/nm.20247"><em>Bifidobacterium stercoris</em></a></span> Kim <em>et al.</em> 2010 should be reclassified as a later heterotypic synonym of <span class="named-content species" id="named-content-17"><a class="namesforlife" rel="namesforlife-name"
+                           title="Bifidobacterium adolescentis"
+                           href="doi:10.1601/nm.7679"><em>Bifidobacterium adolescentis</em></a></span> Reuter 1963 (Approved Lists 1980).
+                  </p>
+                  
+               </div>
+               <div class="section fn-group" id="fn-group-1">
+                  <div class="section-nav"><a href="#abstract-1" title="Abstract" class="prev-section-link"><span>Previous Section</span></a><a href="#ack-1" title="Acknowledgements" class="next-section-link"><span>Next Section</span></a></div>
+                  <ul>
+                     <li class="fn-other" id="fn-1">
+                        <p id="p-1">The GenBank/EMBL/DDBJ accession numbers for the partial <em>rpoC</em>, <em>xfp</em>, <em>fusA</em>, <em>rplB</em>, <em>gyrB</em> and <em>dnaJ1</em> gene sequences of <span class="named-content species" id="named-content-5"><a class="namesforlife" rel="namesforlife-name" title="B. stercoris"
+                                 href="doi:10.1601/nm.20247"><em>B. stercoris</em></a></span> KCTC 5756<sup>T</sup> and <span class="named-content species" id="named-content-6"><a class="namesforlife" rel="namesforlife-name" title="B. adolescentis"
+                                 href="doi:10.1601/nm.7679"><em>B. adolescentis</em></a></span> CCUG 18363<sup>T</sup> are respectively JQ363659 and JQ363660 (<em>rpoC</em>), JQ363666 and JQ363667 (<em>xfp</em>), JQ363628 and JQ363629 (<em>fusA</em>), JQ363655 and JQ363656 (<em>rplB</em>), JQ363638 and JQ363639 (<em>gyrB</em>) and JQ363622 and JQ363623 (<em>dnaJ1</em>). The GenBank/EMBL/DDBJ accession number for the revised partial 16S rRNA gene sequence of <span class="named-content species" id="named-content-7"><a class="namesforlife" rel="namesforlife-name" title="B. stercoris"
+                                 href="doi:10.1601/nm.20247"><em>B. stercoris</em></a></span> KCTC 5756<sup>T</sup> is KF147852.
+                        </p>
+                     </li>
+                     <li class="fn-supplementary-material" id="fn-2">
+                        <p id="p-2">Two supplementary figures and a supplementary table are available with the online version of this paper.</p>
+                     </li>
+                  </ul>
+               </div>
+               <p id="p-4"><span class="named-content species" id="named-content-18"><a class="namesforlife" rel="namesforlife-name" title="Bifidobacterium stercoris"
+                        href="doi:10.1601/nm.20247"><em>Bifidobacterium stercoris</em></a></span> was described by <a id="xref-ref-9-1" class="xref-bibr" href="#ref-9">Kim <em>et al.</em> (2010)</a> for one strain isolated from faeces of a Korean adult mainly on the basis of phenotypic characteristics and DNA–DNA reassociation
+                  results. All results confirmed that the new bacterial isolate belonged to the genus <span class="named-content genus" id="named-content-19"><a class="namesforlife" rel="namesforlife-name" title="Bifidobacterium"
+                        href="doi:10.1601/nm.7677"><em>Bifidobacterium</em></a></span>. However, the authors stated, based on phylogenetic analyses, that the new isolate was closely related to <span class="named-content species" id="named-content-20"><a class="namesforlife" rel="namesforlife-name"
+                        title="Bifidobacterium adolescentis"
+                        href="doi:10.1601/nm.7679"><em>Bifidobacterium adolescentis</em></a></span>. Moreover, the habitats from which these bacteria were isolated suggest the necessity of clarifying their taxonomic relationship
+                  with additional genetic approaches. The affinity of <span class="named-content species" id="named-content-21"><a class="namesforlife" rel="namesforlife-name" title="B. stercoris"
+                        href="doi:10.1601/nm.20247"><em>B. stercoris</em></a></span> KCTC 5756<sup>T</sup> and the type strain of <span class="named-content species" id="named-content-22"><a class="namesforlife" rel="namesforlife-name" title="B. adolescentis"
+                        href="doi:10.1601/nm.7679"><em>B. adolescentis</em></a></span>, CCUG 18363<sup>T</sup>, was therefore evaluated in this study by a polyphasic taxonomic approach.
+               </p>
+               <p id="p-5">Both strains were grown at 37 °C in TPY anaerobic broth (<a id="xref-ref-11-1" class="xref-bibr" href="#ref-11">Scardovi, 1986</a>). Chromosomal DNA was extracted using the DNeasy Blood &amp; Tissue kit (Qiagen) according to the manufacturer’s protocol. The
+                  16S rRNA gene sequence of <span class="named-content species" id="named-content-23"><a class="namesforlife" rel="namesforlife-name" title="B. stercoris"
+                        href="doi:10.1601/nm.20247"><em>B. stercoris</em></a></span> KCTC 5756<sup>T</sup> was resequenced by the method of <a id="xref-ref-7-1" class="xref-bibr" href="#ref-7">Killer <em>et al.</em> (2011)</a>. A comparative analysis based on the revised 16S rRNA gene sequence of <span class="named-content species" id="named-content-24"><a class="namesforlife" rel="namesforlife-name" title="B. stercoris"
+                        href="doi:10.1601/nm.20247"><em>B. stercoris</em></a></span> KCTC 5756<sup>T</sup> (GenBank accession no. <a href="/external-ref?link_type=GEN&amp;access_num=KF147852">KF147852</a>) and the 16S rRNA gene sequence of <span class="named-content species" id="named-content-25"><a class="namesforlife" rel="namesforlife-name" title="B. adolescentis"
+                        href="doi:10.1601/nm.7679"><em>B. adolescentis</em></a></span> ATCC 15703<sup>T</sup> (NR_074802) revealed relatively high similarity of 98.9 % (over a total of 1520 bp). This relatively high similarity is of
+                  limited value for the resolution of bacterial species (<a id="xref-ref-13-1" class="xref-bibr" href="#ref-13">Tindall <em>et al.</em>, 2010</a>). Protein-coding housekeeping gene sequences have recently been recommended for the determination of genomic relatedness
+                  at the bacterial species level because of their ability to provide higher taxonomic resolution compared with 16S rRNA gene
+                  sequence analysis (<a id="xref-ref-14-1" class="xref-bibr" href="#ref-14">Ventura <em>et al.</em>, 2006</a>). Therefore, comparative sequence analyses were done between <span class="named-content species" id="named-content-26"><a class="namesforlife" rel="namesforlife-name" title="B. stercoris"
+                        href="doi:10.1601/nm.20247"><em>B. stercoris</em></a></span> KCTC 5756<sup>T</sup> and <span class="named-content species" id="named-content-27"><a class="namesforlife" rel="namesforlife-name" title="B. adolescentis"
+                        href="doi:10.1601/nm.7679"><em>B. adolescentis</em></a></span> CCUG 18363<sup>T</sup> based on <em>rpoC</em>, <em>xfp</em>, <em>fusA</em>, <em>rplB</em>, <em>gyrB</em> and <em>dnaJ1</em> gene sequences. Multilocus sequence analysis (MLSA) has been proposed as an alternative to DNA hybridization, enabling inter-
+                  and intra-specific genomic relatedness to be established. In addition, the authors who described the species <span class="named-content species" id="named-content-28"><a class="namesforlife" rel="namesforlife-name" title="B. stercoris"
+                        href="doi:10.1601/nm.20247"><em>B. stercoris</em></a></span> reported high <em>hsp60</em> gene sequence similarity (99.4 %) between <span class="named-content species" id="named-content-29"><a class="namesforlife" rel="namesforlife-name" title="B. stercoris"
+                        href="doi:10.1601/nm.20247"><em>B. stercoris</em></a></span> Eg1<sup>T</sup> and <span class="named-content species" id="named-content-30"><a class="namesforlife" rel="namesforlife-name" title="B. adolescentis"
+                        href="doi:10.1601/nm.7679"><em>B. adolescentis</em></a></span> JCM 1275<sup>T</sup> (<a id="xref-ref-9-2" class="xref-bibr" href="#ref-9">Kim <em>et al.</em>, 2010</a>). Primers and PCR conditions for amplification of partial <em>fusA</em>, <em>rplB</em> and <em>gyrB</em> gene sequences were obtained from <a id="xref-ref-4-1" class="xref-bibr" href="#ref-4">Delétoile <em>et al.</em> (2010)</a>. Partial sequences of <em>rpoC</em> and <em>dnaJ1</em> genes were amplified under conditions described by <a id="xref-ref-14-2" class="xref-bibr" href="#ref-14">Ventura <em>et al.</em> (2006)</a>. The gene encoding the xylulose-5-phosphate/fructose-6-phosphate phosphoketolase (<em>xfp</em>) was proposed as a suitable phylogenetic marker for bifidobacteria by <a id="xref-ref-1-1" class="xref-bibr" href="#ref-1">Berthoud <em>et al.</em> (2005)</a>. Amplified DNA fragments were subsequently checked by electrophoresis on 1.5 % PCR agarose gel (Top-Bio), purified using
+                  a PCR purification kit (Qiagen) and sequenced by using an automatic ABI PRISM 3130xl Genetic Analyzer (Applied Biosystems).
+                  The values of sequence similarity based on <em>rpoC</em>, <em>xfp</em>, <em>fusA</em>, <em>rplB</em>, <em>gyrB</em> and <em>dnaJ1</em> gene sequences using the jPHYDIT program (<a id="xref-ref-6-1" class="xref-bibr" href="#ref-6">Jeon <em>et al.</em>, 2005</a>) were 99.3, 99.6, 99.6, 99.8, 100.0 and 97.7 %, respectively. Multilocus sequence typing based on partial <em>fusA</em>, <em>rplB</em> and <em>gyrB</em> gene sequences revealed ≥99 % similarity between different strains within bifidobacterial species (<a id="xref-ref-4-2" class="xref-bibr" href="#ref-4">Delétoile <em>et al.</em>, 2010</a>). <a id="xref-ref-14-3" class="xref-bibr" href="#ref-14">Ventura <em>et al.</em> (2006)</a> determined means of 88.25 and 65.09 % sequence similarity for the <em>rpoC</em> and <em>dnaJ1</em> genes between 31 bifidobacterial strains.
+               </p>
+               <p id="p-6">The concatenation of protein-encoding housekeeping genes has been shown to be extremely useful in order to infer bacterial
+                  phylogeny (<a id="xref-ref-12-1" class="xref-bibr" href="#ref-12">Teichmann &amp; Mitchison, 1999</a>). Therefore, phylogenetic analysis to reveal the relationship between <span class="named-content species" id="named-content-31"><a class="namesforlife" rel="namesforlife-name" title="B. stercoris"
+                        href="doi:10.1601/nm.20247"><em>B. stercoris</em></a></span> KCTC 5756<sup>T</sup> and <span class="named-content species" id="named-content-32"><a class="namesforlife" rel="namesforlife-name" title="B. adolescentis"
+                        href="doi:10.1601/nm.7679"><em>B. adolescentis</em></a></span> CCUG 18363<sup>T</sup> was based on concatenated sequences of the <em>hsp60</em>, <em>xfp</em> and <em>dnaJ1</em> genes. These housekeeping genes were chosen because their sequences are available for a wider range of bifidobacterial species.
+                  Phylogenetic trees were reconstructed by <span class="sc">mega</span> version 5.05 and the Gblocks program using the maximum-likelihood algorithm as described previously (<a id="xref-ref-8-1" class="xref-bibr" href="#ref-8">Killer <em>et al.</em>, 2013</a>). The topology of the phylogenetic tree reconstructed on the basis of concatenated <em>hsp60</em> and <em>xfp</em> gene sequences revealed a very close relationship between the two tested strains. The phylogenetic branch length between
+                  the two strains was shorter than the length of the phylogenetic branches between distinctive subspecies of bifidobacteria
+                  such as <span class="named-content subspecies" id="named-content-33"><a class="namesforlife" rel="namesforlife-name"
+                        title="Bifidobacterium animalis subsp. animalis"
+                        href="doi:10.1601/nm.7681"><em>Bifidobacterium animalis</em> subsp. <em>animalis</em></a></span> and <span class="named-content subspecies" id="named-content-34"><a class="namesforlife" rel="namesforlife-name" title="B. animalis subsp. lactis"
+                        href="doi:10.1601/nm.8511"><em>B. animalis</em> subsp. <em>lactis</em></a></span> and <span class="named-content subspecies" id="named-content-35"><a class="namesforlife" rel="namesforlife-name"
+                        title="Bifidobacterium pseudolongum subsp. pseudolongum"
+                        href="doi:10.1601/nm.7703"><em>Bifidobacterium pseudolongum</em> subsp. <em>pseudolongum</em></a></span> and <span class="named-content subspecies" id="named-content-36"><a class="namesforlife" rel="namesforlife-name"
+                        title="B. pseudolongum subsp. globosum"
+                        href="doi:10.1601/nm.7704"><em>B. pseudolongum</em> subsp. <em>globosum</em></a></span> (<a id="xref-fig-1-1" class="xref-fig" href="#F1">Fig. 1</a>). Very similar results were obtained using concatenated <em>hsp60</em>, <em>xfp</em> and <em>dnaJ1</em> gene sequences (Fig. S1, available in IJSEM Online). The GenBank accession numbers for the partial <em>hsp60</em>, <em>xfp</em> and <em>dnaJ1</em> gene sequences of type strains of bifidobacterial species used and generated in this study are listed in Table S1. A close
+                  relationship of the two bacterial strains was also confirmed by the phylogenetic tree of the family <span class="named-content family" id="named-content-37"><a class="namesforlife" rel="namesforlife-name" title="Bifidobacteriaceae"
+                        href="doi:10.1601/nm.7676"><em>Bifidobacteriaceae</em></a></span> reconstructed on the basis of sequences of the 16S rRNA gene (Fig. S2).
+               </p>
+               <div id="F1" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4350/F1.expansion.html"><img alt="Fig. 1. " src="4350/F1.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4350/F1.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4350/F1.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4350/F1">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 1. </span> 
+                     
+                     <p id="p-7" class="first-child">Phylogenetic tree of the family <span class="named-content family" id="named-content-38"><a class="namesforlife" rel="namesforlife-name" title="Bifidobacteriaceae"
+                              href="doi:10.1601/nm.7676"><em>Bifidobacteriaceae</em></a></span> showing the very close relationship of <span class="named-content species" id="named-content-39"><a class="namesforlife" rel="namesforlife-name" title="B. adolescentis"
+                              href="doi:10.1601/nm.7679"><em>B. adolescentis</em></a></span> CCUG 18363<sup>T</sup> and <span class="named-content species" id="named-content-40"><a class="namesforlife" rel="namesforlife-name" title="B. stercoris"
+                              href="doi:10.1601/nm.20247"><em>B. stercoris</em></a></span> KCTC 5756<sup>T</sup>, reconstructed by the maximum-likelihood method based on concatenated partial sequences of the <em>hsp60</em> (539 nt) and <em>xfp</em> (418 nt) genes using <span class="sc">mega</span> version 5.05 software after removing hypervariable positions by using the program Gblocks. Sequence data were aligned using
+                        the <span class="sc">clustal</span> <span class="sc">w</span> algorithm. The Tamura–Nei model was used for reconstruction of the phylogenetic tree. Bootstrap values, expressed as percentages
+                        of 1000 datasets, are given at nodes. GenBank accession numbers of partial gene sequences derived from type strains are presented
+                        in Table S1. The tree was rooted by <span class="named-content species" id="named-content-41"><a class="namesforlife" rel="namesforlife-name" title="Gardnerella vaginalis"
+                              href="doi:10.1601/nm.7721"><em>Gardnerella vaginalis</em></a></span> ATCC 14018<sup>T</sup>. Bar, 0.04 substitutions per nucleotide position.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <p id="p-8">The determination of DNA–DNA relatedness is the mandatory reference method for determining whether micro-organisms belong
+                  to the same species (<a id="xref-ref-13-2" class="xref-bibr" href="#ref-13">Tindall <em>et al.</em>, 2010</a>). DNA–DNA relatedness between <span class="named-content species" id="named-content-42"><a class="namesforlife" rel="namesforlife-name" title="B. stercoris"
+                        href="doi:10.1601/nm.20247"><em>B. stercoris</em></a></span> KCTC 5756<sup>T</sup> and <span class="named-content species" id="named-content-43"><a class="namesforlife" rel="namesforlife-name" title="B. adolescentis"
+                        href="doi:10.1601/nm.7679"><em>B. adolescentis</em></a></span> CCUG 18363<sup>T</sup> was re-evaluated as follows. Wet biomass (3 g) from the tested strains suspended in isopropanol/water (1 : 1, v/v) was disrupted
+                  using a Constant Systems TS 0.75 kW disruptor (IUL Instruments) and the DNA in the crude lysate was purified by chromatography
+                  on hydroxyapatite as described by <a id="xref-ref-2-1" class="xref-bibr" href="#ref-2">Cashion <em>et al.</em> (1977)</a>. DNA–DNA hybridization was carried out as described by <a id="xref-ref-3-1" class="xref-bibr" href="#ref-3">De Ley <em>et al.</em> (1970)</a> under consideration of the modifications described by <a id="xref-ref-5-1" class="xref-bibr" href="#ref-5">Huss <em>et al.</em> (1983)</a> using a model Cary 100 Bio UV/Vis spectrophotometer equipped with a Peltier-thermostatted 6×6 multicell changer and a temperature
+                  controller with <em>in</em>-<em>situ</em> temperature probe (Varian). The results showed that the tested strains had a binding level of 78.9 % (mean of three experiments,
+                  <span class="sc">sd</span> = 0.2 %), higher than the 70 % species boundary limit.
+               </p>
+               <p id="p-9">The DNA G+C contents of <span class="named-content species" id="named-content-44"><a class="namesforlife" rel="namesforlife-name" title="B. stercoris"
+                        href="doi:10.1601/nm.20247"><em>B. stercoris</em></a></span> KCTC 5756<sup>T</sup> and <span class="named-content species" id="named-content-45"><a class="namesforlife" rel="namesforlife-name" title="B. adolescentis"
+                        href="doi:10.1601/nm.7679"><em>B. adolescentis</em></a></span> CCUG 18363<sup>T</sup> were re-evaluated as follows. DNA was degraded enzymically into nucleosides as described by <a id="xref-ref-10-1" class="xref-bibr" href="#ref-10">Mesbah <em>et al.</em> (1989)</a>. The nucleoside mixture was then separated by HPLC as described previously (<a id="xref-ref-7-2" class="xref-bibr" href="#ref-7">Killer <em>et al.</em>, 2011</a>). The determined values were not significantly different between the studied strains (60.6 and 61.2 mol%, respectively).
+               </p>
+               <p id="p-10">API 50 CHL and Rapid ID 32A commercial kits (bioMérieux) were used for comparison of biochemical characteristics of <span class="named-content species" id="named-content-46"><a class="namesforlife" rel="namesforlife-name" title="B. stercoris"
+                        href="doi:10.1601/nm.20247"><em>B. stercoris</em></a></span> KCTC 5756<sup>T</sup> and <span class="named-content species" id="named-content-47"><a class="namesforlife" rel="namesforlife-name" title="B. adolescentis"
+                        href="doi:10.1601/nm.7679"><em>B. adolescentis</em></a></span> CCUG 18363<sup>T</sup> to determine intra- or interspecies divergence. For this purpose, the strains were cultivated in anaerobic TPY broth. Tests
+                  were performed according to the manufacturer’s instructions, except that the API 50 CHL test strips were incubated under anaerobic
+                  conditions (anaerobic jars; Oxoid) at 37 °C for 48 h. Minor differences in biochemical characteristics between <span class="named-content species" id="named-content-48"><a class="namesforlife" rel="namesforlife-name" title="B. adolescentis"
+                        href="doi:10.1601/nm.7679"><em>B. adolescentis</em></a></span> CCUG 18363<sup>T</sup> and <span class="named-content species" id="named-content-49"><a class="namesforlife" rel="namesforlife-name" title="B. stercoris"
+                        href="doi:10.1601/nm.20247"><em>B. stercoris</em></a></span> KCTC 5756<sup>T</sup> are shown in <a id="xref-table-wrap-1-1" class="xref-table" href="#T1">Table 1</a>. These results proved the close biochemical similarity of the tested strains.
+               </p>
+               <div id="T1" class="table pos-float">
+                  <div class="table-inline">
+                     <div class="callout"><span>View this table:</span><ul class="callout-links">
+                           <li><a href="4350/T1.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4350/T1.expansion.html">In a new window</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="table-caption"><span class="table-label">Table 1. </span> 
+                     <span class="caption-title">Minor differences between <span class="named-content species" id="named-content-50"><a class="namesforlife" rel="namesforlife-name" title="B. stercoris"
+                              href="doi:10.1601/nm.20247"><em>B. stercoris</em></a></span> KCTC 5756<sup>T</sup> and <span class="named-content species" id="named-content-51"><a class="namesforlife" rel="namesforlife-name" title="B. adolescentis"
+                              href="doi:10.1601/nm.7679"><em>B. adolescentis</em></a></span> CCUG 18363<sup>T</sup></span>
+                     
+                     <p id="p-11" class="first-child">Both strains produced acids from <span class="sc">d</span>-ribose, <span class="sc">d</span>-galactose, <span class="sc">d</span>-glucose, amygdalin, arbutin, aesculin (hydrolysis), maltose, lactose, melibiose, sucrose, raffinose, gentiobiose and turanose.
+                        Neither strain produced acids from glycerol, erythritol, <span class="sc">d</span>- or <span class="sc">l</span>-arabinose, <span class="sc">d</span>- or <span class="sc">l</span>-xylose, <span class="sc">d</span>-adonitol, methyl β-<span class="sc">d</span>-xylopyranoside, <span class="sc">d</span>-mannose, <span class="sc">l</span>-sorbose, <span class="sc">l</span>-rhamnose, dulcitol, inositol, <span class="sc">d</span>-mannitol, methyl α-<span class="sc">d</span>-mannopyranoside, methyl α-<span class="sc">d</span>-glucopyranoside, <em>N</em>-acetylglucosamine, cellobiose, trehalose, inulin, melezitose, starch, glycogen, xylitol, <span class="sc">d</span>-lyxose, <span class="sc">d</span>-tagatose, <span class="sc">d</span>- or <span class="sc">l</span>-fucose, <span class="sc">d</span>- or <span class="sc">l</span>-arabitol, gluconate or 2- or 5-ketogluconate. Both strains were positive for α-galactosidase, α-glucosidase, β-galactosidase,
+                        β-glucosidase, α-arabinosidase, arginine arylamidase, proline arylamidase, leucyl glycine arylamidase, phenylalanine arylamidase,
+                        leucine arylamidase, tyrosine arylamidase, alanine arylamidase, glycine arylamidase, histidine arylamidase and serine arylamidase.
+                        Both strains were negative for urease, arginine dihydrolase, β-galactosidase-6-phosphate, β-glucuronidase, <em>N</em>-acetyl-β-glucosaminidase, glutamic acid decarboxylase, α-fucosidase, nitrate reduction, indole production, alkaline phosphatase,
+                        pyroglutamic acid arylamidase, glutamyl glutamic acid arylamidase, esterase (C4), valine arylamidase, cystine arylamidase,
+                        trypsin, α-chymotrypsin, α-mannosidase, gelatin hydrolysis, catalase and oxidase. +, Positive reaction; <span class="sc">w</span>, weakly positive reaction; −, negative reaction.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <p id="p-12">On the basis of the phenotypic and important genotypic results presented in this study, it is proposed that <span class="named-content species" id="named-content-54"><a class="namesforlife" rel="namesforlife-name" title="B. stercoris"
+                        href="doi:10.1601/nm.20247"><em>B. stercoris</em></a></span> and <span class="named-content species" id="named-content-55"><a class="namesforlife" rel="namesforlife-name" title="B. adolescentis"
+                        href="doi:10.1601/nm.7679"><em>B. adolescentis</em></a></span> represent the same species and should be united under the same name. It is concluded that <span class="named-content species" id="named-content-56"><a class="namesforlife" rel="namesforlife-name" title="Bifidobacterium stercoris"
+                        href="doi:10.1601/nm.20247"><em>Bifidobacterium stercoris</em></a></span> Kim <em>et al.</em> 2010 is a later heterotypic synonym of <span class="named-content species" id="named-content-57"><a class="namesforlife" rel="namesforlife-name"
+                        title="Bifidobacterium adolescentis"
+                        href="doi:10.1601/nm.7679"><em>Bifidobacterium adolescentis</em></a></span> Reuter 1963 (Approved Lists 1980), which has priority.
+               </p>
+               <div class="section ack" id="ack-1">
+                  <div class="section-nav"><a href="#fn-group-1" title="Previous Section" class="prev-section-link"><span>Previous Section</span></a><a href="#ref-list-1" title="References" class="next-section-link"><span>Next Section</span></a></div>
+                  <h2>Acknowledgements</h2>
+                  
+                  <p id="p-13">This work was supported by the Czech Science Foundation (project no. GA CR 304/11/1252), the Operation Programme Education
+                     for Competitiveness project CEB (CZ.1.07/2.3.00/20.0183) and the Institutional Research Project of the Institute of Animal
+                     Physiology and Genetics, Acad. Sci. CR (RVO 67985904).
+                  </p>
+                  
+               </div>
+               <div class="section ref-list" id="ref-list-1">
+                  <div class="section-nav"><a href="#ack-1" title="Acknowledgements" class="prev-section-link"><span>Previous Section</span></a><div class="nav-placeholder"> </div>
+                  </div>
+                  <h2>References</h2>
+                  <ol class="cit-list ref-use-labels">
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-1-1" title="View reference  in text"
+                           id="ref-1">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4350.1"
+                             data-doi="10.1016/j.lwt.2004.05.002">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Berthoud</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Chavagnat</span>,  <span class="cit-name-given-names">F.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Haueter</span>,  <span class="cit-name-given-names">M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Casey</span>,  <span class="cit-name-given-names">M. G.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2005</span><strong>).</strong> <span class="cit-article-title">Comparison of partial gene sequences encoding a phosphoketolase for the identification of bifidobacteria</span>. <abbr class="cit-jnl-abbrev">LWT-Food Sci Technol</abbr> <span class="cit-vol">38</span>, <span class="cit-fpage">101</span>–<span class="cit-lpage">105</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/j.lwt.2004.05.002</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/j.lwt.2004.05.002&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Comparison%20of%20partial%20gene%20sequences%20encoding%20a%20phosphoketolase%20for%20the%20identification%20of%20bifidobacteria&amp;author=H.%20Berthoud&amp;author=F.%20Chavagnat&amp;author=M.%20Haueter&amp;author=M.%20G.%20Casey&amp;publication_year=2005&amp;journal=LWT-Food%20Sci%20Technol&amp;volume=38&amp;pages=101-105&amp;doi=10.1016%2Fj.lwt.2004.05.002">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-2-1" title="View reference  in text"
+                           id="ref-2">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4350.2"
+                             data-doi="10.1016/0003-2697(77)90720-5">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Cashion</span>,  <span class="cit-name-given-names">P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Holder-Franklin</span>,  <span class="cit-name-given-names">M. A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">McCully</span>,  <span class="cit-name-given-names">J.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Franklin</span>,  <span class="cit-name-given-names">M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1977</span><strong>).</strong> <span class="cit-article-title">A rapid method for the base ratio determination of bacterial DNA</span>. <abbr class="cit-jnl-abbrev">Anal Biochem</abbr> <span class="cit-vol">81</span>, <span class="cit-fpage">461</span>–<span class="cit-lpage">466</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/0003-2697(77)90720-5</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>907108</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/0003-2697(77)90720-5&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=907108&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=A%20rapid%20method%20for%20the%20base%20ratio%20determination%20of%20bacterial%20DNA&amp;author=P.%20Cashion&amp;author=M.%20A.%20Holder-Franklin&amp;author=J.%20McCully&amp;author=M.%20Franklin&amp;publication_year=1977&amp;journal=Anal%20Biochem&amp;volume=81&amp;pages=461-466&amp;doi=10.1016%2F0003-2697%2877%2990720-5&amp;pmid=907108">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-3-1" title="View reference  in text"
+                           id="ref-3">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4350.3"
+                             data-doi="10.1111/j.1432-1033.1970.tb00830.x">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">De Ley</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Cattoir</span>,  <span class="cit-name-given-names">H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Reynaerts</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1970</span><strong>).</strong> <span class="cit-article-title">The quantitative measurement of DNA hybridization from renaturation rates</span>. <abbr class="cit-jnl-abbrev">Eur J Biochem</abbr> <span class="cit-vol">12</span>, <span class="cit-fpage">133</span>–<span class="cit-lpage">142</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1111/j.1432-1033.1970.tb00830.x</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>4984993</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1111/j.1432-1033.1970.tb00830.x&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=4984993&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=The%20quantitative%20measurement%20of%20DNA%20hybridization%20from%20renaturation%20rates&amp;author=J.%20De%20Ley&amp;author=H.%20Cattoir&amp;author=A.%20Reynaerts&amp;publication_year=1970&amp;journal=Eur%20J%20Biochem&amp;volume=12&amp;pages=133-142&amp;doi=10.1111%2Fj.1432-1033.1970.tb00830.x&amp;pmid=4984993">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-4-1" title="View reference  in text"
+                           id="ref-4">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4350.4"
+                             data-doi="10.1016/j.resmic.2009.12.006">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Delétoile</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Passet</span>,  <span class="cit-name-given-names">V.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Aires</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Chambaud</span>,  <span class="cit-name-given-names">I.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Butel</span>,  <span class="cit-name-given-names">M.-J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Smokvina</span>,  <span class="cit-name-given-names">T.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brisse</span>,  <span class="cit-name-given-names">S.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2010</span><strong>).</strong> <span class="cit-article-title">Species delineation and clonal diversity in four <em>Bifidobacterium</em> species as revealed by multilocus sequencing</span>. <abbr class="cit-jnl-abbrev">Res Microbiol</abbr> <span class="cit-vol">161</span>, <span class="cit-fpage">82</span>–<span class="cit-lpage">90</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/j.resmic.2009.12.006</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>20060895</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/j.resmic.2009.12.006&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=20060895&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Species%20delineation%20and%20clonal%20diversity%20in%20four%20Bifidobacterium%20species%20as%20revealed%20by%20multilocus%20sequencing&amp;author=A.%20Del%C3%A9toile&amp;author=V.%20Passet&amp;author=J.%20Aires&amp;author=I.%20Chambaud&amp;author=M.-J.%20Butel&amp;author=T.%20Smokvina&amp;author=S.%20Brisse&amp;publication_year=2010&amp;journal=Res%20Microbiol&amp;volume=161&amp;pages=82-90&amp;doi=10.1016%2Fj.resmic.2009.12.006&amp;pmid=20060895">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-5-1" title="View reference  in text"
+                           id="ref-5">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4350.5"
+                             data-doi="10.1016/S0723-2020(83)80048-4">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Huss</span>,  <span class="cit-name-given-names">V. A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Festl</span>,  <span class="cit-name-given-names">H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Schleifer</span>,  <span class="cit-name-given-names">K. H.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1983</span><strong>).</strong> <span class="cit-article-title">Studies on the spectrophotometric determination of DNA hybridization from renaturation rates</span>. <abbr class="cit-jnl-abbrev">Syst Appl Microbiol</abbr> <span class="cit-vol">4</span>, <span class="cit-fpage">184</span>–<span class="cit-lpage">192</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/S0723-2020(83)80048-4</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>23194591</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/S0723-2020(83)80048-4&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=23194591&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Studies%20on%20the%20spectrophotometric%20determination%20of%20DNA%20hybridization%20from%20renaturation%20rates&amp;author=V.%20A.%20Huss&amp;author=H.%20Festl&amp;author=K.%20H.%20Schleifer&amp;publication_year=1983&amp;journal=Syst%20Appl%20Microbiol&amp;volume=4&amp;pages=184-192&amp;doi=10.1016%2FS0723-2020%2883%2980048-4&amp;pmid=23194591">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-6-1" title="View reference  in text"
+                           id="ref-6">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4350.6"
+                             data-doi="10.1093/bioinformatics/bti463">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jeon</span>,  <span class="cit-name-given-names">Y. S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Chung</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Park</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hur</span>,  <span class="cit-name-given-names">I.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lee</span>,  <span class="cit-name-given-names">J. H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Chun</span>,  <span class="cit-name-given-names">J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2005</span><strong>).</strong> <span class="cit-article-title">jPHYDIT: a JAVA-based integrated environment for molecular phylogeny of ribosomal RNA sequences</span>. <abbr class="cit-jnl-abbrev">Bioinformatics</abbr> <span class="cit-vol">21</span>, <span class="cit-fpage">3171</span>–<span class="cit-lpage">3173</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1093/bioinformatics/bti463</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>15855247</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=bioinfo&amp;resid=21/14/3171"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-7-1" title="View reference  in text"
+                           id="ref-7">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4350.7"
+                             data-doi="10.1099/ijs.0.022525-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Killer</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kopečný</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Mrázek</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Koppová</span>,  <span class="cit-name-given-names">I.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Havlík</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Benada</span>,  <span class="cit-name-given-names">O.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kott</span>,  <span class="cit-name-given-names">T.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2011</span><strong>).</strong> <span class="cit-article-title"><em>Bifidobacterium actinocoloniiforme</em> sp. nov. and <em>Bifidobacterium bohemicum</em> sp. nov., from the bumblebee digestive tract</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">61</span>, <span class="cit-fpage">1315</span>–<span class="cit-lpage">1321</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.022525-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>20656822</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=61/6/1315"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-8-1" title="View reference  in text"
+                           id="ref-8">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4350.8"
+                             data-doi="10.1016/j.syapm.2012.09.001">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Killer</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Mrázek</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bunešová</span>,  <span class="cit-name-given-names">V.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Havlík</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Koppová</span>,  <span class="cit-name-given-names">I.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Benada</span>,  <span class="cit-name-given-names">O.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Rada</span>,  <span class="cit-name-given-names">V.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kopečný</span>,  <span class="cit-name-given-names">J.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Vlková</span>,  <span class="cit-name-given-names">E.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2013</span><strong>).</strong> <span class="cit-article-title"><em>Pseudoscardovia suis</em> gen. nov., sp. nov., a new member of the family <em>Bifidobacteriaceae</em> isolated from the digestive tract of wild pigs (<em>Sus scrofa</em>)</span>. <abbr class="cit-jnl-abbrev">Syst Appl Microbiol</abbr> <span class="cit-vol">36</span>, <span class="cit-fpage">11</span>–<span class="cit-lpage">16</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/j.syapm.2012.09.001</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>23122702</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/j.syapm.2012.09.001&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=23122702&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Pseudoscardovia%20suis%20gen.%20nov.%2C%20sp.%20nov.%2C%20a%20new%20member%20of%20the%20family%20Bifidobacteriaceae%20isolated%20from%20the%20digestive%20tract%20of%20wild%20pigs%20%28Sus%20scrofa%29&amp;author=J.%20Killer&amp;author=J.%20Mr%C3%A1zek&amp;author=V.%20Bune%C5%A1ov%C3%A1&amp;author=J.%20Havl%C3%ADk&amp;author=I.%20Koppov%C3%A1&amp;author=O.%20Benada&amp;author=V.%20Rada&amp;author=J.%20Kope%C4%8Dn%C3%BD&amp;author=E.%20Vlkov%C3%A1&amp;publication_year=2013&amp;journal=Syst%20Appl%20Microbiol&amp;volume=36&amp;pages=11-16&amp;doi=10.1016%2Fj.syapm.2012.09.001&amp;pmid=23122702">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-9-1" title="View reference  in text"
+                           id="ref-9">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4350.9"
+                             data-doi="10.1099/ijs.0.019943-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kim</span>,  <span class="cit-name-given-names">M. S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Roh</span>,  <span class="cit-name-given-names">S. W.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bae</span>,  <span class="cit-name-given-names">J. W.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2010</span><strong>).</strong> <span class="cit-article-title"><em>Bifidobacterium stercoris</em> sp. nov., isolated from human faeces</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">60</span>, <span class="cit-fpage">2823</span>–<span class="cit-lpage">2827</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.019943-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>20081020</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=60/12/2823"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-10-1" title="View reference  in text"
+                           id="ref-10">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4350.10"
+                             data-doi="10.1099/00207713-39-2-159">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Mesbah</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Premachandran</span>,  <span class="cit-name-given-names">U.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Whitman</span>,  <span class="cit-name-given-names">W. B.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1989</span><strong>).</strong> <span class="cit-article-title">Precise measurement of the G+C content of deoxyribonucleic acid by high performance liquid chromatography</span>. <abbr class="cit-jnl-abbrev">Int J Syst Bacteriol</abbr> <span class="cit-vol">39</span>, <span class="cit-fpage">159</span>–<span class="cit-lpage">167</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-39-2-159</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=39/2/159"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-11-1" title="View reference  in text"
+                           id="ref-11">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4350.11">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Sneath</span>,  <span class="cit-name-given-names">P. H. A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Mair</span>,  <span class="cit-name-given-names">N. S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Sharp</span>,  <span class="cit-name-given-names">M. E.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Holt</span>,  <span class="cit-name-given-names">J. G.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Scardovi</span>,  <span class="cit-name-given-names">V.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1986</span><strong>).</strong> <span class="cit-article-title">Genus <em>Bifidobacterium</em></span>. In <span class="cit-source">Bergey’s Manual of Systematic Bacteriology</span>, <span class="cit-vol">vol. 2</span>, pp. <span class="cit-fpage">1418</span>–<span class="cit-lpage">1434</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Sneath</span>,  <span class="cit-name-given-names">P. H. A.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Mair</span>,  <span class="cit-name-given-names">N. S.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Sharp</span>,  <span class="cit-name-given-names">M. E.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Holt</span>,  <span class="cit-name-given-names">J. G.</span></span>
+                                 . <span class="cit-publ-loc">Baltimore</span>: <span class="cit-publ-name">Williams &amp; Wilkins</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Genus%20Bifidobacterium&amp;author=V.%20Scardovi&amp;publication_year=1986&amp;citation_inbook_title=Bergey%E2%80%99s%20Manual%20of%20Systematic%20Bacteriology">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-12-1" title="View reference  in text"
+                           id="ref-12">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4350.12"
+                             data-doi="10.1007/PL00006538">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Teichmann</span>,  <span class="cit-name-given-names">S. A.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Mitchison</span>,  <span class="cit-name-given-names">G.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1999</span><strong>).</strong> <span class="cit-article-title">Is there a phylogenetic signal in prokaryote proteins?</span> <abbr class="cit-jnl-abbrev">J Mol Evol</abbr> <span class="cit-vol">49</span>, <span class="cit-fpage">98</span>–<span class="cit-lpage">107</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/PL00006538</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>10368438</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/PL00006538&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=10368438&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Is%20there%20a%20phylogenetic%20signal%20in%20prokaryote%20proteins%3F&amp;author=S.%20A.%20Teichmann&amp;author=G.%20Mitchison&amp;publication_year=1999&amp;journal=J%20Mol%20Evol&amp;volume=49&amp;pages=98-107&amp;doi=10.1007%2FPL00006538&amp;pmid=10368438">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-13-1" title="View reference  in text"
+                           id="ref-13">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4350.13"
+                             data-doi="10.1099/ijs.0.016949-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Tindall</span>,  <span class="cit-name-given-names">B. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Rosselló-Móra</span>,  <span class="cit-name-given-names">R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Busse</span>,  <span class="cit-name-given-names">H. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ludwig</span>,  <span class="cit-name-given-names">W.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kämpfer</span>,  <span class="cit-name-given-names">P.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2010</span><strong>).</strong> <span class="cit-article-title">Notes on the characterization of prokaryote strains for taxonomic purposes</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">60</span>, <span class="cit-fpage">249</span>–<span class="cit-lpage">266</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.016949-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>19700448</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=60/1/249"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-14-1" title="View reference  in text"
+                           id="ref-14">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4350.14"
+                             data-doi="10.1099/ijs.0.64233-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ventura</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Canchaya</span>,  <span class="cit-name-given-names">C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Del Casale</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Dellaglio</span>,  <span class="cit-name-given-names">F.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Neviani</span>,  <span class="cit-name-given-names">E.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Fitzgerald</span>,  <span class="cit-name-given-names">G. F.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">van Sinderen</span>,  <span class="cit-name-given-names">D.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2006</span><strong>).</strong> <span class="cit-article-title">Analysis of bifidobacterial evolution using a multilocus approach</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">56</span>, <span class="cit-fpage">2783</span>–<span class="cit-lpage">2792</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.64233-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>17158978</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=56/12/2783"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                  </ol>
+               </div><span class="highwire-journal-article-marker-end"></span></div>
+            <div class="social-bookmarking">
+               
+               <ul class="social-bookmark-links">
+                  <li class="social-bookmarking-item social-bookmarking-item-citeulike"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4350&amp;title=Reclassification%20of%20Bifidobacterium%20stercoris%20Kim%20et%20al.%202010%20as%20a%20later%20heterotypic%20synonym%20of%20Bifidobacterium%20adolescentis+--+Killer%20et%20al.%2063%20%28Pt%2011%29%3A%204350+--+IJSEM&amp;doi=10.1099/ijs.0.054957-0&amp;link_type=CITEULIKE"><img src="/shared/img/common/social-bookmarking/citeulike.gif"
+                             alt="Add to CiteULike"
+                             title="CiteULike" /></a><span class="soc-bm-link-text">CiteULike</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-delicious"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4350&amp;title=Reclassification%20of%20Bifidobacterium%20stercoris%20Kim%20et%20al.%202010%20as%20a%20later%20heterotypic%20synonym%20of%20Bifidobacterium%20adolescentis+--+Killer%20et%20al.%2063%20%28Pt%2011%29%3A%204350+--+IJSEM&amp;doi=10.1099/ijs.0.054957-0&amp;link_type=DEL_ICIO_US"><img src="/shared/img/common/social-bookmarking/delicious.gif"
+                             alt="Add to Delicious"
+                             title="Delicious" /></a><span class="soc-bm-link-text">Delicious</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-digg"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4350&amp;title=Reclassification%20of%20Bifidobacterium%20stercoris%20Kim%20et%20al.%202010%20as%20a%20later%20heterotypic%20synonym%20of%20Bifidobacterium%20adolescentis+--+Killer%20et%20al.%2063%20%28Pt%2011%29%3A%204350+--+IJSEM&amp;doi=10.1099/ijs.0.054957-0&amp;link_type=DIGG"><img src="/shared/img/common/social-bookmarking/digg.gif" alt="Add to Digg"
+                             title="Digg" /></a><span class="soc-bm-link-text">Digg</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-facebook"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/short/63/Pt_11/4350&amp;title=Reclassification%20of%20Bifidobacterium%20stercoris%20Kim%20et%20al.%202010%20as%20a%20later%20heterotypic%20synonym%20of%20Bifidobacterium%20adolescentis+--+Killer%20et%20al.%2063%20%28Pt%2011%29%3A%204350+--+IJSEM&amp;doi=10.1099/ijs.0.054957-0&amp;link_type=FACEBOOK"
+                        class="sb-facebook"
+                        rel="external-nw"><img src="/shared/img/common/social-bookmarking/facebook.gif" alt="Add to Facebook"
+                             title="Facebook" /></a><span class="soc-bm-link-text">Facebook</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-googleplus"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4350&amp;title=Reclassification%20of%20Bifidobacterium%20stercoris%20Kim%20et%20al.%202010%20as%20a%20later%20heterotypic%20synonym%20of%20Bifidobacterium%20adolescentis+--+Killer%20et%20al.%2063%20%28Pt%2011%29%3A%204350+--+IJSEM&amp;doi=10.1099/ijs.0.054957-0&amp;link_type=GOOGLEPLUS&amp;log_only=yes"><img src="/shared/img/common/social-bookmarking/googleplus.jpg" alt="Add to Google+"
+                             title="Google+" /></a><span class="soc-bm-link-text">Google+</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-linkedin"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4350&amp;title=Reclassification%20of%20Bifidobacterium%20stercoris%20Kim%20et%20al.%202010%20as%20a%20later%20heterotypic%20synonym%20of%20Bifidobacterium%20adolescentis+--+Killer%20et%20al.%2063%20%28Pt%2011%29%3A%204350+--+IJSEM&amp;doi=10.1099/ijs.0.054957-0&amp;link_type=LINKEDIN"><img src="/shared/img/common/social-bookmarking/linkedin.gif" alt="Add to LinkedIn"
+                             title="LinkedIn" /></a><span class="soc-bm-link-text">LinkedIn</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-mendeley"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4350&amp;title=Reclassification%20of%20Bifidobacterium%20stercoris%20Kim%20et%20al.%202010%20as%20a%20later%20heterotypic%20synonym%20of%20Bifidobacterium%20adolescentis+--+Killer%20et%20al.%2063%20%28Pt%2011%29%3A%204350+--+IJSEM&amp;doi=10.1099/ijs.0.054957-0&amp;link_type=MENDELEY"><img src="/shared/img/common/social-bookmarking/mendeley.gif" alt="Add to Mendeley"
+                             title="Mendeley" /></a><span class="soc-bm-link-text">Mendeley</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-reddit"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4350&amp;title=Reclassification%20of%20Bifidobacterium%20stercoris%20Kim%20et%20al.%202010%20as%20a%20later%20heterotypic%20synonym%20of%20Bifidobacterium%20adolescentis+--+Killer%20et%20al.%2063%20%28Pt%2011%29%3A%204350+--+IJSEM&amp;doi=10.1099/ijs.0.054957-0&amp;link_type=REDDIT"><img src="/shared/img/common/social-bookmarking/reddit.gif" alt="Add to Reddit"
+                             title="Reddit" /></a><span class="soc-bm-link-text">Reddit</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-twitter"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4350&amp;title=Reclassification%20of%20Bifidobacterium%20stercoris%20Kim%20et%20al.%202010%20as%20a%20later%20heterotypic%20synonym%20of%20Bifidobacterium%20adolescentis+--+Killer%20et%20al.%2063%20%28Pt%2011%29%3A%204350+--+IJSEM&amp;doi=10.1099/ijs.0.054957-0&amp;link_type=TWITTER"><img src="/shared/img/common/social-bookmarking/twitter.gif" alt="Add to Twitter"
+                             title="Twitter" /></a><span class="soc-bm-link-text">Twitter</span></li>
+               </ul>
+               
+               <p class="social-bookmarking-help"><a href="/help/social_bookmarks.dtl">What's this?</a></p>
+               
+            </div><span id="related-urls"></span></div>
+         <div id="col-2">
+            
+            <div class="article-nav sidebar-nav">
+               <a href="/content/63/Pt_11/4340.short" title="Previous article" class="previous">« Previous</a><span class="article-nav-sep"> | </span><a href="/content/63/Pt_11/4354.short" title="Next article" class="next">Next Article »</a>
+               
+               <span class="toc-link">
+                  				<a href="/content/63/Pt_11.toc" title="Table of Contents">Table of Contents</a>
+                  			</span>
+               
+               
+            </div>
+            <div class="free-article">
+               <span class="free-article-note">
+                  FREE ARTICLE
+                  </span>
+               
+            </div>
+            <div class="content-box" id="article-cb-main">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Article</span></h3>
+                  <div class="cb-section cb-slug">
+                     <ol>
+                        <li>
+                           <div id="slugline">
+                              
+                              
+                              	    
+                              
+                              doi:
+                              <span title="10.1099/ijs.0.054957-0" class="slug-doi">10.1099/ijs.0.054957-0
+                                 </span>
+                              <cite>
+                                 	    <abbr title="International Journal of Systematic and Evolutionary Microbiology"
+                                       class="slug-jnl-abbrev">
+                                    IJSEM</abbr><span class="slug-pub-date" itemprop="datePublished">
+                                    	    November 2013 
+                                    </span>
+                                 	    <span class="slug-vol">
+                                    vol. 63 
+                                    </span><span class="slug-issue">
+                                    no. Pt 11 
+                                    </span><span class="slug-pages">
+                                    4350-4353
+                                    </span>
+                                 </cite>
+                              
+                              	           
+                              
+                              
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section cb-views">
+                     <ol>
+                        <li class="abstract-view-link primary"><a href="/content/63/Pt_11/4350.abstract" rel="view-abstract">Abstract</a><span class="free">Free</span></li>
+                        <li class="notice full-text-view-link primary"><span class="variant-indicator">» <span>Full Text</span></span><span class="free">Free</span></li>
+                        <li class="notice full-text-pdf-view-link primary"><a href="/content/63/Pt_11/4350.full.pdf+html" rel="view-full-text.pdf">Full Text (PDF)</a><span class="free">Free</span></li>
+                        <li><a href="/content/63/Pt_11/4350/suppl/DC1" rel="supplemental-data"
+                              class="dslink-supplementary-material">Supplementary material</a></li>
+                        <li><a href="/powerpoint/63/Pt_11/4350">PPT Slides of All Figures</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible" id="cb-art-cat">
+                     <h4 class="cb-section-header"><span>Classifications</span></h4>
+                     <ol>
+                        <li>
+                           <ul class="subject-headings last-child">
+                              <li><a class="tocsection-search"
+                                    href="/search?tocsectionid=Taxonomic+Note&amp;sortspec=date&amp;submit=Submit">Taxonomic Note</a></li>
+                           </ul>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible" id="cb-art-svcs">
+                     <h4 class="cb-section-header"><span>Services</span></h4>
+                     <ol>
+                        <li class="mail-a-friend-link icon-link"><a href="/email?gca=ijs%3B63%2FPt_11%2F4350&amp;current-view-path=/content/63/Pt_11/4350.full">
+                              Email this article to a colleague</a></li>
+                        <li class="alert-link icon-link"><a href="/cgi/alerts/ctalert?alertType=citedby&amp;addAlert=cited_by&amp;cited_by_criteria_resid=ijs%3B63%2FPt_11%2F4350&amp;saveAlert=no&amp;return-type=article&amp;return_url=http://ijs.sgmjournals.org/content/63/Pt_11/4350.full">Alert me when this article is cited</a></li>
+                        <li class="alert-link icon-link"><a href="/cgi/alerts/ctalert?alertType=correction&amp;addAlert=correction&amp;correction_criteria_value=63/Pt_11/4350&amp;saveAlert=no&amp;return-type=article&amp;return_url=http://ijs.sgmjournals.org/content/63/Pt_11/4350.full">Alert me if a correction is posted</a></li>
+                        <li class="similar-link"><a href="/search?qbe=ijs%3Bijs.0.054957-0&amp;citation=Killer%20et%20al.%2063%20%28Pt%2011%29:%204350&amp;submit=yes">Similar articles in this journal</a></li>
+                        <li class="similar-link"><a href="/external-ref?access_num=ijs%3B63%2FPt_11%2F4350&amp;link_type=ISI_RELATEDRECORDS"
+                              id="cb-isi-similar-articles"
+                              class="similar-link">Similar articles in Web of Science</a></li>
+                        <li class="similar-link"><a href="/external-ref?access_num=24187022&amp;link_type=MED_NBRS"
+                              class="similar-link">Similar articles in PubMed</a></li>
+                        <li class="cit-man-link icon-link cite-link"><a href="/citmgr?gca=ijs%3B63%2FPt_11%2F4350">Download to citation manager</a></li>
+                        <li class="copyright-link icon-link"><a href="/external-ref?link_type=PERMISSIONDIRECT"><img src="/shared/img/content/permissions.gif" /></a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-cit">
+                     <h4 class="cb-section-header"><span>Citing Articles</span></h4>
+                     <ol>
+                        <li class="hw-citing-link"><a href="/content/63/Pt_11/4350.full?cited-by=yes&amp;legid=ijs;63/Pt_11/4350#cited-by"
+                              id="cb-hw-citing-articles">Load citing article information</a></li>
+                        <li><a href="/cgi/crossref-forward-links/63/Pt_11/4350" rel="external-nw"
+                              id="cb-crossref-citing-articles">Citing articles via CrossRef</a></li>
+                        <li><a href="/external-ref?access_num=%2Fijs%2F63%2FPt_11%2F4350&amp;link_type=ISI_CITING&amp;accnum_type=native"
+                              rel="external-nw"
+                              id="cb-isi-citing-articles">Citing articles via Web of Science</a></li>
+                        <li><a href="/external-ref?access_num=http://ijs.sgmjournals.org/content/63/Pt_11/4350.abstract&amp;link_type=GOOGLESCHOLAR">Citing articles via Google Scholar</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-gs">
+                     <h4 class="cb-section-header"><span>Google Scholar</span></h4>
+                     <ol>
+                        <li class="cb-art-gs-auth author-link"><a href="http://scholar.google.com/scholar?q=%22author%3AKiller%20author%3AJ.%22"
+                              class="cb-art-gs-auth author-link">Articles by  Killer, J.</a></li>
+                        <li class="cb-art-gs-auth author-link"><a href="http://scholar.google.com/scholar?q=%22author%3AKope%C4%8Dn%C3%BD%20author%3AJ.%22"
+                              class="cb-art-gs-auth author-link">Articles by  Kopečný, J.</a></li>
+                        <li class="cb-art-gs-rel similar-link"><a href="/external-ref?access_num=http://ijs.sgmjournals.org/content/63/Pt_11/4350.abstract&amp;link_type=GOOGLESCHOLARRELATED">Search for related content</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-pm">
+                     <h4 class="cb-section-header"><span>PubMed</span></h4>
+                     <ol>
+                        <li class="cb-art-pm-cite cite-link icon-link"><a href="/external-ref?access_num=24187022&amp;link_type=PUBMED"
+                              class="cb-art-pm-cite cite-link icon-link">PubMed citation</a></li>
+                        <li class="cb-art-pm-auth author-link"><a href="/external-ref?access_num=Killer%20J&amp;link_type=AUTHORSEARCH"
+                              class="cb-art-pm-auth author-link">Articles by  Killer, J.</a></li>
+                        <li class="cb-art-pm-auth author-link"><a href="/external-ref?access_num=Kope%C4%8Dn%C3%BD%20J&amp;link_type=AUTHORSEARCH"
+                              class="cb-art-pm-auth author-link">Articles by  Kopečný, J.</a></li>
+                        <li>
+                           <div id="cb-entrez-links-placeholder"><a href="/entrez-links/24187022"></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-rel">
+                     <h4 class="cb-section-header"><span>Related Content</span></h4>
+                     <ol>
+                        <li><a href="/content/63/Pt_11/4350.full?related-urls=yes&amp;legid=ijs;63/Pt_11/4350#related-urls"
+                              id="cb-related-urls">Load related web page information</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed soc-links icon-link"
+                       id="cb-art-soc">
+                     <h4 class="cb-section-header"><span>Social Bookmarking</span></h4>
+                     <ol>
+                        <li>
+                           <div class="social-bookmarking">
+                              
+                              <ul class="social-bookmark-links">
+                                 <li class="social-bookmarking-item social-bookmarking-item-citeulike"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4350&amp;title=Reclassification%20of%20Bifidobacterium%20stercoris%20Kim%20et%20al.%202010%20as%20a%20later%20heterotypic%20synonym%20of%20Bifidobacterium%20adolescentis+--+Killer%20et%20al.%2063%20%28Pt%2011%29%3A%204350+--+IJSEM&amp;doi=10.1099/ijs.0.054957-0&amp;link_type=CITEULIKE"><img src="/shared/img/common/social-bookmarking/citeulike.gif"
+                                            alt="Add to CiteULike"
+                                            title="CiteULike" /></a><span class="soc-bm-link-text">CiteULike</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-delicious"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4350&amp;title=Reclassification%20of%20Bifidobacterium%20stercoris%20Kim%20et%20al.%202010%20as%20a%20later%20heterotypic%20synonym%20of%20Bifidobacterium%20adolescentis+--+Killer%20et%20al.%2063%20%28Pt%2011%29%3A%204350+--+IJSEM&amp;doi=10.1099/ijs.0.054957-0&amp;link_type=DEL_ICIO_US"><img src="/shared/img/common/social-bookmarking/delicious.gif"
+                                            alt="Add to Delicious"
+                                            title="Delicious" /></a><span class="soc-bm-link-text">Delicious</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-digg"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4350&amp;title=Reclassification%20of%20Bifidobacterium%20stercoris%20Kim%20et%20al.%202010%20as%20a%20later%20heterotypic%20synonym%20of%20Bifidobacterium%20adolescentis+--+Killer%20et%20al.%2063%20%28Pt%2011%29%3A%204350+--+IJSEM&amp;doi=10.1099/ijs.0.054957-0&amp;link_type=DIGG"><img src="/shared/img/common/social-bookmarking/digg.gif" alt="Add to Digg"
+                                            title="Digg" /></a><span class="soc-bm-link-text">Digg</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-facebook"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/short/63/Pt_11/4350&amp;title=Reclassification%20of%20Bifidobacterium%20stercoris%20Kim%20et%20al.%202010%20as%20a%20later%20heterotypic%20synonym%20of%20Bifidobacterium%20adolescentis+--+Killer%20et%20al.%2063%20%28Pt%2011%29%3A%204350+--+IJSEM&amp;doi=10.1099/ijs.0.054957-0&amp;link_type=FACEBOOK"
+                                       class="sb-facebook"
+                                       rel="external-nw"><img src="/shared/img/common/social-bookmarking/facebook.gif" alt="Add to Facebook"
+                                            title="Facebook" /></a><span class="soc-bm-link-text">Facebook</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-googleplus"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4350&amp;title=Reclassification%20of%20Bifidobacterium%20stercoris%20Kim%20et%20al.%202010%20as%20a%20later%20heterotypic%20synonym%20of%20Bifidobacterium%20adolescentis+--+Killer%20et%20al.%2063%20%28Pt%2011%29%3A%204350+--+IJSEM&amp;doi=10.1099/ijs.0.054957-0&amp;link_type=GOOGLEPLUS&amp;log_only=yes"><img src="/shared/img/common/social-bookmarking/googleplus.jpg" alt="Add to Google+"
+                                            title="Google+" /></a><span class="soc-bm-link-text">Google+</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-linkedin"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4350&amp;title=Reclassification%20of%20Bifidobacterium%20stercoris%20Kim%20et%20al.%202010%20as%20a%20later%20heterotypic%20synonym%20of%20Bifidobacterium%20adolescentis+--+Killer%20et%20al.%2063%20%28Pt%2011%29%3A%204350+--+IJSEM&amp;doi=10.1099/ijs.0.054957-0&amp;link_type=LINKEDIN"><img src="/shared/img/common/social-bookmarking/linkedin.gif" alt="Add to LinkedIn"
+                                            title="LinkedIn" /></a><span class="soc-bm-link-text">LinkedIn</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-mendeley"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4350&amp;title=Reclassification%20of%20Bifidobacterium%20stercoris%20Kim%20et%20al.%202010%20as%20a%20later%20heterotypic%20synonym%20of%20Bifidobacterium%20adolescentis+--+Killer%20et%20al.%2063%20%28Pt%2011%29%3A%204350+--+IJSEM&amp;doi=10.1099/ijs.0.054957-0&amp;link_type=MENDELEY"><img src="/shared/img/common/social-bookmarking/mendeley.gif" alt="Add to Mendeley"
+                                            title="Mendeley" /></a><span class="soc-bm-link-text">Mendeley</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-reddit"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4350&amp;title=Reclassification%20of%20Bifidobacterium%20stercoris%20Kim%20et%20al.%202010%20as%20a%20later%20heterotypic%20synonym%20of%20Bifidobacterium%20adolescentis+--+Killer%20et%20al.%2063%20%28Pt%2011%29%3A%204350+--+IJSEM&amp;doi=10.1099/ijs.0.054957-0&amp;link_type=REDDIT"><img src="/shared/img/common/social-bookmarking/reddit.gif" alt="Add to Reddit"
+                                            title="Reddit" /></a><span class="soc-bm-link-text">Reddit</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-twitter"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4350&amp;title=Reclassification%20of%20Bifidobacterium%20stercoris%20Kim%20et%20al.%202010%20as%20a%20later%20heterotypic%20synonym%20of%20Bifidobacterium%20adolescentis+--+Killer%20et%20al.%2063%20%28Pt%2011%29%3A%204350+--+IJSEM&amp;doi=10.1099/ijs.0.054957-0&amp;link_type=TWITTER"><img src="/shared/img/common/social-bookmarking/twitter.gif" alt="Add to Twitter"
+                                            title="Twitter" /></a><span class="soc-bm-link-text">Twitter</span></li>
+                              </ul>
+                              
+                              <p class="social-bookmarking-help"><a href="/help/social_bookmarks.dtl">What's this?</a></p>
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+            
+            <div class="content-box" id="article-dyn-nav">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>Navigate This Article</span></h3>
+                  <div class="cb-section" id="cb-art-nav">
+                     <ol>
+                        <li><a href="#content-block">Top</a></li>
+                        <li><a href="#abstract-1">Abstract</a></li>
+                        <li><a href="#ack-1">Acknowledgements</a></li>
+                        <li><a href="#ref-list-1">References</a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+         </div>
+         <div id="col-3">
+            
+            <div class="content-box" id="sidebar-current-issue">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Month's Issue</span></h3>
+                  <div class="cb-section">
+                     <ol>
+                        <li><span><a href="/content/current" rel="current-issue">April 2015, 65 (Pt 4)</a></span></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section">
+                     <ol>
+                        <li>
+                           <div class="current-issue"><a href="/content/current" rel="current-issue"><img src="/content/65/Pt_4.cover.gif" width="67" height="89" alt="Current Issue" /></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section sidebar-etoc-link">
+                     <ol>
+                        <li><a href="/cgi/alerts/etoc">Alert me to new issues of IJSEM
+                              </a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            <div id="sidebar-global-nav">
+               
+               		
+               <ul class="button-list pub-links">
+                  <li class="first"><a href="/site/misc/about.xhtml" title="ABOUT IJSEM"><span>ABOUT IJSEM</span></a></li>
+                  <li><a href="/site/misc/edboard.xhtml" title="EDITORIAL BOARD &amp; STAFF"><span>EDITORIAL BOARD &amp; STAFF</span></a></li>
+                  <li><a href="http://www.editorialmanager.com/ijs/" title="SUBMIT A MANUSCRIPT"><span>SUBMIT A MANUSCRIPT</span></a></li>
+                  <li><a href="/site/misc/ifora.xhtml" title="INFORMATION FOR AUTHORS"><span>INFORMATION FOR AUTHORS</span></a></li>
+                  <li><a href="/site/misc/iforr.xhtml" title="INFORMATION FOR REVIEWERS"><span>INFORMATION FOR REVIEWERS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/site/librarians/index.xhtml"
+                        title="INFORMATION FOR LIBRARIANS"><span>INFORMATION FOR LIBRARIANS</span></a></li>
+                  <li><a href="/site/misc/reprints.xhtml" title="PERMISSIONS AND REPRINTS"><span>PERMISSIONS AND REPRINTS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/subscriptions" title="SUBSCRIPTIONS"><span>SUBSCRIPTIONS</span></a></li>
+                  <li><a href="/site/misc/addir.xhtml" title="ADVERTISING"><span>ADVERTISING</span></a></li>
+                  <li class="rss-img-button"><a href="/site/misc/alerts_feeds.xhtml" title="ALERTS &amp; FEEDS"><span>ALERTS &amp; FEEDS</span></a></li>
+                  <li class="last"><a href="/feedback" title="FEEDBACK"><span>FEEDBACK</span></a></li>
+               </ul>
+               		
+               <ul class="button-list pub-links umbrella-links">
+                  <li class="first"><a href="http://mic.sgmjournals.org" title="MICROBIOLOGY"><span>MICROBIOLOGY</span></a></li>
+                  <li><a href="http://vir.sgmjournals.org" title="J GEN VIROL"><span>J GEN VIROL</span></a></li>
+                  <li><a href="http://jmm.sgmjournals.org" title="J MED MICROBIOL"><span>J MED MICROBIOL</span></a></li>
+                  <li><a href="http://jmmcr.sgmjournals.org" title="JMM CASE REPORTS"><span>JMM CASE REPORTS</span></a></li>
+                  <li class="last"><a href="http://www.sgmjournals.org" title="ALL SGM JOURNALS"><span>ALL SGM JOURNALS</span></a></li>
+               </ul>
+               		
+               <div class="sidebar-icon-group">
+                  			
+                  <div class="icons">
+                     			<a href="http://www.sgm.ac.uk/" rel="external-nw"><img src="/publisher/img/society_logo.gif" class="publisher-icon" alt="Society Logo" /></a>
+                     			<a href="http://www.the-icsp.org/" rel="external-nw"><img src="/publisher/img/icsp_logo.gif" class="publisher-icon" alt="ICSP Logo" /></a>
+                     			<a href="http://highwire.stanford.edu/" rel="external-nw"><img src="/publisher/img/hplogo.gif" class="hw-icon" alt="HighWire Press Logo" /></a>
+                     			
+                  </div>
+                  			
+                  <div class="sidebar-icon-text"><span>The <a href="http://www.sgmjournals.org"> Society for General Microbiology</a> publishes online with the assistance of <a href="http://highwire.stanford.edu">HighWire Press®</a>.</span></div>
+                  		
+               </div>
+               	
+            </div>
+            <div class="most-links-box js-marker">
+               
+               <div class="most-header">
+                  
+                  <h3>Most</h3>
+                  
+               </div>
+               
+               <ul>
+                  <li class="most-cur-sel">
+                     <h4>Viewed</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/1070?rss=1&amp;ssource=mfr">Proposal to consistently apply the International Code of Nomenclature of Prokaryotes (ICNP) to names of the oxygenic photosynthetic
+                                 bacteria (cyanobacteria), including those validly published under the International Code of Botanical Nomenclature (ICBN)/International
+                                 Code of Nomenclature for algae, fungi and plants (ICN), and proposal to change Principle 2 of the ICNP</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfr">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/316?rss=1&amp;ssource=mfr">Integrating genomics into the taxonomy and systematics of the Bacteria and Archaea</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/333?rss=1&amp;ssource=mfr">Applications of next-generation sequencing to unravelling the evolutionary history of algae</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/739?rss=1&amp;ssource=mfr">Notification that new names of prokaryotes, new combinations, and new taxonomic opinions have appeared in volume 64, part
+                                 12, of the IJSEM</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfr1.dtl" class="view-all">» View all Most Viewed articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+                  <li>
+                     <h4>Cited</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4386?rss=1&amp;ssource=mfc">Chryseobacterium hispalense sp. nov., a plant-growth-promoting bacterium isolated from a rainwater pond in an olive plant
+                                 nursery, and emended descriptions of Chryseobacterium defluvii, Chryseobacterium indologenes, Chryseobacterium wanjuense and
+                                 Chryseobacterium gregarium</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfc">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_1/138?rss=1&amp;ssource=mfc">Aquibacter zeaxanthinifaciens gen. nov., sp. nov., a zeaxanthin-producing bacterium of the family Flavobacteriaceae isolated
+                                 from surface seawater, and emended descriptions of the genera Aestuariibaculum and Gaetbulibacter</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4790?rss=1&amp;ssource=mfc">Kordia aquimaris sp. nov., a zeaxanthin-producing member of the family Flavobacteriaceae isolated from surface seawater, and
+                                 emended description of the genus Kordia</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4524?rss=1&amp;ssource=mfc">Erythrobacter odishensis sp. nov. and Pontibacter odishensis sp. nov. isolated from dry soil of a solar saltern</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfc1.dtl" class="view-all">» View all Most Cited articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+               </ul>
+               
+               
+            </div>
+            
+            
+            
+         </div>
+         <div id="footer">
+            
+            <div class="bar">
+               
+               <div class="footer-group footer-col-left">
+                  		
+                  <p class="copyright">Copyright ©
+                     		2015 International Union of Microbiological Societies
+                     	
+                  </p>
+                  	
+               </div>
+               
+               <div class="footer-group footer-col-right">
+                  	    
+                  <ul class="issns">
+                     <li>
+                        <span>Print ISSN: </span>
+                        <span class="issn">1466-5026</span>
+                        
+                     </li>
+                     <li>
+                        <span>Online ISSN: </span>
+                        <span class="issn">1466-5034</span>
+                        
+                     </li>
+                  </ul>
+                  	  
+               </div>
+               	  
+            </div>
+            
+            
+            <div class="block-2 sb-div"></div>
+            
+         </div><script type="text/javascript">
+        var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
+        document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
+        </script><script type="text/javascript">
+        try {
+        var pageTracker = _gat._getTracker("UA-189672-25");
+        pageTracker._setDomainName(".sgmjournals.org");
+        pageTracker._trackPageview();
+        } catch(err) {}
+        </script><script type="text/javascript">
+	(function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
+		(i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
+		m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
+	})(window,document,'script','//www.google-analytics.com/analytics.js','ga');
+
+	ga('create', 'UA-48529861-1', '.sgmjournals.org');
+	ga('send', 'pageview');
+	</script></div>
+   </body>
+</html>
\ No newline at end of file
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4350.full/fulltext.pdf b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4350.full/fulltext.pdf
new file mode 100644
index 00000000..3e146915
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4350.full/fulltext.pdf differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4350.full/results.json b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4350.full/results.json
new file mode 100644
index 00000000..c9efd168
--- /dev/null
+++ b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4350.full/results.json
@@ -0,0 +1,89 @@
+{
+  "publisher": {
+    "value": [
+      "Society for General Microbiology"
+    ]
+  },
+  "journal": {
+    "value": [
+      "International Journal of Systematic and Evolutionary\n                Microbiology"
+    ]
+  },
+  "title": {
+    "value": [
+      "Reclassification of Bifidobacterium stercoris Kim et al. 2010 as a later heterotypic synonym of Bifidobacterium adolescentis"
+    ]
+  },
+  "authors": {
+    "value": [
+      "J. Killer",
+      "I. Sedláček",
+      "V. Rada",
+      "J. Havlík",
+      "J. Kopečný"
+    ]
+  },
+  "date": {
+    "value": [
+      "11/01/2013"
+    ]
+  },
+  "doi": {
+    "value": [
+      "10.1099/ijs.0.054957-0"
+    ]
+  },
+  "volume": {
+    "value": [
+      "63"
+    ]
+  },
+  "issue": {
+    "value": [
+      "Pt 11"
+    ]
+  },
+  "firstpage": {
+    "value": [
+      "4350"
+    ]
+  },
+  "abstract": {
+    "value": [
+      "\n                  \n                      Next Section\n                  Abstract\n                  \n                  The taxonomic position of Bifidobacterium stercoris Eg1T ( = JCM 15918T) based on comparative 16S rRNA gene and hsp60 sequence analyses was found to be controversial, as the strain showed high similarity to the type strain of Bifidobacterium adolescentis, CCUG 18363T. Therefore, the relationship between the two species was investigated by a taxonomic study that included, in addition to\n                     re-evaluation of the 16S rRNA gene sequence, determination of DNA–DNA binding and multilocus sequence analysis (MLSA) of housekeeping\n                     genes encoding the DNA-directed RNA polymerase B subunit (rpoC), putative xylulose-5-phosphate/fructose-6-phosphate phosphoketolase (xfp), elongation factor EF-G (fusA), 50S ribosomal protein L2 (rplB) and DNA gyrase B subunit (gyrB). Comparative 16S rRNA gene sequence analysis showed relatively high similarity (98.9 %) between B. stercoris KCTC 5756T and B. adolescentis ATCC 15703T. MLSA revealed close relatedness between B. stercoris KCTC 5756T and B. adolescentis CCUG 18363T, with 99.3–100 % similarity between the rpoC, xfp, fusA, rplB and gyrB gene sequences. In addition, relatively high dnaJ1 gene sequence similarity of 97.7 % was found between the strains. Similar phenotypes and a high DNA–DNA binding value (78.9 %)\n                     confirmed that B. stercoris and B. adolescentis are synonymous. Based on these results, it is proposed that the species Bifidobacterium stercoris Kim et al. 2010 should be reclassified as a later heterotypic synonym of Bifidobacterium adolescentis Reuter 1963 (Approved Lists 1980).\n                  \n                  \n               "
+    ]
+  },
+  "fulltext_html": {
+    "value": [
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4350.full"
+    ]
+  },
+  "fulltext_pdf": {
+    "value": [
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4350.full.pdf"
+    ]
+  },
+  "supplementary_material": {
+    "value": [
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4350/suppl/DC1"
+    ]
+  },
+  "figure": {
+    "value": [
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4350/F1.small.gif"
+    ]
+  },
+  "figure_caption": {
+    "value": [
+      "Fig. 1.  \n                     \n                     Phylogenetic tree of the family Bifidobacteriaceae showing the very close relationship of B. adolescentis CCUG 18363T and B. stercoris KCTC 5756T, reconstructed by the maximum-likelihood method based on concatenated partial sequences of the hsp60 (539 nt) and xfp (418 nt) genes using mega version 5.05 software after removing hypervariable positions by using the program Gblocks. Sequence data were aligned using\n                        the clustal w algorithm. The Tamura–Nei model was used for reconstruction of the phylogenetic tree. Bootstrap values, expressed as percentages\n                        of 1000 datasets, are given at nodes. GenBank accession numbers of partial gene sequences derived from type strains are presented\n                        in Table S1. The tree was rooted by Gardnerella vaginalis ATCC 14018T. Bar, 0.04 substitutions per nucleotide position.\n                     \n                     \n                     \n                  "
+    ]
+  },
+  "license": {
+    "value": []
+  },
+  "copyright": {
+    "value": [
+      "Copyright ©\n                     \t\t2015 International Union of Microbiological Societies\n                     \t\n                  "
+    ]
+  }
+}
\ No newline at end of file
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/DC1 b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/DC1
new file mode 100644
index 00000000..7cdf1ee6
--- /dev/null
+++ b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/DC1
@@ -0,0 +1,350 @@
+<!DOCTYPE html
+  PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html
+      xmlns="http://www.w3.org/1999/xhtml"
+      xml:lang="en"
+      lang="en">
+   <head>
+      <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
+      <title>Supplementary material </title>
+      <meta name="googlebot" content="NOODP" />
+      <meta name="HW.ad-path" content="/cgi/content/full/ijs.0.056440-0/DC1" />
+      <link rel="stylesheet" type="text/css" media="all" href="/shared/css/hw-global.css" />
+      <link rel="stylesheet" type="text/css" media="print" href="/shared/css/hw-print.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/standard-designs/design25/main.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/local/css/hw-local-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-page-data-supp.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-page-data-supp.css" /><script type="text/javascript" id="session-d7728117e1">var callbackToken='56356970A2E8388';</script><script type="text/javascript" id="session-d7728117e3">
+                      var subCode='sgmjournal_sub';
+                    </script><script type="text/javascript" src="/shared/js/jquery-min.js"></script><script type="text/javascript" src="/shared/js/fingerprint.js"></script><script type="text/javascript" src="/shared/js/hw-shared.js"></script><script type="text/javascript" src="/shared/js/design/hw-design1.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-shared.js"></script><script type="text/javascript" src="/shared/js/pages/hw-data-supp.js"></script></head>
+   <body>
+      <div class="hw-gen-page pagetype-content" id="pageid-data-supp">
+         <div id="header">
+            
+            <h1><a id="logo" href="/"><span>International Journal of Systematic and Evolutionary Microbiology</span></a></h1>
+            
+            <p id="skip-link">
+               <a href="#content-block">Skip to main page content</a>
+               
+            </p>
+            
+            <ul class="button-list header-buttons">
+               <li class="first"><a href="/" title="HOME"><span>HOME</span></a></li>
+               <li><a href="/content/current" title="CURRENT ISSUE"><span>CURRENT ISSUE</span></a></li>
+               <li><a href="/content" title="ARCHIVE"><span>ARCHIVE</span></a></li>
+               <li><a href="/search" title="SEARCH"><span>SEARCH</span></a></li>
+               <li><a href="/help" title="HELP"><span>HELP</span></a></li>
+               <li class="last"><a href="/feedback" title="CONTACT US"><span>CONTACT US</span></a></li>
+            </ul>
+            
+            
+            <div class="header-qs">
+               
+               <form class="searchbox" action="/search" method="get">
+                  <div>
+                     	<label for="header-qs-input" id="header-qs-search-label">Search for Keyword:</label>
+                     <input value="" title="Search" type="text" name="fulltext" id="header-qs-input" /><input type="hidden" name="submit" value="yes" /><label for="header-qs-search" id="header-qs-search-label">GO</label><input value="GO" alt="Link: Go" type="image" id="header-qs-search-go"
+                            src="/shared/img/standard-design/design2/go.gif" /> 
+                     
+                  </div>
+                  <div class="adv-search-link"><a href="/search">Advanced Search</a></div>
+               </form>
+               
+               
+            </div>
+            
+            <div class="header-ac-elements">
+               
+               <div id="authstring" class="suppress-header-login">
+                  
+                  <ul>
+                     <li class="subscr-ref">Institution: THE NATURAL HISTORY MUSEUM</li>
+                     <li>
+                        <a href="/login?uri=http%3A%2F%2Fijs.sgmjournals.org%2Fcontent%2F63%2FPt_11%2F4354%2Fsuppl%2FDC1">
+                           Sign In as Member / Individual
+                           </a>
+                        
+                     </li>
+                  </ul>           
+                  
+               </div> 
+               
+               <div id="hdr-login" class="suppress-header-login"></div>
+               
+            </div>
+            
+            <div class="banner-ads">
+               		
+               <ul>
+                  <li class="position-1 no-ad hdr_left"><span>  </span></li>
+               </ul>
+               	
+            </div>
+            
+            <div class="bar">
+               
+               <div class="bar-inner"></div>
+               
+            </div>
+            
+         </div>
+         <div id="content-block">
+            <h1 class="data-supp-article-title">Designation of type strains for seven species of the order <em>Myxococcales</em> and proposal for neotype strains of <em>Cystobacter ferrugineus</em>, <em>Cystobacter minus</em> and <em>Polyangium fumosum</em></h1>
+            <div><span class="highwire-journal-article-marker-start"></span><div class="auto-clean"><span style="font-family: Verdana,Arial,Helvetica,sans-serif;  font-size: 83.33%">
+                     
+                     
+                     <h2>Supplementary material</h2>
+                     
+                     <p><strong>Files in this Data Supplement:</strong></p>
+                     
+                     <ul>
+                        <li><a href="/content/suppl/2013/11/05/ijs.0.056440-0.DC1/ijs056440.pdf">Supplementary material</a> 
+                           		
+                           
+                        </li>
+                     </ul>
+                     </span>
+                  
+                  
+               </div><span class="highwire-journal-article-marker-end"></span></div><span id="related-urls"></span></div>
+         <div id="col-2">
+            
+            <div class="content-box" id="article-cb-main">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Article</span></h3>
+                  <div class="cb-section cb-slug">
+                     <ol>
+                        <li>
+                           <div id="slugline">
+                              
+                              	
+                              
+                              
+                              doi:
+                              <span title="10.1099/ijs.0.056440-0" class="slug-doi">10.1099/ijs.0.056440-0</span>
+                              
+                              <cite>
+                                 	    <abbr title="International Journal of Systematic and Evolutionary Microbiology"
+                                       class="slug-jnl-abbrev">
+                                    IJSEM</abbr><span class="slug-pub-date">
+                                    November 2013 
+                                    </span>
+                                 	    <span class="slug-vol">
+                                    vol. 63 
+                                    </span><span class="slug-issue">
+                                    no. Pt 11 
+                                    </span><span class="slug-pages">
+                                    4354-4360
+                                    </span>
+                                 </cite>
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section cb-views">
+                     <ol>
+                        <li class="abstract-view-link primary"><a href="/content/63/Pt_11/4354.abstract" rel="view-abstract">Abstract</a><span class="free">Free</span></li>
+                        <li class="notice full-text-view-link primary"><a href="/content/63/Pt_11/4354.full" rel="view-full-text">Full Text</a><span class="free">Free</span></li>
+                        <li class="notice full-text-pdf-view-link primary"><a href="/content/63/Pt_11/4354.full.pdf+html" rel="view-full-text.pdf">Full Text (PDF)</a></li>
+                        <li><span class="variant-indicator">» <span>Supplementary material</span></span></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+            
+            
+         </div>
+         <div id="col-3">
+            
+            <div class="content-box" id="sidebar-current-issue">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Month's Issue</span></h3>
+                  <div class="cb-section">
+                     <ol>
+                        <li><span><a href="/content/current" rel="current-issue">April 2015, 65 (Pt 4)</a></span></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section">
+                     <ol>
+                        <li>
+                           <div class="current-issue"><a href="/content/current" rel="current-issue"><img src="/content/65/Pt_4.cover.gif" width="67" height="89" alt="Current Issue" /></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section sidebar-etoc-link">
+                     <ol>
+                        <li><a href="/cgi/alerts/etoc">Alert me to new issues of IJSEM
+                              </a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            <div id="sidebar-global-nav">
+               
+               		
+               <ul class="button-list pub-links">
+                  <li class="first"><a href="/site/misc/about.xhtml" title="ABOUT IJSEM"><span>ABOUT IJSEM</span></a></li>
+                  <li><a href="/site/misc/edboard.xhtml" title="EDITORIAL BOARD &amp; STAFF"><span>EDITORIAL BOARD &amp; STAFF</span></a></li>
+                  <li><a href="http://www.editorialmanager.com/ijs/" title="SUBMIT A MANUSCRIPT"><span>SUBMIT A MANUSCRIPT</span></a></li>
+                  <li><a href="/site/misc/ifora.xhtml" title="INFORMATION FOR AUTHORS"><span>INFORMATION FOR AUTHORS</span></a></li>
+                  <li><a href="/site/misc/iforr.xhtml" title="INFORMATION FOR REVIEWERS"><span>INFORMATION FOR REVIEWERS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/site/librarians/index.xhtml"
+                        title="INFORMATION FOR LIBRARIANS"><span>INFORMATION FOR LIBRARIANS</span></a></li>
+                  <li><a href="/site/misc/reprints.xhtml" title="PERMISSIONS AND REPRINTS"><span>PERMISSIONS AND REPRINTS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/subscriptions" title="SUBSCRIPTIONS"><span>SUBSCRIPTIONS</span></a></li>
+                  <li><a href="/site/misc/addir.xhtml" title="ADVERTISING"><span>ADVERTISING</span></a></li>
+                  <li class="rss-img-button"><a href="/site/misc/alerts_feeds.xhtml" title="ALERTS &amp; FEEDS"><span>ALERTS &amp; FEEDS</span></a></li>
+                  <li class="last"><a href="/feedback" title="FEEDBACK"><span>FEEDBACK</span></a></li>
+               </ul>
+               		
+               <ul class="button-list pub-links umbrella-links">
+                  <li class="first"><a href="http://mic.sgmjournals.org" title="MICROBIOLOGY"><span>MICROBIOLOGY</span></a></li>
+                  <li><a href="http://vir.sgmjournals.org" title="J GEN VIROL"><span>J GEN VIROL</span></a></li>
+                  <li><a href="http://jmm.sgmjournals.org" title="J MED MICROBIOL"><span>J MED MICROBIOL</span></a></li>
+                  <li><a href="http://jmmcr.sgmjournals.org" title="JMM CASE REPORTS"><span>JMM CASE REPORTS</span></a></li>
+                  <li class="last"><a href="http://www.sgmjournals.org" title="ALL SGM JOURNALS"><span>ALL SGM JOURNALS</span></a></li>
+               </ul>
+               		
+               <div class="sidebar-icon-group">
+                  			
+                  <div class="icons">
+                     			<a href="http://www.sgm.ac.uk/" rel="external-nw"><img src="/publisher/img/society_logo.gif" class="publisher-icon" alt="Society Logo" /></a>
+                     			<a href="http://www.the-icsp.org/" rel="external-nw"><img src="/publisher/img/icsp_logo.gif" class="publisher-icon" alt="ICSP Logo" /></a>
+                     			<a href="http://highwire.stanford.edu/" rel="external-nw"><img src="/publisher/img/hplogo.gif" class="hw-icon" alt="HighWire Press Logo" /></a>
+                     			
+                  </div>
+                  			
+                  <div class="sidebar-icon-text"><span>The <a href="http://www.sgmjournals.org"> Society for General Microbiology</a> publishes online with the assistance of <a href="http://highwire.stanford.edu">HighWire Press®</a>.</span></div>
+                  		
+               </div>
+               	
+            </div>
+            <div class="most-links-box js-marker">
+               
+               <div class="most-header">
+                  
+                  <h3>Most</h3>
+                  
+               </div>
+               
+               <ul>
+                  <li class="most-cur-sel">
+                     <h4>Viewed</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/1070?rss=1&amp;ssource=mfr">Proposal to consistently apply the International Code of Nomenclature of Prokaryotes (ICNP) to names of the oxygenic photosynthetic
+                                 bacteria (cyanobacteria), including those validly published under the International Code of Botanical Nomenclature (ICBN)/International
+                                 Code of Nomenclature for algae, fungi and plants (ICN), and proposal to change Principle 2 of the ICNP</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfr">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/316?rss=1&amp;ssource=mfr">Integrating genomics into the taxonomy and systematics of the Bacteria and Archaea</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/333?rss=1&amp;ssource=mfr">Applications of next-generation sequencing to unravelling the evolutionary history of algae</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/739?rss=1&amp;ssource=mfr">Notification that new names of prokaryotes, new combinations, and new taxonomic opinions have appeared in volume 64, part
+                                 12, of the IJSEM</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfr1.dtl" class="view-all">» View all Most Viewed articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+                  <li>
+                     <h4>Cited</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4386?rss=1&amp;ssource=mfc">Chryseobacterium hispalense sp. nov., a plant-growth-promoting bacterium isolated from a rainwater pond in an olive plant
+                                 nursery, and emended descriptions of Chryseobacterium defluvii, Chryseobacterium indologenes, Chryseobacterium wanjuense and
+                                 Chryseobacterium gregarium</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfc">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_1/138?rss=1&amp;ssource=mfc">Aquibacter zeaxanthinifaciens gen. nov., sp. nov., a zeaxanthin-producing bacterium of the family Flavobacteriaceae isolated
+                                 from surface seawater, and emended descriptions of the genera Aestuariibaculum and Gaetbulibacter</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4790?rss=1&amp;ssource=mfc">Kordia aquimaris sp. nov., a zeaxanthin-producing member of the family Flavobacteriaceae isolated from surface seawater, and
+                                 emended description of the genus Kordia</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4524?rss=1&amp;ssource=mfc">Erythrobacter odishensis sp. nov. and Pontibacter odishensis sp. nov. isolated from dry soil of a solar saltern</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfc1.dtl" class="view-all">» View all Most Cited articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+               </ul>
+               
+               
+            </div>
+            
+            
+            
+         </div>
+         <div id="footer">
+            
+            <div class="bar">
+               
+               <div class="footer-group footer-col-left">
+                  		
+                  <p class="copyright">Copyright ©
+                     		2015 International Union of Microbiological Societies
+                     	
+                  </p>
+                  	
+               </div>
+               
+               <div class="footer-group footer-col-right">
+                  	    
+                  <ul class="issns">
+                     <li>
+                        <span>Print ISSN: </span>
+                        <span class="issn">1466-5026</span>
+                        
+                     </li>
+                     <li>
+                        <span>Online ISSN: </span>
+                        <span class="issn">1466-5034</span>
+                        
+                     </li>
+                  </ul>
+                  	  
+               </div>
+               	  
+            </div>
+            
+            
+            <div class="block-2 sb-div"></div>
+            
+         </div><script type="text/javascript">
+        var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
+        document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
+        </script><script type="text/javascript">
+        try {
+        var pageTracker = _gat._getTracker("UA-189672-25");
+        pageTracker._setDomainName(".sgmjournals.org");
+        pageTracker._trackPageview();
+        } catch(err) {}
+        </script><script type="text/javascript">
+	(function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
+		(i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
+		m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
+	})(window,document,'script','//www.google-analytics.com/analytics.js','ga');
+
+	ga('create', 'UA-48529861-1', '.sgmjournals.org');
+	ga('send', 'pageview');
+	</script></div>
+   </body>
+</html>
\ No newline at end of file
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F1.small.gif b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F1.small.gif
new file mode 100644
index 00000000..a95e1078
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F1.small.gif differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F10.small.gif b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F10.small.gif
new file mode 100644
index 00000000..0f61a325
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F10.small.gif differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F2.small.gif b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F2.small.gif
new file mode 100644
index 00000000..82363b89
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F2.small.gif differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F3.small.gif b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F3.small.gif
new file mode 100644
index 00000000..ed37c5ca
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F3.small.gif differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F4.small.gif b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F4.small.gif
new file mode 100644
index 00000000..8188a5cd
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F4.small.gif differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F5.small.gif b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F5.small.gif
new file mode 100644
index 00000000..cba036a0
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F5.small.gif differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F6.small.gif b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F6.small.gif
new file mode 100644
index 00000000..131147bf
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F6.small.gif differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F7.small.gif b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F7.small.gif
new file mode 100644
index 00000000..2590fb41
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F7.small.gif differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F8.small.gif b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F8.small.gif
new file mode 100644
index 00000000..a317af51
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F8.small.gif differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F9.small.gif b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F9.small.gif
new file mode 100644
index 00000000..5aa55735
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F9.small.gif differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/fulltext.html b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/fulltext.html
new file mode 100644
index 00000000..364023aa
--- /dev/null
+++ b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/fulltext.html
@@ -0,0 +1,1307 @@
+<!DOCTYPE html
+  PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html
+      xmlns="http://www.w3.org/1999/xhtml"
+      xml:lang="en"
+      lang="en">
+   <head>
+      <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
+      <title>Designation of type strains for seven species of the order Myxococcales and proposal for neotype strains of Cystobacter ferrugineus,
+         Cystobacter minus and Polyangium fumosum 
+      </title>
+      <meta name="googlebot" content="NOODP" />
+      <meta name="HW.ad-path" content="/cgi/content/full/63/Pt_11/4354" />
+      <meta content="/ijs/63/Pt_11/4354.atom" name="HW.identifier" />
+      <meta name="DC.Format" content="text/html" />
+      <meta name="DC.Language" content="en" />
+      <meta content="Designation of type strains for seven species of the order Myxococcales and proposal for neotype strains of Cystobacter ferrugineus, Cystobacter minus and Polyangium fumosum"
+            name="DC.Title" />
+      <meta content="10.1099/ijs.0.056440-0" name="DC.Identifier" />
+      <meta content="2013-11-01" name="DC.Date" />
+      <meta content="Society for General Microbiology" name="DC.Publisher" />
+      <meta content="Elke Lang" name="DC.Contributor" />
+      <meta content="Hans Reichenbach" name="DC.Contributor" />
+      <meta content="International Journal of Systematic and Evolutionary&#xA;                Microbiology"
+            name="citation_journal_title" />
+      <meta content="Int J Syst Evol&#xA;                Microbiol"
+            name="citation_journal_abbrev" />
+      <meta content="1466-5026" name="citation_issn" />
+      <meta content="1466-5034" name="citation_issn" />
+      <meta name="citation_author" content="Elke Lang" />
+      <meta name="citation_author_institution"
+            content="1Leibniz-Institut DSMZ – Deutsche Sammlung von Mikroorganismen und Zellkulturen GmbH, Inhoffenstrasse 7B, 38124 Braunschweig, Germany" />
+      <meta name="citation_author" content="Hans Reichenbach" />
+      <meta name="citation_author_institution"
+            content="2Helmholtz-Zentrum für Infektionsforschung, Inhoffenstrasse 7, 38124 Braunschweig, Germany" />
+      <meta content="Designation of type strains for seven species of the order Myxococcales and proposal for neotype strains of Cystobacter ferrugineus, Cystobacter minus and Polyangium fumosum"
+            name="citation_title" />
+      <meta content="11/01/2013" name="citation_date" />
+      <meta content="63" name="citation_volume" />
+      <meta content="Pt 11" name="citation_issue" />
+      <meta content="4354" name="citation_firstpage" />
+      <meta content="4360" name="citation_lastpage" />
+      <meta content="63/Pt_11/4354" name="citation_id" />
+      <meta content="63/Pt 11/4354" name="citation_id_from_sass_path" />
+      <meta content="ijs;63/Pt_11/4354" name="citation_mjid" />
+      <meta content="10.1099/ijs.0.056440-0" name="citation_doi" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4354.abstract"
+            name="citation_abstract_html_url" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4354.full"
+            name="citation_fulltext_html_url" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4354.full.pdf"
+            name="citation_pdf_url" />
+      <meta content="/content/63/Pt_11.cover.gif" name="issue_cover_image" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4354"
+            name="citation_public_url" />
+      <meta content="24187023" name="citation_pmid" />
+      <meta name="citation_fulltext_world_readable" content="" />
+      <meta name="citation_section" content="Taxonomic Note" />
+      <meta name="robots" content="noarchive,nofollow" />
+      <meta name="googlebot" content="noarchive" />
+      <link href="/content/63/Pt_11/4350.short" rel="prev" />
+      <link href="/content/63/Pt_11/4361.short" rel="next" />
+      <link rel="stylesheet" type="text/css" media="all" href="/shared/css/hw-global.css" />
+      <link rel="stylesheet" type="text/css" media="print" href="/shared/css/hw-print.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/standard-designs/design25/main.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/local/css/hw-local-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/jquery.fancybox-1.3.4.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-global-colexpand.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-global-colexpand.css" /><script type="text/javascript" id="session-d7727761e1">var callbackToken='56356970A2E8388';</script><script type="text/javascript" id="session-d7727761e3">
+                      var subCode='sgmjournal_sub';
+                    </script><script type="text/javascript" src="/shared/js/jquery-min.js"></script><script type="text/javascript" src="/shared/js/fingerprint.js"></script><script type="text/javascript" src="/shared/js/hw-shared.js"></script><script type="text/javascript" src="/shared/js/design/hw-design1.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-shared.js"></script><script type="text/javascript" src="/shared/js/pages/hw-content.js"></script><script type="text/javascript" src="/shared/js/fancybox/jquery.fancybox-1.3.4.js"></script><script type="text/javascript" src="/shared/js/fancybox/jquery.easing-1.3.pack.js"></script><script type="text/javascript"
+              src="/shared/js/fancybox/jquery.mousewheel-3.0.4.pack.js"></script><script type="text/javascript" src="/shared/js/util/content.jquery.addVariantLink.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-custom-free.js"></script><script type="text/javascript" src="/shared/js/util/hw-col-expand.js"></script><script type="text/javascript"
+              src="https://data.namesforlife.com/script/NamesforLife.js"></script></head>
+   <body>
+      <div class="hw-gen-page pagetype-content" id="pageid-content" itemscope="itemscope"
+           itemtype="http://schema.org/ScholarlyArticle">
+         <div id="header">
+            
+            <h1><a id="logo" href="/"><span>International Journal of Systematic and Evolutionary Microbiology</span></a></h1>
+            
+            <p id="skip-link">
+               <a href="#content-block">Skip to main page content</a>
+               
+            </p>
+            
+            <ul class="button-list header-buttons">
+               <li class="first"><a href="/" title="HOME"><span>HOME</span></a></li>
+               <li><a href="/content/current" title="CURRENT ISSUE"><span>CURRENT ISSUE</span></a></li>
+               <li><a href="/content" title="ARCHIVE"><span>ARCHIVE</span></a></li>
+               <li><a href="/search" title="SEARCH"><span>SEARCH</span></a></li>
+               <li><a href="/help" title="HELP"><span>HELP</span></a></li>
+               <li class="last"><a href="/feedback" title="CONTACT US"><span>CONTACT US</span></a></li>
+            </ul>
+            
+            
+            <div class="header-qs">
+               
+               <form class="searchbox" action="/search" method="get">
+                  <div>
+                     	<label for="header-qs-input" id="header-qs-search-label">Search for Keyword:</label>
+                     <input value="" title="Search" type="text" name="fulltext" id="header-qs-input" /><input type="hidden" name="submit" value="yes" /><label for="header-qs-search" id="header-qs-search-label">GO</label><input value="GO" alt="Link: Go" type="image" id="header-qs-search-go"
+                            src="/shared/img/standard-design/design2/go.gif" /> 
+                     
+                  </div>
+                  <div class="adv-search-link"><a href="/search">Advanced Search</a></div>
+               </form>
+               
+               
+            </div>
+            
+            <div class="header-ac-elements">
+               
+               <div id="authstring" class="suppress-header-login">
+                  
+                  <ul>
+                     <li class="subscr-ref">Institution: THE NATURAL HISTORY MUSEUM</li>
+                     <li>
+                        <a href="/login?uri=http%3A%2F%2Fijs.sgmjournals.org%2Fcontent%2F63%2FPt_11%2F4354.full">
+                           Sign In as Member / Individual
+                           </a>
+                        
+                     </li>
+                  </ul>           
+                  
+               </div> 
+               
+               <div id="hdr-login" class="suppress-header-login"></div>
+               
+            </div>
+            
+            <div class="banner-ads">
+               		
+               <ul>
+                  <li class="position-1 no-ad hdr_left"><span>  </span></li>
+               </ul>
+               	
+            </div>
+            
+            <div class="bar">
+               
+               <div class="bar-inner"></div>
+               
+            </div>
+            
+         </div>
+         <div id="content-block">
+            <div class="article fulltext-view " itemprop="articleBody"><span class="highwire-journal-article-marker-start"></span><h1 id="article-title-1" itemprop="headline">Designation of type strains for seven species of the order <em>Myxococcales</em> and proposal for neotype strains of <em>Cystobacter ferrugineus</em>, <em>Cystobacter minus</em> and <em>Polyangium fumosum</em></h1>
+               <div class="contributors">
+                  <ol class="contributor-list" id="contrib-group-1">
+                     <li class="contributor" id="contrib-1" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Elke+Lang&amp;sortspec=date&amp;submit=Submit">Elke Lang</a></span><a id="xref-aff-1-1" class="xref-aff" href="#aff-1"><sup>1</sup></a> and 
+                     </li>
+                     <li class="last" id="contrib-2"><span class="name"><a class="name-search"
+                              href="/search?author1=Hans+Reichenbach&amp;sortspec=date&amp;submit=Submit">Hans Reichenbach</a></span><a id="xref-aff-2-1" class="xref-aff" href="#aff-2"><sup>2</sup></a><span class="xref-sep">,</span><a id="xref-fn-1-1" class="xref-fn" href="#fn-1">†</a></li>
+                  </ol>
+                  <ol class="affiliation-list">
+                     <li class="aff"><a id="aff-1" name="aff-1"></a><address><sup>1</sup>Leibniz-Institut DSMZ – Deutsche Sammlung von Mikroorganismen und Zellkulturen GmbH, Inhoffenstrasse 7B, 38124 Braunschweig,
+                           Germany
+                        </address>
+                     </li>
+                     <li class="aff"><a id="aff-2" name="aff-2"></a><address><sup>2</sup>Helmholtz-Zentrum für Infektionsforschung, Inhoffenstrasse 7, 38124 Braunschweig, Germany
+                        </address>
+                     </li>
+                  </ol>
+                  <ol class="corresp-list">
+                     <li class="corresp" id="corresp-1"><strong>Corresponding</strong><br />Elke Lang <span class="em-link"><span class="em-addr">ela{at}dsmz.de</span></span></li>
+                  </ol>
+               </div>
+               <div class="section abstract" id="abstract-1" itemprop="description">
+                  <div class="section-nav">
+                     <div class="nav-placeholder"> </div><a href="#fn-group-1" title="Next Section" class="next-section-link"><span>Next Section</span></a></div>
+                  <h2>Abstract</h2>
+                  
+                  <p id="p-3">Ten species of the order <span class="named-content order" id="named-content-1"><a class="namesforlife" rel="namesforlife-name" title="Myxococcales"
+                           href="doi:10.1601/nm.3690"><em>Myxococcales</em></a></span> with validly published names are devoid of living type strains. Four species of the genus <span class="named-content genus" id="named-content-2"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces"
+                           href="doi:10.1601/nm.3749"><em>Chondromyces</em></a></span> are represented by dead herbarium samples as the type material. For a species of the genus <span class="named-content genus" id="named-content-3"><a class="namesforlife" rel="namesforlife-name" title="Melittangium"
+                           href="doi:10.1601/nm.3710"><em>Melittangium</em></a></span> and two species of the genus <span class="named-content genus" id="named-content-4"><a class="namesforlife" rel="namesforlife-name" title="Polyangium"
+                           href="doi:10.1601/nm.3736"><em>Polyangium</em></a></span>, no physical type material was assigned at the time of validation of the names or later on. In accordance with rule 18f of
+                     the International Code of Nomenclature of Bacteria the following type strains are designated for these species: strain Cm
+                     a14<sup>T</sup> ( = DSM 14605<sup>T</sup> = JCM 12615<sup>T</sup>) as the type strain of <span class="named-content species" id="named-content-5"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces apiculatus"
+                           href="doi:10.1601/nm.3751"><em>Chondromyces apiculatus</em></a></span>, strain Cm c5<sup>T</sup> ( = DSM 14714<sup>T</sup> = JCM 12616<sup>T</sup>) as the type strain of <span class="named-content species" id="named-content-6"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces crocatus"
+                           href="doi:10.1601/nm.3750"><em>Chondromyces crocatus</em></a></span>, strain Sy t2<sup>T</sup> ( = DSM 14631<sup>T</sup> = JCM 12617<sup>T</sup>) as the type strain of <span class="named-content species" id="named-content-7"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces lanuginosus"
+                           href="doi:10.1601/nm.3753"><em>Chondromyces lanuginosus</em></a></span>, strain Cm p51<sup>T</sup> ( = DSM 14607<sup>T</sup> = JCM 12618<sup>T</sup>) as the type strain of <span class="named-content species" id="named-content-8"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces pediculatus"
+                           href="doi:10.1601/nm.3754"><em>Chondromyces pediculatus</em></a></span>, strain Me b8<sup>T</sup> ( = DSM 14713<sup>T</sup> = JCM 12633<sup>T</sup>) as the type strain of <span class="named-content species" id="named-content-9"><a class="namesforlife" rel="namesforlife-name" title="Melittangium boletus"
+                           href="doi:10.1601/nm.3711"><em>Melittangium boletus</em></a></span>, strain Pl s12<sup>T</sup> ( = DSM 14670<sup>T</sup> = JCM 12637<sup>T</sup>) as the type strain of <span class="named-content species" id="named-content-10"><a class="namesforlife" rel="namesforlife-name" title="Polyangium sorediatum"
+                           href="doi:10.1601/nm.3745"><em>Polyangium sorediatum</em></a></span> and strain Pl sm5<sup>T</sup> ( = DSM 14734<sup>T</sup> = JCM 12638<sup>T</sup>) as the type strain of <span class="named-content species" id="named-content-11"><a class="namesforlife" rel="namesforlife-name" title="Polyangium spumosum"
+                           href="doi:10.1601/nm.3746"><em>Polyangium spumosum</em></a></span>. Furthermore, the type strains given for three species of the genera <span class="named-content genus" id="named-content-12"><a class="namesforlife" rel="namesforlife-name" title="Cystobacter"
+                           href="doi:10.1601/nm.3693"><em>Cystobacter</em></a></span> and <span class="named-content genus" id="named-content-13"><a class="namesforlife" rel="namesforlife-name" title="Polyangium"
+                           href="doi:10.1601/nm.3736"><em>Polyangium</em></a></span> had been kept at one university institute and have been lost according to our investigations. In accordance with Rule 18c
+                     of the Bacteriological Code, we propose the following neotype strains: strain Cb fe18 ( = DSM 14716  = JCM 12624) as the neotype
+                     strain of <span class="named-content species" id="named-content-14"><a class="namesforlife" rel="namesforlife-name" title="Cystobacter ferrugineus"
+                           href="doi:10.1601/nm.3698"><em>Cystobacter ferrugineus</em></a></span>, strain Cb m2 ( = DSM 14751 = JCM 12627) as the neotype strain of <span class="named-content species" id="named-content-15"><a class="namesforlife" rel="namesforlife-name" title="Cystobacter minus"
+                           href="doi:10.1601/nm.10682"><em>Cystobacter minus</em></a></span> and strain Pl fu5 ( = DSM 14668 = JCM 12636) as the neotype strain of <span class="named-content species" id="named-content-16"><a class="namesforlife" rel="namesforlife-name" title="Polyangium fumosum"
+                           href="doi:10.1601/nm.3740"><em>Polyangium fumosum</em></a></span>. The proposals of the strains are based on the descriptions and strain proposals given in the respective chapters of <em>Bergey’s Manual of Systematic Bacteriology</em> (2005).
+                  </p>
+                  
+               </div>
+               <div class="section fn-group" id="fn-group-1">
+                  <div class="section-nav"><a href="#abstract-1" title="Abstract" class="prev-section-link"><span>Previous Section</span></a><a href="#ack-1" title="Acknowledgements" class="next-section-link"><span>Next Section</span></a></div>
+                  <ul>
+                     <li class="fn" id="fn-1">
+                        <p id="p-1"><a class="rev-xref" href="#xref-fn-1-1">↵</a><span class="fn-label">†</span> Retired.
+                        </p>
+                     </li>
+                     <li class="fn-supplementary-material" id="fn-2">
+                        <p id="p-2">Two supplementary tables are available with the online version of this paper.</p>
+                     </li>
+                  </ul>
+               </div>
+               <p id="p-4">An exceptionally high number of myxobacterial species descriptions is not supported by the availability of formally acknowledged
+                  living type strain material. Because of this lack of material, the species could not be included, for example, in species-representing
+                  16S rRNA gene sequence databases. These are the most frequently used guides in taxonomy currently, and for that reason, great
+                  efforts are taken to fill the sequencing gaps (<a id="xref-ref-23-1" class="xref-bibr" href="#ref-23">Yarza <em>et al.</em>, 2013</a>). The International Code of Nomenclature of Bacteria (<a id="xref-ref-12-1" class="xref-bibr" href="#ref-12">Lapage <em>et al.</em>, 1992</a>) allows for the designation of type strains in cases where descriptions or dead specimens represent the type given for species
+                  with validly published species names. The code also allows for the proposal of neotype strains if a specimen of the strain
+                  on which the original description was based cannot be found. These measures have been installed in order to clear the way
+                  for inclusion of such species in future examinations, in particular in studies including ‘new’ methods which had not been
+                  applied at the time of the species description. In this communication, we formally designate type strains for seven and formally
+                  propose neotype strains for three species of the order <span class="named-content order" id="named-content-17"><a class="namesforlife" rel="namesforlife-name" title="Myxococcales"
+                        href="doi:10.1601/nm.3690"><em>Myxococcales</em></a></span>.
+               </p>
+               <p id="p-5">The present wording of Rule 18f of the International Code is: ‘If a description or illustration constitutes, or a dead preserved
+                  specimen has been designated as the type of a species [Rule 18a(1)] and a later strain of this species is cultivated, then
+                  the type strain may be designated by the person who isolated the strain or by a subsequent author. This type strain shall
+                  then replace the description, illustration or preserved specimen as the nomenclatural type. The designation of a type strain
+                  in this manner must be published in the IJSB/IJSEM, the authorship and date of priority of publication being determined by
+                  the effective and valid publication of the name by the original authors (Rule 24b)’.
+               </p>
+               <p id="p-6">The presently designated type strains of the species <span class="named-content species" id="named-content-18"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces apiculatus"
+                        href="doi:10.1601/nm.3751"><em>Chondromyces apiculatus</em></a></span> (<a id="xref-ref-21-1" class="xref-bibr" href="#ref-21">Thaxter, 1897</a>), <span class="named-content species" id="named-content-19"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces crocatus"
+                        href="doi:10.1601/nm.3750"><em>Chondromyces crocatus</em></a></span> (Berkeley &amp; Curtis, 1874), <span class="named-content species" id="named-content-20"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces lanuginosus"
+                        href="doi:10.1601/nm.3753"><em>Chondromyces lanuginosus</em></a></span> (<a id="xref-ref-8-1" class="xref-bibr" href="#ref-8">Kofler, 1913</a>) and <span class="named-content species" id="named-content-21"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces pediculatus"
+                        href="doi:10.1601/nm.3754"><em>Chondromyces pediculatus</em></a></span> (<a id="xref-ref-22-1" class="xref-bibr" href="#ref-22">Thaxter, 1904</a>) are dead herbarium specimens in the Thaxter collection (TC), housed in the Farlow Herbarium, Harvard University, Cambridge,
+                  USA (<a id="xref-table-wrap-1-1" class="xref-table" href="#T1">Table 1</a>). Howard McCurdy studied myxobacteria at the University of Windsor, Ontario, Canada during the period around 1960–1970. He
+                  assigned specific samples of the Thaxter collection as the types of these species (<a id="xref-ref-14-1" class="xref-bibr" href="#ref-14">McCurdy, 1971</a>). The species names were included in the Approved Lists (Skerman <em>et al.</em>, 1980). According to a curator of the herbarium, the specimen for <span class="named-content species" id="named-content-22"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces lanuginosus"
+                        href="doi:10.1601/nm.3753"><em>Chondromyces lanuginosus</em></a></span> seems to be lost whereas the other three specimens are still there, dried on the original substrates, accompanied by some
+                  slides.
+               </p>
+               <div id="T1" class="table pos-float">
+                  <div class="table-inline">
+                     <div class="callout"><span>View this table:</span><ul class="callout-links">
+                           <li><a href="4354/T1.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4354/T1.expansion.html">In a new window</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="table-caption"><span class="table-label">Table 1. </span> 
+                     <span class="caption-title">Myxobacterial species for which a cultivable type strain or neotype strain is formally proposed and the 16S rRNA sequences
+                        of the proposed neotype strains. AL, type strain as given in Approved Lists (Skerman <em>et al.</em>, 1980). VL, types as given in Validation List No 31 (<a id="xref-ref-4-1" class="xref-bibr" href="#ref-4">Brockman, 1989b</a>, <a id="xref-ref-5-1" class="xref-bibr" href="#ref-5">c</a>)</span>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <p id="p-7">For the species <span class="named-content species" id="named-content-36"><a class="namesforlife" rel="namesforlife-name" title="Melittangium boletus"
+                        href="doi:10.1601/nm.3711"><em>Melittangium boletus</em></a></span> (<a id="xref-ref-7-2" class="xref-bibr" href="#ref-7">Jahn, 1924</a>), <span class="named-content species" id="named-content-37"><a class="namesforlife" rel="namesforlife-name" title="Polyangium sorediatum"
+                        href="doi:10.1601/nm.3745"><em>Polyangium sorediatum</em></a></span> (<a id="xref-ref-3-3" class="xref-bibr" href="#ref-3">Brockman, 1989a</a>) and <span class="named-content species" id="named-content-38"><a class="namesforlife" rel="namesforlife-name" title="Polyangium spumosum"
+                        href="doi:10.1601/nm.3746"><em>Polyangium spumosum</em></a></span> (<a id="xref-ref-3-4" class="xref-bibr" href="#ref-3">Brockman, 1989a</a>) no physical type strains were assigned in the Approved Lists (<a id="xref-ref-20-1" class="xref-bibr" href="#ref-20">Skerman <em>et al.</em>, 1980</a>) or in Validation List No. 31 (<a id="xref-ref-4-2" class="xref-bibr" href="#ref-4">Brockman, 1989b</a>,<a id="xref-ref-5-2" class="xref-bibr" href="#ref-5">c</a>), respectively. Instead, the descriptions of <a id="xref-ref-3-5" class="xref-bibr" href="#ref-3">Brockman (1989a)</a> or simply the statement ‘not cultivated’ are given.
+               </p>
+               <p id="p-8">Bergey’s Manual of Systematic Bacteriology, second edition, includes comprehensive chapters about the members of the order
+                  <span class="named-content order" id="named-content-39"><a class="namesforlife" rel="namesforlife-name" title="Myxococcales"
+                        href="doi:10.1601/nm.3690"><em>Myxococcales</em></a></span>. <a id="xref-ref-15-5" class="xref-bibr" href="#ref-15">Reichenbach (2005a</a>, <a id="xref-ref-16-5" class="xref-bibr" href="#ref-16">b</a>, <a id="xref-ref-17-2" class="xref-bibr" href="#ref-17">c</a>, d, e) are the chapters relevant to the taxa mentioned in this paper. These chapters are based on the experience and knowledge
+                  accumulated during 40 years of intense investigations on myxobacteria and were written after more than 3000 myxobacterial
+                  strains had been isolated. Based on the original species descriptions, appropriate strains were selected and described as
+                  the type strains of the respective species (<a id="xref-table-wrap-1-2" class="xref-table" href="#T1">Table 1</a>). However, it has not been formally proposed in the IJSEM until now to accept these strains as the type strains.
+               </p>
+               <p id="p-9">For the reason that presently dead preserved material constitutes-, or a description has been designated-, the type strain
+                  of the mentioned species, or no type strain has been assigned, it is formally proposed that the strains selected by Reichenbach
+                  shall be designated the type strains of the respective species according to Rule 18f. The proposed type strains listed in
+                  <a id="xref-table-wrap-1-3" class="xref-table" href="#T1">Table 1</a> shall replace the dead specimen or descriptions. These are <span class="named-content species" id="named-content-40"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces apiculatus"
+                        href="doi:10.1601/nm.3751"><em>Chondromyces apiculatus</em></a></span> Cm a14<sup>T</sup>, <span class="named-content species" id="named-content-41"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces crocatus"
+                        href="doi:10.1601/nm.3750"><em>Chondromyces crocatus</em></a></span> Cm c5<sup>T</sup>, <span class="named-content species" id="named-content-42"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces lanuginosus"
+                        href="doi:10.1601/nm.3753"><em>Chondromyces lanuginosus</em></a></span> Sy t2<sup>T</sup>, <span class="named-content species" id="named-content-43"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces pediculatus"
+                        href="doi:10.1601/nm.3754"><em>Chondromyces pediculatus</em></a></span> Cm p51<sup>T</sup>, <span class="named-content species" id="named-content-44"><a class="namesforlife" rel="namesforlife-name" title="M. boletus"
+                        href="doi:10.1601/nm.3711"><em>M. boletus</em></a></span> Me b8<sup>T</sup>, <span class="named-content species" id="named-content-45"><a class="namesforlife" rel="namesforlife-name" title="P. sorediatum"
+                        href="doi:10.1601/nm.3745"><em>P. sorediatum</em></a></span> Pl s12<sup>T</sup> and <span class="named-content species" id="named-content-46"><a class="namesforlife" rel="namesforlife-name" title="P. spumosum"
+                        href="doi:10.1601/nm.3746"><em>P. spumosum</em></a></span> Pl sm5<sup>T</sup>. The prerequisite for the acceptance of type strains, their deposit and availability in two culture collections is achieved.
+                  The designation of the type strains is based on the descriptions given in the respective chapters of Bergey’s Manual (<a id="xref-ref-15-6" class="xref-bibr" href="#ref-15">Reichenbach 2005a</a>, <a id="xref-ref-17-3" class="xref-bibr" href="#ref-17">c</a>, <a id="xref-ref-18-5" class="xref-bibr" href="#ref-18">d</a>). In order to facilitate the comparison of these recent descriptions with those of the authors who originally proposed, revived
+                  or emended the species these original descriptions are assembled in Table S1 available in IJSEM Online. The fatty acid composition
+                  of the proposed type strains are given in Table S2 (<a id="xref-ref-6-1" class="xref-bibr" href="#ref-6">Garcia <em>et al.</em>, 2011</a>). The figures from the original descriptions and of the proposed type strains are shown face to face with figures showing
+                  the proposed type strains in <a id="xref-fig-1-1" class="xref-fig" href="#F1">Figs 1</a>–<a id="xref-fig-2-1" class="xref-fig" href="#F2">10</a>.
+               </p>
+               <div id="F1" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4354/F1.expansion.html"><img alt="Fig. 1. " src="4354/F1.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4354/F1.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4354/F1.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4354/F1">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 1. </span> 
+                     
+                     <p id="p-10" class="first-child"><span class="named-content species" id="named-content-47"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces apiculatus"
+                              href="doi:10.1601/nm.3751"><em>Chondromyces apiculatus</em></a></span>. (a) Drawing from <a id="xref-ref-21-3" class="xref-bibr" href="#ref-21">Thaxter (1897)</a>, plate XXX on pages 405–406. (b) Fruiting body (bar, 100 µm) and vegetative cells (insert; bar, 10 µm) of Cm a14<sup>T</sup>.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <div id="F2" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4354/F2.expansion.html"><img alt="Fig. 10. " src="4354/F2.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4354/F2.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4354/F2.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4354/F2">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 10. </span> 
+                     
+                     <p id="p-11" class="first-child"><span class="named-content species" id="named-content-48"><a class="namesforlife" rel="namesforlife-name" title="Polyangium fumosum"
+                              href="doi:10.1601/nm.3740"><em>Polyangium fumosum</em></a></span>. (a) Drawing from <a id="xref-ref-11-3" class="xref-bibr" href="#ref-11">Krzemieniewska &amp; Krzemieniewski (1930)</a>, plate XVI, nos 6–9 depict <span class="named-content species" id="named-content-49"><a class="namesforlife" rel="namesforlife-name" title="P. fumosum"
+                              href="doi:10.1601/nm.3740"><em>P. fumosum</em></a></span>. Courtesy of the Polish Botanical Society. (b) Swarm of PI fu5 (bar, 2000 µm) and single sporangium of PI fu5 (insert; bar,
+                        100 µm). (c) Fruiting bodies of PI fu5. Bar, 300 µm.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <p id="p-12">The Bacteriological Code also allows for the proposal of neotype strains according to Rule 18c: ‘If a strain on which the
+                  original description was based cannot be found, a neotype strain may be proposed. A neotype strain must be proposed (proposed
+                  neotype) in the IJSB, together with citation of the author(s) of the name, a description or reference to an effectively published
+                  description and a record of the permanently established culture collection(s) where the strain is deposited (see also Note
+                  1 to Rule 24a)’.
+               </p>
+               <p id="p-13">The species <span class="named-content species" id="named-content-50"><a class="namesforlife" rel="namesforlife-name" title="Cystobacter ferrugineus"
+                        href="doi:10.1601/nm.3698"><em>Cystobacter ferrugineus</em></a></span>, <span class="named-content species" id="named-content-51"><a class="namesforlife" rel="namesforlife-name" title="Cystobacter minus"
+                        href="doi:10.1601/nm.10682"><em>Cystobacter minus</em></a></span> and <span class="named-content species" id="named-content-52"><a class="namesforlife" rel="namesforlife-name" title="Polyangium fumosum"
+                        href="doi:10.1601/nm.3740"><em>Polyangium fumosum</em></a></span> were first described by <a id="xref-ref-9-3" class="xref-bibr" href="#ref-9">Krzemieniewska &amp; Krzemieniewski (1926</a>, <a id="xref-ref-10-4" class="xref-bibr" href="#ref-10">1927</a>, <a id="xref-ref-11-4" class="xref-bibr" href="#ref-11">1930)</a>. McCurdy assigned three of his isolates as the type strains for the above-mentioned three species (<a id="xref-ref-13-5" class="xref-bibr" href="#ref-13">McCurdy, 1970</a>; <a id="xref-table-wrap-1-4" class="xref-table" href="#T1">Table 1</a>). The species names and type strains were included in the Approved Lists (<a id="xref-ref-20-2" class="xref-bibr" href="#ref-20">Skerman <em>et al.</em>, 1980</a>) but they have never been deposited in a culture collection to the best of our knowledge. In 2007, we wrote a letter to the
+                  head of the microbiology laboratory of the University of Windsor with the request for subcultures of the strains <span class="named-content species" id="named-content-53"><a class="namesforlife" rel="namesforlife-name" title="Cystobacter ferrugineus"
+                        href="doi:10.1601/nm.3698"><em>Cystobacter ferrugineus</em></a></span> M-203<sup>T</sup>, <span class="named-content species" id="named-content-54"><a class="namesforlife" rel="namesforlife-name" title="Cystobacter minus"
+                        href="doi:10.1601/nm.10682"><em>Cystobacter minus</em></a></span> M-307<sup>T</sup> and <span class="named-content species" id="named-content-55"><a class="namesforlife" rel="namesforlife-name" title="P. fumosum"
+                        href="doi:10.1601/nm.3740"><em>P. fumosum</em></a></span> M257<sup>T</sup>. Even though the importance for microbial taxonomy was stressed there was no response. In 2012, another attempt to contact
+                  the department at Windsor University was more successful in the respect that we received answers from two colleagues at Windsor
+                  and from H. D. McCurdy who retired several years ago. However, they informed us that they cannot find the samples. Since 1981,
+                  there have been no scientific papers originating from the University of Windsor dealing with myxobacteria (PubMed), a fact
+                  additionally suggesting that nobody at the university had a research interest to keep the cultures alive or, at least, under
+                  surveillance. For that reasons we conclude that these cultures must have been lost.
+               </p>
+               <p id="p-14">Since the presently assigned type strains of the mentioned species are no longer available as living cultures it is formally
+                  proposed that the strains selected by Reichenbach shall be proposed as the neotype strains of the respective species in accordance
+                  with Rule 18c, as given in <a id="xref-table-wrap-1-5" class="xref-table" href="#T1">Table 1</a>. The deposit and availability of the neotype strains from two culture collections is achieved. The proposals of the neotype
+                  strains are based on the suggestions in (<a id="xref-ref-16-6" class="xref-bibr" href="#ref-16">Reichenbach (2005b</a>, <a id="xref-ref-18-6" class="xref-bibr" href="#ref-18">d</a>). In these chapters, the strains <span class="named-content species" id="named-content-56"><a class="namesforlife" rel="namesforlife-name" title="Cystobacter ferrugineus"
+                        href="doi:10.1601/nm.3698"><em>Cystobacter ferrugineus</em></a></span> Cb fe18, <span class="named-content species" id="named-content-57"><a class="namesforlife" rel="namesforlife-name" title="Cystobacter minus"
+                        href="doi:10.1601/nm.10682"><em>Cystobacter minus</em></a></span> Cb m2 and <span class="named-content species" id="named-content-58"><a class="namesforlife" rel="namesforlife-name" title="P. fumosum"
+                        href="doi:10.1601/nm.3740"><em>P. fumosum</em></a></span> Pl fu5 were proposed as the type strains according to the species descriptions given in the respective chapters which rely
+                  on the original species descriptions by Krzemieniewska and Krzemieniewski and McCurdy (<a id="xref-ref-16-7" class="xref-bibr" href="#ref-16">Reichenbach 2005b</a>, <a id="xref-ref-18-7" class="xref-bibr" href="#ref-18">d</a>). However, since type strains have already been assigned these strains have to be proposed as the neotype strains of the
+                  respective species according to rule 18c.
+               </p>
+               <div id="F3" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4354/F3.expansion.html"><img alt="Fig. 2. " src="4354/F3.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4354/F3.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4354/F3.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4354/F3">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 2. </span> 
+                     
+                     <p id="p-15" class="first-child"><span class="named-content species" id="named-content-59"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces crocatus"
+                              href="doi:10.1601/nm.3750"><em>Chondromyces crocatus</em></a></span>. (a) Drawing from <a id="xref-ref-1-1" class="xref-bibr" href="#ref-1">Berkeley (1857)</a>, page 313. (b) Fruiting bodies of Cm c5<sup>T</sup>. Bar, 500 µm.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <div id="F4" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4354/F4.expansion.html"><img alt="Fig. 3. " src="4354/F4.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4354/F4.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4354/F4.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4354/F4">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 3. </span> 
+                     
+                     <p id="p-16" class="first-child"><span class="named-content species" id="named-content-60"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces lanuginosus"
+                              href="doi:10.1601/nm.3753"><em>Chondromyces lanuginosus</em></a></span>. (a) Figures from <a id="xref-ref-8-3" class="xref-bibr" href="#ref-8">Kofler (1913)</a>, <a id="xref-fig-1-2" class="xref-fig" href="#F1">Figs 1</a>–<a id="xref-fig-4-1" class="xref-fig" href="#F4">3</a> on page 877 depict <span class="named-content species" id="named-content-61"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces lanuginosus"
+                              href="doi:10.1601/nm.3753"><em>Chondromyces lanuginosus</em></a></span>. Courtesy Österreichische Akademie der Wissenschaften. (b) Fruiting body of Sy t2<sup>T</sup>. Bar, 100 µm.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <div id="F5" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4354/F5.expansion.html"><img alt="Fig. 4. " src="4354/F5.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4354/F5.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4354/F5.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4354/F5">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 4. </span> 
+                     
+                     <p id="p-17" class="first-child"><span class="named-content species" id="named-content-62"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces pediculatus"
+                              href="doi:10.1601/nm.3754"><em>Chondromyces pediculatus</em></a></span>. (a) Drawing from <a id="xref-ref-22-4" class="xref-bibr" href="#ref-22">Thaxter (1904)</a>, plate XXVI on page 411; nos 7–13 depict <span class="named-content species" id="named-content-63"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces pediculatus"
+                              href="doi:10.1601/nm.3754"><em>Chondromyces pediculatus</em></a></span>. (b) Fruiting body of Cm p51<sup>T</sup>. Bar 100 µm.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <div id="F6" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4354/F6.expansion.html"><img alt="Fig. 5. " src="4354/F6.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4354/F6.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4354/F6.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4354/F6">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 5. </span> 
+                     
+                     <p id="p-18" class="first-child"><span class="named-content species" id="named-content-64"><a class="namesforlife" rel="namesforlife-name" title="Melittangium boletus"
+                              href="doi:10.1601/nm.3711"><em>Melittangium boletus</em></a></span>. (a) Drawing from <a id="xref-ref-7-3" class="xref-bibr" href="#ref-7">Jahn (1924)</a>, plate II, Fig. 17 on page 78. Courtesy Bornträger-Cramer, www.borntraeger-cramer.de. (b) and (c) Fruiting bodies of Me b8<sup>T</sup>. Bars, 120 and 80 µm, respectively.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <div id="F7" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4354/F7.expansion.html"><img alt="Fig. 6. " src="4354/F7.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4354/F7.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4354/F7.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4354/F7">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 6. </span> 
+                     
+                     <p id="p-19" class="first-child"><span class="named-content species" id="named-content-65"><a class="namesforlife" rel="namesforlife-name" title="Polyangium sorediatum"
+                              href="doi:10.1601/nm.3745"><em>Polyangium sorediatum</em></a></span>. (a) Drawing from <a id="xref-ref-22-5" class="xref-bibr" href="#ref-22">Thaxter (1904)</a>, plate XXVII. Nos 22–30 depict <span class="named-content species" id="named-content-66"><a class="namesforlife" rel="namesforlife-name" title="P. sorediatum"
+                              href="doi:10.1601/nm.3745"><em>P. sorediatum</em></a></span>. (b and c) Fruiting bodies of PI s12<sup>T</sup>. Insert: crushed sporangium releasing the single sporangioles. Bars, 200 µm.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <div id="F8" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4354/F8.expansion.html"><img alt="Fig. 7. " src="4354/F8.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4354/F8.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4354/F8.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4354/F8">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 7. </span> 
+                     
+                     <p id="p-20" class="first-child"><span class="named-content species" id="named-content-67"><a class="namesforlife" rel="namesforlife-name" title="Polyangium spumosum"
+                              href="doi:10.1601/nm.3746"><em>Polyangium spumosum</em></a></span>. (a) Figures from <a id="xref-ref-10-5" class="xref-bibr" href="#ref-10">Krzemieniewska &amp; Krzemieniewski (1926)</a>, plate V; no. 19 depicts <span class="named-content species" id="named-content-68"><a class="namesforlife" rel="namesforlife-name" title="P. spumosum"
+                              href="doi:10.1601/nm.3746"><em>P. spumosum</em></a></span> and from <a id="xref-ref-11-5" class="xref-bibr" href="#ref-11">Krzemieniewska &amp; Krzemieniewski (1930)</a>, plate XVI; nos 10–12 depict <span class="named-content species" id="named-content-69"><a class="namesforlife" rel="namesforlife-name" title="P. spumosum"
+                              href="doi:10.1601/nm.3746"><em>P. spumosum</em></a></span>. Courtesy of the Polish Botanical Society. (b–d) Degenerated fruiting bodies of PI sm5<sup>T</sup>. Bars, 500, 100 and 250 µm, respectively.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <div id="F9" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4354/F9.expansion.html"><img alt="Fig. 8. " src="4354/F9.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4354/F9.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4354/F9.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4354/F9">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 8. </span> 
+                     
+                     <p id="p-21" class="first-child"><span class="named-content species" id="named-content-70"><a class="namesforlife" rel="namesforlife-name" title="Cystobacter ferrugineus"
+                              href="doi:10.1601/nm.3698"><em>Cystobacter ferrugineus</em></a></span>. (a) Figures from <a id="xref-ref-13-6" class="xref-bibr" href="#ref-13">McCurdy (1970)</a>. (b–d) Strain Cb fe18, (b) myxospores and (c) fruiting bodies on <em>Escherichia coli</em> as food bacteria and (d) on a cellulose plate. Bars, 10 µm, 1 mm and 10 mm, respectively.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <div id="F10" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4354/F10.expansion.html"><img alt="Fig. 9. " src="4354/F10.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4354/F10.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4354/F10.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4354/F10">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 9. </span> 
+                     
+                     <p id="p-22" class="first-child"><span class="named-content species" id="named-content-71"><a class="namesforlife" rel="namesforlife-name" title="Cystobacter minus"
+                              href="doi:10.1601/nm.10682"><em>Cystobacter minus</em></a></span>. (a), Figures from <a id="xref-ref-13-7" class="xref-bibr" href="#ref-13">McCurdy (1970)</a>. (b and c), Fruiting bodies of Cb m2. Bars, 500 µm and 200 µm, respectively.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <div class="section ack" id="ack-1">
+                  <div class="section-nav"><a href="#fn-group-1" title="Previous Section" class="prev-section-link"><span>Previous Section</span></a><a href="#ref-list-1" title="References" class="next-section-link"><span>Next Section</span></a></div>
+                  <h2>Acknowledgements</h2>
+                  
+                  <p id="p-23">We are thankful to K. Poling and I. Churchill at Windsor University, G. Lewis-Gentry at the Harvard University Herbaria and
+                     H. D. McCurdy for taking the effort to investigate the disposition of the type materials.
+                  </p>
+                  
+               </div>
+               <div class="section ref-list" id="ref-list-1">
+                  <div class="section-nav"><a href="#ack-1" title="Acknowledgements" class="prev-section-link"><span>Previous Section</span></a><div class="nav-placeholder"> </div>
+                  </div>
+                  <h2>References</h2>
+                  <ol class="cit-list ref-use-labels">
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-1-1" title="View reference  in text"
+                           id="ref-1">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4354.1">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Berkeley</span>,  <span class="cit-name-given-names">M. J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1857</span><strong>).</strong> <span class="cit-source">Introduction to Cryptogamic Botany</span>. <span class="cit-publ-loc">London</span>: <span class="cit-publ-name">H. Bailliere</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Introduction%20to%20Cryptogamic%20Botany&amp;author=M.%20J.%20Berkeley&amp;publication_year=1857">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><div class="cit ref-cit ref-journal no-rev-xref" id="cit-63.Pt_11.4354.2"
+                             data-doi="10.1099/00207713-39-4-495">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Berkeley</span>,  <span class="cit-name-given-names">M. J.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Curtis</span>,  <span class="cit-name-given-names">M. A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1874</span><strong>).</strong> <span class="cit-article-title">Notices of the North American Fungi</span>. <abbr class="cit-jnl-abbrev">Grevillea</abbr> <span class="cit-vol">3</span>, <span class="cit-fpage">49</span>–<span class="cit-lpage">64</span>.<span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-39-4-495</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1099/00207713-39-4-495&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Notices%20of%20the%20North%20American%20Fungi&amp;author=M.%20J.%20Berkeley&amp;author=M.%20A.%20Curtis&amp;publication_year=1874&amp;journal=Grevillea&amp;volume=3&amp;pages=49-64&amp;doi=10.1099%2F00207713-39-4-495">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-3-3" title="View reference  in text"
+                           id="ref-3">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4354.3">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Staley</span>,  <span class="cit-name-given-names">J. T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Bryant</span>,  <span class="cit-name-given-names">M. P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Pfennig</span>,  <span class="cit-name-given-names">N.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Holt</span>,  <span class="cit-name-given-names">J. G.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brockman</span>,  <span class="cit-name-given-names">E. R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1989a</span><strong>).</strong> <span class="cit-article-title">Genus I. <em>Polyangium</em> Link 1809, 42<sup>AL</sup></span>. In <span class="cit-source">Bergey’s Manual of Systematic Bacteriology</span>, <span class="cit-vol">vol. 3</span>, pp. <span class="cit-fpage">2159</span>–<span class="cit-lpage">2162</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Staley</span>,  <span class="cit-name-given-names">J. T.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Bryant</span>,  <span class="cit-name-given-names">M. P.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Pfennig</span>,  <span class="cit-name-given-names">N.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Holt</span>,  <span class="cit-name-given-names">J. G.</span></span>
+                                 . <span class="cit-publ-loc">Baltimore</span>: <span class="cit-publ-name">Williams &amp; Wilkins</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Genus%20I.%20Polyangium%20Link%201809%2C%2042AL&amp;author=E.%20R.%20Brockman&amp;publication_year=1989a&amp;citation_inbook_title=Bergey%E2%80%99s%20Manual%20of%20Systematic%20Bacteriology">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-4-1" title="View reference  in text"
+                           id="ref-4">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4354.4"
+                             data-doi="10.1099/00207713-39-4-495">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brockman</span>,  <span class="cit-name-given-names">E. R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1989b</span><strong>).</strong> <span class="cit-article-title"><em>Polyangium sorediatum</em> nom. rev. In <em>Validation of the Publication of New Names and New Combinations Previously Effectively Published Outside the IJSB</em>, List No. 31</span>. <abbr class="cit-jnl-abbrev">Int J Syst Bacteriol</abbr> <span class="cit-vol">39</span>, <span class="cit-fpage">495</span>–<span class="cit-lpage">497</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-39-4-495</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=PDF&amp;journalCode=ijs&amp;resid=39/4/495"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-5-1" title="View reference  in text"
+                           id="ref-5">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4354.5"
+                             data-doi="10.1099/00207713-39-4-495">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brockman</span>,  <span class="cit-name-given-names">E. R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1989</span><strong>c).</strong> <span class="cit-article-title"><em>Polyangium spumosum</em> nom. rev. In <em>Validation of the Publication of New Names and New Combinations Previously Effectively Published Outside the IJSB</em>, List No. 31</span>. <abbr class="cit-jnl-abbrev">Int J Syst Bacteriol</abbr> <span class="cit-vol">39</span>, <span class="cit-fpage">495</span>–<span class="cit-lpage">497</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-39-4-495</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=PDF&amp;journalCode=ijs&amp;resid=39/4/495"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-6-1" title="View reference  in text"
+                           id="ref-6">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4354.6"
+                             data-doi="10.1128/JB.01091-10">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Garcia</span>,  <span class="cit-name-given-names">R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pistorius</span>,  <span class="cit-name-given-names">D.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stadler</span>,  <span class="cit-name-given-names">M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Müller</span>,  <span class="cit-name-given-names">R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2011</span><strong>).</strong> <span class="cit-article-title">Fatty acid-related phylogeny of myxobacteria as an approach to discover polyunsaturated omega-3/6 fatty acids</span>. <abbr class="cit-jnl-abbrev">J Bacteriol</abbr> <span class="cit-vol">193</span>, <span class="cit-fpage">1930</span>–<span class="cit-lpage">1942</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/JB.01091-10</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>21317327</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=jb&amp;resid=193/8/1930"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-7-2" title="View reference  in text"
+                           id="ref-7">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4354.7">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jahn</span>,  <span class="cit-name-given-names">E.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1924</span><strong>).</strong> <span class="cit-source">Beitraege zur Botanischen Protistologie I. Die Polyangiden</span>. <span class="cit-publ-loc">Leipzig</span>: <span class="cit-publ-name">Verlag Gebrueder Borntraeger</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Beitraege%20zur%20Botanischen%20Protistologie%20I.%20Die%20Polyangiden&amp;author=E.%20Jahn&amp;publication_year=1924">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-8-1" title="View reference  in text"
+                           id="ref-8">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4354.8">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kofler</span>,  <span class="cit-name-given-names">L.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1913</span><strong>).</strong> <span class="cit-article-title">Die Myxobakterien der Umgebung von Wien</span>. <abbr class="cit-jnl-abbrev">Sitzungsberichte der Akademie der Wissenschaften in Wien Mathematisch-naturwissenschaftliche Klasse Abteilung I</abbr> <span class="cit-vol">122</span>, <span class="cit-fpage">845</span>–<span class="cit-lpage">876</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Die%20Myxobakterien%20der%20Umgebung%20von%20Wien&amp;author=L.%20Kofler&amp;publication_year=1913&amp;journal=Sitzungsberichte%20der%20Akademie%20der%20Wissenschaften%20in%20Wien%20Mathematisch-naturwissenschaftliche%20Klasse%20Abteilung%20I&amp;volume=122&amp;pages=845-876">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-9-3" title="View reference  in text"
+                           id="ref-9">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4354.9">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Krzemieniewska</span>,  <span class="cit-name-given-names">H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Krzemieniewski</span>,  <span class="cit-name-given-names">S.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1926</span><strong>).</strong> <span class="cit-article-title">Miksobacterje Polski (Die Myxobakterien von Polen)</span>. <abbr class="cit-jnl-abbrev">Acta Societatis Botanicorum Poloniae</abbr> <span class="cit-vol">4</span>, <span class="cit-fpage">1</span>–<span class="cit-lpage">54</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Miksobacterje%20Polski%20%28Die%20Myxobakterien%20von%20Polen%29&amp;author=H.%20Krzemieniewska&amp;author=S.%20Krzemieniewski&amp;publication_year=1926&amp;journal=Acta%20Societatis%20Botanicorum%20Poloniae&amp;volume=4&amp;pages=1-54">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-10-4" title="View reference  in text"
+                           id="ref-10">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4354.10">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Krzemieniewska</span>,  <span class="cit-name-given-names">H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Krzemieniewski</span>,  <span class="cit-name-given-names">S.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1927</span><strong>).</strong> <span class="cit-article-title">Miksobacterje Polski. Uzupelnienie. (Die Myxobakterien von Polen. Anhang)</span>. <abbr class="cit-jnl-abbrev">Acta Societatis Botanicorum Poloniae</abbr> <span class="cit-vol">5</span>, <span class="cit-fpage">79</span>–<span class="cit-lpage">98</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Miksobacterje%20Polski.%20Uzupelnienie.%20%28Die%20Myxobakterien%20von%20Polen.%20Anhang%29&amp;author=H.%20Krzemieniewska&amp;author=S.%20Krzemieniewski&amp;publication_year=1927&amp;journal=Acta%20Societatis%20Botanicorum%20Poloniae&amp;volume=5&amp;pages=79-98">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-11-3" title="View reference  in text"
+                           id="ref-11">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4354.11">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Krzemieniewska</span>,  <span class="cit-name-given-names">H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Krzemieniewski</span>,  <span class="cit-name-given-names">S.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1930</span><strong>).</strong> <span class="cit-article-title">Miksobakterje Polski. Czesc Trzecia. (Die Myxobakterien von Polen. III. Teil)</span>. <abbr class="cit-jnl-abbrev">Acta Societatis Botanicorum Poloniae</abbr> <span class="cit-vol">7</span>, <span class="cit-fpage">250</span>–<span class="cit-lpage">273</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Miksobakterje%20Polski.%20Czesc%20Trzecia.%20%28Die%20Myxobakterien%20von%20Polen.%20III.%20Teil%29&amp;author=H.%20Krzemieniewska&amp;author=S.%20Krzemieniewski&amp;publication_year=1930&amp;journal=Acta%20Societatis%20Botanicorum%20Poloniae&amp;volume=7&amp;pages=250-273">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-12-1" title="View reference  in text"
+                           id="ref-12">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4354.12">
+                           <div class="cit-metadata">
+                              <ol class="cit-ed-list">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Lapage</span>,  <span class="cit-name-given-names">S. P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Sneath</span>,  <span class="cit-name-given-names">P. H. A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Lessel</span>,  <span class="cit-name-given-names">E. F.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Skerman</span>,  <span class="cit-name-given-names">V. B. D.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Seeliger</span>,  <span class="cit-name-given-names">H. P. R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Clark</span>,  <span class="cit-name-given-names">W. A.</span></span></li>
+                              </ol><cite> <strong>(editors) (</strong><span class="cit-pub-date">1992</span><strong>).</strong> <span class="cit-source">International Code of Nomenclature of Bacteria (1990 Revision). Bacteriological Code</span>. <span class="cit-publ-loc">Washington, DC</span>: <span class="cit-publ-name">American Society for Microbiology</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=International%20Code%20of%20Nomenclature%20of%20Bacteria%20%281990%20Revision%29.%20Bacteriological%20Code&amp;author=S.%20P.%20Lapage&amp;author=P.%20H.%20A.%20Sneath&amp;author=E.%20F.%20Lessel&amp;author=V.%20B.%20D.%20Skerman&amp;author=H.%20P.%20R.%20Seeliger&amp;author=W.%20A.%20Clark&amp;publication_year=1992">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-13-5" title="View reference  in text"
+                           id="ref-13">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4354.13"
+                             data-doi="10.1099/00207713-20-3-283">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">McCurdy</span>,  <span class="cit-name-given-names">H. D.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1970</span><strong>).</strong> <span class="cit-article-title">Studies on the taxonomy of the <em>Myxobacterales</em>. II. <em>Polyangium</em> and the demise of the <em>Sporangiaceae</em></span>. <abbr class="cit-jnl-abbrev">Int J Syst Bacteriol</abbr> <span class="cit-vol">20</span>, <span class="cit-fpage">283</span>–<span class="cit-lpage">296</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-20-3-283</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=20/3/283"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-14-1" title="View reference  in text"
+                           id="ref-14">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4354.14"
+                             data-doi="10.1099/00207713-21-1-40">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">McCurdy</span>,  <span class="cit-name-given-names">H. D.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1971</span><strong>).</strong> <span class="cit-article-title">Studies on the taxonomy of the <em>Myxobacterales</em>. III. <em>Chondromyces</em> and <em>Stigmatella</em></span>. <abbr class="cit-jnl-abbrev">Int J Syst Bacteriol</abbr> <span class="cit-vol">21</span>, <span class="cit-fpage">40</span>–<span class="cit-lpage">49</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-21-1-40</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=21/1/40"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-15-5" title="View reference  in text"
+                           id="ref-15">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4354.15"
+                             data-doi="10.1007/0-387-29298-5_276">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Brenner</span>,  <span class="cit-name-given-names">D. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Garrity</span>,  <span class="cit-name-given-names">G. M.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Reichenbach</span>,  <span class="cit-name-given-names">H.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2005a</span><strong>).</strong> <span class="cit-article-title">Genus III. <em>Chondromyces</em> Berkeley and Curtis in Berkeley 1874, 64<sup>AL</sup></span>. In <span class="cit-source">Bergey’s Manual of Systematic Bacteriology</span>, <span class="cit-edition">2nd edn</span>, <span class="cit-vol">vol. 2</span>, pp. <span class="cit-fpage">1121</span>–<span class="cit-lpage">1129</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Brenner</span>,  <span class="cit-name-given-names">D. J.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Garrity</span>,  <span class="cit-name-given-names">G. M.</span></span>
+                                 . <span class="cit-publ-loc">New York</span>: <span class="cit-publ-name">Springer</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/0-387-29298-5_276</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/0-387-29298-5_276&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Genus%20III.%20Chondromyces%20Berkeley%20and%20Curtis%20in%20Berkeley%201874%2C%2064AL&amp;author=H.%20Reichenbach&amp;publication_year=2005a&amp;citation_inbook_title=Bergey%E2%80%99s%20Manual%20of%20Systematic%20Bacteriology">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-16-5" title="View reference  in text"
+                           id="ref-16">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4354.16"
+                             data-doi="10.1007/0-387-29298-5_269">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Brenner</span>,  <span class="cit-name-given-names">D. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Garrity</span>,  <span class="cit-name-given-names">G. M.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Reichenbach</span>,  <span class="cit-name-given-names">H.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2005b</span><strong>).</strong> <span class="cit-article-title">Genus I. <em>Cystobacter</em> Schroeter 1886, 170<sup>AL</sup></span>. In <span class="cit-source">Bergey’s Manual of Systematic Bacteriology</span>, <span class="cit-edition">2nd edn</span>, <span class="cit-vol">vol. 2</span>, pp. <span class="cit-fpage">1086</span>–<span class="cit-lpage">1096</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Brenner</span>,  <span class="cit-name-given-names">D. J.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Garrity</span>,  <span class="cit-name-given-names">G. M.</span></span>
+                                 . <span class="cit-publ-loc">New York</span>: <span class="cit-publ-name">Springer</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/0-387-29298-5_269</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/0-387-29298-5_269&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Genus%20I.%20Cystobacter%20Schroeter%201886%2C%20170AL&amp;author=H.%20Reichenbach&amp;publication_year=2005b&amp;citation_inbook_title=Bergey%E2%80%99s%20Manual%20of%20Systematic%20Bacteriology">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-17-2" title="View reference  in text"
+                           id="ref-17">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4354.17"
+                             data-doi="10.1007/0-387-29298-5_272">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Brenner</span>,  <span class="cit-name-given-names">D. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Garrity</span>,  <span class="cit-name-given-names">G. M.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Reichenbach</span>,  <span class="cit-name-given-names">H.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2005c</span><strong>).</strong> <span class="cit-article-title">Genus IV. <em>Melittangium</em> Jahn 1924, 7<sup>AL</sup></span>. In <span class="cit-source">Bergey’s Manual of Systematic Bacteriology</span>, <span class="cit-edition">2nd edn</span>, <span class="cit-vol">vol. 2</span>, pp. <span class="cit-fpage">1101</span>–<span class="cit-lpage">1104</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Brenner</span>,  <span class="cit-name-given-names">D. J.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Garrity</span>,  <span class="cit-name-given-names">G. M.</span></span>
+                                 . <span class="cit-publ-loc">New York</span>: <span class="cit-publ-name">Springer</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/0-387-29298-5_272</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/0-387-29298-5_272&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Genus%20IV.%20Melittangium%20Jahn%201924%2C%207AL&amp;author=H.%20Reichenbach&amp;publication_year=2005c&amp;citation_inbook_title=Bergey%E2%80%99s%20Manual%20of%20Systematic%20Bacteriology">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-18-5" title="View reference  in text"
+                           id="ref-18">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4354.18"
+                             data-doi="10.1007/0-387-29298-5_274">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Brenner</span>,  <span class="cit-name-given-names">D. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Garrity</span>,  <span class="cit-name-given-names">G. M.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Reichenbach</span>,  <span class="cit-name-given-names">H.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2005d</span><strong>).</strong> <span class="cit-article-title">Genus I. Polyangium Link 1809, 42<sup>AL</sup></span>. In <span class="cit-source">Bergey’s Manual of Systematic Bacteriology</span>, <span class="cit-edition">2nd edn</span>, <span class="cit-vol">vol. 2</span>, pp. <span class="cit-fpage">1110</span>–<span class="cit-lpage">1118</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Brenner</span>,  <span class="cit-name-given-names">D. J.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Garrity</span>,  <span class="cit-name-given-names">G. M.</span></span>
+                                 . <span class="cit-publ-loc">New York</span>: <span class="cit-publ-name">Springer</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/0-387-29298-5_274</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/0-387-29298-5_274&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Genus%20I.%20Polyangium%20Link%201809%2C%2042AL&amp;author=H.%20Reichenbach&amp;publication_year=2005d&amp;citation_inbook_title=Bergey%E2%80%99s%20Manual%20of%20Systematic%20Bacteriology">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><div class="cit ref-cit ref-book no-rev-xref" id="cit-63.Pt_11.4354.19">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Brenner</span>,  <span class="cit-name-given-names">D. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Garrity</span>,  <span class="cit-name-given-names">G. M.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Reichenbach</span>,  <span class="cit-name-given-names">H.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2005e</span><strong>).</strong> <span class="cit-article-title">Order VIII. Myxococcales Tchan, Pochon and Prévot 1948, 398<sup>AL</sup></span>. In <span class="cit-source">Bergey’s Manual of Systematic Bacteriology</span><em>,</em> <span class="cit-edition">2nd edn</span>, <span class="cit-vol">vol. 2</span>, pp. <span class="cit-fpage">1059</span>–<span class="cit-lpage">1072</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Brenner</span>,  <span class="cit-name-given-names">D. J.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Garrity</span>,  <span class="cit-name-given-names">G. M.</span></span>
+                                 . <span class="cit-publ-loc">New York</span>: <span class="cit-publ-name">Springer</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Order%20VIII.%20Myxococcales%20Tchan%2C%20Pochon%20and%20Pr%C3%A9vot%201948%2C%20398AL&amp;author=H.%20Reichenbach&amp;publication_year=2005e&amp;citation_inbook_title=Bergey%E2%80%99s%20Manual%20of%20Systematic%20Bacteriology">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-20-1" title="View reference  in text"
+                           id="ref-20">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4354.20"
+                             data-doi="10.1099/00207713-30-1-225">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Skerman</span>,  <span class="cit-name-given-names">V. B. D.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">McGowan</span>,  <span class="cit-name-given-names">V.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sneath</span>,  <span class="cit-name-given-names">P. H. A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1980</span><strong>).</strong> <span class="cit-article-title">Approved lists of bacterial names</span>. <abbr class="cit-jnl-abbrev">Int J Syst Bacteriol</abbr> <span class="cit-vol">30</span>, <span class="cit-fpage">225</span>–<span class="cit-lpage">420</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-30-1-225</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=PDF&amp;journalCode=ijs&amp;resid=30/1/225"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-21-1" title="View reference  in text"
+                           id="ref-21">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4354.21"
+                             data-doi="10.1086/327531">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Thaxter</span>,  <span class="cit-name-given-names">R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1897</span><strong>).</strong> <span class="cit-article-title">Further observations on the <em>Myxobacteriaceae</em></span>. <abbr class="cit-jnl-abbrev">Bot Gaz</abbr> <span class="cit-vol">23</span>, <span class="cit-fpage">395</span>–<span class="cit-lpage">411</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1086/327531</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1086/327531&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Further%20observations%20on%20the%20Myxobacteriaceae&amp;author=R.%20Thaxter&amp;publication_year=1897&amp;journal=Bot%20Gaz&amp;volume=23&amp;pages=395-411&amp;doi=10.1086%2F327531">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-22-1" title="View reference  in text"
+                           id="ref-22">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4354.22"
+                             data-doi="10.1086/328505">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Thaxter</span>,  <span class="cit-name-given-names">R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1904</span><strong>).</strong> <span class="cit-article-title">Notes on the <em>Myxobacteriaceae</em></span>. <abbr class="cit-jnl-abbrev">Bot Gaz</abbr> <span class="cit-vol">37</span>, <span class="cit-fpage">405</span>–<span class="cit-lpage">416</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1086/328505</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1086/328505&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Notes%20on%20the%20Myxobacteriaceae&amp;author=R.%20Thaxter&amp;publication_year=1904&amp;journal=Bot%20Gaz&amp;volume=37&amp;pages=405-416&amp;doi=10.1086%2F328505">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-23-1" title="View reference  in text"
+                           id="ref-23">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4354.23"
+                             data-doi="10.1016/j.syapm.2012.12.006">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Yarza</span>,  <span class="cit-name-given-names">P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Spröer</span>,  <span class="cit-name-given-names">C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Swiderski</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Mrotzek</span>,  <span class="cit-name-given-names">N.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Spring</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Tindall</span>,  <span class="cit-name-given-names">B. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Gronow</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pukall</span>,  <span class="cit-name-given-names">R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Klenk</span>,  <span class="cit-name-given-names">H. P.</span></span></li>
+                              </ol><cite> <strong>&amp; other authors (</strong><span class="cit-pub-date">2013</span><strong>).</strong> <span class="cit-article-title">Sequencing orphan species initiative (SOS): Filling the gaps in the 16S rRNA gene sequence database for all species with validly
+                                    published names</span>. <abbr class="cit-jnl-abbrev">Syst Appl Microbiol</abbr> <span class="cit-vol">36</span>, <span class="cit-fpage">69</span>–<span class="cit-lpage">73</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/j.syapm.2012.12.006</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>23410935</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/j.syapm.2012.12.006&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=23410935&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Sequencing%20orphan%20species%20initiative%20%28SOS%29%3A%20Filling%20the%20gaps%20in%20the%2016S%20rRNA%20gene%20sequence%20database%20for%20all%20species%20with%20validly%20published%20names&amp;author=P.%20Yarza&amp;author=C.%20Spr%C3%B6er&amp;author=J.%20Swiderski&amp;author=N.%20Mrotzek&amp;author=S.%20Spring&amp;author=B.%20J.%20Tindall&amp;author=S.%20Gronow&amp;author=R.%20Pukall&amp;author=H.%20P.%20Klenk&amp;publication_year=2013&amp;journal=Syst%20Appl%20Microbiol&amp;volume=36&amp;pages=69-73&amp;doi=10.1016%2Fj.syapm.2012.12.006&amp;pmid=23410935">Google Scholar</a></div>
+                        </div>
+                     </li>
+                  </ol>
+               </div><span class="highwire-journal-article-marker-end"></span></div>
+            <div class="social-bookmarking">
+               
+               <ul class="social-bookmark-links">
+                  <li class="social-bookmarking-item social-bookmarking-item-citeulike"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=CITEULIKE"><img src="/shared/img/common/social-bookmarking/citeulike.gif"
+                             alt="Add to CiteULike"
+                             title="CiteULike" /></a><span class="soc-bm-link-text">CiteULike</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-delicious"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=DEL_ICIO_US"><img src="/shared/img/common/social-bookmarking/delicious.gif"
+                             alt="Add to Delicious"
+                             title="Delicious" /></a><span class="soc-bm-link-text">Delicious</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-digg"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=DIGG"><img src="/shared/img/common/social-bookmarking/digg.gif" alt="Add to Digg"
+                             title="Digg" /></a><span class="soc-bm-link-text">Digg</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-facebook"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/short/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=FACEBOOK"
+                        class="sb-facebook"
+                        rel="external-nw"><img src="/shared/img/common/social-bookmarking/facebook.gif" alt="Add to Facebook"
+                             title="Facebook" /></a><span class="soc-bm-link-text">Facebook</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-googleplus"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=GOOGLEPLUS&amp;log_only=yes"><img src="/shared/img/common/social-bookmarking/googleplus.jpg" alt="Add to Google+"
+                             title="Google+" /></a><span class="soc-bm-link-text">Google+</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-linkedin"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=LINKEDIN"><img src="/shared/img/common/social-bookmarking/linkedin.gif" alt="Add to LinkedIn"
+                             title="LinkedIn" /></a><span class="soc-bm-link-text">LinkedIn</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-mendeley"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=MENDELEY"><img src="/shared/img/common/social-bookmarking/mendeley.gif" alt="Add to Mendeley"
+                             title="Mendeley" /></a><span class="soc-bm-link-text">Mendeley</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-reddit"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=REDDIT"><img src="/shared/img/common/social-bookmarking/reddit.gif" alt="Add to Reddit"
+                             title="Reddit" /></a><span class="soc-bm-link-text">Reddit</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-twitter"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=TWITTER"><img src="/shared/img/common/social-bookmarking/twitter.gif" alt="Add to Twitter"
+                             title="Twitter" /></a><span class="soc-bm-link-text">Twitter</span></li>
+               </ul>
+               
+               <p class="social-bookmarking-help"><a href="/help/social_bookmarks.dtl">What's this?</a></p>
+               
+            </div><span id="related-urls"></span></div>
+         <div id="col-2">
+            
+            <div class="article-nav sidebar-nav">
+               <a href="/content/63/Pt_11/4350.short" title="Previous article" class="previous">« Previous</a><span class="article-nav-sep"> | </span><a href="/content/63/Pt_11/4361.short" title="Next article" class="next">Next Article »</a>
+               
+               <span class="toc-link">
+                  				<a href="/content/63/Pt_11.toc" title="Table of Contents">Table of Contents</a>
+                  			</span>
+               
+               
+            </div>
+            <div class="free-article">
+               <span class="free-article-note">
+                  FREE ARTICLE
+                  </span>
+               
+            </div>
+            <div class="content-box" id="article-cb-main">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Article</span></h3>
+                  <div class="cb-section cb-slug">
+                     <ol>
+                        <li>
+                           <div id="slugline">
+                              
+                              
+                              	    
+                              
+                              doi:
+                              <span title="10.1099/ijs.0.056440-0" class="slug-doi">10.1099/ijs.0.056440-0
+                                 </span>
+                              <cite>
+                                 	    <abbr title="International Journal of Systematic and Evolutionary Microbiology"
+                                       class="slug-jnl-abbrev">
+                                    IJSEM</abbr><span class="slug-pub-date" itemprop="datePublished">
+                                    	    November 2013 
+                                    </span>
+                                 	    <span class="slug-vol">
+                                    vol. 63 
+                                    </span><span class="slug-issue">
+                                    no. Pt 11 
+                                    </span><span class="slug-pages">
+                                    4354-4360
+                                    </span>
+                                 </cite>
+                              
+                              	           
+                              
+                              
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section cb-views">
+                     <ol>
+                        <li class="abstract-view-link primary"><a href="/content/63/Pt_11/4354.abstract" rel="view-abstract">Abstract</a><span class="free">Free</span></li>
+                        <li class="notice full-text-view-link primary"><span class="variant-indicator">» <span>Full Text</span></span><span class="free">Free</span></li>
+                        <li class="notice full-text-pdf-view-link primary"><a href="/content/63/Pt_11/4354.full.pdf+html" rel="view-full-text.pdf">Full Text (PDF)</a><span class="free">Free</span></li>
+                        <li><a href="/content/63/Pt_11/4354/suppl/DC1" rel="supplemental-data"
+                              class="dslink-supplementary-material">Supplementary material</a></li>
+                        <li><a href="/powerpoint/63/Pt_11/4354">PPT Slides of All Figures</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible" id="cb-art-cat">
+                     <h4 class="cb-section-header"><span>Classifications</span></h4>
+                     <ol>
+                        <li>
+                           <ul class="subject-headings last-child">
+                              <li><a class="tocsection-search"
+                                    href="/search?tocsectionid=Taxonomic+Note&amp;sortspec=date&amp;submit=Submit">Taxonomic Note</a></li>
+                           </ul>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible" id="cb-art-svcs">
+                     <h4 class="cb-section-header"><span>Services</span></h4>
+                     <ol>
+                        <li class="mail-a-friend-link icon-link"><a href="/email?gca=ijs%3B63%2FPt_11%2F4354&amp;current-view-path=/content/63/Pt_11/4354.full">
+                              Email this article to a colleague</a></li>
+                        <li class="alert-link icon-link"><a href="/cgi/alerts/ctalert?alertType=citedby&amp;addAlert=cited_by&amp;cited_by_criteria_resid=ijs%3B63%2FPt_11%2F4354&amp;saveAlert=no&amp;return-type=article&amp;return_url=http://ijs.sgmjournals.org/content/63/Pt_11/4354.full">Alert me when this article is cited</a></li>
+                        <li class="alert-link icon-link"><a href="/cgi/alerts/ctalert?alertType=correction&amp;addAlert=correction&amp;correction_criteria_value=63/Pt_11/4354&amp;saveAlert=no&amp;return-type=article&amp;return_url=http://ijs.sgmjournals.org/content/63/Pt_11/4354.full">Alert me if a correction is posted</a></li>
+                        <li class="similar-link"><a href="/search?qbe=ijs%3Bijs.0.056440-0&amp;citation=Lang%20and%20Reichenbach%2063%20%28Pt%2011%29:%204354&amp;submit=yes">Similar articles in this journal</a></li>
+                        <li class="similar-link"><a href="/external-ref?access_num=ijs%3B63%2FPt_11%2F4354&amp;link_type=ISI_RELATEDRECORDS"
+                              id="cb-isi-similar-articles"
+                              class="similar-link">Similar articles in Web of Science</a></li>
+                        <li class="similar-link"><a href="/external-ref?access_num=24187023&amp;link_type=MED_NBRS"
+                              class="similar-link">Similar articles in PubMed</a></li>
+                        <li class="cit-man-link icon-link cite-link"><a href="/citmgr?gca=ijs%3B63%2FPt_11%2F4354">Download to citation manager</a></li>
+                        <li class="copyright-link icon-link"><a href="/external-ref?link_type=PERMISSIONDIRECT"><img src="/shared/img/content/permissions.gif" /></a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-cit">
+                     <h4 class="cb-section-header"><span>Citing Articles</span></h4>
+                     <ol>
+                        <li class="hw-citing-link"><a href="/content/63/Pt_11/4354.full?cited-by=yes&amp;legid=ijs;63/Pt_11/4354#cited-by"
+                              id="cb-hw-citing-articles">Load citing article information</a></li>
+                        <li><a href="/cgi/crossref-forward-links/63/Pt_11/4354" rel="external-nw"
+                              id="cb-crossref-citing-articles">Citing articles via CrossRef</a></li>
+                        <li><a href="/external-ref?access_num=%2Fijs%2F63%2FPt_11%2F4354&amp;link_type=ISI_CITING&amp;accnum_type=native"
+                              rel="external-nw"
+                              id="cb-isi-citing-articles">Citing articles via Web of Science</a></li>
+                        <li><a href="/external-ref?access_num=http://ijs.sgmjournals.org/content/63/Pt_11/4354.abstract&amp;link_type=GOOGLESCHOLAR">Citing articles via Google Scholar</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-gs">
+                     <h4 class="cb-section-header"><span>Google Scholar</span></h4>
+                     <ol>
+                        <li class="cb-art-gs-auth author-link"><a href="http://scholar.google.com/scholar?q=%22author%3ALang%20author%3AE.%22"
+                              class="cb-art-gs-auth author-link">Articles by  Lang, E.</a></li>
+                        <li class="cb-art-gs-auth author-link"><a href="http://scholar.google.com/scholar?q=%22author%3AReichenbach%20author%3AH.%22"
+                              class="cb-art-gs-auth author-link">Articles by  Reichenbach, H.</a></li>
+                        <li class="cb-art-gs-rel similar-link"><a href="/external-ref?access_num=http://ijs.sgmjournals.org/content/63/Pt_11/4354.abstract&amp;link_type=GOOGLESCHOLARRELATED">Search for related content</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-pm">
+                     <h4 class="cb-section-header"><span>PubMed</span></h4>
+                     <ol>
+                        <li class="cb-art-pm-cite cite-link icon-link"><a href="/external-ref?access_num=24187023&amp;link_type=PUBMED"
+                              class="cb-art-pm-cite cite-link icon-link">PubMed citation</a></li>
+                        <li class="cb-art-pm-auth author-link"><a href="/external-ref?access_num=Lang%20E&amp;link_type=AUTHORSEARCH"
+                              class="cb-art-pm-auth author-link">Articles by  Lang, E.</a></li>
+                        <li class="cb-art-pm-auth author-link"><a href="/external-ref?access_num=Reichenbach%20H&amp;link_type=AUTHORSEARCH"
+                              class="cb-art-pm-auth author-link">Articles by  Reichenbach, H.</a></li>
+                        <li>
+                           <div id="cb-entrez-links-placeholder"><a href="/entrez-links/24187023"></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-rel">
+                     <h4 class="cb-section-header"><span>Related Content</span></h4>
+                     <ol>
+                        <li><a href="/content/63/Pt_11/4354.full?related-urls=yes&amp;legid=ijs;63/Pt_11/4354#related-urls"
+                              id="cb-related-urls">Load related web page information</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed soc-links icon-link"
+                       id="cb-art-soc">
+                     <h4 class="cb-section-header"><span>Social Bookmarking</span></h4>
+                     <ol>
+                        <li>
+                           <div class="social-bookmarking">
+                              
+                              <ul class="social-bookmark-links">
+                                 <li class="social-bookmarking-item social-bookmarking-item-citeulike"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=CITEULIKE"><img src="/shared/img/common/social-bookmarking/citeulike.gif"
+                                            alt="Add to CiteULike"
+                                            title="CiteULike" /></a><span class="soc-bm-link-text">CiteULike</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-delicious"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=DEL_ICIO_US"><img src="/shared/img/common/social-bookmarking/delicious.gif"
+                                            alt="Add to Delicious"
+                                            title="Delicious" /></a><span class="soc-bm-link-text">Delicious</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-digg"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=DIGG"><img src="/shared/img/common/social-bookmarking/digg.gif" alt="Add to Digg"
+                                            title="Digg" /></a><span class="soc-bm-link-text">Digg</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-facebook"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/short/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=FACEBOOK"
+                                       class="sb-facebook"
+                                       rel="external-nw"><img src="/shared/img/common/social-bookmarking/facebook.gif" alt="Add to Facebook"
+                                            title="Facebook" /></a><span class="soc-bm-link-text">Facebook</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-googleplus"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=GOOGLEPLUS&amp;log_only=yes"><img src="/shared/img/common/social-bookmarking/googleplus.jpg" alt="Add to Google+"
+                                            title="Google+" /></a><span class="soc-bm-link-text">Google+</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-linkedin"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=LINKEDIN"><img src="/shared/img/common/social-bookmarking/linkedin.gif" alt="Add to LinkedIn"
+                                            title="LinkedIn" /></a><span class="soc-bm-link-text">LinkedIn</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-mendeley"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=MENDELEY"><img src="/shared/img/common/social-bookmarking/mendeley.gif" alt="Add to Mendeley"
+                                            title="Mendeley" /></a><span class="soc-bm-link-text">Mendeley</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-reddit"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=REDDIT"><img src="/shared/img/common/social-bookmarking/reddit.gif" alt="Add to Reddit"
+                                            title="Reddit" /></a><span class="soc-bm-link-text">Reddit</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-twitter"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=TWITTER"><img src="/shared/img/common/social-bookmarking/twitter.gif" alt="Add to Twitter"
+                                            title="Twitter" /></a><span class="soc-bm-link-text">Twitter</span></li>
+                              </ul>
+                              
+                              <p class="social-bookmarking-help"><a href="/help/social_bookmarks.dtl">What's this?</a></p>
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+            
+            <div class="content-box" id="article-dyn-nav">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>Navigate This Article</span></h3>
+                  <div class="cb-section" id="cb-art-nav">
+                     <ol>
+                        <li><a href="#content-block">Top</a></li>
+                        <li><a href="#abstract-1">Abstract</a></li>
+                        <li><a href="#ack-1">Acknowledgements</a></li>
+                        <li><a href="#ref-list-1">References</a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+         </div>
+         <div id="col-3">
+            
+            <div class="content-box" id="sidebar-current-issue">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Month's Issue</span></h3>
+                  <div class="cb-section">
+                     <ol>
+                        <li><span><a href="/content/current" rel="current-issue">April 2015, 65 (Pt 4)</a></span></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section">
+                     <ol>
+                        <li>
+                           <div class="current-issue"><a href="/content/current" rel="current-issue"><img src="/content/65/Pt_4.cover.gif" width="67" height="89" alt="Current Issue" /></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section sidebar-etoc-link">
+                     <ol>
+                        <li><a href="/cgi/alerts/etoc">Alert me to new issues of IJSEM
+                              </a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            <div id="sidebar-global-nav">
+               
+               		
+               <ul class="button-list pub-links">
+                  <li class="first"><a href="/site/misc/about.xhtml" title="ABOUT IJSEM"><span>ABOUT IJSEM</span></a></li>
+                  <li><a href="/site/misc/edboard.xhtml" title="EDITORIAL BOARD &amp; STAFF"><span>EDITORIAL BOARD &amp; STAFF</span></a></li>
+                  <li><a href="http://www.editorialmanager.com/ijs/" title="SUBMIT A MANUSCRIPT"><span>SUBMIT A MANUSCRIPT</span></a></li>
+                  <li><a href="/site/misc/ifora.xhtml" title="INFORMATION FOR AUTHORS"><span>INFORMATION FOR AUTHORS</span></a></li>
+                  <li><a href="/site/misc/iforr.xhtml" title="INFORMATION FOR REVIEWERS"><span>INFORMATION FOR REVIEWERS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/site/librarians/index.xhtml"
+                        title="INFORMATION FOR LIBRARIANS"><span>INFORMATION FOR LIBRARIANS</span></a></li>
+                  <li><a href="/site/misc/reprints.xhtml" title="PERMISSIONS AND REPRINTS"><span>PERMISSIONS AND REPRINTS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/subscriptions" title="SUBSCRIPTIONS"><span>SUBSCRIPTIONS</span></a></li>
+                  <li><a href="/site/misc/addir.xhtml" title="ADVERTISING"><span>ADVERTISING</span></a></li>
+                  <li class="rss-img-button"><a href="/site/misc/alerts_feeds.xhtml" title="ALERTS &amp; FEEDS"><span>ALERTS &amp; FEEDS</span></a></li>
+                  <li class="last"><a href="/feedback" title="FEEDBACK"><span>FEEDBACK</span></a></li>
+               </ul>
+               		
+               <ul class="button-list pub-links umbrella-links">
+                  <li class="first"><a href="http://mic.sgmjournals.org" title="MICROBIOLOGY"><span>MICROBIOLOGY</span></a></li>
+                  <li><a href="http://vir.sgmjournals.org" title="J GEN VIROL"><span>J GEN VIROL</span></a></li>
+                  <li><a href="http://jmm.sgmjournals.org" title="J MED MICROBIOL"><span>J MED MICROBIOL</span></a></li>
+                  <li><a href="http://jmmcr.sgmjournals.org" title="JMM CASE REPORTS"><span>JMM CASE REPORTS</span></a></li>
+                  <li class="last"><a href="http://www.sgmjournals.org" title="ALL SGM JOURNALS"><span>ALL SGM JOURNALS</span></a></li>
+               </ul>
+               		
+               <div class="sidebar-icon-group">
+                  			
+                  <div class="icons">
+                     			<a href="http://www.sgm.ac.uk/" rel="external-nw"><img src="/publisher/img/society_logo.gif" class="publisher-icon" alt="Society Logo" /></a>
+                     			<a href="http://www.the-icsp.org/" rel="external-nw"><img src="/publisher/img/icsp_logo.gif" class="publisher-icon" alt="ICSP Logo" /></a>
+                     			<a href="http://highwire.stanford.edu/" rel="external-nw"><img src="/publisher/img/hplogo.gif" class="hw-icon" alt="HighWire Press Logo" /></a>
+                     			
+                  </div>
+                  			
+                  <div class="sidebar-icon-text"><span>The <a href="http://www.sgmjournals.org"> Society for General Microbiology</a> publishes online with the assistance of <a href="http://highwire.stanford.edu">HighWire Press®</a>.</span></div>
+                  		
+               </div>
+               	
+            </div>
+            <div class="most-links-box js-marker">
+               
+               <div class="most-header">
+                  
+                  <h3>Most</h3>
+                  
+               </div>
+               
+               <ul>
+                  <li class="most-cur-sel">
+                     <h4>Viewed</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/1070?rss=1&amp;ssource=mfr">Proposal to consistently apply the International Code of Nomenclature of Prokaryotes (ICNP) to names of the oxygenic photosynthetic
+                                 bacteria (cyanobacteria), including those validly published under the International Code of Botanical Nomenclature (ICBN)/International
+                                 Code of Nomenclature for algae, fungi and plants (ICN), and proposal to change Principle 2 of the ICNP</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfr">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/316?rss=1&amp;ssource=mfr">Integrating genomics into the taxonomy and systematics of the Bacteria and Archaea</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/333?rss=1&amp;ssource=mfr">Applications of next-generation sequencing to unravelling the evolutionary history of algae</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/739?rss=1&amp;ssource=mfr">Notification that new names of prokaryotes, new combinations, and new taxonomic opinions have appeared in volume 64, part
+                                 12, of the IJSEM</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfr1.dtl" class="view-all">» View all Most Viewed articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+                  <li>
+                     <h4>Cited</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4386?rss=1&amp;ssource=mfc">Chryseobacterium hispalense sp. nov., a plant-growth-promoting bacterium isolated from a rainwater pond in an olive plant
+                                 nursery, and emended descriptions of Chryseobacterium defluvii, Chryseobacterium indologenes, Chryseobacterium wanjuense and
+                                 Chryseobacterium gregarium</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfc">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_1/138?rss=1&amp;ssource=mfc">Aquibacter zeaxanthinifaciens gen. nov., sp. nov., a zeaxanthin-producing bacterium of the family Flavobacteriaceae isolated
+                                 from surface seawater, and emended descriptions of the genera Aestuariibaculum and Gaetbulibacter</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4790?rss=1&amp;ssource=mfc">Kordia aquimaris sp. nov., a zeaxanthin-producing member of the family Flavobacteriaceae isolated from surface seawater, and
+                                 emended description of the genus Kordia</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4524?rss=1&amp;ssource=mfc">Erythrobacter odishensis sp. nov. and Pontibacter odishensis sp. nov. isolated from dry soil of a solar saltern</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfc1.dtl" class="view-all">» View all Most Cited articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+               </ul>
+               
+               
+            </div>
+            
+            
+            
+         </div>
+         <div id="footer">
+            
+            <div class="bar">
+               
+               <div class="footer-group footer-col-left">
+                  		
+                  <p class="copyright">Copyright ©
+                     		2015 International Union of Microbiological Societies
+                     	
+                  </p>
+                  	
+               </div>
+               
+               <div class="footer-group footer-col-right">
+                  	    
+                  <ul class="issns">
+                     <li>
+                        <span>Print ISSN: </span>
+                        <span class="issn">1466-5026</span>
+                        
+                     </li>
+                     <li>
+                        <span>Online ISSN: </span>
+                        <span class="issn">1466-5034</span>
+                        
+                     </li>
+                  </ul>
+                  	  
+               </div>
+               	  
+            </div>
+            
+            
+            <div class="block-2 sb-div"></div>
+            
+         </div><script type="text/javascript">
+        var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
+        document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
+        </script><script type="text/javascript">
+        try {
+        var pageTracker = _gat._getTracker("UA-189672-25");
+        pageTracker._setDomainName(".sgmjournals.org");
+        pageTracker._trackPageview();
+        } catch(err) {}
+        </script><script type="text/javascript">
+	(function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
+		(i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
+		m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
+	})(window,document,'script','//www.google-analytics.com/analytics.js','ga');
+
+	ga('create', 'UA-48529861-1', '.sgmjournals.org');
+	ga('send', 'pageview');
+	</script></div>
+   </body>
+</html>
\ No newline at end of file
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/fulltext.pdf b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/fulltext.pdf
new file mode 100644
index 00000000..2c9c5ebd
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/fulltext.pdf differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/results.json b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/results.json
new file mode 100644
index 00000000..c64840e5
--- /dev/null
+++ b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/results.json
@@ -0,0 +1,104 @@
+{
+  "publisher": {
+    "value": [
+      "Society for General Microbiology"
+    ]
+  },
+  "journal": {
+    "value": [
+      "International Journal of Systematic and Evolutionary\n                Microbiology"
+    ]
+  },
+  "title": {
+    "value": [
+      "Designation of type strains for seven species of the order Myxococcales and proposal for neotype strains of Cystobacter ferrugineus, Cystobacter minus and Polyangium fumosum"
+    ]
+  },
+  "authors": {
+    "value": [
+      "Elke Lang",
+      "Hans Reichenbach"
+    ]
+  },
+  "date": {
+    "value": [
+      "11/01/2013"
+    ]
+  },
+  "doi": {
+    "value": [
+      "10.1099/ijs.0.056440-0"
+    ]
+  },
+  "volume": {
+    "value": [
+      "63"
+    ]
+  },
+  "issue": {
+    "value": [
+      "Pt 11"
+    ]
+  },
+  "firstpage": {
+    "value": [
+      "4354"
+    ]
+  },
+  "abstract": {
+    "value": [
+      "\n                  \n                      Next Section\n                  Abstract\n                  \n                  Ten species of the order Myxococcales with validly published names are devoid of living type strains. Four species of the genus Chondromyces are represented by dead herbarium samples as the type material. For a species of the genus Melittangium and two species of the genus Polyangium, no physical type material was assigned at the time of validation of the names or later on. In accordance with rule 18f of\n                     the International Code of Nomenclature of Bacteria the following type strains are designated for these species: strain Cm\n                     a14T ( = DSM 14605T = JCM 12615T) as the type strain of Chondromyces apiculatus, strain Cm c5T ( = DSM 14714T = JCM 12616T) as the type strain of Chondromyces crocatus, strain Sy t2T ( = DSM 14631T = JCM 12617T) as the type strain of Chondromyces lanuginosus, strain Cm p51T ( = DSM 14607T = JCM 12618T) as the type strain of Chondromyces pediculatus, strain Me b8T ( = DSM 14713T = JCM 12633T) as the type strain of Melittangium boletus, strain Pl s12T ( = DSM 14670T = JCM 12637T) as the type strain of Polyangium sorediatum and strain Pl sm5T ( = DSM 14734T = JCM 12638T) as the type strain of Polyangium spumosum. Furthermore, the type strains given for three species of the genera Cystobacter and Polyangium had been kept at one university institute and have been lost according to our investigations. In accordance with Rule 18c\n                     of the Bacteriological Code, we propose the following neotype strains: strain Cb fe18 ( = DSM 14716  = JCM 12624) as the neotype\n                     strain of Cystobacter ferrugineus, strain Cb m2 ( = DSM 14751 = JCM 12627) as the neotype strain of Cystobacter minus and strain Pl fu5 ( = DSM 14668 = JCM 12636) as the neotype strain of Polyangium fumosum. The proposals of the strains are based on the descriptions and strain proposals given in the respective chapters of Bergey’s Manual of Systematic Bacteriology (2005).\n                  \n                  \n               "
+    ]
+  },
+  "fulltext_html": {
+    "value": [
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4354.full"
+    ]
+  },
+  "fulltext_pdf": {
+    "value": [
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4354.full.pdf"
+    ]
+  },
+  "supplementary_material": {
+    "value": [
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4354/suppl/DC1"
+    ]
+  },
+  "figure": {
+    "value": [
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4354/F1.small.gif",
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4354/F2.small.gif",
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4354/F3.small.gif",
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4354/F4.small.gif",
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4354/F5.small.gif",
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4354/F6.small.gif",
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4354/F7.small.gif",
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4354/F8.small.gif",
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4354/F9.small.gif",
+      "http://ijs.sgmjournals.org/content/63/Pt_11/4354/F10.small.gif"
+    ]
+  },
+  "figure_caption": {
+    "value": [
+      "Fig. 1.  \n                     \n                     Chondromyces apiculatus. (a) Drawing from Thaxter (1897), plate XXX on pages 405–406. (b) Fruiting body (bar, 100 µm) and vegetative cells (insert; bar, 10 µm) of Cm a14T.\n                     \n                     \n                     \n                  ",
+      "Fig. 10.  \n                     \n                     Polyangium fumosum. (a) Drawing from Krzemieniewska & Krzemieniewski (1930), plate XVI, nos 6–9 depict P. fumosum. Courtesy of the Polish Botanical Society. (b) Swarm of PI fu5 (bar, 2000 µm) and single sporangium of PI fu5 (insert; bar,\n                        100 µm). (c) Fruiting bodies of PI fu5. Bar, 300 µm.\n                     \n                     \n                     \n                  ",
+      "Fig. 2.  \n                     \n                     Chondromyces crocatus. (a) Drawing from Berkeley (1857), page 313. (b) Fruiting bodies of Cm c5T. Bar, 500 µm.\n                     \n                     \n                     \n                  ",
+      "Fig. 3.  \n                     \n                     Chondromyces lanuginosus. (a) Figures from Kofler (1913), Figs 1–3 on page 877 depict Chondromyces lanuginosus. Courtesy Österreichische Akademie der Wissenschaften. (b) Fruiting body of Sy t2T. Bar, 100 µm.\n                     \n                     \n                     \n                  ",
+      "Fig. 4.  \n                     \n                     Chondromyces pediculatus. (a) Drawing from Thaxter (1904), plate XXVI on page 411; nos 7–13 depict Chondromyces pediculatus. (b) Fruiting body of Cm p51T. Bar 100 µm.\n                     \n                     \n                     \n                  ",
+      "Fig. 5.  \n                     \n                     Melittangium boletus. (a) Drawing from Jahn (1924), plate II, Fig. 17 on page 78. Courtesy Bornträger-Cramer, www.borntraeger-cramer.de. (b) and (c) Fruiting bodies of Me b8T. Bars, 120 and 80 µm, respectively.\n                     \n                     \n                     \n                  ",
+      "Fig. 6.  \n                     \n                     Polyangium sorediatum. (a) Drawing from Thaxter (1904), plate XXVII. Nos 22–30 depict P. sorediatum. (b and c) Fruiting bodies of PI s12T. Insert: crushed sporangium releasing the single sporangioles. Bars, 200 µm.\n                     \n                     \n                     \n                  ",
+      "Fig. 7.  \n                     \n                     Polyangium spumosum. (a) Figures from Krzemieniewska & Krzemieniewski (1926), plate V; no. 19 depicts P. spumosum and from Krzemieniewska & Krzemieniewski (1930), plate XVI; nos 10–12 depict P. spumosum. Courtesy of the Polish Botanical Society. (b–d) Degenerated fruiting bodies of PI sm5T. Bars, 500, 100 and 250 µm, respectively.\n                     \n                     \n                     \n                  ",
+      "Fig. 8.  \n                     \n                     Cystobacter ferrugineus. (a) Figures from McCurdy (1970). (b–d) Strain Cb fe18, (b) myxospores and (c) fruiting bodies on Escherichia coli as food bacteria and (d) on a cellulose plate. Bars, 10 µm, 1 mm and 10 mm, respectively.\n                     \n                     \n                     \n                  ",
+      "Fig. 9.  \n                     \n                     Cystobacter minus. (a), Figures from McCurdy (1970). (b and c), Fruiting bodies of Cb m2. Bars, 500 µm and 200 µm, respectively.\n                     \n                     \n                     \n                  "
+    ]
+  },
+  "license": {
+    "value": []
+  },
+  "copyright": {
+    "value": [
+      "Copyright ©\n                     \t\t2015 International Union of Microbiological Societies\n                     \t\n                  "
+    ]
+  }
+}
\ No newline at end of file
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_12_4586.full/DC1 b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_12_4586.full/DC1
new file mode 100644
index 00000000..beca2227
--- /dev/null
+++ b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_12_4586.full/DC1
@@ -0,0 +1,356 @@
+<!DOCTYPE html
+  PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html
+      xmlns="http://www.w3.org/1999/xhtml"
+      xml:lang="en"
+      lang="en">
+   <head>
+      <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
+      <title>Supplementary material </title>
+      <meta name="googlebot" content="NOODP" />
+      <meta name="HW.ad-path" content="/cgi/content/full/ijs.0.052654-0/DC1" />
+      <link rel="stylesheet" type="text/css" media="all" href="/shared/css/hw-global.css" />
+      <link rel="stylesheet" type="text/css" media="print" href="/shared/css/hw-print.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/standard-designs/design25/main.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/local/css/hw-local-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-page-data-supp.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-page-data-supp.css" /><script type="text/javascript" id="session-d7624831e1">var callbackToken='563684563197759';</script><script type="text/javascript" id="session-d7624831e3">
+                      var subCode='sgmjournal_sub';
+                    </script><script type="text/javascript" src="/shared/js/jquery-min.js"></script><script type="text/javascript" src="/shared/js/fingerprint.js"></script><script type="text/javascript" src="/shared/js/hw-shared.js"></script><script type="text/javascript" src="/shared/js/design/hw-design1.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-shared.js"></script><script type="text/javascript" src="/shared/js/pages/hw-data-supp.js"></script></head>
+   <body>
+      <div class="hw-gen-page pagetype-content" id="pageid-data-supp">
+         <div id="header">
+            
+            <h1><a id="logo" href="/"><span>International Journal of Systematic and Evolutionary Microbiology</span></a></h1>
+            
+            <p id="skip-link">
+               <a href="#content-block">Skip to main page content</a>
+               
+            </p>
+            
+            <ul class="button-list header-buttons">
+               <li class="first"><a href="/" title="HOME"><span>HOME</span></a></li>
+               <li><a href="/content/current" title="CURRENT ISSUE"><span>CURRENT ISSUE</span></a></li>
+               <li><a href="/content" title="ARCHIVE"><span>ARCHIVE</span></a></li>
+               <li><a href="/search" title="SEARCH"><span>SEARCH</span></a></li>
+               <li><a href="/help" title="HELP"><span>HELP</span></a></li>
+               <li class="last"><a href="/feedback" title="CONTACT US"><span>CONTACT US</span></a></li>
+            </ul>
+            
+            
+            <div class="header-qs">
+               
+               <form class="searchbox" action="/search" method="get">
+                  <div>
+                     	<label for="header-qs-input" id="header-qs-search-label">Search for Keyword:</label>
+                     <input value="" title="Search" type="text" name="fulltext" id="header-qs-input" /><input type="hidden" name="submit" value="yes" /><label for="header-qs-search" id="header-qs-search-label">GO</label><input value="GO" alt="Link: Go" type="image" id="header-qs-search-go"
+                            src="/shared/img/standard-design/design2/go.gif" /> 
+                     
+                  </div>
+                  <div class="adv-search-link"><a href="/search">Advanced Search</a></div>
+               </form>
+               
+               
+            </div>
+            
+            <div class="header-ac-elements">
+               
+               <div id="authstring" class="suppress-header-login">
+                  
+                  <ul>
+                     <li class="subscr-ref">Institution: THE NATURAL HISTORY MUSEUM</li>
+                     <li>
+                        <a href="/login?uri=http%3A%2F%2Fijs.sgmjournals.org%2Fcontent%2F63%2FPt_12%2F4586%2Fsuppl%2FDC1">
+                           Sign In as Member / Individual
+                           </a>
+                        
+                     </li>
+                  </ul>           
+                  
+               </div> 
+               
+               <div id="hdr-login" class="suppress-header-login"></div>
+               
+            </div>
+            
+            <div class="banner-ads">
+               		
+               <ul>
+                  <li class="position-1 no-ad hdr_left"><span>  </span></li>
+               </ul>
+               	
+            </div>
+            
+            <div class="bar">
+               
+               <div class="bar-inner"></div>
+               
+            </div>
+            
+         </div>
+         <div id="content-block">
+            <h1 class="data-supp-article-title"><em>Spirosoma</em> <em>endophyticum</em> sp. nov., isolated from Zn- and Cd-accumulating <em>Salix caprea</em></h1>
+            <div><span class="highwire-journal-article-marker-start"></span><div class="auto-clean"><span style="font-family: Verdana,Arial,Helvetica,sans-serif;  font-size: 83.33%">
+                     
+                     
+                     <h2>Supplementary material</h2>
+                     
+                     <p><strong>Files in this Data Supplement:</strong></p>
+                     
+                     <ul>
+                        <li><a href="/content/suppl/2013/12/09/ijs.0.052654-0.DC1/52654.pdf">Supplementary material</a> 
+                           		
+                           
+                        </li>
+                     </ul>
+                     </span>
+                  
+                  
+               </div><span class="highwire-journal-article-marker-end"></span></div><span id="related-urls"></span></div>
+         <div id="col-2">
+            
+            <div class="content-box" id="article-cb-main">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Article</span></h3>
+                  <div class="cb-section cb-slug">
+                     <ol>
+                        <li>
+                           <div id="slugline">
+                              
+                              	<span class="slug-metadata-note ahead-of-print">
+                                 
+                                 Published online ahead of print
+                                 
+                                 <span class="slug-ahead-of-print-date">August 2013</span>,
+                                 doi:
+                                 <span title="10.1099/ijs.0.052654-0" class="slug-doi">10.1099/ijs.0.052654-0</span>
+                                 </span>
+                              
+                              
+                              
+                              <cite>
+                                 	    <abbr title="International Journal of Systematic and Evolutionary Microbiology"
+                                       class="slug-jnl-abbrev">
+                                    IJSEM</abbr><span class="slug-pub-date">
+                                    December 2013 
+                                    </span>
+                                 	    <span class="slug-vol">
+                                    vol. 63 
+                                    </span><span class="slug-issue">
+                                    no. Pt 12 
+                                    </span><span class="slug-pages">
+                                    4586-4590
+                                    </span>
+                                 </cite>
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section cb-views">
+                     <ol>
+                        <li><span class="oa-article">Free via Open Access: <span>OA</span></span></li>
+                        <li class="abstract-view-link primary"><span class="oa-view">OA </span><a href="/content/63/Pt_12/4586.abstract" rel="view-abstract">Abstract</a><span class="free">Free</span></li>
+                        <li class="notice full-text-view-link primary"><span class="oa-view">OA </span><a href="/content/63/Pt_12/4586.full" rel="view-full-text">Full Text</a><span class="free">Free</span></li>
+                        <li class="notice full-text-pdf-view-link primary"><a href="/content/63/Pt_12/4586.full.pdf+html" rel="view-full-text.pdf">Full Text (PDF)</a></li>
+                        <li><span class="variant-indicator">» <span>Supplementary material</span></span></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+            
+            
+         </div>
+         <div id="col-3">
+            
+            <div class="content-box" id="sidebar-current-issue">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Month's Issue</span></h3>
+                  <div class="cb-section">
+                     <ol>
+                        <li><span><a href="/content/current" rel="current-issue">April 2015, 65 (Pt 4)</a></span></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section">
+                     <ol>
+                        <li>
+                           <div class="current-issue"><a href="/content/current" rel="current-issue"><img src="/content/65/Pt_4.cover.gif" width="67" height="89" alt="Current Issue" /></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section sidebar-etoc-link">
+                     <ol>
+                        <li><a href="/cgi/alerts/etoc">Alert me to new issues of IJSEM
+                              </a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            <div id="sidebar-global-nav">
+               
+               		
+               <ul class="button-list pub-links">
+                  <li class="first"><a href="/site/misc/about.xhtml" title="ABOUT IJSEM"><span>ABOUT IJSEM</span></a></li>
+                  <li><a href="/site/misc/edboard.xhtml" title="EDITORIAL BOARD &amp; STAFF"><span>EDITORIAL BOARD &amp; STAFF</span></a></li>
+                  <li><a href="http://www.editorialmanager.com/ijs/" title="SUBMIT A MANUSCRIPT"><span>SUBMIT A MANUSCRIPT</span></a></li>
+                  <li><a href="/site/misc/ifora.xhtml" title="INFORMATION FOR AUTHORS"><span>INFORMATION FOR AUTHORS</span></a></li>
+                  <li><a href="/site/misc/iforr.xhtml" title="INFORMATION FOR REVIEWERS"><span>INFORMATION FOR REVIEWERS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/site/librarians/index.xhtml"
+                        title="INFORMATION FOR LIBRARIANS"><span>INFORMATION FOR LIBRARIANS</span></a></li>
+                  <li><a href="/site/misc/reprints.xhtml" title="PERMISSIONS AND REPRINTS"><span>PERMISSIONS AND REPRINTS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/subscriptions" title="SUBSCRIPTIONS"><span>SUBSCRIPTIONS</span></a></li>
+                  <li><a href="/site/misc/addir.xhtml" title="ADVERTISING"><span>ADVERTISING</span></a></li>
+                  <li class="rss-img-button"><a href="/site/misc/alerts_feeds.xhtml" title="ALERTS &amp; FEEDS"><span>ALERTS &amp; FEEDS</span></a></li>
+                  <li class="last"><a href="/feedback" title="FEEDBACK"><span>FEEDBACK</span></a></li>
+               </ul>
+               		
+               <ul class="button-list pub-links umbrella-links">
+                  <li class="first"><a href="http://mic.sgmjournals.org" title="MICROBIOLOGY"><span>MICROBIOLOGY</span></a></li>
+                  <li><a href="http://vir.sgmjournals.org" title="J GEN VIROL"><span>J GEN VIROL</span></a></li>
+                  <li><a href="http://jmm.sgmjournals.org" title="J MED MICROBIOL"><span>J MED MICROBIOL</span></a></li>
+                  <li><a href="http://jmmcr.sgmjournals.org" title="JMM CASE REPORTS"><span>JMM CASE REPORTS</span></a></li>
+                  <li class="last"><a href="http://www.sgmjournals.org" title="ALL SGM JOURNALS"><span>ALL SGM JOURNALS</span></a></li>
+               </ul>
+               		
+               <div class="sidebar-icon-group">
+                  			
+                  <div class="icons">
+                     			<a href="http://www.sgm.ac.uk/" rel="external-nw"><img src="/publisher/img/society_logo.gif" class="publisher-icon" alt="Society Logo" /></a>
+                     			<a href="http://www.the-icsp.org/" rel="external-nw"><img src="/publisher/img/icsp_logo.gif" class="publisher-icon" alt="ICSP Logo" /></a>
+                     			<a href="http://highwire.stanford.edu/" rel="external-nw"><img src="/publisher/img/hplogo.gif" class="hw-icon" alt="HighWire Press Logo" /></a>
+                     			
+                  </div>
+                  			
+                  <div class="sidebar-icon-text"><span>The <a href="http://www.sgmjournals.org"> Society for General Microbiology</a> publishes online with the assistance of <a href="http://highwire.stanford.edu">HighWire Press®</a>.</span></div>
+                  		
+               </div>
+               	
+            </div>
+            <div class="most-links-box js-marker">
+               
+               <div class="most-header">
+                  
+                  <h3>Most</h3>
+                  
+               </div>
+               
+               <ul>
+                  <li class="most-cur-sel">
+                     <h4>Viewed</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/1070?rss=1&amp;ssource=mfr">Proposal to consistently apply the International Code of Nomenclature of Prokaryotes (ICNP) to names of the oxygenic photosynthetic
+                                 bacteria (cyanobacteria), including those validly published under the International Code of Botanical Nomenclature (ICBN)/International
+                                 Code of Nomenclature for algae, fungi and plants (ICN), and proposal to change Principle 2 of the ICNP</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfr">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/316?rss=1&amp;ssource=mfr">Integrating genomics into the taxonomy and systematics of the Bacteria and Archaea</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/333?rss=1&amp;ssource=mfr">Applications of next-generation sequencing to unravelling the evolutionary history of algae</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/739?rss=1&amp;ssource=mfr">Notification that new names of prokaryotes, new combinations, and new taxonomic opinions have appeared in volume 64, part
+                                 12, of the IJSEM</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfr1.dtl" class="view-all">» View all Most Viewed articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+                  <li>
+                     <h4>Cited</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4386?rss=1&amp;ssource=mfc">Chryseobacterium hispalense sp. nov., a plant-growth-promoting bacterium isolated from a rainwater pond in an olive plant
+                                 nursery, and emended descriptions of Chryseobacterium defluvii, Chryseobacterium indologenes, Chryseobacterium wanjuense and
+                                 Chryseobacterium gregarium</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfc">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_1/138?rss=1&amp;ssource=mfc">Aquibacter zeaxanthinifaciens gen. nov., sp. nov., a zeaxanthin-producing bacterium of the family Flavobacteriaceae isolated
+                                 from surface seawater, and emended descriptions of the genera Aestuariibaculum and Gaetbulibacter</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4790?rss=1&amp;ssource=mfc">Kordia aquimaris sp. nov., a zeaxanthin-producing member of the family Flavobacteriaceae isolated from surface seawater, and
+                                 emended description of the genus Kordia</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4524?rss=1&amp;ssource=mfc">Erythrobacter odishensis sp. nov. and Pontibacter odishensis sp. nov. isolated from dry soil of a solar saltern</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfc1.dtl" class="view-all">» View all Most Cited articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+               </ul>
+               
+               
+            </div>
+            
+            
+            
+         </div>
+         <div id="footer">
+            
+            <div class="bar">
+               
+               <div class="footer-group footer-col-left">
+                  		
+                  <p class="copyright">Copyright ©
+                     		2015 International Union of Microbiological Societies
+                     	
+                  </p>
+                  	
+               </div>
+               
+               <div class="footer-group footer-col-right">
+                  	    
+                  <ul class="issns">
+                     <li>
+                        <span>Print ISSN: </span>
+                        <span class="issn">1466-5026</span>
+                        
+                     </li>
+                     <li>
+                        <span>Online ISSN: </span>
+                        <span class="issn">1466-5034</span>
+                        
+                     </li>
+                  </ul>
+                  	  
+               </div>
+               	  
+            </div>
+            
+            
+            <div class="block-2 sb-div"></div>
+            
+         </div><script type="text/javascript">
+        var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
+        document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
+        </script><script type="text/javascript">
+        try {
+        var pageTracker = _gat._getTracker("UA-189672-25");
+        pageTracker._setDomainName(".sgmjournals.org");
+        pageTracker._trackPageview();
+        } catch(err) {}
+        </script><script type="text/javascript">
+	(function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
+		(i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
+		m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
+	})(window,document,'script','//www.google-analytics.com/analytics.js','ga');
+
+	ga('create', 'UA-48529861-1', '.sgmjournals.org');
+	ga('send', 'pageview');
+	</script></div>
+   </body>
+</html>
\ No newline at end of file
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_12_4586.full/F1.small.gif b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_12_4586.full/F1.small.gif
new file mode 100644
index 00000000..e26a9625
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_12_4586.full/F1.small.gif differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_12_4586.full/fulltext.html b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_12_4586.full/fulltext.html
new file mode 100644
index 00000000..c436e2c0
--- /dev/null
+++ b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_12_4586.full/fulltext.html
@@ -0,0 +1,1263 @@
+<!DOCTYPE html
+  PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html
+      xmlns="http://www.w3.org/1999/xhtml"
+      xml:lang="en"
+      lang="en">
+   <head>
+      <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
+      <title>Spirosoma endophyticum sp. nov., isolated from Zn- and Cd-accumulating Salix caprea </title>
+      <meta name="googlebot" content="NOODP" />
+      <meta name="HW.ad-path" content="/cgi/content/full/63/Pt_12/4586" />
+      <meta content="/ijs/63/Pt_12/4586.atom" name="HW.identifier" />
+      <meta name="DC.Format" content="text/html" />
+      <meta name="DC.Language" content="en" />
+      <meta content="Spirosoma endophyticum sp. nov., isolated from Zn- and Cd-accumulating Salix caprea"
+            name="DC.Title" />
+      <meta content="10.1099/ijs.0.052654-0" name="DC.Identifier" />
+      <meta content="2013-12-01" name="DC.Date" />
+      <meta content="Society for General Microbiology" name="DC.Publisher" />
+      <meta content="Julia Fries" name="DC.Contributor" />
+      <meta content="Stefan Pfeiffer" name="DC.Contributor" />
+      <meta content="Melanie Kuffner" name="DC.Contributor" />
+      <meta content="Angela Sessitsch" name="DC.Contributor" />
+      <meta content="International Journal of Systematic and Evolutionary&#xA;                Microbiology"
+            name="citation_journal_title" />
+      <meta content="Int J Syst Evol&#xA;                Microbiol"
+            name="citation_journal_abbrev" />
+      <meta content="1466-5026" name="citation_issn" />
+      <meta content="1466-5034" name="citation_issn" />
+      <meta name="citation_author" content="Julia Fries" />
+      <meta name="citation_author_institution"
+            content="AIT Austrian Institute of Technology GmbH, Bioresources Unit, Tulln, Austria" />
+      <meta name="citation_author" content="Stefan Pfeiffer" />
+      <meta name="citation_author_institution"
+            content="AIT Austrian Institute of Technology GmbH, Bioresources Unit, Tulln, Austria" />
+      <meta name="citation_author" content="Melanie Kuffner" />
+      <meta name="citation_author_institution"
+            content="AIT Austrian Institute of Technology GmbH, Bioresources Unit, Tulln, Austria" />
+      <meta name="citation_author" content="Angela Sessitsch" />
+      <meta name="citation_author_institution"
+            content="AIT Austrian Institute of Technology GmbH, Bioresources Unit, Tulln, Austria" />
+      <meta content="Spirosoma endophyticum sp. nov., isolated from Zn- and Cd-accumulating Salix caprea"
+            name="citation_title" />
+      <meta content="12/01/2013" name="citation_date" />
+      <meta content="63" name="citation_volume" />
+      <meta content="Pt 12" name="citation_issue" />
+      <meta content="4586" name="citation_firstpage" />
+      <meta content="4590" name="citation_lastpage" />
+      <meta content="63/Pt_12/4586" name="citation_id" />
+      <meta content="63/Pt 12/4586" name="citation_id_from_sass_path" />
+      <meta content="ijs;63/Pt_12/4586" name="citation_mjid" />
+      <meta content="10.1099/ijs.0.052654-0" name="citation_doi" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_12/4586.abstract"
+            name="citation_abstract_html_url" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_12/4586.full"
+            name="citation_fulltext_html_url" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_12/4586.full.pdf"
+            name="citation_pdf_url" />
+      <meta content="/content/63/Pt_12.cover.gif" name="issue_cover_image" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_12/4586"
+            name="citation_public_url" />
+      <meta content="23907231" name="citation_pmid" />
+      <meta name="citation_access" content="all" />
+      <meta name="citation_fulltext_world_readable" content="" />
+      <meta name="citation_section" content="Bacteroidetes" />
+      <meta name="robots" content="noarchive,nofollow" />
+      <meta name="googlebot" content="noarchive" />
+      <link href="/content/63/Pt_12/4580.short" rel="prev" />
+      <link href="/content/63/Pt_12/4591.short" rel="next" />
+      <link rel="stylesheet" type="text/css" media="all" href="/shared/css/hw-global.css" />
+      <link rel="stylesheet" type="text/css" media="print" href="/shared/css/hw-print.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/standard-designs/design25/main.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/local/css/hw-local-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/jquery.fancybox-1.3.4.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-global-colexpand.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-global-colexpand.css" /><script type="text/javascript" id="session-d7622811e1">var callbackToken='563684563197759';</script><script type="text/javascript" id="session-d7622811e3">
+                      var subCode='sgmjournal_sub';
+                    </script><script type="text/javascript" src="/shared/js/jquery-min.js"></script><script type="text/javascript" src="/shared/js/fingerprint.js"></script><script type="text/javascript" src="/shared/js/hw-shared.js"></script><script type="text/javascript" src="/shared/js/design/hw-design1.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-shared.js"></script><script type="text/javascript" src="/shared/js/pages/hw-content.js"></script><script type="text/javascript" src="/shared/js/fancybox/jquery.fancybox-1.3.4.js"></script><script type="text/javascript" src="/shared/js/fancybox/jquery.easing-1.3.pack.js"></script><script type="text/javascript"
+              src="/shared/js/fancybox/jquery.mousewheel-3.0.4.pack.js"></script><script type="text/javascript" src="/shared/js/util/content.jquery.addVariantLink.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-custom-free.js"></script><script type="text/javascript" src="/shared/js/util/hw-col-expand.js"></script><script type="text/javascript"
+              src="https://data.namesforlife.com/script/NamesforLife.js"></script></head>
+   <body>
+      <div class="hw-gen-page pagetype-content" id="pageid-content" itemscope="itemscope"
+           itemtype="http://schema.org/ScholarlyArticle">
+         <div id="header">
+            
+            <h1><a id="logo" href="/"><span>International Journal of Systematic and Evolutionary Microbiology</span></a></h1>
+            
+            <p id="skip-link">
+               <a href="#content-block">Skip to main page content</a>
+               
+            </p>
+            
+            <ul class="button-list header-buttons">
+               <li class="first"><a href="/" title="HOME"><span>HOME</span></a></li>
+               <li><a href="/content/current" title="CURRENT ISSUE"><span>CURRENT ISSUE</span></a></li>
+               <li><a href="/content" title="ARCHIVE"><span>ARCHIVE</span></a></li>
+               <li><a href="/search" title="SEARCH"><span>SEARCH</span></a></li>
+               <li><a href="/help" title="HELP"><span>HELP</span></a></li>
+               <li class="last"><a href="/feedback" title="CONTACT US"><span>CONTACT US</span></a></li>
+            </ul>
+            
+            
+            <div class="header-qs">
+               
+               <form class="searchbox" action="/search" method="get">
+                  <div>
+                     	<label for="header-qs-input" id="header-qs-search-label">Search for Keyword:</label>
+                     <input value="" title="Search" type="text" name="fulltext" id="header-qs-input" /><input type="hidden" name="submit" value="yes" /><label for="header-qs-search" id="header-qs-search-label">GO</label><input value="GO" alt="Link: Go" type="image" id="header-qs-search-go"
+                            src="/shared/img/standard-design/design2/go.gif" /> 
+                     
+                  </div>
+                  <div class="adv-search-link"><a href="/search">Advanced Search</a></div>
+               </form>
+               
+               
+            </div>
+            
+            <div class="header-ac-elements">
+               
+               <div id="authstring" class="suppress-header-login">
+                  
+                  <ul>
+                     <li class="subscr-ref">Institution: THE NATURAL HISTORY MUSEUM</li>
+                     <li>
+                        <a href="/login?uri=http%3A%2F%2Fijs.sgmjournals.org%2Fcontent%2F63%2FPt_12%2F4586.full">
+                           Sign In as Member / Individual
+                           </a>
+                        
+                     </li>
+                  </ul>           
+                  
+               </div> 
+               
+               <div id="hdr-login" class="suppress-header-login"></div>
+               
+            </div>
+            
+            <div class="banner-ads">
+               		
+               <ul>
+                  <li class="position-1 no-ad hdr_left"><span>  </span></li>
+               </ul>
+               	
+            </div>
+            
+            <div class="bar">
+               
+               <div class="bar-inner"></div>
+               
+            </div>
+            
+         </div>
+         <div id="content-block">
+            <div class="article fulltext-view " itemprop="articleBody"><span class="highwire-journal-article-marker-start"></span><h1 id="article-title-1" itemprop="headline"><em>Spirosoma</em> <em>endophyticum</em> sp. nov., isolated from Zn- and Cd-accumulating <em>Salix caprea</em></h1>
+               <div class="contributors">
+                  <ol class="contributor-list" id="contrib-group-1">
+                     <li class="contributor" id="contrib-1" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Julia+Fries&amp;sortspec=date&amp;submit=Submit">Julia Fries</a></span>, 
+                     </li>
+                     <li class="contributor" id="contrib-2" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Stefan+Pfeiffer&amp;sortspec=date&amp;submit=Submit">Stefan Pfeiffer</a></span>, 
+                     </li>
+                     <li class="contributor" id="contrib-3" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Melanie+Kuffner&amp;sortspec=date&amp;submit=Submit">Melanie Kuffner</a></span> and 
+                     </li>
+                     <li class="last" id="contrib-4"><span class="name"><a class="name-search"
+                              href="/search?author1=Angela+Sessitsch&amp;sortspec=date&amp;submit=Submit">Angela Sessitsch</a></span></li>
+                  </ol>
+                  <ol class="affiliation-list">
+                     <li class="aff"><a id="aff-1" name="aff-1"></a><address>AIT Austrian Institute of Technology GmbH, Bioresources Unit, Tulln, Austria</address>
+                     </li>
+                  </ol>
+                  <ol class="corresp-list">
+                     <li class="corresp" id="corresp-1"><strong>Correspondence</strong><br /> Angela Sessitsch <span class="em-link"><span class="em-addr">angela.sessitsch{at}ait.ac.at</span></span></li>
+                  </ol>
+               </div>
+               <div class="section abstract" id="abstract-1" itemprop="description">
+                  <div class="section-nav">
+                     <div class="nav-placeholder"> </div><a href="#fn-group-1" title="Next Section" class="next-section-link"><span>Next Section</span></a></div>
+                  <h2>Abstract</h2>
+                  
+                  <p id="p-4">A Gram-reaction-negative, yellow-pigmented strain, designated EX36<sup>T</sup>, was characterized using a polyphasic approach comprising phylogenetic, morphological and genotypic analyses. The endophytic
+                     strain was isolated from Zn/Cd-accumulating <em>Salix caprea</em> in Arnoldstein, Austria. Analysis of the 16S rRNA gene demonstrated that the novel strain is most closely related to members
+                     of the genus <span class="named-content genus" id="named-content-2"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                           href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span> (95 % sequence similarity with <span class="named-content species" id="named-content-3"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma linguale"
+                           href="doi:10.1601/nm.8318"><em>Spirosoma linguale</em></a></span>). The genomic DNA G+C content was 47.2 mol%. The predominant quinone was and the major cellular fatty acids were summed feature
+                     3 (iso-C<sub>15 : 0</sub> 2-OH and/or C<sub>16 : 1</sub>ω7<em>c</em>), C<sub>16 : 1</sub>ω5<em>c</em>, iso-C<sub>17 : 0</sub> 3-OH and iso-C<sub>15 : 0</sub>. On the basis of its phenotypic and genotypic properties, strain EX36<sup>T</sup> should be classified as a novel species of the genus <span class="named-content genus" id="named-content-4"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                           href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span>, for which the name <span class="named-content genus" id="named-content-5"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                           href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span> <em>endophyticum</em> sp. nov. is proposed. The type strain is EX36<sup>T</sup> ( = DSM 26130<sup>T</sup> = LMG 27272<sup>T</sup>).
+                  </p>
+                  
+               </div>
+               <div class="section fn-group" id="fn-group-1">
+                  <div class="section-nav"><a href="#abstract-1" title="Abstract" class="prev-section-link"><span>Previous Section</span></a><a href="#sec-1" title="Next Section" class="next-section-link"><span>Next Section</span></a></div>
+                  <ul>
+                     <li class="fn-other" id="fn-1">
+                        <p id="p-1">The GenBank/EMBL/DDBJ accession number for the 16S rRNA gene sequence of strain EX36<sup>T</sup> is GQ342559.
+                        </p>
+                     </li>
+                     <li class="fn-supplementary-material" id="fn-2">
+                        <p id="p-2">A supplementary figure is available with the online version of this paper.</p>
+                     </li>
+                  </ul>
+               </div>
+               <div class="license" id="license-1">
+                  <p id="p-3">This is an open-access article distributed under the terms of the Creative Commons Attribution License, which permits unrestricted
+                     use, distribution, and reproduction in any medium, provided the original work is properly cited.
+                  </p>
+               </div>
+               <p id="p-5">The genus <span class="named-content genus" id="named-content-6"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                        href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span> was first proposed by <a id="xref-ref-11-1" class="xref-bibr" href="#ref-11">Larkin &amp; Borrall (1984)</a> and belongs to the family <span class="named-content family" id="named-content-7"><a class="namesforlife" rel="namesforlife-name" title="Flexibacteraceae"
+                        href="doi:10.1601/nm.8247"><em>Flexibacteraceae</em></a></span> in the phylum <span class="named-content phylum" id="named-content-8"><a class="namesforlife" rel="namesforlife-name" title="Bacteroidetes"
+                        href="doi:10.1601/nm.7927"><em>Bacteroidetes</em></a></span>. At the time of writing the genus <span class="named-content genus" id="named-content-9"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                        href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span> includes five species, the type species <span class="named-content species" id="named-content-10"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma linguale"
+                        href="doi:10.1601/nm.8318"><em>Spirosoma linguale</em></a></span> (<a id="xref-ref-11-2" class="xref-bibr" href="#ref-11">Larkin &amp; Borrall, 1984</a>), <span class="named-content species" id="named-content-11"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma rigui"
+                        href="doi:10.1601/nm.11571"><em>Spirosoma rigui</em></a></span> (<a id="xref-ref-1-1" class="xref-bibr" href="#ref-1">Baik <em>et al.</em>, 2007</a>), <span class="named-content species" id="named-content-12"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma panaciterrae"
+                        href="doi:10.1601/nm.13622"><em>Spirosoma panaciterrae</em></a></span> (<a id="xref-ref-21-1" class="xref-bibr" href="#ref-21">Ten <em>et al.</em>, 2009</a>), <span class="named-content species" id="named-content-13"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma spitsbergense"
+                        href="doi:10.1601/nm.14214"><em>Spirosoma spitsbergense</em></a></span> and <span class="named-content species" id="named-content-14"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma luteum"
+                        href="doi:10.1601/nm.14215"><em>Spirosoma luteum</em></a></span> (<a id="xref-ref-6-1" class="xref-bibr" href="#ref-6">Finster <em>et al.</em>, 2009</a>). So far, <span class="named-content genus" id="named-content-15"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                        href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span> strains have been isolated from various habitats, such as fresh water, permafrost soil or soil from a ginseng field. Strain
+                  EX36<sup>T</sup>, which is proposed in this study to represent a novel species, was isolated in course of the analysis of bacteria associated
+                  with the heavy metal accumulating plant <em>Salix caprea</em> (<a id="xref-ref-10-1" class="xref-bibr" href="#ref-10">Kuffner <em>et al.</em>, 2010</a>).
+               </p>
+               <p id="p-6">For the isolation of strain EX36<sup>T</sup>, <em>Salix caprea</em> trees growing on a former Zn/Pb mining and processing site in Arnoldstein (Austria) were sampled (<a id="xref-ref-10-2" class="xref-bibr" href="#ref-10">Kuffner <em>et al.</em>, 2010</a>). Xylem sap extract was directly plated on 10 % tryptic soy agar (TSA, Merck Darmstadt, Germany) and after 1 week of incubation
+                  single colonies were picked and streaked on phosphate-poor MOPS medium (<a id="xref-ref-14-1" class="xref-bibr" href="#ref-14">Neidhardt <em>et al.</em>, 1974</a>) containing 0.1 % glucose and 1 mM ZnSO<sub>4</sub>. The strain was routinely cultured on 10 % TSA. For maintenance, the cell material was suspended in 10 % tryptic soy broth
+                  (TSB, Merck, Darmstadt, Germany) containing 15 % glycerol and stored at −80 °C. Endophytic colonization was confirmed by inoculating
+                  two maize and two potato cultivars, growing the plants under <em>in vitro</em> conditions and reisolating the strain from root and stem tissues.
+               </p>
+               <p id="p-7">For the extraction of bacterial DNA the Gen Elute Bacterial Genomic DNA kit (Sigma–Aldrich) was used. The 16S rRNA gene was
+                  amplified by PCR using the primers 8f (5′-AGAGTTTGATCCTGGCTCAG-3′) (<a id="xref-ref-22-1" class="xref-bibr" href="#ref-22">Weisburg <em>et al.</em>, 1991</a>) and 1520r (5′-AAGGAGGTGATCCAGCCGCA-3′) (<a id="xref-ref-5-1" class="xref-bibr" href="#ref-5">Edwards <em>et al.</em>, 1989</a>). Sequencing of the amplified PCR product was performed by LGC Genomics (Berlin, Germany). The obtained partial sequences
+                  were assembled using the programs BioEdit (<a id="xref-ref-7-1" class="xref-bibr" href="#ref-7">Hall, 1999</a>) and <span class="sc">seqman</span> <span class="sc">pro</span> (DNAstar). The consensus sequence was subjected to nucleotide <span class="sc">blast</span> analysis (<a href="http://blast.ncbi.nlm.nih.gov/Blast.cgi">http://blast.ncbi.nlm.nih.gov/Blast.cgi</a>) to search the database of the National Center for Biotechnology Information (NCBI) for the closest relatives of the bacterial
+                  strains with validly published names. Sequence comparisons indicated that the isolate belonged to the family <span class="named-content family" id="named-content-16"><a class="namesforlife" rel="namesforlife-name" title="Flexibacteraceae"
+                        href="doi:10.1601/nm.8247"><em>Flexibacteraceae</em></a></span>.
+               </p>
+               <p id="p-8">Nearly complete 16S rRNA gene sequences of strain EX36<sup>T</sup> and of all species of the genus <span class="named-content genus" id="named-content-17"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                        href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span> with validly published names and of selected species of the family <span class="named-content family" id="named-content-18"><a class="namesforlife" rel="namesforlife-name" title="Cytophagaceae"
+                        href="doi:10.1601/nm.14010"><em>Cytophagaceae</em></a></span>, which were downloaded from the NCBI GenBank sequence database, were imported into the <span class="sc">arb</span> program package (<a id="xref-ref-12-1" class="xref-bibr" href="#ref-12">Ludwig <em>et al.</em>, 2004</a>). Sequences were aligned into the <span class="sc">silva</span> SSURef 102 (<a id="xref-ref-15-1" class="xref-bibr" href="#ref-15">Pruesse <em>et al.</em>, 2007</a>) database by using the option ‘autosearch by PT_server’ of the <span class="sc">arb</span> editor. Alignments were manually corrected using the <span class="sc">arb</span> editor. A maximum-likelihood phylogenetic tree was reconstructed using RAxML v. 7.4.2 (<a id="xref-ref-18-1" class="xref-bibr" href="#ref-18">Stamatakis, 2006a</a>) by execution of the following command line in raxmlGUI v. 1.3 (<a id="xref-ref-16-1" class="xref-bibr" href="#ref-16">Silvestro &amp; Michalak, 2012</a>): raxmlHPC.exe -T 2 &lt;number of processors &gt;-f a -m GTRGAMMA -x 336 &lt;seed1 &gt;-p 115 &lt;seed2 &gt;-N 100 &lt;bootstraps &gt;-o CarHomin
+                  &lt;outgroup &gt;-s &lt;input file &gt;-O &lt;output order &gt;. We used a combination of the Gamma model of rate heterogeneity (<a id="xref-ref-23-1" class="xref-bibr" href="#ref-23">Yang, 1994</a>) and the CAT model (<a id="xref-ref-19-1" class="xref-bibr" href="#ref-19">Stamatakis, 2006b</a>), which was implemented in the rapid bootstrapping algorithm, (<a id="xref-ref-20-1" class="xref-bibr" href="#ref-20">Stamatakis <em>et al.</em>, 2008</a>) was performed with 100 replicates and using general time reversible (GTR) as the substitution matrix. In <a id="xref-fig-1-1" class="xref-fig" href="#F1">Fig. 1</a> the position of EX36<sup>T</sup> in the distinct cluster of the genus <span class="named-content genus" id="named-content-19"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                        href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span> can be clearly recognized. The calculation of pairwise sequence similarity using a global alignment algorithm (<a id="xref-ref-13-1" class="xref-bibr" href="#ref-13">Myers &amp; Miller, 1988</a>), which was implemented at the EzTaxon-e server (<a href="http://eztaxon-e.ezbiocloud.net/">http://eztaxon-e.ezbiocloud.net/</a>; <a id="xref-ref-8-1" class="xref-bibr" href="#ref-8">Kim <em>et al.</em>, 2012</a>) showed highest sequence similarity values for strain EX36<sup>T</sup> to <span class="named-content species" id="named-content-20"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma linguale"
+                        href="doi:10.1601/nm.8318"><em>Spirosoma linguale</em></a></span> DSM 74<sup>T</sup> (95.7 %), followed by <span class="named-content species" id="named-content-21"><a class="namesforlife" rel="namesforlife-name" title="S. luteum"
+                        href="doi:10.1601/nm.14215"><em>S. luteum</em></a></span> SPM-10<sup>T</sup> (93.9 %), <span class="named-content species" id="named-content-22"><a class="namesforlife" rel="namesforlife-name" title="S. spitsbergense"
+                        href="doi:10.1601/nm.14214"><em>S. spitsbergense</em></a></span> SPM-9<sup>T</sup> (93.9 %), <span class="named-content species" id="named-content-23"><a class="namesforlife" rel="namesforlife-name" title="S. rigui"
+                        href="doi:10.1601/nm.11571"><em>S. rigui</em></a></span> KCTC 12531<sup>T</sup> (93.8 %) and <span class="named-content species" id="named-content-24"><a class="namesforlife" rel="namesforlife-name" title="S. panaciterrae"
+                        href="doi:10.1601/nm.13622"><em>S. panaciterrae</em></a></span> Gsoil 1519<sup>T</sup> (92.5 %).
+               </p>
+               <div id="F1" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4586/F1.expansion.html"><img alt="Fig. 1. " src="4586/F1.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4586/F1.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4586/F1.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_12/4586/F1">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 1. </span> 
+                     
+                     <p id="p-9" class="first-child">Maximum-likelihood tree (bootstrap: 100 replicates) based on 16S rRNA gene sequence data (sequence length 1296 bp) showing
+                        the phylogenetic position of strain EX36<sup>T</sup> among related species selected from the phylum <span class="named-content phylum" id="named-content-25"><a class="namesforlife" rel="namesforlife-name" title="Bacteroidetes"
+                              href="doi:10.1601/nm.7927"><em>Bacteroidetes</em></a></span>. <span class="named-content species" id="named-content-26"><a class="namesforlife" rel="namesforlife-name" title="Cardiobacterium hominis"
+                              href="doi:10.1601/nm.2271"><em>Cardiobacterium hominis</em></a></span> ATCC 15826<sup>T</sup> (M35014) was used as an outgroup.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <p id="p-10">Growth of strain EX36<sup>T</sup> was tested at various temperatures (4, 20, 23, 28, 37 and 41 °C) on 10 % TSA plates for up to 1 week. The pH range for growth
+                  (pH 4, 5, 6, 7, 8 and 9) was determined by measuring OD<sub>600</sub> changes in cultures incubated at 28 °C with shaking at 190 r.p.m. compared with an uninoculated control. Salt tolerance was
+                  determined by amending 10 % TSB with NaCl to final concentrations of 0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.8, 1.0, 2.0, 3.0, 4.0,
+                  5.0 and 10.0 % NaCl (w/v). The Gram reaction of strain EX36<sup>T</sup> was determined by using the non-staining method described by <a id="xref-ref-3-1" class="xref-bibr" href="#ref-3">Buck (1982)</a>. Pigment analysis of cells grown on 10 % TSA was performed in triplicates by extraction with acetone according to the method
+                  described by <a id="xref-ref-4-1" class="xref-bibr" href="#ref-4">Denner <em>et al.</em> (2001)</a> using a U-2900 spectrophotometer (Hitachi). Minimal inhibition concentrations (MIC) for Zn and Cd were determined according
+                  to the method of <a id="xref-ref-9-1" class="xref-bibr" href="#ref-9">Kuffner <em>et al.</em> (2008)</a>. Additionally cells were tested for flexirubin pigments using the method described by <a id="xref-ref-2-1" class="xref-bibr" href="#ref-2">Bernardet <em>et al.</em> (2002)</a>. Oxidase and catalase activity were tested as outlined by <a id="xref-ref-17-1" class="xref-bibr" href="#ref-17">Smibert &amp; Krieg (1994)</a>. Additional biochemical tests were performed by the Identification Service of the DSMZ (Leibniz-Institut DSMZ-Deutsche Sammlung
+                  von Mikroorganismen und Zellkulturen GmbH, Braunschweig, Germany) using API 20NE (bioMérieux) and GENIII plates (Biolog).
+                  Cell morphology after 4 days of growth at 28 °C was investigated using fluorescence and bright-field microscopy (IX81, Olympus;
+                  Axiovert 200 M, Zeiss). Antibiotic susceptibility was determined by the disc diffusion method on 10 % TSA plates.
+               </p>
+               <p id="p-11">Cells of strain EX36<sup>T</sup> were rod-shaped, Gram-reaction-negative and 1.2×2−17.5 µm in size (Fig S1, available in IJSEM Online). Most cells were arranged
+                  in pairs, but filaments up to 55 µm were observed. EX36<sup>T</sup> showed yellowish, opaque, semi-translucent colonies with a smooth and shiny surface and a circular and convex shape. The
+                  diameter of colonies grown on 10 % TSA at 28 °C for 1 week varied between 1.5 and 3.0 mm. The strain was positive for catalase
+                  and oxidase activity; detailed results of biochemical and physiological analyses are listed in <a id="xref-table-wrap-1-1" class="xref-table" href="#T1">Table 1</a> and in the species description. In contrast to other species of the genus <span class="named-content genus" id="named-content-27"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                        href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span>, cells of EX36<sup>T</sup> showed a length up to 17.5 µm, did not grow at 5 and 42 °C, did not tolerate NaCl concentrations higher than 0.6 % (w/v),
+                  had the lowest genomic G+C content and showed differences in antibiotic susceptibility. Low tolerance of Cd and Zn was observed
+                  (slow growth at 4 mM Zn and 1 mM Cd). The analysis of yellow pigments showed three absorption maxima at 428, 453 and 483 nm.
+                  EX36<sup>T</sup> was negative for flexirubin-type pigments.
+               </p>
+               <div id="T1" class="table pos-float">
+                  <div class="table-inline">
+                     <div class="callout"><span>View this table:</span><ul class="callout-links">
+                           <li><a href="4586/T1.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4586/T1.expansion.html">In a new window</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="table-caption"><span class="table-label">Table 1. </span> 
+                     <span class="caption-title">Differential characteristics of strain EX36<sup>T</sup> and recognized species of the genus <span class="named-content genus" id="named-content-28"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                              href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span></span>
+                     
+                     <p id="p-12" class="first-child">Strains: 1, EX36<sup>T</sup> (data from this study); 2, <span class="named-content species" id="named-content-29"><a class="namesforlife" rel="namesforlife-name" title="S. linguale"
+                              href="doi:10.1601/nm.8318"><em>S. linguale</em></a></span> DSM 74<sup>T</sup> (<a id="xref-ref-11-3" class="xref-bibr" href="#ref-11">Larkin &amp; Borrall, 1984</a>; and this study); 3, <span class="named-content species" id="named-content-30"><a class="namesforlife" rel="namesforlife-name" title="S. luteum"
+                              href="doi:10.1601/nm.14215"><em>S. luteum</em></a></span> DSM 19990<sup>T</sup> (<a id="xref-ref-6-2" class="xref-bibr" href="#ref-6">Finster <em>et al.</em>, 2009</a>); 4, <span class="named-content species" id="named-content-31"><a class="namesforlife" rel="namesforlife-name" title="S. spitsbergense"
+                              href="doi:10.1601/nm.14214"><em>S. spitsbergense</em></a></span> DSM 19989<sup>T</sup> (<a id="xref-ref-6-3" class="xref-bibr" href="#ref-6">Finster <em>et al.</em>, 2009</a>); 5, <span class="named-content species" id="named-content-32"><a class="namesforlife" rel="namesforlife-name" title="S. rigui"
+                              href="doi:10.1601/nm.11571"><em>S. rigui</em></a></span> KCTC 12531<sup>T</sup> (<a id="xref-ref-1-2" class="xref-bibr" href="#ref-1">Baik <em>et al.</em>, 2007</a>); 6, <span class="named-content species" id="named-content-33"><a class="namesforlife" rel="namesforlife-name" title="S. panaciterrae"
+                              href="doi:10.1601/nm.13622"><em>S. panaciterrae</em></a></span> DSM 21099<sup>T</sup> (<a id="xref-ref-21-2" class="xref-bibr" href="#ref-21">Ten <em>et al.</em>, 2009</a>). All strains are catalase-positive, Gram-reaction-negative and negative for nitrate reduction, utilization of gluconate,
+                        caprate, adipate and glycerol. +, Positive; −, negative; <span class="sc">w</span>, weakly positive; <span class="sc">nd</span>, not determined; <span class="sc">r</span>, resistant; <span class="sc">s</span>, susceptible.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <p id="p-13">Analyses of cellular fatty acid composition, respiratory quinones, polar lipids and chromosomal G+C content were performed
+                  by the Identification Service of the DSMZ. The fatty acid profile was determined according to the protocol of the Microbial
+                  Identification System (MIDI). The major fatty acids of strain EX36<sup>T</sup> were summed feature 3 (iso-C<sub>15 : 0</sub> 2-OH and/or C<sub>16 : 1</sub>ω7<em>c</em>; 49.3 %), C<sub>16 : 1</sub>ω5<em>c</em> (23.8 %), iso-C<sub>17 : 0</sub> 3-OH (6.2 %) and iso-C<sub>15 : 0</sub> (5.4 %). A detailed overview of the cellular fatty acid profiles of all species of the genus <span class="named-content genus" id="named-content-34"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                        href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span> can be found in <a id="xref-table-wrap-2-1" class="xref-table" href="#T2">Table 2</a>. Differences between the fatty acid profile of EX36<sup>T</sup> and other species of the genus <span class="named-content genus" id="named-content-35"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                        href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span> were found in the amounts of iso-C<sub>15 : 0</sub>, C<sub>16 : 1</sub>ω5<em>c</em> and summed feature 3. In contrast to <span class="named-content species" id="named-content-36"><a class="namesforlife" rel="namesforlife-name" title="S. linguale"
+                        href="doi:10.1601/nm.8318"><em>S. linguale</em></a></span> DSM 74<sup>T</sup>, the fatty acids C<sub>15 : 0</sub> and anteiso-C<sub>15 : 0</sub> were not detected.
+               </p>
+               <div id="T2" class="table pos-float">
+                  <div class="table-inline">
+                     <div class="callout"><span>View this table:</span><ul class="callout-links">
+                           <li><a href="4586/T2.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4586/T2.expansion.html">In a new window</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="table-caption"><span class="table-label">Table 2. </span> 
+                     <span class="caption-title">Fatty acid profiles (%) of strain EX36<sup>T</sup> and its closest phylogenetic neighbours from the genus <span class="named-content genus" id="named-content-37"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                              href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span></span>
+                     
+                     <p id="p-14" class="first-child">Strains: 1, EX36<sup>T</sup> (data from this study); 2, <span class="named-content species" id="named-content-38"><a class="namesforlife" rel="namesforlife-name" title="S. linguale"
+                              href="doi:10.1601/nm.8318"><em>S. linguale</em></a></span> DSM 74<sup>T</sup> (data from this study); 3, <span class="named-content species" id="named-content-39"><a class="namesforlife" rel="namesforlife-name" title="S. luteum"
+                              href="doi:10.1601/nm.14215"><em>S. luteum</em></a></span> DSM 19990<sup>T</sup> (<a id="xref-ref-6-4" class="xref-bibr" href="#ref-6">Finster <em>et al.</em>, 2009</a>); 4, <span class="named-content species" id="named-content-40"><a class="namesforlife" rel="namesforlife-name" title="S. spitsbergense"
+                              href="doi:10.1601/nm.14214"><em>S. spitsbergense</em></a></span> DSM 19989<sup>T</sup> (<a id="xref-ref-6-5" class="xref-bibr" href="#ref-6">Finster <em>et al.</em>, 2009</a>); 5, <span class="named-content species" id="named-content-41"><a class="namesforlife" rel="namesforlife-name" title="S. rigui"
+                              href="doi:10.1601/nm.11571"><em>S. rigui</em></a></span> KCTC 12531<sup>T</sup> (<a id="xref-ref-1-3" class="xref-bibr" href="#ref-1">Baik <em>et al.</em>, 2007</a>); 6, <span class="named-content species" id="named-content-42"><a class="namesforlife" rel="namesforlife-name" title="S. panaciterrae"
+                              href="doi:10.1601/nm.13622"><em>S. panaciterrae</em></a></span> DSM 21099<sup>T</sup> (<a id="xref-ref-21-3" class="xref-bibr" href="#ref-21">Ten <em>et al.</em>, 2009</a>). <span class="sc">tr</span>, Trace amount (&lt;1 %); −, not detected.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <p id="p-16">The predominant menaquinone, in accordance with all other species of the genus <span class="named-content genus" id="named-content-43"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                        href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span>, was MK-7. As polar lipids, phosphatidylethanolamine, two aminophospholipids, two aminolipids, a glycolipid and three unknown
+                  lipids were detected on the TLC plate. The DNA G+C content of strain EX36<sup>T</sup> was 47.2 mol%, which is lower than reported values for all other species of the genus <span class="named-content genus" id="named-content-44"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                        href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span> with validly published names.
+               </p>
+               <p id="p-17">The analysis of DNA−DNA similarity of strain EX36<sup>T</sup> with its nearest phylogenetic neighbour <span class="named-content species" id="named-content-45"><a class="namesforlife" rel="namesforlife-name" title="S. linguale"
+                        href="doi:10.1601/nm.8318"><em>S. linguale</em></a></span> DSM 74<sup>T</sup> was also carried out by the Identification Service of the DSMZ. The experiment was performed in duplicates. DNA−DNA hybridization
+                  showed a DNA−DNA similarity of 12.2 % (second measurement: 17.2 %), demonstrating that these two strains do not represent
+                  the same species.
+               </p>
+               <p id="p-18">The present data regarding 16S rRNA gene sequence analysis, physiological, chemotaxonomic and morphological properties indicates,
+                  that strain EX36<sup>T</sup> represents a distinct species in the genus <span class="named-content genus" id="named-content-46"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                        href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span>, for which the name <span class="named-content genus" id="named-content-47"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                        href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span> <em>endophyticum</em> sp. nov. is proposed.
+               </p>
+               <div class="section" id="sec-1">
+                  <div class="section-nav"><a href="#fn-group-1" title="Previous Section" class="prev-section-link"><span>Previous Section</span></a><a href="#ack-1" title="Acknowledgements" class="next-section-link"><span>Next Section</span></a></div>
+                  
+                  
+                  <div id="sec-2" class="subsection">
+                     
+                     <h3>Description of <span class="named-content genus" id="named-content-48"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                              href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span><em>endophytica</em> sp. nov.
+                     </h3>
+                     
+                     <p id="p-19"><em>Spirosom endophyticum</em> (en.do.phy′ti.cum. Gr. Pref. <em>endo</em> within; Gr. n. <em>phyton</em> plant; L. neut. suff. ‐<em>icum</em> adjectival suffix used with the sense of belonging to; N.L. neut. adj. <em>endophyticum</em> within plant, referring to the endophytic nature of the strain and its isolation from plant tissue).
+                     </p>
+                     
+                     <p id="p-20">Cells are rod-shaped, Gram-reaction-negative, non-spore-forming, with a size of 1.2×2–17.5 µm. A yellow pigment which is not
+                        of the flexirubin type is produced. Filaments up to 55 µm may be formed. Colonies on 10 % TSA are opaque, semi-translucent
+                        with a smooth and shiny surface and a circular, convex shape. Aerobic growth occurs at 20–28 °C (optimum at 28 °C), pH 5–8
+                        (optimum at pH 7); tolerates concentrations up to 0.6 % NaCl (w/v) in the medium, whereas best growth was achieved in absence
+                        of NaCl. Positive for catalase and oxidase activity. Nitrate is not reduced and indole is not produced. Negative for glucose
+                        fermentation, hydrolysis of arginine and gelatin, and urease activities and positive for aesculin hydrolysis. Does not utilize
+                        the following substrates: arabinose, mannitol, <em>N</em>-acetylglucosamine, gluconate, caprate, adipate, malate, citrate, phenylacetate, β-methyl <span class="sc">d</span>-glucoside, <span class="sc">d</span>-salicin, <span class="sc">n</span>-acetyl-β-<span class="sc">d</span>-mannosamine, <span class="sc">n</span>-acetyl neuraminic acid, <span class="sc">d</span>-galactose, <span class="sc">d</span>-fucose, <span class="sc">l</span>-fucose, <span class="sc">l</span>-rhamnose, inosine, <span class="sc">d</span>-arabitol, <em>myo</em>-inositol, <span class="sc">d</span>-aspartic acid, <span class="sc">d</span>-serine, glycyl-<span class="sc">l</span>-proline, <span class="sc">l</span>-alanine, <span class="sc">l</span>-arginine, <span class="sc">l</span>-aspartic acid, <span class="sc">l</span>-glutamic acid, <span class="sc">l</span>-serine and pectin. The following substrates are weakly utilized: dextrin, maltose, trehalose, cellobiose, gentiobiose, sucrose,
+                        turanose, stachyose, α-lactose, melibiose, α-<span class="sc">d</span>-glucose, <span class="sc">d</span>-mannose, <span class="sc">d</span>-fructose, <span class="sc">d</span>-mannitol and <span class="sc">l</span>-histidine. <span class="sc">d</span>-Raffinose and <em>N</em>-acetyl-<span class="sc">d</span>-glucosamine are utilized. Susceptible to the following antibiotics (µg per disc): streptomycin (10), kanamycin (30), chloramphenicol
+                        (60) and rifampicin (15) and resistant to ampicillin (10), polymyxin B (20), tetracycline (15) and erythromycin (15). The
+                        major fatty acids are summed feature 3 (iso-C<sub>15 : 0</sub> 2-OH and/or C<sub>16 : 1</sub>ω7<em>c</em>), C<sub>16 : 1</sub>ω5<em>c</em>, iso-C<sub>17 : 0</sub> 3-OH and iso-C<sub>15 : 0</sub>; the complete fatty acid profile can be found in <a id="xref-table-wrap-2-2" class="xref-table" href="#T2">Table 2</a>. The predominant menaquinone is MK-7. The major polar lipid is phosphatidylethanolamine.
+                     </p>
+                     
+                     <p id="p-21">The type strain, EX36<sup>T</sup> ( = DSM 26130<sup>T</sup> = LMG 27272<sup>T</sup>), was isolated from Zn/Cd-accumulating <em>Salix caprea</em> in Arnoldstein, Austria. The DNA G+C content of the type strain is 47.2 mol%.
+                     </p>
+                     
+                  </div>
+               </div>
+               <div class="section ack" id="ack-1">
+                  <div class="section-nav"><a href="#sec-1" title="Previous Section" class="prev-section-link"><span>Previous Section</span></a><a href="#ref-list-1" title="References" class="next-section-link"><span>Next Section</span></a></div>
+                  <h2>Acknowledgements</h2>
+                  
+                  <p id="p-22">We thank Marlies Polt for technical support and Katharina Fallmann, Friederike Trognitz and Muhammad Naveed for helpful discussions.
+                     This study was supported by the Austrian Science Foundation [Förderung der wissenschaftlichen Forshung (FWF) grant no. L561-B17].
+                  </p>
+                  
+               </div>
+               <div class="section ref-list" id="ref-list-1">
+                  <div class="section-nav"><a href="#ack-1" title="Acknowledgements" class="prev-section-link"><span>Previous Section</span></a><div class="nav-placeholder"> </div>
+                  </div>
+                  <h2>References</h2>
+                  <ol class="cit-list ref-use-labels">
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-1-1" title="View reference  in text"
+                           id="ref-1">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.1"
+                             data-doi="10.1099/ijs.0.65302-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Baik</span>,  <span class="cit-name-given-names">K. S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kim</span>,  <span class="cit-name-given-names">M. S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Park</span>,  <span class="cit-name-given-names">S. C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lee</span>,  <span class="cit-name-given-names">D. W.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lee</span>,  <span class="cit-name-given-names">S. D.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ka</span>,  <span class="cit-name-given-names">J.-O.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Choi</span>,  <span class="cit-name-given-names">S. K.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Seong</span>,  <span class="cit-name-given-names">C. N.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2007</span><strong>).</strong> <span class="cit-article-title"><em>Spirosoma rigui</em> sp. nov., isolated from fresh water</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">57</span>, <span class="cit-fpage">2870</span>–<span class="cit-lpage">2873</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.65302-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>18048741</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=57/12/2870"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-2-1" title="View reference  in text"
+                           id="ref-2">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.2"
+                             data-doi="10.1099/ijs.0.02136-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bernardet</span>,  <span class="cit-name-given-names">J.-F.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nakagawa</span>,  <span class="cit-name-given-names">Y.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Holmes</span>,  <span class="cit-name-given-names">B.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth cit-collab">Subcommittee on the taxonomy of Flavobacterium and Cytophaga-like bacteria of the International Committee on Systematics of
+                                       Prokaryotes</span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2002</span><strong>).</strong> <span class="cit-article-title">Proposed minimal standards for describing new taxa of the family <em>Flavobacteriaceae</em> and emended description of the family</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">52</span>, <span class="cit-fpage">1049</span>–<span class="cit-lpage">1070</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.02136-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>12054224</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=52/3/1049"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-3-1" title="View reference  in text"
+                           id="ref-3">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.3">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Buck</span>,  <span class="cit-name-given-names">J. D.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1982</span><strong>).</strong> <span class="cit-article-title">Nonstaining (KOH) method for determination of Gram reactions of marine bacteria</span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">44</span>, <span class="cit-fpage">992</span>–<span class="cit-lpage">993</span>.<span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>6184019</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=44/4/992"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-4-1" title="View reference  in text"
+                           id="ref-4">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.4"
+                             data-doi="10.1099/00207713-51-3-827">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Denner</span>,  <span class="cit-name-given-names">E. B. M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Paukner</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kämpfer</span>,  <span class="cit-name-given-names">P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Moore</span>,  <span class="cit-name-given-names">E. R. B.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Abraham</span>,  <span class="cit-name-given-names">W. R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Busse</span>,  <span class="cit-name-given-names">H.-J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wanner</span>,  <span class="cit-name-given-names">G.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lübitz</span>,  <span class="cit-name-given-names">W.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2001</span><strong>).</strong> <span class="cit-article-title"><em>Sphingomonas pituitosa</em> sp. nov., an exopolysaccharide-producing bacterium that secretes an unusual type of sphingan</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">51</span>, <span class="cit-fpage">827</span>–<span class="cit-lpage">841</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-51-3-827</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>11411704</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=51/3/827"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-5-1" title="View reference  in text"
+                           id="ref-5">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.5"
+                             data-doi="10.1093/nar/17.19.7843">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Edwards</span>,  <span class="cit-name-given-names">U.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Rogall</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Blöcker</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Emde</span>,  <span class="cit-name-given-names">M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Böttger</span>,  <span class="cit-name-given-names">E. C.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1989</span><strong>).</strong> <span class="cit-article-title">Isolation and direct complete nucleotide determination of entire genes. Characterization of a gene coding for 16S ribosomal
+                                    RNA</span>. <abbr class="cit-jnl-abbrev">Nucleic Acids Res</abbr> <span class="cit-vol">17</span>, <span class="cit-fpage">7843</span>–<span class="cit-lpage">7853</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1093/nar/17.19.7843</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>2798131</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=nar&amp;resid=17/19/7843"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-6-1" title="View reference  in text"
+                           id="ref-6">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.6"
+                             data-doi="10.1099/ijs.0.002725-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Finster</span>,  <span class="cit-name-given-names">K. W.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Herbert</span>,  <span class="cit-name-given-names">R. A.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lomstein</span>,  <span class="cit-name-given-names">B. A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2009</span><strong>).</strong> <span class="cit-article-title"><em>Spirosoma spitsbergense</em> sp. nov. and <em>Spirosoma luteum</em> sp. nov., isolated from a high Arctic permafrost soil, and emended description of the genus <em>Spirosoma</em></span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">59</span>, <span class="cit-fpage">839</span>–<span class="cit-lpage">844</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.002725-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>19329617</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=59/4/839"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-7-1" title="View reference  in text"
+                           id="ref-7">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.7"
+                             data-doi="10.1046/j.1462-2920.2002.00362.x">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hall</span>,  <span class="cit-name-given-names">T. A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1999</span><strong>).</strong> <span class="cit-article-title">BioEdit: a user-friendly biological sequence alignment editor and analysis program for Windows 95/98/NT</span>. <abbr class="cit-jnl-abbrev">Nucleic Acids Symp Ser</abbr> <span class="cit-vol">41</span>, <span class="cit-fpage">95</span>–<span class="cit-lpage">98</span>.</cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1046/j.1462-2920.2002.00362.x&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=12460286&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=BioEdit%3A%20a%20user-friendly%20biological%20sequence%20alignment%20editor%20and%20analysis%20program%20for%20Windows%2095%2F98%2FNT&amp;author=T.%20A.%20Hall&amp;publication_year=1999&amp;journal=Nucleic%20Acids%20Symp%20Ser&amp;volume=41&amp;pages=95-98">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-8-1" title="View reference  in text"
+                           id="ref-8">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.8"
+                             data-doi="10.1099/ijs.0.038075-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kim</span>,  <span class="cit-name-given-names">O. S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Cho</span>,  <span class="cit-name-given-names">Y. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lee</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Yoon</span>,  <span class="cit-name-given-names">S. H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kim</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Na</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Park</span>,  <span class="cit-name-given-names">S. C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jeon</span>,  <span class="cit-name-given-names">Y. S.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lee</span>,  <span class="cit-name-given-names">J. H.</span></span></li>
+                              </ol><cite> <strong>&amp; other authors (</strong><span class="cit-pub-date">2012</span><strong>).</strong> <span class="cit-article-title">Introducing EzTaxon-e: a prokaryotic 16S rRNA gene sequence database with phylotypes that represent uncultured species</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">62</span>, <span class="cit-fpage">716</span>–<span class="cit-lpage">721</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.038075-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>22140171</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=62/Pt_3/716"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-9-1" title="View reference  in text"
+                           id="ref-9">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.9"
+                             data-doi="10.1007/s11104-007-9517-9">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kuffner</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Puschenreiter</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wieshammer</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Gorfer</span>,  <span class="cit-name-given-names">M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sessitsch</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2008</span><strong>).</strong> <span class="cit-article-title">Rhizosphere bacteria affect growth and metal uptake of heavy metal accumulating willows</span>. <abbr class="cit-jnl-abbrev">Plant Soil</abbr> <span class="cit-vol">304</span>, <span class="cit-fpage">35</span>–<span class="cit-lpage">44</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/s11104-007-9517-9</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/s11104-007-9517-9&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Rhizosphere%20bacteria%20affect%20growth%20and%20metal%20uptake%20of%20heavy%20metal%20accumulating%20willows&amp;author=M.%20Kuffner&amp;author=M.%20Puschenreiter&amp;author=G.%20Wieshammer&amp;author=M.%20Gorfer&amp;author=A.%20Sessitsch&amp;publication_year=2008&amp;journal=Plant%20Soil&amp;volume=304&amp;pages=35-44&amp;doi=10.1007%2Fs11104-007-9517-9">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-10-1" title="View reference  in text"
+                           id="ref-10">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.10"
+                             data-doi="10.1111/j.1365-2672.2010.04670.x">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kuffner</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">De Maria</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Puschenreiter</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Fallmann</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wieshammer</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Gorfer</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Strauss</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Rivelli</span>,  <span class="cit-name-given-names">A. R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sessitsch</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2010</span><strong>).</strong> <span class="cit-article-title">Culturable bacteria from Zn- and Cd-accumulating <em>Salix caprea</em> with differential effects on plant growth and heavy metal availability</span>. <abbr class="cit-jnl-abbrev">J Appl Microbiol</abbr> <span class="cit-vol">108</span>, <span class="cit-fpage">1471</span>–<span class="cit-lpage">1484</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1111/j.1365-2672.2010.04670.x</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>20132372</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1111/j.1365-2672.2010.04670.x&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=20132372&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Culturable%20bacteria%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea%20with%20differential%20effects%20on%20plant%20growth%20and%20heavy%20metal%20availability&amp;author=M.%20Kuffner&amp;author=S.%20De%20Maria&amp;author=M.%20Puschenreiter&amp;author=K.%20Fallmann&amp;author=G.%20Wieshammer&amp;author=M.%20Gorfer&amp;author=J.%20Strauss&amp;author=A.%20R.%20Rivelli&amp;author=A.%20Sessitsch&amp;publication_year=2010&amp;journal=J%20Appl%20Microbiol&amp;volume=108&amp;pages=1471-1484&amp;doi=10.1111%2Fj.1365-2672.2010.04670.x&amp;pmid=20132372">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-11-1" title="View reference  in text"
+                           id="ref-11">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_12.4586.11">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Holt</span>,  <span class="cit-name-given-names">J. G.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Larkin</span>,  <span class="cit-name-given-names">J. M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Borrall</span>,  <span class="cit-name-given-names">R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1984</span><strong>).</strong> <span class="cit-article-title">Family I. <em>Spirosomaceae</em> Larkin and Borrall 1978, 595<sup>AL</sup></span>. In <span class="cit-source">Bergey’s Manual of Systematic Bacteriology</span>, <span class="cit-vol">vol. 1</span>, pp. <span class="cit-fpage">125</span>–<span class="cit-lpage">126</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Holt</span>,  <span class="cit-name-given-names">J. G.</span></span>
+                                 . <span class="cit-publ-loc">Baltimore</span>: <span class="cit-publ-name">Williams &amp; Wilkins</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Family%20I.%20Spirosomaceae%20Larkin%20and%20Borrall%201978%2C%20595AL&amp;author=J.%20M.%20Larkin&amp;author=R.%20Borrall&amp;publication_year=1984&amp;citation_inbook_title=Bergey%E2%80%99s%20Manual%20of%20Systematic%20Bacteriology">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-12-1" title="View reference  in text"
+                           id="ref-12">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.12"
+                             data-doi="10.1093/nar/gkh293">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ludwig</span>,  <span class="cit-name-given-names">W.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Strunk</span>,  <span class="cit-name-given-names">O.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Westram</span>,  <span class="cit-name-given-names">R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Richter</span>,  <span class="cit-name-given-names">L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Meier</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Yadhukumar</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Buchner</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lai</span>,  <span class="cit-name-given-names">T.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Steppi</span>,  <span class="cit-name-given-names">S.</span></span></li>
+                              </ol><cite> <strong>&amp; other authors (</strong><span class="cit-pub-date">2004</span><strong>).</strong> <span class="cit-article-title"><span class="sc">arb</span>: a software environment for sequence data</span>. <abbr class="cit-jnl-abbrev">Nucleic Acids Res</abbr> <span class="cit-vol">32</span>, <span class="cit-fpage">1363</span>–<span class="cit-lpage">1371</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1093/nar/gkh293</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>14985472</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=nar&amp;resid=32/4/1363"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-13-1" title="View reference  in text"
+                           id="ref-13">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.13"
+                             data-doi="10.1093/bioinformatics/4.1.11">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Myers</span>,  <span class="cit-name-given-names">E. W.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Miller</span>,  <span class="cit-name-given-names">W.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1988</span><strong>).</strong> <span class="cit-article-title">Optimal alignments in linear space</span>. <abbr class="cit-jnl-abbrev">Comput Appl Biosci</abbr> <span class="cit-vol">4</span>, <span class="cit-fpage">11</span>–<span class="cit-lpage">17</span>.<span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>3382986</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=bioinfo&amp;resid=4/1/11"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-14-1" title="View reference  in text"
+                           id="ref-14">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.14">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Neidhardt</span>,  <span class="cit-name-given-names">F. C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bloch</span>,  <span class="cit-name-given-names">P. L.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Smith</span>,  <span class="cit-name-given-names">D. F.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1974</span><strong>).</strong> <span class="cit-article-title">Culture medium for enterobacteria</span>. <abbr class="cit-jnl-abbrev">J Bacteriol</abbr> <span class="cit-vol">119</span>, <span class="cit-fpage">736</span>–<span class="cit-lpage">747</span>.<span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>4604283</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=jb&amp;resid=119/3/736"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-15-1" title="View reference  in text"
+                           id="ref-15">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.15"
+                             data-doi="10.1093/nar/gkm864">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pruesse</span>,  <span class="cit-name-given-names">E.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Quast</span>,  <span class="cit-name-given-names">C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Knittel</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Fuchs</span>,  <span class="cit-name-given-names">B. M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ludwig</span>,  <span class="cit-name-given-names">W.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Peplies</span>,  <span class="cit-name-given-names">J.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Glöckner</span>,  <span class="cit-name-given-names">F. O.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2007</span><strong>).</strong> <span class="cit-article-title"><span class="sc">silva</span>: a comprehensive online resource for quality checked and aligned ribosomal RNA sequence data compatible with <span class="sc">arb</span></span>. <abbr class="cit-jnl-abbrev">Nucleic Acids Res</abbr> <span class="cit-vol">35</span>, <span class="cit-fpage">7188</span>–<span class="cit-lpage">7196</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1093/nar/gkm864</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>17947321</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=nar&amp;resid=35/21/7188"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-16-1" title="View reference  in text"
+                           id="ref-16">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.16"
+                             data-doi="10.1007/s13127-011-0056-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Silvestro</span>,  <span class="cit-name-given-names">D.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Michalak</span>,  <span class="cit-name-given-names">I.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2012</span><strong>).</strong> <span class="cit-article-title">raxmlGUI: A graphical front-end for RAxML</span>. <abbr class="cit-jnl-abbrev">Org Divers Evol</abbr> <span class="cit-vol">12</span>, <span class="cit-fpage">335</span>–<span class="cit-lpage">337</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/s13127-011-0056-0</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/s13127-011-0056-0&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=raxmlGUI%3A%20A%20graphical%20front-end%20for%20RAxML&amp;author=D.%20Silvestro&amp;author=I.%20Michalak&amp;publication_year=2012&amp;journal=Org%20Divers%20Evol&amp;volume=12&amp;pages=335-337&amp;doi=10.1007%2Fs13127-011-0056-0">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-17-1" title="View reference  in text"
+                           id="ref-17">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_12.4586.17">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Gerhardt</span>,  <span class="cit-name-given-names">P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Murray</span>,  <span class="cit-name-given-names">R. G. E.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Wood</span>,  <span class="cit-name-given-names">W. A.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Smibert</span>,  <span class="cit-name-given-names">R. M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1994</span><strong>).</strong> <span class="cit-article-title">Phenotypic characterization</span>. In <span class="cit-source">Methods for General and Molecular Bacteriology</span>, pp. <span class="cit-fpage">607</span>–<span class="cit-lpage">654</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Gerhardt</span>,  <span class="cit-name-given-names">P.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Murray</span>,  <span class="cit-name-given-names">R. G. E.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Wood</span>,  <span class="cit-name-given-names">W. A.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span>
+                                 . <span class="cit-publ-loc">Washington, DC</span>: <span class="cit-publ-name">American Society for Microbiology</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Phenotypic%20characterization&amp;author=R.%20M.%20Smibert&amp;author=N.%20R.%20Krieg&amp;publication_year=1994&amp;citation_inbook_title=Methods%20for%20General%20and%20Molecular%20Bacteriology">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-18-1" title="View reference  in text"
+                           id="ref-18">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.18"
+                             data-doi="10.1093/bioinformatics/btl446">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stamatakis</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2006a</span><strong>).</strong> <span class="cit-article-title">RAxML-VI-HPC: maximum likelihood-based phylogenetic analyses with thousands of taxa and mixed models</span>. <abbr class="cit-jnl-abbrev">Bioinformatics</abbr> <span class="cit-vol">22</span>, <span class="cit-fpage">2688</span>–<span class="cit-lpage">2690</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1093/bioinformatics/btl446</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>16928733</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=bioinfo&amp;resid=22/21/2688"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-19-1" title="View reference  in text"
+                           id="ref-19">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_12.4586.19">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stamatakis</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2006b</span><strong>).</strong> <span class="cit-article-title">Phylogenetic models of rate heterogeneity: a high performance computing perspective</span>. In: <span class="cit-source">Proc. of IPDPS2006</span>, pp. <span class="cit-fpage">253</span>. <span class="cit-publ-name">IEEE Computer Society</span>. <span class="cit-publ-loc">Washington, DC</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Phylogenetic%20models%20of%20rate%20heterogeneity%3A%20a%20high%20performance%20computing%20perspective&amp;author=A.%20Stamatakis&amp;publication_year=2006b&amp;citation_inbook_title=Proc.%20of%20IPDPS2006">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-20-1" title="View reference  in text"
+                           id="ref-20">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.20"
+                             data-doi="10.1080/10635150802429642">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stamatakis</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hoover</span>,  <span class="cit-name-given-names">P.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Rougemont</span>,  <span class="cit-name-given-names">J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2008</span><strong>).</strong> <span class="cit-article-title">A rapid bootstrap algorithm for the RAxML Web servers</span>. <abbr class="cit-jnl-abbrev">Syst Biol</abbr> <span class="cit-vol">57</span>, <span class="cit-fpage">758</span>–<span class="cit-lpage">771</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1080/10635150802429642</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>18853362</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=sysbio&amp;resid=57/5/758"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-21-1" title="View reference  in text"
+                           id="ref-21">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.21"
+                             data-doi="10.1099/ijs.0.002436-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ten</span>,  <span class="cit-name-given-names">L. N.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Xu</span>,  <span class="cit-name-given-names">J.-L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jin</span>,  <span class="cit-name-given-names">F.-X.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Im</span>,  <span class="cit-name-given-names">W.-T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Oh</span>,  <span class="cit-name-given-names">H.-M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lee</span>,  <span class="cit-name-given-names">S.-T.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2009</span><strong>).</strong> <span class="cit-article-title"><em>Spirosoma panaciterrae</em> sp. nov., isolated from soil</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">59</span>, <span class="cit-fpage">331</span>–<span class="cit-lpage">335</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.002436-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>19196773</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=59/2/331"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-22-1" title="View reference  in text"
+                           id="ref-22">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.22">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Weisburg</span>,  <span class="cit-name-given-names">W. G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Barns</span>,  <span class="cit-name-given-names">S. M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pelletier</span>,  <span class="cit-name-given-names">D. A.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lane</span>,  <span class="cit-name-given-names">D. J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1991</span><strong>).</strong> <span class="cit-article-title">16S ribosomal DNA amplification for phylogenetic study</span>. <abbr class="cit-jnl-abbrev">J Bacteriol</abbr> <span class="cit-vol">173</span>, <span class="cit-fpage">697</span>–<span class="cit-lpage">703</span>.<span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>1987160</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=jb&amp;resid=173/2/697"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-23-1" title="View reference  in text"
+                           id="ref-23">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.23"
+                             data-doi="10.1007/BF00160154">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Yang</span>,  <span class="cit-name-given-names">Z. H.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1994</span><strong>).</strong> <span class="cit-article-title">Maximum likelihood phylogenetic estimation from DNA sequences with variable rates over sites: approximate methods</span>. <abbr class="cit-jnl-abbrev">J Mol Evol</abbr> <span class="cit-vol">39</span>, <span class="cit-fpage">306</span>–<span class="cit-lpage">314</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/BF00160154</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>7932792</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/BF00160154&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=7932792&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Maximum%20likelihood%20phylogenetic%20estimation%20from%20DNA%20sequences%20with%20variable%20rates%20over%20sites%3A%20approximate%20methods&amp;author=Z.%20H.%20Yang&amp;publication_year=1994&amp;journal=J%20Mol%20Evol&amp;volume=39&amp;pages=306-314&amp;doi=10.1007%2FBF00160154&amp;pmid=7932792">Google Scholar</a></div>
+                        </div>
+                     </li>
+                  </ol>
+               </div><span class="highwire-journal-article-marker-end"></span></div>
+            <div class="social-bookmarking">
+               
+               <ul class="social-bookmark-links">
+                  <li class="social-bookmarking-item social-bookmarking-item-citeulike"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=CITEULIKE"><img src="/shared/img/common/social-bookmarking/citeulike.gif"
+                             alt="Add to CiteULike"
+                             title="CiteULike" /></a><span class="soc-bm-link-text">CiteULike</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-delicious"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=DEL_ICIO_US"><img src="/shared/img/common/social-bookmarking/delicious.gif"
+                             alt="Add to Delicious"
+                             title="Delicious" /></a><span class="soc-bm-link-text">Delicious</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-digg"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=DIGG"><img src="/shared/img/common/social-bookmarking/digg.gif" alt="Add to Digg"
+                             title="Digg" /></a><span class="soc-bm-link-text">Digg</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-facebook"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=FACEBOOK"
+                        class="sb-facebook"
+                        rel="external-nw"><img src="/shared/img/common/social-bookmarking/facebook.gif" alt="Add to Facebook"
+                             title="Facebook" /></a><span class="soc-bm-link-text">Facebook</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-googleplus"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=GOOGLEPLUS&amp;log_only=yes"><img src="/shared/img/common/social-bookmarking/googleplus.jpg" alt="Add to Google+"
+                             title="Google+" /></a><span class="soc-bm-link-text">Google+</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-linkedin"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=LINKEDIN"><img src="/shared/img/common/social-bookmarking/linkedin.gif" alt="Add to LinkedIn"
+                             title="LinkedIn" /></a><span class="soc-bm-link-text">LinkedIn</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-mendeley"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=MENDELEY"><img src="/shared/img/common/social-bookmarking/mendeley.gif" alt="Add to Mendeley"
+                             title="Mendeley" /></a><span class="soc-bm-link-text">Mendeley</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-reddit"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=REDDIT"><img src="/shared/img/common/social-bookmarking/reddit.gif" alt="Add to Reddit"
+                             title="Reddit" /></a><span class="soc-bm-link-text">Reddit</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-twitter"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=TWITTER"><img src="/shared/img/common/social-bookmarking/twitter.gif" alt="Add to Twitter"
+                             title="Twitter" /></a><span class="soc-bm-link-text">Twitter</span></li>
+               </ul>
+               
+               <p class="social-bookmarking-help"><a href="/help/social_bookmarks.dtl">What's this?</a></p>
+               
+            </div><span id="related-urls"></span></div>
+         <div id="col-2">
+            
+            <div class="article-nav sidebar-nav">
+               <a href="/content/63/Pt_12/4580.short" title="Previous article" class="previous">« Previous</a><span class="article-nav-sep"> | </span><a href="/content/63/Pt_12/4591.short" title="Next article" class="next">Next Article »</a>
+               
+               <span class="toc-link">
+                  				<a href="/content/63/Pt_12.toc" title="Table of Contents">Table of Contents</a>
+                  			</span>
+               
+               
+            </div>
+            <div class="open-access-note">
+               <span class="open-access-note">OPEN ACCESS ARTICLE</span>
+               
+            </div>
+            <div class="content-box" id="article-cb-main">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Article</span></h3>
+                  <div class="cb-section cb-slug">
+                     <ol>
+                        <li>
+                           <div id="slugline">
+                              
+                              
+                              	    <span class="slug-metadata-note ahead-of-print">
+                                 	
+                                 Published online ahead of print
+                                 
+                                 <span class="slug-ahead-of-print-date">August 1, 2013</span>,
+                                 doi:
+                                 <span title="10.1099/ijs.0.052654-0" class="slug-doi">10.1099/ijs.0.052654-0
+                                    </span>
+                                 </span>
+                              
+                              <cite>
+                                 	    <abbr title="International Journal of Systematic and Evolutionary Microbiology"
+                                       class="slug-jnl-abbrev">
+                                    IJSEM</abbr><span class="slug-pub-date" itemprop="datePublished">
+                                    	    December 2013 
+                                    </span>
+                                 	    <span class="slug-vol">
+                                    vol. 63 
+                                    </span><span class="slug-issue">
+                                    no. Pt 12 
+                                    </span><span class="slug-pages">
+                                    4586-4590
+                                    </span>
+                                 </cite>
+                              
+                              	           
+                              
+                              
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section cb-views">
+                     <ol>
+                        <li><span class="oa-article">Free via Open Access: <span>OA</span></span></li>
+                        <li><span class="creative-commons-article">Free via Creative Commons: <span>CC</span></span></li>
+                        <li><span class="ccv cc-version-by/2.5/"></span></li>
+                        <li class="abstract-view-link primary"><span class="oa-view">OA </span><a href="/content/63/Pt_12/4586.abstract" rel="view-abstract">Abstract</a><span class="free">Free</span></li>
+                        <li class="notice full-text-view-link primary"><span class="variant-indicator">» <span>Full Text</span></span><span class="free">Free</span></li>
+                        <li class="notice full-text-pdf-view-link primary"><a href="/content/63/Pt_12/4586.full.pdf+html" rel="view-full-text.pdf">Full Text (PDF)</a><span class="free">Free</span></li>
+                        <li><a href="/content/63/Pt_12/4586/suppl/DC1" rel="supplemental-data"
+                              class="dslink-supplementary-material">Supplementary material</a></li>
+                        <li><a href="/powerpoint/63/Pt_12/4586">PPT Slides of All Figures</a></li>
+                        <li class="cb-versions">
+                           <div><span id="pap-all-versions-label">All Versions of this Article:</span><ol class="version-list">
+                                 <li><a href="/content/early/2013/08/01/ijs.0.052654-0">ijs.0.052654-0v1</a></li>
+                                 <li class="current-li"><span>63/Pt_12/4586</span> <span class="current-version">most recent</span></li>
+                              </ol>
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible" id="cb-art-cat">
+                     <h4 class="cb-section-header"><span>Classifications</span></h4>
+                     <ol>
+                        <li>
+                           <ul class="subject-headings">
+                              <li>New Taxa
+                                 <ul class="subject-sub-headings last-child">
+                                    <li><a class="tocsection-search"
+                                          href="/search?tocsectionid=Bacteroidetes&amp;sortspec=date&amp;submit=Submit">Bacteroidetes</a></li>
+                                 </ul>
+                              </li>
+                           </ul>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible" id="cb-art-svcs">
+                     <h4 class="cb-section-header"><span>Services</span></h4>
+                     <ol>
+                        <li class="mail-a-friend-link icon-link"><a href="/email?gca=ijs%3B63%2FPt_12%2F4586&amp;current-view-path=/content/63/Pt_12/4586.full">
+                              Email this article to a colleague</a></li>
+                        <li class="alert-link icon-link"><a href="/cgi/alerts/ctalert?alertType=citedby&amp;addAlert=cited_by&amp;cited_by_criteria_resid=ijs%3B63%2FPt_12%2F4586&amp;saveAlert=no&amp;return-type=article&amp;return_url=http://ijs.sgmjournals.org/content/63/Pt_12/4586.full">Alert me when this article is cited</a></li>
+                        <li class="alert-link icon-link"><a href="/cgi/alerts/ctalert?alertType=correction&amp;addAlert=correction&amp;correction_criteria_value=63/Pt_12/4586&amp;saveAlert=no&amp;return-type=article&amp;return_url=http://ijs.sgmjournals.org/content/63/Pt_12/4586.full">Alert me if a correction is posted</a></li>
+                        <li class="similar-link"><a href="/search?qbe=ijs%3Bijs.0.052654-0&amp;citation=Fries%20et%20al.%2063%20%28Pt%2012%29:%204586&amp;submit=yes">Similar articles in this journal</a></li>
+                        <li class="similar-link"><a href="/external-ref?access_num=ijs%3B63%2FPt_12%2F4586&amp;link_type=ISI_RELATEDRECORDS"
+                              id="cb-isi-similar-articles"
+                              class="similar-link">Similar articles in Web of Science</a></li>
+                        <li class="similar-link"><a href="/external-ref?access_num=23907231&amp;link_type=MED_NBRS"
+                              class="similar-link">Similar articles in PubMed</a></li>
+                        <li class="cit-man-link icon-link cite-link"><a href="/citmgr?gca=ijs%3B63%2FPt_12%2F4586">Download to citation manager</a></li>
+                        <li class="copyright-link icon-link"><a href="/external-ref?link_type=PERMISSIONDIRECT"><img src="/shared/img/content/permissions.gif" /></a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-cit">
+                     <h4 class="cb-section-header"><span>Citing Articles</span></h4>
+                     <ol>
+                        <li class="hw-citing-link"><a href="/content/63/Pt_12/4586.full?cited-by=yes&amp;legid=ijs;63/Pt_12/4586#cited-by"
+                              id="cb-hw-citing-articles">Load citing article information</a></li>
+                        <li><a href="/cgi/crossref-forward-links/63/Pt_12/4586" rel="external-nw"
+                              id="cb-crossref-citing-articles">Citing articles via CrossRef</a></li>
+                        <li><a href="/external-ref?access_num=%2Fijs%2F63%2FPt_12%2F4586&amp;link_type=ISI_CITING&amp;accnum_type=native"
+                              rel="external-nw"
+                              id="cb-isi-citing-articles">Citing articles via Web of Science</a></li>
+                        <li><a href="/external-ref?access_num=http://ijs.sgmjournals.org/content/63/Pt_12/4586.abstract&amp;link_type=GOOGLESCHOLAR">Citing articles via Google Scholar</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-gs">
+                     <h4 class="cb-section-header"><span>Google Scholar</span></h4>
+                     <ol>
+                        <li class="cb-art-gs-auth author-link"><a href="http://scholar.google.com/scholar?q=%22author%3AFries%20author%3AJ.%22"
+                              class="cb-art-gs-auth author-link">Articles by  Fries, J.</a></li>
+                        <li class="cb-art-gs-auth author-link"><a href="http://scholar.google.com/scholar?q=%22author%3ASessitsch%20author%3AA.%22"
+                              class="cb-art-gs-auth author-link">Articles by  Sessitsch, A.</a></li>
+                        <li class="cb-art-gs-rel similar-link"><a href="/external-ref?access_num=http://ijs.sgmjournals.org/content/63/Pt_12/4586.abstract&amp;link_type=GOOGLESCHOLARRELATED">Search for related content</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-pm">
+                     <h4 class="cb-section-header"><span>PubMed</span></h4>
+                     <ol>
+                        <li class="cb-art-pm-cite cite-link icon-link"><a href="/external-ref?access_num=23907231&amp;link_type=PUBMED"
+                              class="cb-art-pm-cite cite-link icon-link">PubMed citation</a></li>
+                        <li class="cb-art-pm-auth author-link"><a href="/external-ref?access_num=Fries%20J&amp;link_type=AUTHORSEARCH"
+                              class="cb-art-pm-auth author-link">Articles by  Fries, J.</a></li>
+                        <li class="cb-art-pm-auth author-link"><a href="/external-ref?access_num=Sessitsch%20A&amp;link_type=AUTHORSEARCH"
+                              class="cb-art-pm-auth author-link">Articles by  Sessitsch, A.</a></li>
+                        <li>
+                           <div id="cb-entrez-links-placeholder"><a href="/entrez-links/23907231"></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-rel">
+                     <h4 class="cb-section-header"><span>Related Content</span></h4>
+                     <ol>
+                        <li><a href="/content/63/Pt_12/4586.full?related-urls=yes&amp;legid=ijs;63/Pt_12/4586#related-urls"
+                              id="cb-related-urls">Load related web page information</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed soc-links icon-link"
+                       id="cb-art-soc">
+                     <h4 class="cb-section-header"><span>Social Bookmarking</span></h4>
+                     <ol>
+                        <li>
+                           <div class="social-bookmarking">
+                              
+                              <ul class="social-bookmark-links">
+                                 <li class="social-bookmarking-item social-bookmarking-item-citeulike"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=CITEULIKE"><img src="/shared/img/common/social-bookmarking/citeulike.gif"
+                                            alt="Add to CiteULike"
+                                            title="CiteULike" /></a><span class="soc-bm-link-text">CiteULike</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-delicious"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=DEL_ICIO_US"><img src="/shared/img/common/social-bookmarking/delicious.gif"
+                                            alt="Add to Delicious"
+                                            title="Delicious" /></a><span class="soc-bm-link-text">Delicious</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-digg"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=DIGG"><img src="/shared/img/common/social-bookmarking/digg.gif" alt="Add to Digg"
+                                            title="Digg" /></a><span class="soc-bm-link-text">Digg</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-facebook"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=FACEBOOK"
+                                       class="sb-facebook"
+                                       rel="external-nw"><img src="/shared/img/common/social-bookmarking/facebook.gif" alt="Add to Facebook"
+                                            title="Facebook" /></a><span class="soc-bm-link-text">Facebook</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-googleplus"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=GOOGLEPLUS&amp;log_only=yes"><img src="/shared/img/common/social-bookmarking/googleplus.jpg" alt="Add to Google+"
+                                            title="Google+" /></a><span class="soc-bm-link-text">Google+</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-linkedin"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=LINKEDIN"><img src="/shared/img/common/social-bookmarking/linkedin.gif" alt="Add to LinkedIn"
+                                            title="LinkedIn" /></a><span class="soc-bm-link-text">LinkedIn</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-mendeley"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=MENDELEY"><img src="/shared/img/common/social-bookmarking/mendeley.gif" alt="Add to Mendeley"
+                                            title="Mendeley" /></a><span class="soc-bm-link-text">Mendeley</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-reddit"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=REDDIT"><img src="/shared/img/common/social-bookmarking/reddit.gif" alt="Add to Reddit"
+                                            title="Reddit" /></a><span class="soc-bm-link-text">Reddit</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-twitter"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=TWITTER"><img src="/shared/img/common/social-bookmarking/twitter.gif" alt="Add to Twitter"
+                                            title="Twitter" /></a><span class="soc-bm-link-text">Twitter</span></li>
+                              </ul>
+                              
+                              <p class="social-bookmarking-help"><a href="/help/social_bookmarks.dtl">What's this?</a></p>
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+            
+            <div class="content-box" id="article-dyn-nav">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>Navigate This Article</span></h3>
+                  <div class="cb-section" id="cb-art-nav">
+                     <ol>
+                        <li><a href="#content-block">Top</a></li>
+                        <li><a href="#abstract-1">Abstract</a></li>
+                        <li><a href="#ack-1">Acknowledgements</a></li>
+                        <li><a href="#ref-list-1">References</a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+         </div>
+         <div id="col-3">
+            
+            <div class="content-box" id="sidebar-current-issue">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Month's Issue</span></h3>
+                  <div class="cb-section">
+                     <ol>
+                        <li><span><a href="/content/current" rel="current-issue">April 2015, 65 (Pt 4)</a></span></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section">
+                     <ol>
+                        <li>
+                           <div class="current-issue"><a href="/content/current" rel="current-issue"><img src="/content/65/Pt_4.cover.gif" width="67" height="89" alt="Current Issue" /></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section sidebar-etoc-link">
+                     <ol>
+                        <li><a href="/cgi/alerts/etoc">Alert me to new issues of IJSEM
+                              </a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            <div id="sidebar-global-nav">
+               
+               		
+               <ul class="button-list pub-links">
+                  <li class="first"><a href="/site/misc/about.xhtml" title="ABOUT IJSEM"><span>ABOUT IJSEM</span></a></li>
+                  <li><a href="/site/misc/edboard.xhtml" title="EDITORIAL BOARD &amp; STAFF"><span>EDITORIAL BOARD &amp; STAFF</span></a></li>
+                  <li><a href="http://www.editorialmanager.com/ijs/" title="SUBMIT A MANUSCRIPT"><span>SUBMIT A MANUSCRIPT</span></a></li>
+                  <li><a href="/site/misc/ifora.xhtml" title="INFORMATION FOR AUTHORS"><span>INFORMATION FOR AUTHORS</span></a></li>
+                  <li><a href="/site/misc/iforr.xhtml" title="INFORMATION FOR REVIEWERS"><span>INFORMATION FOR REVIEWERS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/site/librarians/index.xhtml"
+                        title="INFORMATION FOR LIBRARIANS"><span>INFORMATION FOR LIBRARIANS</span></a></li>
+                  <li><a href="/site/misc/reprints.xhtml" title="PERMISSIONS AND REPRINTS"><span>PERMISSIONS AND REPRINTS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/subscriptions" title="SUBSCRIPTIONS"><span>SUBSCRIPTIONS</span></a></li>
+                  <li><a href="/site/misc/addir.xhtml" title="ADVERTISING"><span>ADVERTISING</span></a></li>
+                  <li class="rss-img-button"><a href="/site/misc/alerts_feeds.xhtml" title="ALERTS &amp; FEEDS"><span>ALERTS &amp; FEEDS</span></a></li>
+                  <li class="last"><a href="/feedback" title="FEEDBACK"><span>FEEDBACK</span></a></li>
+               </ul>
+               		
+               <ul class="button-list pub-links umbrella-links">
+                  <li class="first"><a href="http://mic.sgmjournals.org" title="MICROBIOLOGY"><span>MICROBIOLOGY</span></a></li>
+                  <li><a href="http://vir.sgmjournals.org" title="J GEN VIROL"><span>J GEN VIROL</span></a></li>
+                  <li><a href="http://jmm.sgmjournals.org" title="J MED MICROBIOL"><span>J MED MICROBIOL</span></a></li>
+                  <li><a href="http://jmmcr.sgmjournals.org" title="JMM CASE REPORTS"><span>JMM CASE REPORTS</span></a></li>
+                  <li class="last"><a href="http://www.sgmjournals.org" title="ALL SGM JOURNALS"><span>ALL SGM JOURNALS</span></a></li>
+               </ul>
+               		
+               <div class="sidebar-icon-group">
+                  			
+                  <div class="icons">
+                     			<a href="http://www.sgm.ac.uk/" rel="external-nw"><img src="/publisher/img/society_logo.gif" class="publisher-icon" alt="Society Logo" /></a>
+                     			<a href="http://www.the-icsp.org/" rel="external-nw"><img src="/publisher/img/icsp_logo.gif" class="publisher-icon" alt="ICSP Logo" /></a>
+                     			<a href="http://highwire.stanford.edu/" rel="external-nw"><img src="/publisher/img/hplogo.gif" class="hw-icon" alt="HighWire Press Logo" /></a>
+                     			
+                  </div>
+                  			
+                  <div class="sidebar-icon-text"><span>The <a href="http://www.sgmjournals.org"> Society for General Microbiology</a> publishes online with the assistance of <a href="http://highwire.stanford.edu">HighWire Press®</a>.</span></div>
+                  		
+               </div>
+               	
+            </div>
+            <div class="most-links-box js-marker">
+               
+               <div class="most-header">
+                  
+                  <h3>Most</h3>
+                  
+               </div>
+               
+               <ul>
+                  <li class="most-cur-sel">
+                     <h4>Viewed</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/1070?rss=1&amp;ssource=mfr">Proposal to consistently apply the International Code of Nomenclature of Prokaryotes (ICNP) to names of the oxygenic photosynthetic
+                                 bacteria (cyanobacteria), including those validly published under the International Code of Botanical Nomenclature (ICBN)/International
+                                 Code of Nomenclature for algae, fungi and plants (ICN), and proposal to change Principle 2 of the ICNP</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfr">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/316?rss=1&amp;ssource=mfr">Integrating genomics into the taxonomy and systematics of the Bacteria and Archaea</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/333?rss=1&amp;ssource=mfr">Applications of next-generation sequencing to unravelling the evolutionary history of algae</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/739?rss=1&amp;ssource=mfr">Notification that new names of prokaryotes, new combinations, and new taxonomic opinions have appeared in volume 64, part
+                                 12, of the IJSEM</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfr1.dtl" class="view-all">» View all Most Viewed articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+                  <li>
+                     <h4>Cited</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4386?rss=1&amp;ssource=mfc">Chryseobacterium hispalense sp. nov., a plant-growth-promoting bacterium isolated from a rainwater pond in an olive plant
+                                 nursery, and emended descriptions of Chryseobacterium defluvii, Chryseobacterium indologenes, Chryseobacterium wanjuense and
+                                 Chryseobacterium gregarium</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfc">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_1/138?rss=1&amp;ssource=mfc">Aquibacter zeaxanthinifaciens gen. nov., sp. nov., a zeaxanthin-producing bacterium of the family Flavobacteriaceae isolated
+                                 from surface seawater, and emended descriptions of the genera Aestuariibaculum and Gaetbulibacter</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4790?rss=1&amp;ssource=mfc">Kordia aquimaris sp. nov., a zeaxanthin-producing member of the family Flavobacteriaceae isolated from surface seawater, and
+                                 emended description of the genus Kordia</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4524?rss=1&amp;ssource=mfc">Erythrobacter odishensis sp. nov. and Pontibacter odishensis sp. nov. isolated from dry soil of a solar saltern</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfc1.dtl" class="view-all">» View all Most Cited articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+               </ul>
+               
+               
+            </div>
+            
+            
+            
+         </div>
+         <div id="footer">
+            
+            <div class="bar">
+               
+               <div class="footer-group footer-col-left">
+                  		
+                  <p class="copyright">Copyright ©
+                     		2015 International Union of Microbiological Societies
+                     	
+                  </p>
+                  	
+               </div>
+               
+               <div class="footer-group footer-col-right">
+                  	    
+                  <ul class="issns">
+                     <li>
+                        <span>Print ISSN: </span>
+                        <span class="issn">1466-5026</span>
+                        
+                     </li>
+                     <li>
+                        <span>Online ISSN: </span>
+                        <span class="issn">1466-5034</span>
+                        
+                     </li>
+                  </ul>
+                  	  
+               </div>
+               	  
+            </div>
+            
+            
+            <div class="block-2 sb-div"></div>
+            
+         </div><script type="text/javascript">
+        var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
+        document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
+        </script><script type="text/javascript">
+        try {
+        var pageTracker = _gat._getTracker("UA-189672-25");
+        pageTracker._setDomainName(".sgmjournals.org");
+        pageTracker._trackPageview();
+        } catch(err) {}
+        </script><script type="text/javascript">
+	(function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
+		(i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
+		m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
+	})(window,document,'script','//www.google-analytics.com/analytics.js','ga');
+
+	ga('create', 'UA-48529861-1', '.sgmjournals.org');
+	ga('send', 'pageview');
+	</script></div>
+   </body>
+</html>
\ No newline at end of file
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_12_4586.full/fulltext.pdf b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_12_4586.full/fulltext.pdf
new file mode 100644
index 00000000..5c2ed86f
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_12_4586.full/fulltext.pdf differ
diff --git a/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_12_4586.full/results.json b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_12_4586.full/results.json
new file mode 100644
index 00000000..d3867c09
--- /dev/null
+++ b/examples/ijsem-quickscrape/ijsem-mounce-OLD-scraper/http_ijs.sgmjournals.org_content_63_Pt_12_4586.full/results.json
@@ -0,0 +1,90 @@
+{
+  "publisher": {
+    "value": [
+      "Society for General Microbiology"
+    ]
+  },
+  "journal": {
+    "value": [
+      "International Journal of Systematic and Evolutionary\n                Microbiology"
+    ]
+  },
+  "title": {
+    "value": [
+      "Spirosoma endophyticum sp. nov., isolated from Zn- and Cd-accumulating Salix caprea"
+    ]
+  },
+  "authors": {
+    "value": [
+      "Julia Fries",
+      "Stefan Pfeiffer",
+      "Melanie Kuffner",
+      "Angela Sessitsch"
+    ]
+  },
+  "date": {
+    "value": [
+      "12/01/2013"
+    ]
+  },
+  "doi": {
+    "value": [
+      "10.1099/ijs.0.052654-0"
+    ]
+  },
+  "volume": {
+    "value": [
+      "63"
+    ]
+  },
+  "issue": {
+    "value": [
+      "Pt 12"
+    ]
+  },
+  "firstpage": {
+    "value": [
+      "4586"
+    ]
+  },
+  "abstract": {
+    "value": [
+      "\n                  \n                      Next Section\n                  Abstract\n                  \n                  A Gram-reaction-negative, yellow-pigmented strain, designated EX36T, was characterized using a polyphasic approach comprising phylogenetic, morphological and genotypic analyses. The endophytic\n                     strain was isolated from Zn/Cd-accumulating Salix caprea in Arnoldstein, Austria. Analysis of the 16S rRNA gene demonstrated that the novel strain is most closely related to members\n                     of the genus Spirosoma (95 % sequence similarity with Spirosoma linguale). The genomic DNA G+C content was 47.2 mol%. The predominant quinone was and the major cellular fatty acids were summed feature\n                     3 (iso-C15 : 0 2-OH and/or C16 : 1ω7c), C16 : 1ω5c, iso-C17 : 0 3-OH and iso-C15 : 0. On the basis of its phenotypic and genotypic properties, strain EX36T should be classified as a novel species of the genus Spirosoma, for which the name Spirosoma endophyticum sp. nov. is proposed. The type strain is EX36T ( = DSM 26130T = LMG 27272T).\n                  \n                  \n               "
+    ]
+  },
+  "fulltext_html": {
+    "value": [
+      "http://ijs.sgmjournals.org/content/63/Pt_12/4586.full"
+    ]
+  },
+  "fulltext_pdf": {
+    "value": [
+      "http://ijs.sgmjournals.org/content/63/Pt_12/4586.full.pdf"
+    ]
+  },
+  "supplementary_material": {
+    "value": [
+      "http://ijs.sgmjournals.org/content/63/Pt_12/4586/suppl/DC1"
+    ]
+  },
+  "figure": {
+    "value": [
+      "http://ijs.sgmjournals.org/content/63/Pt_12/4586/F1.small.gif"
+    ]
+  },
+  "figure_caption": {
+    "value": [
+      "Fig. 1.  \n                     \n                     Maximum-likelihood tree (bootstrap: 100 replicates) based on 16S rRNA gene sequence data (sequence length 1296 bp) showing\n                        the phylogenetic position of strain EX36T among related species selected from the phylum Bacteroidetes. Cardiobacterium hominis ATCC 15826T (M35014) was used as an outgroup.\n                     \n                     \n                     \n                  "
+    ]
+  },
+  "license": {
+    "value": [
+      "\n                  This is an open-access article distributed under the terms of the Creative Commons Attribution License, which permits unrestricted\n                     use, distribution, and reproduction in any medium, provided the original work is properly cited.\n                  \n               "
+    ]
+  },
+  "copyright": {
+    "value": [
+      "Copyright ©\n                     \t\t2015 International Union of Microbiological Societies\n                     \t\n                  "
+    ]
+  }
+}
\ No newline at end of file
diff --git a/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_53_1_1.full/fulltext.html b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_53_1_1.full/fulltext.html
new file mode 100644
index 00000000..62ce95ee
--- /dev/null
+++ b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_53_1_1.full/fulltext.html
@@ -0,0 +1,625 @@
+<!DOCTYPE html
+  PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html
+      xmlns="http://www.w3.org/1999/xhtml"
+      xml:lang="en"
+      lang="en">
+   <head>
+      <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
+      <title>Validation of publication of new names and new combinations previously effectively published outside the IJSEM </title>
+      <meta name="googlebot" content="NOODP" />
+      <meta name="HW.ad-path" content="/cgi/content/full/53/1/1" />
+      <meta content="/ijs/53/1/1.atom" name="HW.identifier" />
+      <meta name="DC.Format" content="text/html" />
+      <meta name="DC.Language" content="en" />
+      <meta content="Validation of publication of new names and new combinations previously effectively published outside the IJSEM"
+            name="DC.Title" />
+      <meta content="10.1099/ijs.0.02651-0" name="DC.Identifier" />
+      <meta content="2003-01-01" name="DC.Date" />
+      <meta content="Society for General Microbiology" name="DC.Publisher" />
+      <meta content="" name="DC.Contributor" />
+      <meta content="International Journal of Systematic and Evolutionary&#xA;                Microbiology"
+            name="citation_journal_title" />
+      <meta content="Int J Syst Evol&#xA;                Microbiol"
+            name="citation_journal_abbrev" />
+      <meta content="1466-5026" name="citation_issn" />
+      <meta content="1466-5034" name="citation_issn" />
+      <meta content="Validation of publication of new names and new combinations previously effectively published outside the IJSEM"
+            name="citation_title" />
+      <meta content="01/01/2003" name="citation_date" />
+      <meta content="53" name="citation_volume" />
+      <meta content="1" name="citation_issue" />
+      <meta content="1" name="citation_firstpage" />
+      <meta content="2" name="citation_lastpage" />
+      <meta content="53/1/1" name="citation_id" />
+      <meta content="53/1/1" name="citation_id_from_sass_path" />
+      <meta content="ijs;53/1/1" name="citation_mjid" />
+      <meta content="10.1099/ijs.0.02651-0" name="citation_doi" />
+      <meta content="http://ijs.sgmjournals.org/content/53/1/1.abstract"
+            name="citation_abstract_html_url" />
+      <meta content="http://ijs.sgmjournals.org/content/53/1/1.full"
+            name="citation_fulltext_html_url" />
+      <meta content="http://ijs.sgmjournals.org/content/53/1/1.full.pdf"
+            name="citation_pdf_url" />
+      <meta content="/content/53/1.cover.gif" name="issue_cover_image" />
+      <meta content="http://ijs.sgmjournals.org/content/53/1/1" name="citation_public_url" />
+      <meta content="12656143" name="citation_pmid" />
+      <meta name="citation_section" content="Validation List no. 89" />
+      <meta name="robots" content="noarchive,nofollow" />
+      <meta name="googlebot" content="noarchive" />
+      <link href="/content/52/6/2343.short" rel="prev" />
+      <link href="/content/53/1/3.short" rel="next" />
+      <link rel="stylesheet" type="text/css" media="all" href="/shared/css/hw-global.css" />
+      <link rel="stylesheet" type="text/css" media="print" href="/shared/css/hw-print.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/standard-designs/design25/main.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/local/css/hw-local-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/jquery.fancybox-1.3.4.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-global-colexpand.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-global-colexpand.css" /><script type="text/javascript" id="session-d120744727e1">var callbackToken='563573351D2F54F';</script><script type="text/javascript" id="session-d120744727e3">
+                      var subCode='sgmjournal_sub';
+                    </script><script type="text/javascript" src="/shared/js/jquery-min.js"></script><script type="text/javascript" src="/shared/js/fingerprint.js"></script><script type="text/javascript" src="/shared/js/hw-shared.js"></script><script type="text/javascript" src="/shared/js/design/hw-design1.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-shared.js"></script><script type="text/javascript" src="/shared/js/pages/hw-content.js"></script><script type="text/javascript" src="/shared/js/fancybox/jquery.fancybox-1.3.4.js"></script><script type="text/javascript" src="/shared/js/fancybox/jquery.easing-1.3.pack.js"></script><script type="text/javascript"
+              src="/shared/js/fancybox/jquery.mousewheel-3.0.4.pack.js"></script><script type="text/javascript" src="/shared/js/util/content.jquery.addVariantLink.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-custom-free.js"></script><script type="text/javascript" src="/shared/js/util/hw-col-expand.js"></script><script type="text/javascript"
+              src="https://data.namesforlife.com/script/NamesforLife.js"></script></head>
+   <body>
+      <div class="hw-gen-page pagetype-content" id="pageid-content" itemscope="itemscope"
+           itemtype="http://schema.org/ScholarlyArticle">
+         <div id="header">
+            
+            <h1><a id="logo" href="/"><span>International Journal of Systematic and Evolutionary Microbiology</span></a></h1>
+            
+            <p id="skip-link">
+               <a href="#content-block">Skip to main page content</a>
+               
+            </p>
+            
+            <ul class="button-list header-buttons">
+               <li class="first"><a href="/" title="HOME"><span>HOME</span></a></li>
+               <li><a href="/content/current" title="CURRENT ISSUE"><span>CURRENT ISSUE</span></a></li>
+               <li><a href="/content" title="ARCHIVE"><span>ARCHIVE</span></a></li>
+               <li><a href="/search" title="SEARCH"><span>SEARCH</span></a></li>
+               <li><a href="/help" title="HELP"><span>HELP</span></a></li>
+               <li class="last"><a href="/feedback" title="CONTACT US"><span>CONTACT US</span></a></li>
+            </ul>
+            
+            
+            <div class="header-qs">
+               
+               <form class="searchbox" action="/search" method="get">
+                  <div>
+                     	<label for="header-qs-input" id="header-qs-search-label">Search for Keyword:</label>
+                     <input value="" title="Search" type="text" name="fulltext" id="header-qs-input" /><input type="hidden" name="submit" value="yes" /><label for="header-qs-search" id="header-qs-search-label">GO</label><input value="GO" alt="Link: Go" type="image" id="header-qs-search-go"
+                            src="/shared/img/standard-design/design2/go.gif" /> 
+                     
+                  </div>
+                  <div class="adv-search-link"><a href="/search">Advanced Search</a></div>
+               </form>
+               
+               
+            </div>
+            
+            <div class="header-ac-elements">
+               
+               <div id="authstring" class="suppress-header-login">
+                  
+                  <ul>
+                     <li class="subscr-ref">Institution: THE NATURAL HISTORY MUSEUM</li>
+                     <li>
+                        <a href="/login?uri=http%3A%2F%2Fijs.sgmjournals.org%2Fcontent%2F53%2F1%2F1.full">
+                           Sign In as Member / Individual
+                           </a>
+                        
+                     </li>
+                  </ul>           
+                  
+               </div> 
+               
+               <div id="hdr-login" class="suppress-header-login"></div>
+               
+            </div>
+            
+            <div class="banner-ads">
+               		
+               <ul>
+                  <li class="position-1 no-ad hdr_left"><span>  </span></li>
+               </ul>
+               	
+            </div>
+            
+            <div class="bar">
+               
+               <div class="bar-inner"></div>
+               
+            </div>
+            
+         </div>
+         <div id="content-block">
+            <div class="article fulltext-view" itemprop="articleBody"><span class="highwire-journal-article-marker-start"></span><h1 id="article-title-1" itemprop="headline">Validation of publication of new names and new combinations previously effectively published outside the IJSEM</h1>
+               <div class="section abstract" id="abstract-1" itemprop="description">
+                  <div class="section-nav">
+                     <div class="nav-placeholder"> </div><a href="#ref-list-1" title="References" class="next-section-link"><span>Next Section</span></a></div>
+                  <h2>Abstract</h2>
+                  <p id="p-1">The purpose of this announcement is to effect the valid publication of the following new names and new combinations under
+                     the procedure described previously [<em>Int J</em> <em>Syst Bacteriol</em> <strong>27</strong>(3), iv (1977)]. Authors and other individuals wishing to have new names and/or combinations included in future lists should
+                     send <strong>the pertinent reprint or a photocopy thereof to the IJSEM Editorial Office</strong> for confirmation that all of the other requirements for valid publication have been met. It should be noted that the date
+                     of valid publication of these new names and combinations is the date of publication of this list, not the date of the original
+                     publication of the names and combinations. The authors of the new names and combinations are as given below, and these authors'
+                     names will be included in the author index of the present issue and in the volume author index. Inclusion of a name on these
+                     lists validates the name and thereby makes it available in bacteriological nomenclature. The inclusion of a name on this list
+                     is not to be construed as taxonomic acceptance of the taxon to which the name is applied. Indeed, some of these names may,
+                     in time, be shown to be synonyms, or the organisms may be transferred to another genus, thus necessitating the creation of
+                     a new combination.<a id="xref-table-wrap-1-1" class="xref-down-link" href="#T1"><span>⇓</span></a></p>
+               </div>
+               <div class="section ref-list" id="ref-list-1">
+                  <div class="section-nav"><a href="#abstract-1" title="Abstract" class="prev-section-link"><span>Previous Section</span></a><div class="nav-placeholder"> </div>
+                  </div>
+                  <h2>References</h2>
+                  <ol class="cit-list">
+                     <li><a class="rev-xref-ref" href="#xref-ref-1-1" title="View reference 1 in text"
+                           id="ref-1">↵</a><div class="cit ref-cit ref-other" id="cit-53.1.1.1"
+                             data-doi="10.1128/AEM.68.9.4266-4273.2002">
+                           <div class="cit-metadata"><cite><strong>Albuquerque, L., Santos, J., Travassos, P., Nobre, M. F., Rainey, F. A., Wait, R., Empadinhas, N., Silva, M. T. &amp; da Costa,
+                                    M. S.</strong> <strong>(</strong><span class="cit-pub-date">2002</span><strong>).</strong> <em>Albidovulum inexpectatum</em> gen. nov., sp. nov., a nonphotosynthetic and slightly thermophilic bacterium from a marine hot spring that is very closely
+                                 related to members of the photosynthetic genus <em>Rhodovulum</em>. <span class="cit-source">Appl Environ Microbiol</span> <span class="cit-vol">68</span>, <span class="cit-fpage">4266</span>–4273.</cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=68/9/4266"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><a class="rev-xref-ref" href="#xref-ref-2-1" title="View reference 2 in text"
+                           id="ref-2">↵</a><div class="cit ref-cit ref-other" id="cit-53.1.1.2"
+                             data-doi="10.1007/s00792-001-0259-y">
+                           <div class="cit-metadata"><cite><strong>Eder, W. &amp; Huber, R.</strong> <strong>(</strong><span class="cit-pub-date">2002</span><strong>).</strong> New isolates and physiological properties of the <em>Aquificales</em> and description of <em>Thermocrinis albus</em> sp. nov. <span class="cit-source">Extremophiles</span> <span class="cit-vol">6</span>, <span class="cit-fpage">309</span>–318.</cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/s00792-001-0259-y&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=12215816&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a></div>
+                        </div>
+                     </li>
+                     <li><a class="rev-xref-ref" href="#xref-ref-3-1" title="View reference 3 in text"
+                           id="ref-3">↵</a><div class="cit ref-cit ref-other" id="cit-53.1.1.3"
+                             data-doi="10.1078/0723-2020-00134">
+                           <div class="cit-metadata"><cite><strong>Goris, J., Dejonghe, W., Falsen, E., De Clerck, E., Geeraerts, B., Willems, A., Top, E. M., Vandamme, P. &amp; De Vos, P.</strong> <strong>(</strong><span class="cit-pub-date">2002</span><strong>).</strong> Diversity of transconjugants that acquired plasmid pJP4 or pEMT1 after inoculation of a donor strain in the A- and B-horizon
+                                 of an agricultural soil and description of <em>Burkholderia hospita</em> sp. nov. and <em>Burkholderia terricola</em> sp. nov. <span class="cit-source">Syst Appl Microbiol</span> <span class="cit-vol">25</span>, <span class="cit-fpage">340</span>–352.</cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1078/0723-2020-00134&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=12421072&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a></div>
+                        </div>
+                     </li>
+                     <li><a class="rev-xref-ref" href="#xref-ref-4-1" title="View reference 4 in text"
+                           id="ref-4">↵</a><div class="cit ref-cit ref-other" id="cit-53.1.1.4"
+                             data-doi="10.1128/JCM.40.9.3427-3431.2002">
+                           <div class="cit-metadata"><cite><strong>Hall, V., Collins, M. D., Hutson, R., Falsen, E. &amp; Duerden, B. I.</strong> <strong>(</strong><span class="cit-pub-date">2002</span><strong>).</strong> <em>Actinomyces cardiffensis</em> sp. nov. from human clinical sources. <span class="cit-source">J Clin Microbiol</span> <span class="cit-vol">40</span>, <span class="cit-fpage">3427</span>–3431.</cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=jcm&amp;resid=40/9/3427"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><a class="rev-xref-ref" href="#xref-ref-5-1" title="View reference 5 in text"
+                           id="ref-5">↵</a><div class="cit ref-cit ref-other" id="cit-53.1.1.5">
+                           <div class="cit-metadata"><cite><strong>Otoguro, M., Hayakawa, M., Yamazaki, T., Tamura, T., Hatano, K. &amp; Iimura, Y.</strong> <strong>(</strong><span class="cit-pub-date">2001</span><strong>).</strong> Numerical phenetic and phylogenetic analyses of <em>Actinokineospora</em> isolates, with a description of <em>Actinokineospora</em> <em>auranticolor</em> sp. nov. and <em>Actinokineospora</em> <em>enzanensis</em> sp. nov. <span class="cit-source">Actinomycetologica</span> <span class="cit-vol">15</span>, <span class="cit-fpage">30</span>–39.</cite></div>
+                           <div class="cit-extra"></div>
+                        </div>
+                     </li>
+                     <li><a class="rev-xref-ref" href="#xref-ref-6-1" title="View reference 6 in text"
+                           id="ref-6">↵</a><div class="cit ref-cit ref-other" id="cit-53.1.1.6"
+                             data-doi="10.1078/0723-2020-00130">
+                           <div class="cit-metadata"><cite><strong>Place, R. B., Hiestand, D., Burri, S. &amp; Teuber, M.</strong> <strong>(</strong><span class="cit-pub-date">2002</span><strong>).</strong> <em>Staphylococcus succinus</em> subsp. <em>casei</em> subsp. nov., a dominant isolate from surface ripened cheese. <span class="cit-source">Syst Appl Microbiol</span> <span class="cit-vol">25</span>, <span class="cit-fpage">353</span>–359.</cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1078/0723-2020-00130&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=12421073&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a></div>
+                        </div>
+                     </li>
+                     <li><a class="rev-xref-ref" href="#xref-ref-7-1" title="View reference 7 in text"
+                           id="ref-7">↵</a><div class="cit ref-cit ref-other" id="cit-53.1.1.7">
+                           <div class="cit-metadata"><cite><strong>Stetter, K. O.</strong> <strong>(</strong><span class="cit-pub-date">2001</span><strong>).</strong> Genus VII. <em>Thermodiscus</em> gen. nov. In <em>Bergey's Manual of Systematic Bacteriology</em>, 2nd edn, vol. 1 (<em>The Archaea and the Deeply Branching and Phototrophic Bacteria</em>), pp. 189–190. Edited by D. R. Boone, R. W. Castenholz &amp; G. M. Garrity. New York: Springer.</cite></div>
+                           <div class="cit-extra"></div>
+                        </div>
+                     </li>
+                  </ol>
+               </div>
+               <div class="table pos-float" id="T1">
+                  <div class="table-inline">
+                     <div class="callout"><span>View this table:</span><ul class="callout-links">
+                           <li><a href="1/T1.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="1/T1.expansion.html">In a new window</a></li>
+                        </ul>
+                     </div>
+                  </div>
+               </div><span class="highwire-journal-article-marker-end"></span></div>
+            <div class="social-bookmarking">
+               
+               <ul class="social-bookmark-links">
+                  <li class="social-bookmarking-item social-bookmarking-item-citeulike"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/53/1/1&amp;title=Validation%20of%20publication%20of%20new%20names%20and%20new%20combinations%20previously%20effectively%20published%20outside%20the%20IJSEM+--+%2053%20%281%29%3A%201+--+&amp;doi=10.1099/ijs.0.02651-0&amp;link_type=CITEULIKE"><img src="/shared/img/common/social-bookmarking/citeulike.gif"
+                             alt="Add to CiteULike"
+                             title="CiteULike" /></a><span class="soc-bm-link-text">CiteULike</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-delicious"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/53/1/1&amp;title=Validation%20of%20publication%20of%20new%20names%20and%20new%20combinations%20previously%20effectively%20published%20outside%20the%20IJSEM+--+%2053%20%281%29%3A%201+--+&amp;doi=10.1099/ijs.0.02651-0&amp;link_type=DEL_ICIO_US"><img src="/shared/img/common/social-bookmarking/delicious.gif"
+                             alt="Add to Delicious"
+                             title="Delicious" /></a><span class="soc-bm-link-text">Delicious</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-digg"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/53/1/1&amp;title=Validation%20of%20publication%20of%20new%20names%20and%20new%20combinations%20previously%20effectively%20published%20outside%20the%20IJSEM+--+%2053%20%281%29%3A%201+--+&amp;doi=10.1099/ijs.0.02651-0&amp;link_type=DIGG"><img src="/shared/img/common/social-bookmarking/digg.gif" alt="Add to Digg"
+                             title="Digg" /></a><span class="soc-bm-link-text">Digg</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-facebook"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/short/53/1/1&amp;title=Validation%20of%20publication%20of%20new%20names%20and%20new%20combinations%20previously%20effectively%20published%20outside%20the%20IJSEM+--+%2053%20%281%29%3A%201+--+&amp;doi=10.1099/ijs.0.02651-0&amp;link_type=FACEBOOK"
+                        class="sb-facebook"
+                        rel="external-nw"><img src="/shared/img/common/social-bookmarking/facebook.gif" alt="Add to Facebook"
+                             title="Facebook" /></a><span class="soc-bm-link-text">Facebook</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-googleplus"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/53/1/1&amp;title=Validation%20of%20publication%20of%20new%20names%20and%20new%20combinations%20previously%20effectively%20published%20outside%20the%20IJSEM+--+%2053%20%281%29%3A%201+--+&amp;doi=10.1099/ijs.0.02651-0&amp;link_type=GOOGLEPLUS&amp;log_only=yes"><img src="/shared/img/common/social-bookmarking/googleplus.jpg" alt="Add to Google+"
+                             title="Google+" /></a><span class="soc-bm-link-text">Google+</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-linkedin"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/53/1/1&amp;title=Validation%20of%20publication%20of%20new%20names%20and%20new%20combinations%20previously%20effectively%20published%20outside%20the%20IJSEM+--+%2053%20%281%29%3A%201+--+&amp;doi=10.1099/ijs.0.02651-0&amp;link_type=LINKEDIN"><img src="/shared/img/common/social-bookmarking/linkedin.gif" alt="Add to LinkedIn"
+                             title="LinkedIn" /></a><span class="soc-bm-link-text">LinkedIn</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-mendeley"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/53/1/1&amp;title=Validation%20of%20publication%20of%20new%20names%20and%20new%20combinations%20previously%20effectively%20published%20outside%20the%20IJSEM+--+%2053%20%281%29%3A%201+--+&amp;doi=10.1099/ijs.0.02651-0&amp;link_type=MENDELEY"><img src="/shared/img/common/social-bookmarking/mendeley.gif" alt="Add to Mendeley"
+                             title="Mendeley" /></a><span class="soc-bm-link-text">Mendeley</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-reddit"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/53/1/1&amp;title=Validation%20of%20publication%20of%20new%20names%20and%20new%20combinations%20previously%20effectively%20published%20outside%20the%20IJSEM+--+%2053%20%281%29%3A%201+--+&amp;doi=10.1099/ijs.0.02651-0&amp;link_type=REDDIT"><img src="/shared/img/common/social-bookmarking/reddit.gif" alt="Add to Reddit"
+                             title="Reddit" /></a><span class="soc-bm-link-text">Reddit</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-twitter"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/53/1/1&amp;title=Validation%20of%20publication%20of%20new%20names%20and%20new%20combinations%20previously%20effectively%20published%20outside%20the%20IJSEM+--+%2053%20%281%29%3A%201+--+&amp;doi=10.1099/ijs.0.02651-0&amp;link_type=TWITTER"><img src="/shared/img/common/social-bookmarking/twitter.gif" alt="Add to Twitter"
+                             title="Twitter" /></a><span class="soc-bm-link-text">Twitter</span></li>
+               </ul>
+               
+               <p class="social-bookmarking-help"><a href="/help/social_bookmarks.dtl">What's this?</a></p>
+               
+            </div><span id="related-urls"></span></div>
+         <div id="col-2">
+            
+            <div class="article-nav sidebar-nav">
+               <a href="/content/52/6/2343.short" title="Previous article" class="previous">« Previous</a><span class="article-nav-sep"> | </span><a href="/content/53/1/3.short" title="Next article" class="next">Next Article »</a>
+               
+               <span class="toc-link">
+                  				<a href="/content/53/1.toc" title="Table of Contents">Table of Contents</a>
+                  			</span>
+               
+               
+            </div>
+            <div class="content-box" id="article-cb-main">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Article</span></h3>
+                  <div class="cb-section cb-slug">
+                     <ol>
+                        <li>
+                           <div id="slugline">
+                              
+                              
+                              	    
+                              
+                              doi:
+                              <span title="10.1099/ijs.0.02651-0" class="slug-doi">10.1099/ijs.0.02651-0
+                                 </span>
+                              <cite>
+                                 	    <abbr title="International Journal of Systematic and Evolutionary Microbiology"
+                                       class="slug-jnl-abbrev">
+                                    IJSEM</abbr><span class="slug-pub-date" itemprop="datePublished">
+                                    	    January 2003 
+                                    </span>
+                                 	    <span class="slug-vol">
+                                    vol. 53 
+                                    </span><span class="slug-issue">
+                                    no. 1 
+                                    </span><span class="slug-pages">
+                                    1-2
+                                    </span>
+                                 </cite>
+                              
+                              	           
+                              
+                              
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section cb-views">
+                     <ol>
+                        <li class="abstract-view-link primary"><a href="/content/53/1/1.abstract" rel="view-abstract">Abstract</a><span class="free">Free</span></li>
+                        <li class="notice full-text-view-link primary"><span class="variant-indicator">» <span>Full Text</span></span><span class="free">Free</span></li>
+                        <li class="notice full-text-pdf-view-link primary"><a href="/content/53/1/1.full.pdf+html" rel="view-full-text.pdf">Full Text (PDF)</a><span class="free">Free</span></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible" id="cb-art-cat">
+                     <h4 class="cb-section-header"><span>Classifications</span></h4>
+                     <ol>
+                        <li>
+                           <ul class="subject-headings last-child">
+                              <li><a class="tocsection-search"
+                                    href="/search?tocsectionid=Validation+List+no.+89&amp;sortspec=date&amp;submit=Submit">Validation List no. 89</a></li>
+                           </ul>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible" id="cb-art-svcs">
+                     <h4 class="cb-section-header"><span>Services</span></h4>
+                     <ol>
+                        <li class="mail-a-friend-link icon-link"><a href="/email?gca=ijs%3B53%2F1%2F1&amp;current-view-path=/content/53/1/1.full">
+                              Email this article to a colleague</a></li>
+                        <li class="alert-link icon-link"><a href="/cgi/alerts/ctalert?alertType=citedby&amp;addAlert=cited_by&amp;cited_by_criteria_resid=ijs%3B53%2F1%2F1&amp;saveAlert=no&amp;return-type=article&amp;return_url=http://ijs.sgmjournals.org/content/53/1/1.full">Alert me when this article is cited</a></li>
+                        <li class="alert-link icon-link"><a href="/cgi/alerts/ctalert?alertType=correction&amp;addAlert=correction&amp;correction_criteria_value=53/1/1&amp;saveAlert=no&amp;return-type=article&amp;return_url=http://ijs.sgmjournals.org/content/53/1/1.full">Alert me if a correction is posted</a></li>
+                        <li class="similar-link"><a href="/search?qbe=ijs%3B53%2F1%2F1&amp;citation=%2053%20%281%29:%201&amp;submit=yes">Similar articles in this journal</a></li>
+                        <li class="similar-link"><a href="/external-ref?access_num=ijs%3B53%2F1%2F1&amp;link_type=ISI_RELATEDRECORDS"
+                              id="cb-isi-similar-articles"
+                              class="similar-link">Similar articles in Web of Science</a></li>
+                        <li class="similar-link"><a href="/external-ref?access_num=12656143&amp;link_type=MED_NBRS"
+                              class="similar-link">Similar articles in PubMed</a></li>
+                        <li class="cit-man-link icon-link cite-link"><a href="/citmgr?gca=ijs%3B53%2F1%2F1">Download to citation manager</a></li>
+                        <li class="copyright-link icon-link"><a href="/external-ref?link_type=PERMISSIONDIRECT"><img src="/shared/img/content/permissions.gif" /></a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-cit">
+                     <h4 class="cb-section-header"><span>Citing Articles</span></h4>
+                     <ol>
+                        <li class="hw-citing-link"><a href="/content/53/1/1.full?cited-by=yes&amp;legid=ijs;53/1/1#cited-by"
+                              id="cb-hw-citing-articles">Load citing article information</a></li>
+                        <li><a href="/cgi/crossref-forward-links/53/1/1" rel="external-nw"
+                              id="cb-crossref-citing-articles">Citing articles via CrossRef</a></li>
+                        <li><a href="/external-ref?access_num=%2Fijs%2F53%2F1%2F1&amp;link_type=ISI_CITING&amp;accnum_type=native"
+                              rel="external-nw"
+                              id="cb-isi-citing-articles">Citing articles via Web of Science</a></li>
+                        <li><a href="/external-ref?access_num=http://ijs.sgmjournals.org/content/53/1/1.abstract&amp;link_type=GOOGLESCHOLAR">Citing articles via Google Scholar</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-gs">
+                     <h4 class="cb-section-header"><span>Google Scholar</span></h4>
+                     <ol>
+                        <li class="cb-art-gs-rel similar-link"><a href="/external-ref?access_num=http://ijs.sgmjournals.org/content/53/1/1.abstract&amp;link_type=GOOGLESCHOLARRELATED">Search for related content</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-pm">
+                     <h4 class="cb-section-header"><span>PubMed</span></h4>
+                     <ol>
+                        <li class="cb-art-pm-cite cite-link icon-link"><a href="/external-ref?access_num=12656143&amp;link_type=PUBMED"
+                              class="cb-art-pm-cite cite-link icon-link">PubMed citation</a></li>
+                        <li>
+                           <div id="cb-entrez-links-placeholder"><a href="/entrez-links/12656143"></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-rel">
+                     <h4 class="cb-section-header"><span>Related Content</span></h4>
+                     <ol>
+                        <li><a href="/content/53/1/1.full?related-urls=yes&amp;legid=ijs;53/1/1#related-urls"
+                              id="cb-related-urls">Load related web page information</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed soc-links icon-link"
+                       id="cb-art-soc">
+                     <h4 class="cb-section-header"><span>Social Bookmarking</span></h4>
+                     <ol>
+                        <li>
+                           <div class="social-bookmarking">
+                              
+                              <ul class="social-bookmark-links">
+                                 <li class="social-bookmarking-item social-bookmarking-item-citeulike"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/53/1/1&amp;title=Validation%20of%20publication%20of%20new%20names%20and%20new%20combinations%20previously%20effectively%20published%20outside%20the%20IJSEM+--+%2053%20%281%29%3A%201+--+&amp;doi=10.1099/ijs.0.02651-0&amp;link_type=CITEULIKE"><img src="/shared/img/common/social-bookmarking/citeulike.gif"
+                                            alt="Add to CiteULike"
+                                            title="CiteULike" /></a><span class="soc-bm-link-text">CiteULike</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-delicious"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/53/1/1&amp;title=Validation%20of%20publication%20of%20new%20names%20and%20new%20combinations%20previously%20effectively%20published%20outside%20the%20IJSEM+--+%2053%20%281%29%3A%201+--+&amp;doi=10.1099/ijs.0.02651-0&amp;link_type=DEL_ICIO_US"><img src="/shared/img/common/social-bookmarking/delicious.gif"
+                                            alt="Add to Delicious"
+                                            title="Delicious" /></a><span class="soc-bm-link-text">Delicious</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-digg"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/53/1/1&amp;title=Validation%20of%20publication%20of%20new%20names%20and%20new%20combinations%20previously%20effectively%20published%20outside%20the%20IJSEM+--+%2053%20%281%29%3A%201+--+&amp;doi=10.1099/ijs.0.02651-0&amp;link_type=DIGG"><img src="/shared/img/common/social-bookmarking/digg.gif" alt="Add to Digg"
+                                            title="Digg" /></a><span class="soc-bm-link-text">Digg</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-facebook"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/short/53/1/1&amp;title=Validation%20of%20publication%20of%20new%20names%20and%20new%20combinations%20previously%20effectively%20published%20outside%20the%20IJSEM+--+%2053%20%281%29%3A%201+--+&amp;doi=10.1099/ijs.0.02651-0&amp;link_type=FACEBOOK"
+                                       class="sb-facebook"
+                                       rel="external-nw"><img src="/shared/img/common/social-bookmarking/facebook.gif" alt="Add to Facebook"
+                                            title="Facebook" /></a><span class="soc-bm-link-text">Facebook</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-googleplus"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/53/1/1&amp;title=Validation%20of%20publication%20of%20new%20names%20and%20new%20combinations%20previously%20effectively%20published%20outside%20the%20IJSEM+--+%2053%20%281%29%3A%201+--+&amp;doi=10.1099/ijs.0.02651-0&amp;link_type=GOOGLEPLUS&amp;log_only=yes"><img src="/shared/img/common/social-bookmarking/googleplus.jpg" alt="Add to Google+"
+                                            title="Google+" /></a><span class="soc-bm-link-text">Google+</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-linkedin"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/53/1/1&amp;title=Validation%20of%20publication%20of%20new%20names%20and%20new%20combinations%20previously%20effectively%20published%20outside%20the%20IJSEM+--+%2053%20%281%29%3A%201+--+&amp;doi=10.1099/ijs.0.02651-0&amp;link_type=LINKEDIN"><img src="/shared/img/common/social-bookmarking/linkedin.gif" alt="Add to LinkedIn"
+                                            title="LinkedIn" /></a><span class="soc-bm-link-text">LinkedIn</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-mendeley"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/53/1/1&amp;title=Validation%20of%20publication%20of%20new%20names%20and%20new%20combinations%20previously%20effectively%20published%20outside%20the%20IJSEM+--+%2053%20%281%29%3A%201+--+&amp;doi=10.1099/ijs.0.02651-0&amp;link_type=MENDELEY"><img src="/shared/img/common/social-bookmarking/mendeley.gif" alt="Add to Mendeley"
+                                            title="Mendeley" /></a><span class="soc-bm-link-text">Mendeley</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-reddit"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/53/1/1&amp;title=Validation%20of%20publication%20of%20new%20names%20and%20new%20combinations%20previously%20effectively%20published%20outside%20the%20IJSEM+--+%2053%20%281%29%3A%201+--+&amp;doi=10.1099/ijs.0.02651-0&amp;link_type=REDDIT"><img src="/shared/img/common/social-bookmarking/reddit.gif" alt="Add to Reddit"
+                                            title="Reddit" /></a><span class="soc-bm-link-text">Reddit</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-twitter"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/53/1/1&amp;title=Validation%20of%20publication%20of%20new%20names%20and%20new%20combinations%20previously%20effectively%20published%20outside%20the%20IJSEM+--+%2053%20%281%29%3A%201+--+&amp;doi=10.1099/ijs.0.02651-0&amp;link_type=TWITTER"><img src="/shared/img/common/social-bookmarking/twitter.gif" alt="Add to Twitter"
+                                            title="Twitter" /></a><span class="soc-bm-link-text">Twitter</span></li>
+                              </ul>
+                              
+                              <p class="social-bookmarking-help"><a href="/help/social_bookmarks.dtl">What's this?</a></p>
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+            
+            <div class="content-box" id="article-dyn-nav">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>Navigate This Article</span></h3>
+                  <div class="cb-section" id="cb-art-nav">
+                     <ol>
+                        <li><a href="#content-block">Top</a></li>
+                        <li><a href="#abstract-1">Abstract</a></li>
+                        <li><a href="#ref-list-1">References</a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+         </div>
+         <div id="col-3">
+            
+            <div class="content-box" id="sidebar-current-issue">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Month's Issue</span></h3>
+                  <div class="cb-section">
+                     <ol>
+                        <li><span><a href="/content/current" rel="current-issue">April 2015, 65 (Pt 4)</a></span></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section">
+                     <ol>
+                        <li>
+                           <div class="current-issue"><a href="/content/current" rel="current-issue"><img src="/content/65/Pt_4.cover.gif" width="67" height="89" alt="Current Issue" /></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section sidebar-etoc-link">
+                     <ol>
+                        <li><a href="/cgi/alerts/etoc">Alert me to new issues of IJSEM
+                              </a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            <div id="sidebar-global-nav">
+               
+               		
+               <ul class="button-list pub-links">
+                  <li class="first"><a href="/site/misc/about.xhtml" title="ABOUT IJSEM"><span>ABOUT IJSEM</span></a></li>
+                  <li><a href="/site/misc/edboard.xhtml" title="EDITORIAL BOARD &amp; STAFF"><span>EDITORIAL BOARD &amp; STAFF</span></a></li>
+                  <li><a href="http://www.editorialmanager.com/ijs/" title="SUBMIT A MANUSCRIPT"><span>SUBMIT A MANUSCRIPT</span></a></li>
+                  <li><a href="/site/misc/ifora.xhtml" title="INFORMATION FOR AUTHORS"><span>INFORMATION FOR AUTHORS</span></a></li>
+                  <li><a href="/site/misc/iforr.xhtml" title="INFORMATION FOR REVIEWERS"><span>INFORMATION FOR REVIEWERS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/site/librarians/index.xhtml"
+                        title="INFORMATION FOR LIBRARIANS"><span>INFORMATION FOR LIBRARIANS</span></a></li>
+                  <li><a href="/site/misc/reprints.xhtml" title="PERMISSIONS AND REPRINTS"><span>PERMISSIONS AND REPRINTS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/subscriptions" title="SUBSCRIPTIONS"><span>SUBSCRIPTIONS</span></a></li>
+                  <li><a href="/site/misc/addir.xhtml" title="ADVERTISING"><span>ADVERTISING</span></a></li>
+                  <li class="rss-img-button"><a href="/site/misc/alerts_feeds.xhtml" title="ALERTS &amp; FEEDS"><span>ALERTS &amp; FEEDS</span></a></li>
+                  <li class="last"><a href="/feedback" title="FEEDBACK"><span>FEEDBACK</span></a></li>
+               </ul>
+               		
+               <ul class="button-list pub-links umbrella-links">
+                  <li class="first"><a href="http://mic.sgmjournals.org" title="MICROBIOLOGY"><span>MICROBIOLOGY</span></a></li>
+                  <li><a href="http://vir.sgmjournals.org" title="J GEN VIROL"><span>J GEN VIROL</span></a></li>
+                  <li><a href="http://jmm.sgmjournals.org" title="J MED MICROBIOL"><span>J MED MICROBIOL</span></a></li>
+                  <li><a href="http://jmmcr.sgmjournals.org" title="JMM CASE REPORTS"><span>JMM CASE REPORTS</span></a></li>
+                  <li class="last"><a href="http://www.sgmjournals.org" title="ALL SGM JOURNALS"><span>ALL SGM JOURNALS</span></a></li>
+               </ul>
+               		
+               <div class="sidebar-icon-group">
+                  			
+                  <div class="icons">
+                     			<a href="http://www.sgm.ac.uk/" rel="external-nw"><img src="/publisher/img/society_logo.gif" class="publisher-icon" alt="Society Logo" /></a>
+                     			<a href="http://www.the-icsp.org/" rel="external-nw"><img src="/publisher/img/icsp_logo.gif" class="publisher-icon" alt="ICSP Logo" /></a>
+                     			<a href="http://highwire.stanford.edu/" rel="external-nw"><img src="/publisher/img/hplogo.gif" class="hw-icon" alt="HighWire Press Logo" /></a>
+                     			
+                  </div>
+                  			
+                  <div class="sidebar-icon-text"><span>The <a href="http://www.sgmjournals.org"> Society for General Microbiology</a> publishes online with the assistance of <a href="http://highwire.stanford.edu">HighWire Press®</a>.</span></div>
+                  		
+               </div>
+               	
+            </div>
+            <div class="most-links-box js-marker">
+               
+               <div class="most-header">
+                  
+                  <h3>Most</h3>
+                  
+               </div>
+               
+               <ul>
+                  <li class="most-cur-sel">
+                     <h4>Viewed</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/1070?rss=1&amp;ssource=mfr">Proposal to consistently apply the International Code of Nomenclature of Prokaryotes (ICNP) to names of the oxygenic photosynthetic
+                                 bacteria (cyanobacteria), including those validly published under the International Code of Botanical Nomenclature (ICBN)/International
+                                 Code of Nomenclature for algae, fungi and plants (ICN), and proposal to change Principle 2 of the ICNP</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfr">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/316?rss=1&amp;ssource=mfr">Integrating genomics into the taxonomy and systematics of the Bacteria and Archaea</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/333?rss=1&amp;ssource=mfr">Applications of next-generation sequencing to unravelling the evolutionary history of algae</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/739?rss=1&amp;ssource=mfr">Notification that new names of prokaryotes, new combinations, and new taxonomic opinions have appeared in volume 64, part
+                                 12, of the IJSEM</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfr1.dtl" class="view-all">» View all Most Viewed articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+                  <li>
+                     <h4>Cited</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4386?rss=1&amp;ssource=mfc">Chryseobacterium hispalense sp. nov., a plant-growth-promoting bacterium isolated from a rainwater pond in an olive plant
+                                 nursery, and emended descriptions of Chryseobacterium defluvii, Chryseobacterium indologenes, Chryseobacterium wanjuense and
+                                 Chryseobacterium gregarium</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfc">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_1/138?rss=1&amp;ssource=mfc">Aquibacter zeaxanthinifaciens gen. nov., sp. nov., a zeaxanthin-producing bacterium of the family Flavobacteriaceae isolated
+                                 from surface seawater, and emended descriptions of the genera Aestuariibaculum and Gaetbulibacter</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4790?rss=1&amp;ssource=mfc">Kordia aquimaris sp. nov., a zeaxanthin-producing member of the family Flavobacteriaceae isolated from surface seawater, and
+                                 emended description of the genus Kordia</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4524?rss=1&amp;ssource=mfc">Erythrobacter odishensis sp. nov. and Pontibacter odishensis sp. nov. isolated from dry soil of a solar saltern</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfc1.dtl" class="view-all">» View all Most Cited articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+               </ul>
+               
+               
+            </div>
+            
+            
+            
+         </div>
+         <div id="footer">
+            
+            <div class="bar">
+               
+               <div class="footer-group footer-col-left">
+                  		
+                  <p class="copyright">Copyright ©
+                     		2015 International Union of Microbiological Societies
+                     	
+                  </p>
+                  	
+               </div>
+               
+               <div class="footer-group footer-col-right">
+                  	    
+                  <ul class="issns">
+                     <li>
+                        <span>Print ISSN: </span>
+                        <span class="issn">1466-5026</span>
+                        
+                     </li>
+                     <li>
+                        <span>Online ISSN: </span>
+                        <span class="issn">1466-5034</span>
+                        
+                     </li>
+                  </ul>
+                  	  
+               </div>
+               	  
+            </div>
+            
+            
+            <div class="block-2 sb-div"></div>
+            
+         </div><script type="text/javascript">
+        var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
+        document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
+        </script><script type="text/javascript">
+        try {
+        var pageTracker = _gat._getTracker("UA-189672-25");
+        pageTracker._setDomainName(".sgmjournals.org");
+        pageTracker._trackPageview();
+        } catch(err) {}
+        </script><script type="text/javascript">
+	(function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
+		(i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
+		m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
+	})(window,document,'script','//www.google-analytics.com/analytics.js','ga');
+
+	ga('create', 'UA-48529861-1', '.sgmjournals.org');
+	ga('send', 'pageview');
+	</script></div>
+   </body>
+</html>
\ No newline at end of file
diff --git a/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_53_1_1.full/fulltext.pdf b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_53_1_1.full/fulltext.pdf
new file mode 100644
index 00000000..c1f7c97f
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_53_1_1.full/fulltext.pdf differ
diff --git a/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4141.full/F3.large.jpg b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4141.full/F3.large.jpg
new file mode 100644
index 00000000..a5062c09
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4141.full/F3.large.jpg differ
diff --git a/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4141.full/fulltext.html b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4141.full/fulltext.html
new file mode 100644
index 00000000..bfec021c
--- /dev/null
+++ b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4141.full/fulltext.html
@@ -0,0 +1,1754 @@
+<!DOCTYPE html
+  PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html
+      xmlns="http://www.w3.org/1999/xhtml"
+      xml:lang="en"
+      lang="en">
+   <head>
+      <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
+      <title>Sulfurimonas gotlandica sp. nov., a chemoautotrophic and psychrotolerant epsilonproteobacterium isolated from a pelagic redoxcline,
+         and an emended description of the genus Sulfurimonas 
+      </title>
+      <meta name="googlebot" content="NOODP" />
+      <meta name="HW.ad-path" content="/cgi/content/full/63/Pt_11/4141" />
+      <meta content="/ijs/63/Pt_11/4141.atom" name="HW.identifier" />
+      <meta name="DC.Format" content="text/html" />
+      <meta name="DC.Language" content="en" />
+      <meta content="Sulfurimonas gotlandica sp. nov., a chemoautotrophic and psychrotolerant epsilonproteobacterium isolated from a pelagic redoxcline, and an emended description of the genus Sulfurimonas"
+            name="DC.Title" />
+      <meta content="10.1099/ijs.0.048827-0" name="DC.Identifier" />
+      <meta content="2013-11-01" name="DC.Date" />
+      <meta content="Society for General Microbiology" name="DC.Publisher" />
+      <meta content="Matthias Labrenz" name="DC.Contributor" />
+      <meta content="Jana Grote" name="DC.Contributor" />
+      <meta content="Kerstin Mammitzsch" name="DC.Contributor" />
+      <meta content="Henricus T. S. Boschker" name="DC.Contributor" />
+      <meta content="Michael Laue" name="DC.Contributor" />
+      <meta content="Günter Jost" name="DC.Contributor" />
+      <meta content="Sabine Glaubitz" name="DC.Contributor" />
+      <meta content="Klaus Jürgens" name="DC.Contributor" />
+      <meta content="International Journal of Systematic and Evolutionary&#xA;                Microbiology"
+            name="citation_journal_title" />
+      <meta content="Int J Syst Evol&#xA;                Microbiol"
+            name="citation_journal_abbrev" />
+      <meta content="1466-5026" name="citation_issn" />
+      <meta content="1466-5034" name="citation_issn" />
+      <meta name="citation_author" content="Matthias Labrenz" />
+      <meta name="citation_author_institution"
+            content="1IOW Leibniz Institute for Baltic Sea Research Warnemuende (IOW), Germany" />
+      <meta name="citation_author" content="Jana Grote" />
+      <meta name="citation_author_institution"
+            content="1IOW Leibniz Institute for Baltic Sea Research Warnemuende (IOW), Germany" />
+      <meta name="citation_author" content="Kerstin Mammitzsch" />
+      <meta name="citation_author_institution"
+            content="1IOW Leibniz Institute for Baltic Sea Research Warnemuende (IOW), Germany" />
+      <meta name="citation_author" content="Henricus T. S. Boschker" />
+      <meta name="citation_author_institution"
+            content="2Royal Netherlands Institute of Sea Research (NIOZ), Yerseke, Netherlands" />
+      <meta name="citation_author" content="Michael Laue" />
+      <meta name="citation_author_institution"
+            content="3Arbeitsbereich Medizinische Biologie und Elektronenmikroskopisches Zentrum (EMZ), Universität Rostock, Germany" />
+      <meta name="citation_author" content="Günter Jost" />
+      <meta name="citation_author_institution"
+            content="1IOW Leibniz Institute for Baltic Sea Research Warnemuende (IOW), Germany" />
+      <meta name="citation_author" content="Sabine Glaubitz" />
+      <meta name="citation_author_institution"
+            content="1IOW Leibniz Institute for Baltic Sea Research Warnemuende (IOW), Germany" />
+      <meta name="citation_author" content="Klaus Jürgens" />
+      <meta name="citation_author_institution"
+            content="1IOW Leibniz Institute for Baltic Sea Research Warnemuende (IOW), Germany" />
+      <meta content="Sulfurimonas gotlandica sp. nov., a chemoautotrophic and psychrotolerant epsilonproteobacterium isolated from a pelagic redoxcline, and an emended description of the genus Sulfurimonas"
+            name="citation_title" />
+      <meta content="11/01/2013" name="citation_date" />
+      <meta content="63" name="citation_volume" />
+      <meta content="Pt 11" name="citation_issue" />
+      <meta content="4141" name="citation_firstpage" />
+      <meta content="4148" name="citation_lastpage" />
+      <meta content="63/Pt_11/4141" name="citation_id" />
+      <meta content="63/Pt 11/4141" name="citation_id_from_sass_path" />
+      <meta content="ijs;63/Pt_11/4141" name="citation_mjid" />
+      <meta content="10.1099/ijs.0.048827-0" name="citation_doi" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4141.abstract"
+            name="citation_abstract_html_url" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4141.full"
+            name="citation_fulltext_html_url" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4141.full.pdf"
+            name="citation_pdf_url" />
+      <meta content="/content/63/Pt_11.cover.gif" name="issue_cover_image" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4141"
+            name="citation_public_url" />
+      <meta content="23749282" name="citation_pmid" />
+      <meta name="citation_access" content="all" />
+      <meta name="citation_fulltext_world_readable" content="" />
+      <meta name="citation_section" content="Proteobacteria" />
+      <meta name="robots" content="noarchive,nofollow" />
+      <meta name="googlebot" content="noarchive" />
+      <link href="/content/63/Pt_11/4136.short" rel="prev" />
+      <link href="/content/63/Pt_11/4149.short" rel="next" />
+      <link rel="stylesheet" type="text/css" media="all" href="/shared/css/hw-global.css" />
+      <link rel="stylesheet" type="text/css" media="print" href="/shared/css/hw-print.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/standard-designs/design25/main.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/local/css/hw-local-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/jquery.fancybox-1.3.4.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-global-colexpand.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-global-colexpand.css" /><script type="text/javascript" id="session-d118285018e1">var callbackToken='563169098C3DE36';</script><script type="text/javascript" id="session-d118285018e3">
+                      var subCode='sgmjournal_sub';
+                    </script><script type="text/javascript" src="/shared/js/jquery-min.js"></script><script type="text/javascript" src="/shared/js/fingerprint.js"></script><script type="text/javascript" src="/shared/js/hw-shared.js"></script><script type="text/javascript" src="/shared/js/design/hw-design1.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-shared.js"></script><script type="text/javascript" src="/shared/js/pages/hw-content.js"></script><script type="text/javascript" src="/shared/js/fancybox/jquery.fancybox-1.3.4.js"></script><script type="text/javascript" src="/shared/js/fancybox/jquery.easing-1.3.pack.js"></script><script type="text/javascript"
+              src="/shared/js/fancybox/jquery.mousewheel-3.0.4.pack.js"></script><script type="text/javascript" src="/shared/js/util/content.jquery.addVariantLink.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-custom-free.js"></script><script type="text/javascript" src="/shared/js/util/hw-col-expand.js"></script><script type="text/javascript"
+              src="https://data.namesforlife.com/script/NamesforLife.js"></script></head>
+   <body>
+      <div class="hw-gen-page pagetype-content" id="pageid-content" itemscope="itemscope"
+           itemtype="http://schema.org/ScholarlyArticle">
+         <div id="header">
+            
+            <h1><a id="logo" href="/"><span>International Journal of Systematic and Evolutionary Microbiology</span></a></h1>
+            
+            <p id="skip-link">
+               <a href="#content-block">Skip to main page content</a>
+               
+            </p>
+            
+            <ul class="button-list header-buttons">
+               <li class="first"><a href="/" title="HOME"><span>HOME</span></a></li>
+               <li><a href="/content/current" title="CURRENT ISSUE"><span>CURRENT ISSUE</span></a></li>
+               <li><a href="/content" title="ARCHIVE"><span>ARCHIVE</span></a></li>
+               <li><a href="/search" title="SEARCH"><span>SEARCH</span></a></li>
+               <li><a href="/help" title="HELP"><span>HELP</span></a></li>
+               <li class="last"><a href="/feedback" title="CONTACT US"><span>CONTACT US</span></a></li>
+            </ul>
+            
+            
+            <div class="header-qs">
+               
+               <form class="searchbox" action="/search" method="get">
+                  <div>
+                     	<label for="header-qs-input" id="header-qs-search-label">Search for Keyword:</label>
+                     <input value="" title="Search" type="text" name="fulltext" id="header-qs-input" /><input type="hidden" name="submit" value="yes" /><label for="header-qs-search" id="header-qs-search-label">GO</label><input value="GO" alt="Link: Go" type="image" id="header-qs-search-go"
+                            src="/shared/img/standard-design/design2/go.gif" /> 
+                     
+                  </div>
+                  <div class="adv-search-link"><a href="/search">Advanced Search</a></div>
+               </form>
+               
+               
+            </div>
+            
+            <div class="header-ac-elements">
+               
+               <div id="authstring" class="suppress-header-login">
+                  
+                  <ul>
+                     <li class="subscr-ref">Institution: THE NATURAL HISTORY MUSEUM</li>
+                     <li>
+                        <a href="/login?uri=http%3A%2F%2Fijs.sgmjournals.org%2Fcontent%2F63%2FPt_11%2F4141.full">
+                           Sign In as Member / Individual
+                           </a>
+                        
+                     </li>
+                  </ul>           
+                  
+               </div> 
+               
+               <div id="hdr-login" class="suppress-header-login"></div>
+               
+            </div>
+            
+            <div class="banner-ads">
+               		
+               <ul>
+                  <li class="position-1 no-ad hdr_left"><span>  </span></li>
+               </ul>
+               	
+            </div>
+            
+            <div class="bar">
+               
+               <div class="bar-inner"></div>
+               
+            </div>
+            
+         </div>
+         <div id="content-block">
+            <div class="article fulltext-view " itemprop="articleBody"><span class="highwire-journal-article-marker-start"></span><h1 id="article-title-1" itemprop="headline"><em>Sulfurimonas gotlandica</em> sp. nov., a chemoautotrophic and psychrotolerant epsilonproteobacterium isolated from a pelagic redoxcline, and an emended
+                  description of the genus <em>Sulfurimonas</em></h1>
+               <div class="contributors">
+                  <ol class="contributor-list" id="contrib-group-1">
+                     <li class="contributor" id="contrib-1" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Matthias+Labrenz&amp;sortspec=date&amp;submit=Submit">Matthias Labrenz</a></span><a id="xref-aff-1-1" class="xref-aff" href="#aff-1"><sup>1</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-2" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Jana+Grote&amp;sortspec=date&amp;submit=Submit">Jana Grote</a></span><a id="xref-aff-1-2" class="xref-aff" href="#aff-1"><sup>1</sup></a><span class="xref-sep">,</span><a id="xref-fn-1-1" class="xref-fn" href="#fn-1">†</a><a id="xref-fn-2-1" class="xref-fn" href="#fn-2">‡</a>, 
+                     </li>
+                     <li class="contributor" id="contrib-3" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Kerstin+Mammitzsch&amp;sortspec=date&amp;submit=Submit">Kerstin Mammitzsch</a></span><a id="xref-aff-1-3" class="xref-aff" href="#aff-1"><sup>1</sup></a><span class="xref-sep">,</span><a id="xref-fn-1-2" class="xref-fn" href="#fn-1">†</a>, 
+                     </li>
+                     <li class="contributor" id="contrib-4" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Henricus+T.+S.+Boschker&amp;sortspec=date&amp;submit=Submit">Henricus T. S. Boschker</a></span><a id="xref-aff-2-1" class="xref-aff" href="#aff-2"><sup>2</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-5" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Michael+Laue&amp;sortspec=date&amp;submit=Submit">Michael Laue</a></span><a id="xref-aff-3-1" class="xref-aff" href="#aff-3"><sup>3</sup></a><span class="xref-sep">,</span><a id="xref-fn-3-1" class="xref-fn" href="#fn-3">§</a>, 
+                     </li>
+                     <li class="contributor" id="contrib-6" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=G%C3%BCnter+Jost&amp;sortspec=date&amp;submit=Submit">Günter Jost</a></span><a id="xref-aff-1-4" class="xref-aff" href="#aff-1"><sup>1</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-7" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Sabine+Glaubitz&amp;sortspec=date&amp;submit=Submit">Sabine Glaubitz</a></span><a id="xref-aff-1-5" class="xref-aff" href="#aff-1"><sup>1</sup></a> and 
+                     </li>
+                     <li class="last" id="contrib-8"><span class="name"><a class="name-search"
+                              href="/search?author1=Klaus+J%C3%BCrgens&amp;sortspec=date&amp;submit=Submit">Klaus Jürgens</a></span><a id="xref-aff-1-6" class="xref-aff" href="#aff-1"><sup>1</sup></a></li>
+                  </ol>
+                  <ol class="affiliation-list">
+                     <li class="aff"><a id="aff-1" name="aff-1"></a><address><sup>1</sup>IOW Leibniz Institute for Baltic Sea Research Warnemuende (IOW), Germany
+                        </address>
+                     </li>
+                     <li class="aff"><a id="aff-2" name="aff-2"></a><address><sup>2</sup>Royal Netherlands Institute of Sea Research (NIOZ), Yerseke, Netherlands
+                        </address>
+                     </li>
+                     <li class="aff"><a id="aff-3" name="aff-3"></a><address><sup>3</sup>Arbeitsbereich Medizinische Biologie und Elektronenmikroskopisches Zentrum (EMZ), Universität Rostock, Germany
+                        </address>
+                     </li>
+                  </ol>
+                  <ol class="corresp-list">
+                     <li class="corresp" id="corresp-1"><strong>Correspondence</strong><br /> Matthias Labrenz <span class="em-link"><span class="em-addr">matthias.labrenz{at}io-warnemuende.de</span></span></li>
+                  </ol>
+                  <ul class="author-notes">
+                     <li class="fn-present-address" id="fn-2">
+                        <p id="p-2"><a class="rev-xref" href="#xref-fn-2-1">↵</a><span class="fn-label">‡</span> <strong>Present address:</strong> Center for Microbial Oceanography: Research and Education, SOEST, University of Hawaii at Manoa, Honolulu, HI 96822, USA.
+                        </p>
+                     </li>
+                     <li class="fn-present-address" id="fn-3">
+                        <p id="p-3"><a class="rev-xref" href="#xref-fn-3-1">↵</a><span class="fn-label">§</span> <strong>Present address:</strong> Robert Koch Institute, Berlin, Germany.
+                        </p>
+                     </li>
+                  </ul>
+               </div>
+               <div class="section abstract" id="abstract-1" itemprop="description">
+                  <div class="section-nav">
+                     <div class="nav-placeholder"> </div><a href="#fn-group-1" title="Next Section" class="next-section-link"><span>Next Section</span></a></div>
+                  <h2>Abstract</h2>
+                  
+                  <p id="p-6">A psychro- and aerotolerant bacterium was isolated from the sulfidic water of a pelagic redox zone of the central Baltic Sea.
+                     The slightly curved rod- or spiral-shaped cells were motile by one polar flagellum or two bipolar flagella. Growth was chemolithoautotrophic,
+                     with nitrate or nitrite as electron acceptor and either a variety of sulfur species of different oxidation states or hydrogen
+                     as electron donor. Although the bacterium was able to utilize organic substances such as acetate, pyruvate, peptone and yeast
+                     extract for growth, these compounds yielded considerably lower cell numbers than obtained with reduced sulfur or hydrogen;
+                     in addition, bicarbonate supplementation was necessary. The cells also had an absolute requirement for NaCl. Optimal growth
+                     occurred at 15 °C and at pH 6.6–8.0. The predominant fatty acid of this organism was 16 : 1ω7<em>c</em>, with 3-OH 14 : 0, 16 : 0, 16 : 1ω5<em>c</em>+<em>t</em> and 18 : 1ω7<em>c</em> present in smaller amounts. The DNA G+C content was 33.6 mol%. As determined in 16S rRNA gene sequence phylogeny analysis,
+                     the isolate belongs to the genus <span class="named-content genus" id="named-content-1"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                           href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span>, within the class <span class="named-content class" id="named-content-2"><a class="namesforlife" rel="namesforlife-name" title="Epsilonproteobacteria"
+                           href="doi:10.1601/nm.3783"><em>Epsilonproteobacteria</em></a></span>, with 93.7 to 94.2 % similarity to the other species of the genus <span class="named-content genus" id="named-content-3"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                           href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span>, <span class="named-content species" id="named-content-4"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas autotrophica"
+                           href="doi:10.1601/nm.3857"><em>Sulfurimonas autotrophica</em></a></span>, <span class="named-content species" id="named-content-5"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas paralvinellae"
+                           href="doi:10.1601/nm.10230"><em>Sulfurimonas paralvinellae</em></a></span> and <span class="named-content species" id="named-content-6"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas denitrificans"
+                           href="doi:10.1601/nm.9790"><em>Sulfurimonas denitrificans</em></a></span>. However, the distinct physiological and genotypic differences from these previously described taxa support the description
+                     of a novel species, <em>Sulfurimonas gotlandica</em> sp. nov. The type strain is GD1<sup>T</sup> ( = DSM 19862<sup>T</sup> = JCM 16533<sup>T</sup>). Our results also justify an emended description of the genus <span class="named-content genus" id="named-content-7"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                           href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span>.
+                  </p>
+                  
+               </div>
+               <div class="section fn-group" id="fn-group-1">
+                  <div class="section-nav"><a href="#abstract-1" title="Abstract" class="prev-section-link"><span>Previous Section</span></a><a href="#sec-1" title="Next Section" class="next-section-link"><span>Next Section</span></a></div>
+                  <ul>
+                     <li class="fn-equal" id="fn-1">
+                        <p id="p-1"><a class="rev-xref" href="#xref-fn-1-1">↵</a><span class="fn-label">†</span> These authors contributed equally to this study.
+                        </p>
+                     </li>
+                     <li class="fn-other" id="fn-4">
+                        <p id="p-4">The GenBank/EMBL/DDBJ accession number for the 16S rRNA gene sequence of strain GD1<sup>T</sup> is AFRZ01000001 (804671..806178), locus_tag SMGD1_rRNA3.
+                        </p>
+                     </li>
+                  </ul>
+               </div>
+               <div class="license" id="license-1">
+                  <p id="p-5">This is an open-access article distributed under the terms of the Creative Commons Attribution License, which permits unrestricted
+                     use, distribution, and reproduction in any medium, provided the original work is properly cited.
+                  </p>
+               </div>
+               <p id="p-7">Deep-sea vents are among the most productive marine systems on Earth. The discovery of these primarily chemoautotrophic environments,
+                  in 1977, has been followed by an appreciation of the remarkable physiological and phylogenetic diversity of their endosymbiotic
+                  and often thermophilic inhabitants, most commonly species of the class <span class="named-content class" id="named-content-8"><a class="namesforlife" rel="namesforlife-name" title="Epsilonproteobacteria"
+                        href="doi:10.1601/nm.3783"><em>Epsilonproteobacteria</em></a></span>. Moreover, deep-sea vent chemolithoautotrophs are thought to be representatives of the earliest biological communities on
+                  Earth (see the review by <a id="xref-ref-26-1" class="xref-bibr" href="#ref-26">Nakagawa &amp; Takai, 2008</a>). Indeed, many epsilonproteobacteria are globally ubiquitous in oxygen-deficient and sulfide-rich marine and terrestrial
+                  ecosystems, which accommodate their predominantly auto- to mixotrophic lifestyles (<a id="xref-ref-8-1" class="xref-bibr" href="#ref-8">Campbell <em>et al.</em>, 2006</a>). A number of studies have verified the significant role of epsilonproteobacteria in biogeochemical cycles, particularly
+                  those which are sulfur-dependent, as is the case in deep-sea hydrothermal fields (<a id="xref-ref-27-1" class="xref-bibr" href="#ref-27">Nakagawa <em>et al.</em>, 2005</a>; <a id="xref-ref-8-2" class="xref-bibr" href="#ref-8">Campbell <em>et al.</em>, 2006</a>), sulfidic cave springs (<a id="xref-ref-10-1" class="xref-bibr" href="#ref-10">Engel <em>et al.</em>, 2004</a>) and autotrophic episymbiotic associations (<a id="xref-ref-35-1" class="xref-bibr" href="#ref-35">Suzuki <em>et al.</em>, 2006</a>). In the suboxic to sulfidic transition zones of aquatic pelagic redox zones, high dark CO<sub>2</sub> fixation rates, mainly due to the activities of epsilonproteobacterial chemolithoautotrophs, have been determined, for instance,
+                  in the Black Sea and the Baltic Sea (<a id="xref-ref-14-1" class="xref-bibr" href="#ref-14">Grote <em>et al.</em>, 2008</a>; <a id="xref-ref-12-1" class="xref-bibr" href="#ref-12">Glaubitz <em>et al.</em>, 2010</a>; <a id="xref-ref-20-1" class="xref-bibr" href="#ref-20">Jost <em>et al.</em>, 2008</a>).
+               </p>
+               <p id="p-8">The Baltic Sea is among the largest brackish basins of the world, with periodically anoxic conditions in its bottom waters.
+                  In the region known as the Baltic Proper there are a number of such areas, including the Gotland Deep, where at depths below
+                  50–60 m a stable halocline separates the water column into an upper oxygenated layer and underlying oxygen-deficient and anoxic/sulfidic
+                  layers (<a id="xref-ref-24-1" class="xref-bibr" href="#ref-24">Lepland &amp; Stevens, 1998</a>; <a id="xref-ref-28-1" class="xref-bibr" href="#ref-28">Neretin <em>et al.</em>, 2003</a>), in which high dark CO<sub>2</sub> fixation rates have been reported (<a id="xref-ref-20-2" class="xref-bibr" href="#ref-20">Jost <em>et al.</em>, 2010</a>).
+               </p>
+               <p id="p-9">In stimulation experiments (<a id="xref-ref-22-1" class="xref-bibr" href="#ref-22">Labrenz <em>et al.</em>, 2005</a>; <a id="xref-ref-5-1" class="xref-bibr" href="#ref-5">Brettar <em>et al.</em>, 2006</a>), quantitative 16S rRNA PCR (<a id="xref-ref-21-1" class="xref-bibr" href="#ref-21">Labrenz <em>et al.</em>, 2004</a>), catalysed reporter deposition–fluorescence <em>in situ</em> hybridization (CARD-FISH; <a id="xref-ref-13-1" class="xref-bibr" href="#ref-13">Grote <em>et al.</em>, 2007</a>) and microautoradiography (MICRO)-CARD-FISH (<a id="xref-ref-14-2" class="xref-bibr" href="#ref-14">Grote <em>et al.</em>, 2008</a>) analyses, as well as 16S rRNA stable isotope probing (RNA-SIP; <a id="xref-ref-11-1" class="xref-bibr" href="#ref-11">Glaubitz <em>et al.</em>, 2009</a>), the epsilonproteobacterial ‘Uncultured <span class="named-content family" id="named-content-9"><a class="namesforlife" rel="namesforlife-name" title="Helicobacteraceae"
+                        href="doi:10.1601/nm.3831"><em>Helicobacteraceae</em></a></span> G138eps1/GD17’ subgroup was shown to account for up to 30 % of the total cell numbers in pelagic redox zones of the central
+                  Baltic Sea. The abundance of these bacteria highlights the importance of chemolithoautotrophic denitrification, which was
+                  convincingly demonstrated to be the major N-loss process in water columns with a sulfide–nitrate interface (<a id="xref-ref-4-1" class="xref-bibr" href="#ref-4">Brettar &amp; Rheinheimer, 1991</a>; <a id="xref-ref-16-1" class="xref-bibr" href="#ref-16">Hannig <em>et al.</em>, 2007</a>; <a id="xref-ref-18-1" class="xref-bibr" href="#ref-18">Jensen <em>et al.</em>, 2009</a>), catalysed by the GD17 group as potential key organisms for this process. According to its 16S rRNA phylogeny, the ‘Uncultured
+                  <span class="named-content family" id="named-content-10"><a class="namesforlife" rel="namesforlife-name" title="Helicobacteraceae"
+                        href="doi:10.1601/nm.3831"><em>Helicobacteraceae</em></a></span> G138eps1/GD17’ subgroup belongs to the genus <span class="named-content genus" id="named-content-11"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                        href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span><em>,</em> which comprises mesophilic, facultatively anaerobic, chemolithoautotrophic species originating from deep-sea hydrothermal
+                  and marine sulfidic environments (<a id="xref-ref-36-1" class="xref-bibr" href="#ref-36">Takai <em>et al.</em>, 2006</a>). In previous work (<a id="xref-ref-15-1" class="xref-bibr" href="#ref-15">Grote <em>et al.</em>, 2012</a>) we described the isolation of strain Gotland Deep 1 (GD1<sup>T</sup>), a close phylogenetic relative (16S rRNA similarity of 95.7 %) and thus representative of the Baltic <span class="named-content genus" id="named-content-12"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                        href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span> ‘Uncultured <span class="named-content family" id="named-content-13"><a class="namesforlife" rel="namesforlife-name" title="Helicobacteraceae"
+                        href="doi:10.1601/nm.3831"><em>Helicobacteraceae</em></a></span> G138eps1/GD17’ subgroup. Selected genomic and physiological data suggested an ecological role for GD1<sup>T</sup>, especially with respect to its sulfide detoxification ability (<a id="xref-ref-15-2" class="xref-bibr" href="#ref-15">Grote <em>et al.</em>, 2012</a>). Here, we expand on previous work by presenting the taxonomic characteristics of GD1<sup>T</sup>. Our results form the basis of an emended description of the genus <span class="named-content genus" id="named-content-14"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                        href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span>.
+               </p>
+               <p id="p-10">Strain GD1<sup>T</sup> was isolated from a pelagic redox zone of the Gotland Deep in the central Baltic Sea during a research cruise on board the
+                  RV <em>Alkor</em> in May 2005 (57° 19.2′ N 20° 03′ E). Water was collected in a free-flow bottle attached to a CTD-rosette from a depth of
+                  215 m. The <em>in situ</em> temperature was 6 °C, the salinity 13 practical salinity units (PSU), and the sulfide concentration 11 µM. Directly on board,
+                  100 µM KNO<sub>3</sub> and 100 µM Na<sub>2</sub>S<sub>2</sub>O<sub>3</sub> were added to the water samples, which were then incubated in the dark at 10 °C under anoxic conditions. For further isolation
+                  and cultivation in the laboratory, a modified version of artificial brackish water medium (ABW) (<a id="xref-ref-7-1" class="xref-bibr" href="#ref-7">Bruns <em>et al.</em>, 2002</a>) was used, consisting of 95 mM NaCl, 11.2 mM MgCl<sub>2</sub> . 6H<sub>2</sub>O, 2.3 mM CaCl<sub>2</sub> . 2H<sub>2</sub>O, 2.0 mM KCl, 6.4 mM Na<sub>2</sub>SO<sub>4</sub>, 192 µM KBr, 92 µM H<sub>3</sub>BO<sub>3</sub>, 34 µM SrCl<sub>2</sub>, 92 µM NH<sub>4</sub>Cl, 9 µM KH<sub>2</sub>PO<sub>4</sub> and 16 µM NaF, buffered with 10 mM HEPES (pH 7.3). For anaerobic cultivation, the medium was boiled, bubbled with N<sub>2</sub> for 30 min, and then autoclaved under anoxic conditions. Subsequently, anoxic and sterile-filtered 0.1 % (v/v) of the trace
+                  element solution SL10 (<a id="xref-ref-39-1" class="xref-bibr" href="#ref-39">Widdel <em>et al.</em>, 1983</a>), 0.2 % (v/v) of a 10-vitamin solution (<a id="xref-ref-2-1" class="xref-bibr" href="#ref-2">Balch <em>et al.</em>, 1979</a>), 0.02 % (v/v) of a selenite–tungstate solution (<a id="xref-ref-38-1" class="xref-bibr" href="#ref-38">Widdel &amp; Bak, 1992</a>), and 2–5 mM NaHCO<sub>3</sub> were added. The standard medium ABW+nitrate+thiosulfate (ABW+NS) was prepared by the variable addition of 10 mM KNO<sub>3</sub> and 10 mM Na<sub>2</sub>S<sub>2</sub>O<sub>3</sub>, with the final concentration depending on the experiment. A pure culture was acquired by the dilution to extinction method
+                  and was cryopreserved at −80 °C in glycerol for long-term storage.
+               </p>
+               <p id="p-11">Morphological, physiological, and metabolic characteristics were, for the most part, analysed as described earlier (<a id="xref-ref-15-3" class="xref-bibr" href="#ref-15">Grote <em>et al.</em>, 2012</a>). For these analyses, strain GD1<sup>T</sup> was cultivated in triplicate for 7–10 days at 15 °C in the dark. Growth was usually measured by counting 4′,6′-diamidino-2-phenylindol
+                  (DAPI) stained cells, observed using epifluorescence microscopy, or by flow cytometric determinations of SYBR-Green I (Molecular
+                  Probes) stained cells (<a id="xref-ref-23-1" class="xref-bibr" href="#ref-23">Labrenz <em>et al.</em>, 2007</a>) at the end of the experiment. <span class="named-content species" id="named-content-15"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas denitrificans"
+                        href="doi:10.1601/nm.9790"><em>Sulfurimonas denitrificans</em></a></span> DSM 1251<sup>T</sup> was used as the reference strain in the cultivation experiments.
+               </p>
+               <p id="p-12">Isolate GD1<sup>T</sup> is a motile, Gram-reaction-negative, slightly curved or spirilla-shaped bacterium typically with one polar flagellum (<a id="xref-fig-1-1" class="xref-fig" href="#F1">Fig. 1a, b</a>), but in some cases two flagella at opposite poles (<a id="xref-fig-1-2" class="xref-fig" href="#F1">Fig. 1c</a>). Cell width was rather constant (mean = 0.66 µm, <span class="sc">sd</span> = 0.083 µm, <em>n</em> = 112) whereas cell length, i.e. from pole to pole, was variable (mean = 2.1 µm, <span class="sc">sd</span> = 0.54 µm, <em>n</em> = 112). The cells had a positive chemotactic response to nitrate (<a id="xref-ref-15-4" class="xref-bibr" href="#ref-15">Grote <em>et al.</em>, 2012</a>). Under optimal conditions in ABW+NS medium the cell doubling time of strain GD1<sup>T</sup> was 13 h. Cells in older cultures tended to form aggregates. Growth at temperatures in the range of 4–40 °C was investigated,
+                  with highest cell numbers obtained between 4 and 20 °C and optimal growth at 15 °C (<a id="xref-ref-15-5" class="xref-bibr" href="#ref-15">Grote <em>et al.</em>, 2012</a>). Thus, isolate GD1<sup>T</sup> is the first psychrotolerant species within the genus <span class="named-content genus" id="named-content-16"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                        href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span>, in which all member species at the time of writing are mesophilic (<a id="xref-table-wrap-1-1" class="xref-table" href="#T1">Table 1</a>).
+               </p>
+               <div id="F1" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4141/F1.expansion.html"><img alt="Fig. 1. " src="4141/F1.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4141/F1.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4141/F1.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4141/F1">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 1. </span> 
+                     
+                     <p id="p-13" class="first-child">Cell morphology of spirilla-shaped cells of strain GD1<sup>T</sup> cultivated on ABW+NS medium. (a) Fluorescence microscopy of 4′,6′-diamidino-2-phenylindol (DAPI) stained cells. (b) Transmission
+                        electron microscopy of a bacterium with one flagellum and (c) of a bacterium with two flagella (indicated by arrows), both
+                        negatively stained with phosphotungstic acid.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <div id="T1" class="table pos-float">
+                  <div class="table-inline">
+                     <div class="callout"><span>View this table:</span><ul class="callout-links">
+                           <li><a href="4141/T1.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4141/T1.expansion.html">In a new window</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="table-caption"><span class="table-label">Table 1. </span> 
+                     <span class="caption-title">Differential characteristics between strain GD1<sup>T</sup> and species of the genus <span class="named-content genus" id="named-content-17"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                              href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span></span>
+                     
+                     <p id="p-14" class="first-child">Taxa: 1, <em>Sulfurimonas gotlandica</em> sp. nov. GD1<sup>T</sup>; 2, <span class="named-content species" id="named-content-18"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas denitrificans"
+                              href="doi:10.1601/nm.9790"><em>Sulfurimonas denitrificans</em></a></span> DSM 1251<sup>T</sup> (data from this study; <a id="xref-ref-37-1" class="xref-bibr" href="#ref-37">Timmer-ten Hoor, 1975</a>; <a id="xref-ref-6-1" class="xref-bibr" href="#ref-6">Brinkhoff <em>et al.</em>, 2005</a>); 3, <span class="named-content species" id="named-content-19"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas paralvinellae"
+                              href="doi:10.1601/nm.10230"><em>Sulfurimonas paralvinellae</em></a></span> GO25<sup>T</sup> (<a id="xref-ref-36-2" class="xref-bibr" href="#ref-36">Takai <em>et al.</em>, 2006</a>); 4, <span class="named-content species" id="named-content-20"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas autotrophica"
+                              href="doi:10.1601/nm.3857"><em>Sulfurimonas autotrophica</em></a></span> OK10<sup>T</sup> (<a id="xref-ref-17-1" class="xref-bibr" href="#ref-17">Inagaki <em>et al.</em>, 2003</a>). <span class="sc">nd</span>, Not determined; +, positive; −, negative.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <p id="p-20">To obtain media with different pH values, the pH of a 20 ml subsample from the anoxic ABW+NS was adjusted to pH 6.0, 6.5,
+                  6.7, 6.9, 7.1, 7.5, 8.0, 8.4 and 9.0 by the addition of the appropriate amount of 0.1M HCl. For the experimental setup, the
+                  corresponding amount of 1 M HCl was added to the media preparations, which were then inoculated. After 14 days of incubation,
+                  the pH was measured. At an initial pH of 6.5–8.4, it remained constant (±0.02) throughout the experiment whereas below and
+                  above this range it decreased by about 0.18–0.25 pH units. Optimal growth occurred over a wide pH range (6.7–8.0) but no growth
+                  occured at pH 6.0 and 8.4. The NaCl requirement was determined by cultivation in ABW+NS containing the following salt concentrations
+                  [NaCl (g l<sup>−1</sup>)/MgCl<sub>2</sub> . 6H<sub>2</sub>O (g l<sup>−1</sup>)]: 0/0, 0/0.50, 2.50/0.38, 5.00/0.75, 7.50/1.13, 10.00/1.50, 12.50/1.88, 15.00/2.25, 17.50/2.63 and 20.00/3.00. The isolate
+                  had an absolute requirement for NaCl and grew best with between 10 and 20 g NaCl l<sup>−1</sup>; the upper limit for growth was not further determined. No growth was observed in media without added NaCl, in contrast to
+                  <span class="named-content species" id="named-content-21"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas denitrificans"
+                        href="doi:10.1601/nm.9790"><em>Sulfurimonas denitrificans</em></a></span> DSM 1251<sup>T</sup>, which grew equally well without NaCl and at all NaCl concentrations tested (<a id="xref-table-wrap-1-2" class="xref-table" href="#T1">Table 1</a>).
+               </p>
+               <p id="p-21">To identify the electron donors sustaining chemoautotrophic growth of isolate GD1<sup>T</sup>, ABW medium containing 5 mM nitrate was supplemented with sulfite (1 mM), sulfide (10 µM, 20 µM, 100 µM) or elemental sulfur
+                  (1 mM). Hydrogen utilization was assessed by bubbling ABW+NS with forming gas (N<sub>2</sub>/H<sub>2</sub>, 95 : 5) for several hours prior to inoculation and cultivation. Strain GD1<sup>T</sup> was able to use all of the tested electron donors as an energy source for growth although growth was inhibited by sulfide
+                  concentrations &gt;20 µM (<a id="xref-ref-15-6" class="xref-bibr" href="#ref-15">Grote <em>et al.</em>, 2012</a>). This observation is in accordance with <em>in situ</em> activities of chemoautotrophic micro-organisms in pelagic Gotland Deep redox zones, where dark CO<sub>2</sub> fixation rates are significantly reduced at environmental sulfide concentrations &gt;20 µM (<a id="xref-ref-20-3" class="xref-bibr" href="#ref-20">Jost <em>et al.</em>, 2010</a>). As electron acceptors, nitrate (100 µM, 2 mM, 5 mM, 10 mM), nitrite (600 µM, 2 mM) (<a id="xref-ref-15-7" class="xref-bibr" href="#ref-15">Grote <em>et al.</em>, 2012</a>), manganese(IV) oxide (200 µM), manganese(III) acetate dihydrate (2.4 mM), iron(III) chloride hexahydrate (5 mM), fumarate
+                  (100 µM) and oxygen (4 % saturation, approx. 12 µmol O<sub>2</sub> l<sup>−1</sup>) were tested in ABW containing 5 mM thiosulfate. For the oxygen experiment, the oxygen content in fully oxygenated ABW+thiosulfate
+                  was measured with an optode (POF-PSt3; PreSens) and the appropriate amount of oxygen was then mixed with anoxic ABW+thiosulfate
+                  to achieve the desired amount of saturation. However, only nitrate and nitrite served as electron acceptors during growth
+                  of the bacterium.
+               </p>
+               <p id="p-22">Although the manganese and iron concentrations tested may have been too high and thereby suppressed cell growth, previous
+                  thiosulfate/manganese stimulation experiments with Baltic Sea water samples containing lower metal concentrations similarly
+                  failed to reveal active manganese-reducing species of the genus <span class="named-content genus" id="named-content-22"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                        href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span> (<a id="xref-ref-22-2" class="xref-bibr" href="#ref-22">Labrenz <em>et al.</em>, 2005</a>). <span class="named-content species" id="named-content-23"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas autotrophica"
+                        href="doi:10.1601/nm.3857"><em>Sulfurimonas autotrophica</em></a></span> is likewise unable to reduce ferrihydrite (<a id="xref-ref-17-2" class="xref-bibr" href="#ref-17">Inagaki <em>et al.</em>, 2003</a>), which further supports the lack of direct participation of strain GD1<sup>T</sup> in the Mn/Fe-shuttle (<a id="xref-ref-28-2" class="xref-bibr" href="#ref-28">Neretin <em>et al.</em>, 2003</a>) of Baltic pelagic redox zones. It also cannot be excluded that strain GD1<sup>T</sup> is able to grow in medium with an oxygen concentration below 4 %, given that the genome of this bacterium includes a gene
+                  encoding a putative cbb3-type cytochrome <em>c</em> oxidase with the potential to mediate aerobic respiration (<a id="xref-ref-15-8" class="xref-bibr" href="#ref-15">Grote <em>et al.</em>, 2012</a>). If aerobic respiration could occur at very low oxygen concentrations, it was beyond the scope of our experimental design.
+                  The oxygen sensitivity of strain GD1<sup>T</sup> was examined in detail, using ABW+NS with oxygen saturations of 0.5, 3, 5, 10, 20, 30, 40 and 50 %. Compared to oxygen-free
+                  conditions, oxygen concentrations ≥20 % reduced or inhibited the growth of this strain whereas oxygen concentration ≤10 %
+                  had no such effect (<a id="xref-ref-15-9" class="xref-bibr" href="#ref-15">Grote <em>et al.</em>, 2012</a>). Thus, the oxygen tolerance of strain GD1<sup>T</sup> is similar to that of aerobic <span class="named-content species" id="named-content-24"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas autotrophica"
+                        href="doi:10.1601/nm.3857"><em>Sulfurimonas autotrophica</em></a></span> OK10<sup>T</sup> (<a id="xref-table-wrap-1-3" class="xref-table" href="#T1">Table 1</a>). Based on our current knowledge, we consider strain GD1<sup>T</sup> to be an aerotolerant representative of the genus <span class="named-content genus" id="named-content-25"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                        href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span>.
+               </p>
+               <p id="p-23">Chemolithoautotrophic growth was directly confirmed in ABW+NS containing <sup>14</sup>C-bicarbonate followed by a combination of fluorescence <em>in situ</em> hybridization and microautoradiography (MICRO-CARD-FISH) (<a id="xref-ref-15-10" class="xref-bibr" href="#ref-15">Grote <em>et al.</em>, 2012</a>). As electron donor (in ABW+5 mM KNO<sub>3</sub>) alone or as electron donor and sole carbon source (in NaHCO<sub>3</sub>-free ABW+5 mM KNO<sub>3</sub>) the following compounds were tested: (a) glucose (0.1 mM), (b) a mixture of lactate, malate, fumarate, succinate, glycerine
+                  and glucose (abbreviated as mix 4) (100 µM), (c) yeast extract (0.01 mg l<sup>−1</sup>), (d) pyruvate (100 µM), (e) acetate (100 µM), (f) fumarate (100 µM), (g) alcohol mix (butanol, ethanol, methanol, propanol;
+                  100 µM) (<a id="xref-ref-15-11" class="xref-bibr" href="#ref-15">Grote <em>et al.</em>, 2012</a>) and (h) an amino acid mix (0.1 mM) consisting of (g l<sup>−1</sup>): β-alanine 0.466, <span class="sc">l</span>-arginine 0.872, <span class="sc">l</span>-asparagine 0.750, <span class="sc">l</span>-cysteine 0.606, <span class="sc">l</span>-glutamine 0.730, <span class="sc">l</span>-glutamic acid 0.736, glycine 0.376, isoleucine 0.656, <span class="sc">l</span>-leucine 0.656, <span class="sc">l</span>-methionine 0.746, <span class="sc">l</span>-phenylalanine 0.826, <span class="sc">l</span>-serine 0.526, <span class="sc">l</span>-threonine 0.596, <span class="sc">l</span>-valine 0.586, <span class="sc">l</span>-proline 0.576, <span class="sc">l</span>-tryptophan 1.022, <span class="sc">l</span>-histidine 0.776, <span class="sc">l</span>-lysine 0.822, <span class="sc">l</span>-tyrosine 0.906 and <span class="sc">l</span>-asparagine 0.666.
+               </p>
+               <p id="p-24">In the presence of 2 mM NaHCO<sub>3</sub>, the growth of isolate GD1<sup>T</sup> was promoted with formate, acetate, yeast extract, pyruvate and the amino acid mix as electron donors. However, maximal cell
+                  numbers were usually more than a magnitude less than those reached with thiosulfate/nitrate-containing medium, as shown in
+                  <a id="xref-fig-2-1" class="xref-fig" href="#F2">Fig. 2(a)</a> for pyruvate, which was also used in radiotracer experiments aimed at confirming the capability of strain GD1<sup>T</sup> to use organics as electron donor. In those experiments, CO<sub>2</sub> production was measured following the addition of 16 kBq [2-<sup>14</sup>C]pyruvate (specific activity 0.6 GBq mmol<sup>−1</sup>) to cultures grown solely on pyruvate or on thiosulfate/pyruvate. After 24 h or 72 h of incubation, CO<sub>2</sub> was degassed by the acidification of cell-free medium and trapped in ethanolamine. In nitrate/pyruvate medium, the growth
+                  of strain GD1<sup>T</sup> was accompanied by elevated CO<sub>2</sub> production (<a id="xref-fig-2-2" class="xref-fig" href="#F2">Fig. 2b</a>). The simultaneous incorporation of [2-<sup>14</sup>C]pyruvate into GD1T cells was much less pronounced, but its uptake and contribution to biomass production were clearly determined
+                  in thiosulfate/nitrate/pyruvate medium, where total cell numbers were also higher than those reached in thiosulfate/nitrate
+                  medium (<a id="xref-fig-2-3" class="xref-fig" href="#F2">Fig. 2a</a>), but the difference was not statistically significant (unpublished data). By contrast, in NaHCO<sub>3</sub>-free medium strain GD1<sup>T</sup> was unable to use any of the organics offered simultaneously as electron donor and carbon source (<a id="xref-fig-2-4" class="xref-fig" href="#F2">Fig. 2a</a>). It has long been recognized that even heterotrophic bacteria may require CO<sub>2</sub> for growth (<a id="xref-ref-9-1" class="xref-bibr" href="#ref-9">Dehority, 1971</a>), e.g. in anaplerotic reactions (<a id="xref-ref-1-1" class="xref-bibr" href="#ref-1">Alonso-Sáez <em>et al.</em>, 2010</a>). Similar findings were reported for <span class="named-content species" id="named-content-26"><a class="namesforlife" rel="namesforlife-name" title="Nitrobacter hamburgensis"
+                        href="doi:10.1601/nm.1487"><em>Nitrobacter hamburgensis</em></a></span>, which requires atmospheric CO<sub>2</sub> or the addition of sodium carbonate for mixotrophic growth (in the presence of NO<sub>2</sub><sup>−</sup>) on <span class="sc">d</span>-lactate (<a id="xref-ref-33-1" class="xref-bibr" href="#ref-33">Starkenburg <em>et al.</em>, 2008</a>). The authors of that study suggested that CO<sub>2</sub> fixation served as a reductant sink necessary to maintain cellular redox balance. The physiological background for the growth
+                  of isolate GD1<sup>T</sup> on organics is thus far unclear. In other species of the genus <span class="named-content genus" id="named-content-27"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                        href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span>, organic substance utilization is variable. For example, in a similar experiment <span class="named-content species" id="named-content-28"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas denitrificans"
+                        href="doi:10.1601/nm.9790"><em>Sulfurimonas denitrificans</em></a></span> was able to use formate, fumarate, yeast extract and the alcohol mix as electron donors (<a id="xref-table-wrap-1-4" class="xref-table" href="#T1">Table 1</a>). The ability of this bacterium to oxidize formate was proposed in a genome analysis, which identified a formate dehydrogenase
+                  complex (<a id="xref-ref-31-1" class="xref-bibr" href="#ref-31">Sievert <em>et al.</em>, 2008</a>). Homologues of genes involved in glycolysis and proteolysis are also present in the genome of strain GD1<sup>T</sup> (<a id="xref-ref-15-12" class="xref-bibr" href="#ref-15">Grote <em>et al.</em>, 2012</a>), whereas <span class="named-content species" id="named-content-29"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas autotrophica"
+                        href="doi:10.1601/nm.3857"><em>Sulfurimonas autotrophica</em></a></span> (<a id="xref-ref-17-3" class="xref-bibr" href="#ref-17">Inagaki <em>et al.</em>, 2003</a>; but tested without bicarbonate supplementation to the organic medium) and <span class="named-content species" id="named-content-30"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas paralvinellae"
+                        href="doi:10.1601/nm.10230"><em>Sulfurimonas paralvinellae</em></a></span> (<a id="xref-ref-36-3" class="xref-bibr" href="#ref-36">Takai <em>et al.</em>, 2006</a>) are unable to grow on organic compounds. In conclusion, although under specific circumstances organic compounds enhance
+                  the growth of some species of the genus <span class="named-content genus" id="named-content-31"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                        href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span>, members of this genus characteristically grow chemolithoautotrophically.
+               </p>
+               <div id="F2" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4141/F2.expansion.html"><img alt="Fig. 2. " src="4141/F2.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4141/F2.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4141/F2.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4141/F2">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 2. </span> 
+                     
+                     <p id="p-25" class="first-child">Impact of pyruvate on the growth of isolate GD1<sup>T</sup>. Error bars indicate the standard deviation of three independent replicates for each assay. (a) Growth on media with different
+                        substrate combinations: 1, NaHCO<sub>3</sub>, S<sub>2</sub>O<sub>3</sub><sup>2-</sup>, NO<sub>3</sub><sup>−</sup>; 2, NaHCO<sub>3</sub>, S<sub>2</sub>O<sub>3</sub><sup>2-</sup>, NO<sub>3</sub><sup>−</sup>, pyruvate; 3, NaHCO<sub>3</sub>, pyruvate; 4, pyruvate; 5, ABW without further supplements. The relative enrichment factor describes the increase of cell
+                        numbers after 7 days of incubation compared to the initial cell numbers after inoculation at day 0 (6.1×10<sup>5</sup> ml<sup>−1</sup>). (b) <sup>14</sup>CO<sub>2</sub> production and [<sup>14</sup>C]pyruvate incorporation after 24 h and 72 h of incubation. Media: 1, NaHCO<sub>3</sub>, S<sub>2</sub>O<sub>3</sub><sup>2-</sup>, NO<sub>3</sub><sup>−</sup>, [<sup>14</sup>C]pyruvate; 2, NaHCO<sub>3</sub>, NO<sub>3</sub><sup>−</sup>, [<sup>14</sup>C]pyruvate. P, pyruvate incorporation; CO<sub>2</sub>, CO<sub>2</sub> production.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <p id="p-26">Total fatty acids and phospholipid-derived fatty acids were extracted as described by Sasser (1990) and <a id="xref-ref-3-1" class="xref-bibr" href="#ref-3">Boschker (2004)</a>, respectively, and analysed by gas chromatography with a flame-ionization detector on a non-polar HP-5ms column (Agilent).
+                  The dominant cellular fatty acid of strain GD1<sup>T</sup> was 16 : 1ω7<em>c</em>, with 3-OH 14 : 0, 16 : 0, 16 : 1ω5<em>c</em>+<em>t</em>, and 18 : 1ω7<em>c</em> detected in lower amounts. This fatty acid profile is comparable to those of other species of the genus <span class="named-content genus" id="named-content-32"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                        href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span> but most similar to that of <span class="named-content species" id="named-content-33"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas denitrificans"
+                        href="doi:10.1601/nm.9790"><em>Sulfurimonas denitrificans</em></a></span> (<a id="xref-table-wrap-1-5" class="xref-table" href="#T1">Table 1</a>). This may reflect the fact that strain GD1<sup>T</sup> and <span class="named-content species" id="named-content-34"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas denitrificans"
+                        href="doi:10.1601/nm.9790"><em>Sulfurimonas denitrificans</em></a></span> were cultivated on ABW+NS under identical conditions. However, a high percentage of C16 : 0 and one or both of the monounsaturated
+                  C16 and C18 fatty acids has also been described in other members of the class <span class="named-content class" id="named-content-35"><a class="namesforlife" rel="namesforlife-name" title="Epsilonproteobacteria"
+                        href="doi:10.1601/nm.3783"><em>Epsilonproteobacteria</em></a></span>, such as <span class="named-content species" id="named-content-36"><a class="namesforlife" rel="namesforlife-name" title="Nitratifractor salsuginis"
+                        href="doi:10.1601/nm.9373"><em>Nitratifractor salsuginis</em></a></span> and <span class="named-content species" id="named-content-37"><a class="namesforlife" rel="namesforlife-name" title="Sulfurovum lithotrophicum"
+                        href="doi:10.1601/nm.8874"><em>Sulfurovum lithotrophicum</em></a></span> (<a id="xref-ref-34-1" class="xref-bibr" href="#ref-34">Suzuki <em>et al.</em>, 2005</a>). Accordingly, this combination may be a general characteristic of these epsilonproteobacteria.
+               </p>
+               <p id="p-27">The DNA guanine-plus-cytosine (G+C) content of strain GD1<sup>T</sup> was determined to be 33.6 mol%, as calculated by analysis of the whole genome (<a id="xref-ref-15-13" class="xref-bibr" href="#ref-15">Grote <em>et al.</em>, 2012</a>).
+               </p>
+               <p id="p-28">To establish the closest relatives of strain GD1<sup>T</sup> based on 16S rRNA sequencing, preliminary searches in the EMBL Data Library were performed with the program <span class="sc">fasta</span> (<a id="xref-ref-29-1" class="xref-bibr" href="#ref-29">Pearson &amp; Lipman, 1988</a>). Closely related sequences were retrieved from GenBank and aligned and analysed with the newly determined sequence, within
+                  the program <span class="sc">arb</span> (<a id="xref-ref-25-1" class="xref-bibr" href="#ref-25">Ludwig <em>et al.</em>, 2004</a>). Sequences for analysis were reduced to unambiguously alignable positions using group-specific filters. For phylogenetic
+                  analyses, three different trees were calculated using the neighbour-joining, parsimony and maximum-likelihood (Phyml) algorithms
+                  based on nearly full-length 16S rRNA sequences (approx. 1400 bp). For neighbour-joining, the Jukes–Cantor-correction was applied.
+                  Shorter sequences were gradually inserted into the reconstructed tree without changing the topology. Sequence searches of
+                  the EMBL database (latest: 2013-05-14) revealed that our isolate is related to the epsilon class of the phylum <span class="named-content phylum" id="named-content-38"><a class="namesforlife" rel="namesforlife-name" title="Proteobacteria"
+                        href="doi:10.1601/nm.808"><em>Proteobacteria</em></a></span> (data not shown). In a pairwise analysis, it displayed highest (93.7–94.2 %) 16S rRNA gene sequence similarity to species
+                  of the genus <span class="named-content genus" id="named-content-39"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                        href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span> and to the Baltic ‘Uncultured <span class="named-content family" id="named-content-40"><a class="namesforlife" rel="namesforlife-name" title="Helicobacteraceae"
+                        href="doi:10.1601/nm.3831"><em>Helicobacteraceae</em></a></span> G138eps1/GD17’ subgroup (95.7 %). Lower levels of relatedness (≤91 % sequence similarity) were determined for the other examined
+                  species belonging to the epsilon class of the phylum <span class="named-content phylum" id="named-content-41"><a class="namesforlife" rel="namesforlife-name" title="Proteobacteria"
+                        href="doi:10.1601/nm.808"><em>Proteobacteria</em></a></span>.
+               </p>
+               <p id="p-29">An unrooted tree reconstructed using the neighbour-joining method showed the phylogenetic position of the novel bacterium,
+                  strain GD1<sup>T</sup>, amongst the members of the class <span class="named-content class" id="named-content-42"><a class="namesforlife" rel="namesforlife-name" title="Epsilonproteobacteria"
+                        href="doi:10.1601/nm.3783"><em>Epsilonproteobacteria</em></a></span> (<a id="xref-fig-3-1" class="xref-fig" href="#F3">Fig. 3</a>). Treeing analyses confirmed it to be a member of the genus <span class="named-content genus" id="named-content-43"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                        href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span>, forming a stable cluster with the ‘Uncultured <span class="named-content family" id="named-content-44"><a class="namesforlife" rel="namesforlife-name" title="Helicobacteraceae"
+                        href="doi:10.1601/nm.3831"><em>Helicobacteraceae</em></a></span> G138eps1/GD17’ subgroup. This cluster is specifically detected by the SUL90 16S rRNA gene probe, originally developed to
+                  be 100 % complementary to the G138eps1/GD17 target site (<a id="xref-ref-13-2" class="xref-bibr" href="#ref-13">Grote <em>et al.</em>, 2007</a>).
+               </p>
+               <div id="F3" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4141/F3.expansion.html"><img alt="Fig. 3. " src="4141/F3.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4141/F3.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4141/F3.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4141/F3">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 3. </span> 
+                     
+                     <p id="p-30" class="first-child">Unrooted tree showing phylogenetic relationships of isolate GD1<sup>T</sup> and closely related members of the class <span class="named-content class" id="named-content-45"><a class="namesforlife" rel="namesforlife-name" title="Epsilonproteobacteria"
+                              href="doi:10.1601/nm.3783"><em>Epsilonproteobacteria</em></a></span>. The tree was reconstructed using the neighbour-joining method and was based on a comparison of approximately 1400 nt. Solid
+                        squares indicate that the corresponding nodes (or groups) were recovered in neighbour-joining, maximum-parsimony and maximum-likelihood
+                        methods. Branching points supported by two algorithms are marked by an open square. The following strains were used as an
+                        outgroup (not shown): <span class="named-content species" id="named-content-46"><a class="namesforlife" rel="namesforlife-name"
+                              title="Antarctobacter heliothermus"
+                              href="doi:10.1601/nm.1057"><em>Antarctobacter heliothermus</em></a></span> EL-219<sup>T</sup>, <span class="named-content species" id="named-content-47"><a class="namesforlife" rel="namesforlife-name" title="Sagittula stellata"
+                              href="doi:10.1601/nm.1149"><em>Sagittula stellata</em></a></span> E-37<sup>T</sup>, <span class="named-content species" id="named-content-48"><a class="namesforlife" rel="namesforlife-name" title="Roseovarius tolerans"
+                              href="doi:10.1601/nm.1140"><em>Roseovarius tolerans</em></a></span> EL-172<sup>T</sup>, <span class="named-content species" id="named-content-49"><a class="namesforlife" rel="namesforlife-name" title="Roseovarius nubinhibens"
+                              href="doi:10.1601/nm.1141"><em>Roseovarius nubinhibens</em></a></span> ISM<sup>T</sup> and <span class="named-content species" id="named-content-50"><a class="namesforlife" rel="namesforlife-name" title="Roseovarius mucosus"
+                              href="doi:10.1601/nm.9734"><em>Roseovarius mucosus</em></a></span> DFL-24<sup>T</sup>. Bar, 1 substitution per 10 nt.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <p id="p-31">There is no precise correlation between percentage 16S rRNA sequence divergence and species delineation, but it is generally
+                  recognized that divergence values ≥3 % are significant (<a id="xref-ref-32-1" class="xref-bibr" href="#ref-32">Stackebrandt &amp; Goebel, 1994</a>). However, it is pertinent to note that the phylogenetic separateness of strain GD1<sup>T</sup> is strongly supported by phenotypic considerations. For instance, this novel bacterium is distinguishable from other species
+                  of the genus <span class="named-content genus" id="named-content-51"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                        href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span> by its psychrotolerance and energy metabolism (<a id="xref-table-wrap-1-6" class="xref-table" href="#T1">Table 1</a>). Additional characteristics useful in differentiating Baltic isolate GD1<sup>T</sup> from related organisms are shown in <a id="xref-table-wrap-1-7" class="xref-table" href="#T1">Table 1</a>. Based on phenotypic and genetic evidence, we propose the classification of strain GD1<sup>T</sup> as a representative of a novel species of the genus <span class="named-content genus" id="named-content-52"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                        href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span>: <em>Sulfurimonas gotlandica</em> sp. nov.
+               </p>
+               <div class="section" id="sec-1">
+                  <div class="section-nav"><a href="#fn-group-1" title="Previous Section" class="prev-section-link"><span>Previous Section</span></a><a href="#ack-1" title="Acknowledgements" class="next-section-link"><span>Next Section</span></a></div>
+                  
+                  
+                  <div id="sec-2" class="subsection">
+                     
+                     <h3>Emended description of the genus <span class="named-content genus" id="named-content-53"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas"
+                              href="doi:10.1601/nm.3856"><em>Sulfurimonas</em></a></span></h3>
+                     
+                     <p id="p-32">The description is based on that by <a id="xref-ref-36-4" class="xref-bibr" href="#ref-36">Takai <em>et al.</em> (2006)</a>. Cells are Gram-negative and morphologically variable. Straight to slightly short rods, elongated rods and spiral in different
+                        growth phases and under different growth conditions. Psychrotolerant to mesophilic and aerotolerant to facultatively anaerobic.
+                        Do not always require NaCl for growth. Optimal growth occurs chemolithoautotrophically with sulfide, S<sup>0</sup>, thiosulfate and H<sub>2</sub> as electron donors, and with nitrate, nitrite and O<sub>2</sub> as electron acceptors, using CO<sub>2</sub> as a carbon source. Supplementation of bicarbonate can enable growth on organic substances, but yields much lower cell numbers
+                        compared to growth on reduced sulfur or hydrogen. Potential ecological niches are deep-sea hydrothermal environments and benthic
+                        or pelagic marine to brackish transition zones from oxic to anoxic/sulfidic environments. The type species is <span class="named-content species" id="named-content-54"><a class="namesforlife" rel="namesforlife-name" title="Sulfurimonas autotrophica"
+                              href="doi:10.1601/nm.3857"><em>Sulfurimonas autotrophica</em></a></span> (<a id="xref-ref-17-4" class="xref-bibr" href="#ref-17">Inagaki <em>et al.</em> 2003</a>).
+                     </p>
+                     
+                  </div>
+                  <div id="sec-3" class="subsection">
+                     
+                     <h3>Description of <em>Sulfurimonas gotlandica</em> sp. nov.
+                     </h3>
+                     
+                     <p id="p-33"><em>Sulfurimonas</em> <em>gotlandica</em> (got.lan′di.ca. N.L. fem. adj. <em>gotlandica</em> pertaining to the Gotland Deep, the basin in the central Baltic Sea from which the organism was first isolated).
+                     </p>
+                     
+                     <p id="p-34">Gram-negative, slightly curved or spirilla-shaped cells. Motile by one polar flagellum or two flagella at opposite poles.
+                        Cells exhibit a positive chemotactic response to nitrate. Cell sizes are 0.66±0.083×2.1±0.54 µm. Cells have a tendency to
+                        aggregate at older stages. Psychro- and aerotolerant. The temperature range for growth is 4–20 °C. Optimal growth occurs at
+                        15 °C and pH 6.7–8.0. The cells have an absolute requirement for NaCl. Chemolithoautotrophic growth occurs with H<sub>2</sub>, HS<sup>−</sup>, S<sup>0</sup> and thiosulfate. Supplementation of bicarbonate can enable growth on formate, acetate, yeast extract, pyruvate or amino acid
+                        mix, but yields much lower cell numbers compared with growth on reduced sulfur or hydrogen. Sulfide concentrations of more
+                        than 20 µM inhibit, but up to 10 % of oxygen in the medium does not influence growth. Dominant cellular fatty acid is 16 : 1ω7<em>c</em>, with 14 : 0, 16 : 0, 16 : 1ω5<em>c</em>+<em>t</em>, and 18 : 1ω7<em>c</em> present in smaller amounts.
+                     </p>
+                     
+                     <p id="p-35">The type strain is GD1<sup>T</sup> ( = DSM 19862<sup>T</sup> = JCM 16533<sup>T</sup>), isolated from water of a pelagic redox zone of the central Baltic Sea. The G+C content of the type strain is 33.6 mol%.
+                     </p>
+                     
+                  </div>
+               </div>
+               <div class="section ack" id="ack-1">
+                  <div class="section-nav"><a href="#sec-1" title="Previous Section" class="prev-section-link"><span>Previous Section</span></a><a href="#ref-list-1" title="References" class="next-section-link"><span>Next Section</span></a></div>
+                  <h2>Acknowledgements</h2>
+                  
+                  <p id="p-36">We thank the captain and the crew of the RV <em>Alkor</em>. We gratefully acknowledge the skilful technical assistance of Bärbel Buuk. Michael Hannig helped during the isolation procedure.
+                     We thank the Deutsche Forschungsgemeinschaft (DFG) for grants LA 1466/4-1 and LA 1466/4-2.
+                  </p>
+                  
+               </div>
+               <div class="section ref-list" id="ref-list-1">
+                  <div class="section-nav"><a href="#ack-1" title="Acknowledgements" class="prev-section-link"><span>Previous Section</span></a><div class="nav-placeholder"> </div>
+                  </div>
+                  <h2>References</h2>
+                  <ol class="cit-list ref-use-labels">
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-1-1" title="View reference  in text"
+                           id="ref-1">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.1"
+                             data-doi="10.1038/ismej.2010.69">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Alonso-Sáez</span>,  <span class="cit-name-given-names">L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Galand</span>,  <span class="cit-name-given-names">P. E.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Casamayor</span>,  <span class="cit-name-given-names">E. O.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pedrós-Alió</span>,  <span class="cit-name-given-names">C.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bertilsson</span>,  <span class="cit-name-given-names">S.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2010</span><strong>).</strong> <span class="cit-article-title">High bicarbonate assimilation in the dark by Arctic bacteria</span>. <abbr class="cit-jnl-abbrev">ISME J</abbr> <span class="cit-vol">4</span>, <span class="cit-fpage">1581</span>–<span class="cit-lpage">1590</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1038/ismej.2010.69</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>20555365</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1038/ismej.2010.69&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=20555365&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=High%20bicarbonate%20assimilation%20in%20the%20dark%20by%20Arctic%20bacteria&amp;author=L.%20Alonso-S%C3%A1ez&amp;author=P.%20E.%20Galand&amp;author=E.%20O.%20Casamayor&amp;author=C.%20Pedr%C3%B3s-Ali%C3%B3&amp;author=S.%20Bertilsson&amp;publication_year=2010&amp;journal=ISME%20J&amp;volume=4&amp;pages=1581-1590&amp;doi=10.1038%2Fismej.2010.69&amp;pmid=20555365">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-2-1" title="View reference  in text"
+                           id="ref-2">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.2"
+                             data-doi="10.1080/713851165">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Balch</span>,  <span class="cit-name-given-names">W. E.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Fox</span>,  <span class="cit-name-given-names">G. E.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Magrum</span>,  <span class="cit-name-given-names">L. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Woese</span>,  <span class="cit-name-given-names">C. R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wolfe</span>,  <span class="cit-name-given-names">R. S.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1979</span><strong>).</strong> <span class="cit-article-title">Methanogens: reevaluation of a unique biological group</span>. <abbr class="cit-jnl-abbrev">Microbiol Rev</abbr> <span class="cit-vol">43</span>, <span class="cit-fpage">260</span>–<span class="cit-lpage">296</span>.<span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>390357</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=PDF&amp;journalCode=mmbr&amp;resid=43/2/260"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-3-1" title="View reference  in text"
+                           id="ref-3">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4141.3">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Kowalchuk</span>,  <span class="cit-name-given-names">G. A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">de Bruijn</span>,  <span class="cit-name-given-names">F. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Head</span>,  <span class="cit-name-given-names">I. M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Akkermans</span>,  <span class="cit-name-given-names">A. D.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">van Elsas</span>,  <span class="cit-name-given-names">J. D.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Boschker</span>,  <span class="cit-name-given-names">H. T. S.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2004</span><strong>).</strong> <span class="cit-article-title">Linking microbial community structure and functioning: stable isotope (13C) labeling in combination with PLFA analysis</span>. <em>In</em> <span class="cit-source">Molecular Microbial Ecology Manual II</span>, pp. <span class="cit-fpage">1673</span>–<span class="cit-lpage">1688</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Kowalchuk</span>,  <span class="cit-name-given-names">G. A.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">de Bruijn</span>,  <span class="cit-name-given-names">F. J.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Head</span>,  <span class="cit-name-given-names">I. M.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Akkermans</span>,  <span class="cit-name-given-names">A. D.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">van Elsas</span>,  <span class="cit-name-given-names">J. D.</span></span>
+                                 . <span class="cit-publ-loc">Dordrecht</span>: <span class="cit-publ-name">Kluwer Academic Publishers</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Linking%20microbial%20community%20structure%20and%20functioning%3A%20stable%20isotope%20%2813C%29%20labeling%20in%20combination%20with%20PLFA%20analysis&amp;author=H.%20T.%20S.%20Boschker&amp;publication_year=2004&amp;citation_inbook_title=Molecular%20Microbial%20Ecology%20Manual%20II">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-4-1" title="View reference  in text"
+                           id="ref-4">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.4"
+                             data-doi="10.3354/meps077157">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brettar</span>,  <span class="cit-name-given-names">I.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Rheinheimer</span>,  <span class="cit-name-given-names">G.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1991</span><strong>).</strong> <span class="cit-article-title">Denitrification in the central Baltic: evidence for H<sub>2</sub>S-oxidation as motor of denitrification at the oxic-anoxic interface</span>. <abbr class="cit-jnl-abbrev">Mar Ecol Prog Ser</abbr> <span class="cit-vol">77</span>, <span class="cit-fpage">157</span>–<span class="cit-lpage">169</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.3354/meps077157</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.3354/meps077157&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Denitrification%20in%20the%20central%20Baltic%3A%20evidence%20for%20H2S-oxidation%20as%20motor%20of%20denitrification%20at%20the%20oxic-anoxic%20interface&amp;author=I.%20Brettar&amp;author=G.%20Rheinheimer&amp;publication_year=1991&amp;journal=Mar%20Ecol%20Prog%20Ser&amp;volume=77&amp;pages=157-169&amp;doi=10.3354%2Fmeps077157">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-5-1" title="View reference  in text"
+                           id="ref-5">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.5"
+                             data-doi="10.1128/AEM.72.2.1364-1372.2006">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brettar</span>,  <span class="cit-name-given-names">I.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Labrenz</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Flavier</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bötel</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kuosa</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Christen</span>,  <span class="cit-name-given-names">R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Höfle</span>,  <span class="cit-name-given-names">M. G.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2006</span><strong>).</strong> <span class="cit-article-title">Identification of a <em>Thiomicrospira denitrificans</em>-like epsilonproteobacterium as a catalyst for autotrophic denitrification in the central Baltic Sea</span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">72</span>, <span class="cit-fpage">1364</span>–<span class="cit-lpage">1372</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.72.2.1364-1372.2006</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>16461688</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=72/2/1364"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-6-1" title="View reference  in text"
+                           id="ref-6">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4141.6">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Brenner</span>,  <span class="cit-name-given-names">D. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Staley</span>,  <span class="cit-name-given-names">J. T.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brinkhoff</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kuever</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Muyzer</span>,  <span class="cit-name-given-names">G.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jannasch</span>,  <span class="cit-name-given-names">H. W.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2005</span><strong>).</strong> <span class="cit-article-title">Genus VI. Thiomicrospira</span>. <em>In</em> <span class="cit-source">Bergey’s Manual of Systematic Bacteriology</span>, <span class="cit-edition">2nd edn</span>, <span class="cit-vol">vol. 2</span>, part B, pp. <span class="cit-fpage">193</span>–<span class="cit-lpage">199</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Brenner</span>,  <span class="cit-name-given-names">D. J.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Staley</span>,  <span class="cit-name-given-names">J. T.</span></span>
+                                 . <span class="cit-publ-loc">New York</span>: <span class="cit-publ-name">Springer</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Genus%20VI.%20Thiomicrospira&amp;author=T.%20Brinkhoff&amp;author=J.%20Kuever&amp;author=G.%20Muyzer&amp;author=H.%20W.%20Jannasch&amp;publication_year=2005&amp;citation_inbook_title=Bergey%E2%80%99s%20Manual%20of%20Systematic%20Bacteriology">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-7-1" title="View reference  in text"
+                           id="ref-7">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.7"
+                             data-doi="10.1128/AEM.68.8.3978-3987.2002">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bruns</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Cypionka</span>,  <span class="cit-name-given-names">H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Overmann</span>,  <span class="cit-name-given-names">J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2002</span><strong>).</strong> <span class="cit-article-title">Cyclic AMP and acyl homoserine lactones increase the cultivation efficiency of heterotrophic bacteria from the central Baltic
+                                    Sea</span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">68</span>, <span class="cit-fpage">3978</span>–<span class="cit-lpage">3987</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.68.8.3978-3987.2002</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>12147499</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=68/8/3978"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-8-1" title="View reference  in text"
+                           id="ref-8">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.8"
+                             data-doi="10.1038/nrmicro1414">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Campbell</span>,  <span class="cit-name-given-names">B. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Engel</span>,  <span class="cit-name-given-names">A. S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Porter</span>,  <span class="cit-name-given-names">M. L.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Takai</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2006</span><strong>).</strong> <span class="cit-article-title">The versatile epsilon-proteobacteria: key players in sulphidic habitats</span>. <abbr class="cit-jnl-abbrev">Nat Rev Microbiol</abbr> <span class="cit-vol">4</span>, <span class="cit-fpage">458</span>–<span class="cit-lpage">468</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1038/nrmicro1414</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>16652138</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1038/nrmicro1414&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=16652138&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=The%20versatile%20epsilon-proteobacteria%3A%20key%20players%20in%20sulphidic%20habitats&amp;author=B.%20J.%20Campbell&amp;author=A.%20S.%20Engel&amp;author=M.%20L.%20Porter&amp;author=K.%20Takai&amp;publication_year=2006&amp;journal=Nat%20Rev%20Microbiol&amp;volume=4&amp;pages=458-468&amp;doi=10.1038%2Fnrmicro1414&amp;pmid=16652138">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-9-1" title="View reference  in text"
+                           id="ref-9">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.9">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Dehority</span>,  <span class="cit-name-given-names">B. A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1971</span><strong>).</strong> <span class="cit-article-title">Carbon dioxide requirement of various species of rumen bacteria</span>. <abbr class="cit-jnl-abbrev">J Bacteriol</abbr> <span class="cit-vol">105</span>, <span class="cit-fpage">70</span>–<span class="cit-lpage">76</span>.<span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>5541030</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=jb&amp;resid=105/1/70"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-10-1" title="View reference  in text"
+                           id="ref-10">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.10"
+                             data-doi="10.1016/j.femsec.2004.07.004">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Engel</span>,  <span class="cit-name-given-names">A. S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Porter</span>,  <span class="cit-name-given-names">M. L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stern</span>,  <span class="cit-name-given-names">L. A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Quinlan</span>,  <span class="cit-name-given-names">S.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bennett</span>,  <span class="cit-name-given-names">P. C.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2004</span><strong>).</strong> <span class="cit-article-title">Bacterial diversity and ecosystem function of filamentous microbial mats from aphotic (cave) sulfidic springs dominated by
+                                    chemolithoautotrophic “<em>Epsilonproteobacteria</em>”</span>. <abbr class="cit-jnl-abbrev">FEMS Microbiol Ecol</abbr> <span class="cit-vol">51</span>, <span class="cit-fpage">31</span>–<span class="cit-lpage">53</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/j.femsec.2004.07.004</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>16329854</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/j.femsec.2004.07.004&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=16329854&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Bacterial%20diversity%20and%20ecosystem%20function%20of%20filamentous%20microbial%20mats%20from%20aphotic%20%28cave%29%20sulfidic%20springs%20dominated%20by%20chemolithoautotrophic%20%E2%80%9CEpsilonproteobacteria%E2%80%9D&amp;author=A.%20S.%20Engel&amp;author=M.%20L.%20Porter&amp;author=L.%20A.%20Stern&amp;author=S.%20Quinlan&amp;author=P.%20C.%20Bennett&amp;publication_year=2004&amp;journal=FEMS%20Microbiol%20Ecol&amp;volume=51&amp;pages=31-53&amp;doi=10.1016%2Fj.femsec.2004.07.004&amp;pmid=16329854">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-11-1" title="View reference  in text"
+                           id="ref-11">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.11"
+                             data-doi="10.1111/j.1462-2920.2008.01770.x">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Glaubitz</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lueders</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Abraham</span>,  <span class="cit-name-given-names">W.-R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jost</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jürgens</span>,  <span class="cit-name-given-names">K.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Labrenz</span>,  <span class="cit-name-given-names">M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2009</span><strong>).</strong> <span class="cit-article-title"><sup>13</sup>C-isotope analyses reveal that chemolithoautotrophic <em>Gamma</em>- and <em>Epsilonproteobacteria</em> feed a microbial food web in a pelagic redoxcline of the central Baltic Sea</span>. <abbr class="cit-jnl-abbrev">Environ Microbiol</abbr> <span class="cit-vol">11</span>, <span class="cit-fpage">326</span>–<span class="cit-lpage">337</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1111/j.1462-2920.2008.01770.x</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>18793316</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1111/j.1462-2920.2008.01770.x&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=18793316&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=13C-isotope%20analyses%20reveal%20that%20chemolithoautotrophic%20Gamma-%20and%20Epsilonproteobacteria%20feed%20a%20microbial%20food%20web%20in%20a%20pelagic%20redoxcline%20of%20the%20central%20Baltic%20Sea&amp;author=S.%20Glaubitz&amp;author=T.%20Lueders&amp;author=W.-R.%20Abraham&amp;author=G.%20Jost&amp;author=K.%20J%C3%BCrgens&amp;author=M.%20Labrenz&amp;publication_year=2009&amp;journal=Environ%20Microbiol&amp;volume=11&amp;pages=326-337&amp;doi=10.1111%2Fj.1462-2920.2008.01770.x&amp;pmid=18793316">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-12-1" title="View reference  in text"
+                           id="ref-12">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.12"
+                             data-doi="10.1111/j.1574-6941.2010.00944.x">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Glaubitz</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Labrenz</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jost</span>,  <span class="cit-name-given-names">G.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jürgens</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2010</span><strong>).</strong> <span class="cit-article-title">Diversity of active chemolithoautotrophic prokaryotes in the sulfidic zone of a Black Sea pelagic redoxcline as determined
+                                    by rRNA-based stable isotope probing</span>. <abbr class="cit-jnl-abbrev">FEMS Microbiol Ecol</abbr> <span class="cit-vol">74</span>, <span class="cit-fpage">32</span>–<span class="cit-lpage">41</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1111/j.1574-6941.2010.00944.x</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>20649907</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=femsec&amp;resid=74/1/32"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-13-1" title="View reference  in text"
+                           id="ref-13">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.13"
+                             data-doi="10.1128/AEM.00466-07">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Grote</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Labrenz</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pfeiffer</span>,  <span class="cit-name-given-names">B.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jost</span>,  <span class="cit-name-given-names">G.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jürgens</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2007</span><strong>).</strong> <span class="cit-article-title">Quantitative distributions of <em>Epsilonproteobacteria</em> and a <em>Sulfurimonas</em> subgroup in pelagic redoxclines of the central Baltic Sea</span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">73</span>, <span class="cit-fpage">7155</span>–<span class="cit-lpage">7161</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.00466-07</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>17921285</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=73/22/7155"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-14-1" title="View reference  in text"
+                           id="ref-14">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.14"
+                             data-doi="10.1128/AEM.01186-08">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Grote</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jost</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Labrenz</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Herndl</span>,  <span class="cit-name-given-names">G. J.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jürgens</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2008</span><strong>).</strong> <span class="cit-article-title"><em>Epsilonproteobacteria</em> represent the major portion of chemoautotrophic bacteria in sulfidic waters of pelagic redoxclines of the Baltic and Black
+                                    Seas</span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">74</span>, <span class="cit-fpage">7546</span>–<span class="cit-lpage">7551</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.01186-08</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>18952879</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=74/24/7546"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-15-1" title="View reference  in text"
+                           id="ref-15">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.15"
+                             data-doi="10.1073/pnas.1111262109">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Grote</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Schott</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bruckner</span>,  <span class="cit-name-given-names">C. G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Glöckner</span>,  <span class="cit-name-given-names">F. O.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jost</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Teeling</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Labrenz</span>,  <span class="cit-name-given-names">M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jürgens</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2012</span><strong>).</strong> <span class="cit-article-title">Genome and physiology of a model Epsilonproteobacterium responsible for sulfide detoxification in marine oxygen depletion
+                                    zones</span>. <abbr class="cit-jnl-abbrev">Proc Natl Acad Sci U S A</abbr> <span class="cit-vol">109</span>, <span class="cit-fpage">506</span>–<span class="cit-lpage">510</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1073/pnas.1111262109</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>22203982</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=pnas&amp;resid=109/2/506"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-16-1" title="View reference  in text"
+                           id="ref-16">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.16"
+                             data-doi="10.4319/lo.2007.52.4.1336">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hannig</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lavik</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kuypers</span>,  <span class="cit-name-given-names">M. M. M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Woebken</span>,  <span class="cit-name-given-names">D.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Martens-Habbena</span>,  <span class="cit-name-given-names">W.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jürgens</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2007</span><strong>).</strong> <span class="cit-article-title">Shift from denitrification to anammox after inflow events in the central Baltic Sea</span>. <abbr class="cit-jnl-abbrev">Limnol Oceanogr</abbr> <span class="cit-vol">52</span>, <span class="cit-fpage">1336</span>–<span class="cit-lpage">1345</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.4319/lo.2007.52.4.1336</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.4319/lo.2007.52.4.1336&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Shift%20from%20denitrification%20to%20anammox%20after%20inflow%20events%20in%20the%20central%20Baltic%20Sea&amp;author=M.%20Hannig&amp;author=G.%20Lavik&amp;author=M.%20M.%20M.%20Kuypers&amp;author=D.%20Woebken&amp;author=W.%20Martens-Habbena&amp;author=K.%20J%C3%BCrgens&amp;publication_year=2007&amp;journal=Limnol%20Oceanogr&amp;volume=52&amp;pages=1336-1345&amp;doi=10.4319%2Flo.2007.52.4.1336">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-17-1" title="View reference  in text"
+                           id="ref-17">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.17"
+                             data-doi="10.1099/ijs.0.02682-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Inagaki</span>,  <span class="cit-name-given-names">F.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Takai</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kobayashi</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nealson</span>,  <span class="cit-name-given-names">K. H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Horikoshi</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2003</span><strong>).</strong> <span class="cit-article-title"><em>Sulfurimonas autotrophica</em> gen. nov., sp. nov., a novel sulfur-oxidizing ϵ-proteobacterium isolated from hydrothermal sediments in the Mid-Okinawa Trough</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">53</span>, <span class="cit-fpage">1801</span>–<span class="cit-lpage">1805</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.02682-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>14657107</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=53/6/1801"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-18-1" title="View reference  in text"
+                           id="ref-18">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.18"
+                             data-doi="10.1016/j.marchem.2009.01.002">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jensen</span>,  <span class="cit-name-given-names">M. M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Petersen</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Dalsgaard</span>,  <span class="cit-name-given-names">T.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Thamdrup</span>,  <span class="cit-name-given-names">B.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2009</span><strong>).</strong> <span class="cit-article-title">Pathways, rates, and regulation of N<sub>2</sub> production in the chemocline of an anoxic basin, Mariager Fjord, Denmark</span>. <abbr class="cit-jnl-abbrev">Mar Chem</abbr> <span class="cit-vol">113</span>, <span class="cit-fpage">102</span>–<span class="cit-lpage">113</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/j.marchem.2009.01.002</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/j.marchem.2009.01.002&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Pathways%2C%20rates%2C%20and%20regulation%20of%20N2%20production%20in%20the%20chemocline%20of%20an%20anoxic%20basin%2C%20Mariager%20Fjord%2C%20Denmark&amp;author=M.%20M.%20Jensen&amp;author=J.%20Petersen&amp;author=T.%20Dalsgaard&amp;author=B.%20Thamdrup&amp;publication_year=2009&amp;journal=Mar%20Chem&amp;volume=113&amp;pages=102-113&amp;doi=10.1016%2Fj.marchem.2009.01.002">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><div class="cit ref-cit ref-journal no-rev-xref" id="cit-63.Pt_11.4141.19"
+                             data-doi="10.4319/lo.2008.53.1.0014">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jost</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Zubkov</span>,  <span class="cit-name-given-names">M. V.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Yakushev</span>,  <span class="cit-name-given-names">E.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Labrenz</span>,  <span class="cit-name-given-names">M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jürgens</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2008</span><strong>).</strong> <span class="cit-article-title">High abundance and dark CO<sub>2</sub> fixation of chemolithoautotrophic prokaryotes in anoxic waters of the Baltic Sea</span>. <abbr class="cit-jnl-abbrev">Limnol Oceanogr</abbr> <span class="cit-vol">53</span>, <span class="cit-fpage">14</span>–<span class="cit-lpage">22</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.4319/lo.2008.53.1.0014</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.4319/lo.2008.53.1.0014&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=High%20abundance%20and%20dark%20CO2%20fixation%20of%20chemolithoautotrophic%20prokaryotes%20in%20anoxic%20waters%20of%20the%20Baltic%20Sea&amp;author=G.%20Jost&amp;author=M.%20V.%20Zubkov&amp;author=E.%20Yakushev&amp;author=M.%20Labrenz&amp;author=K.%20J%C3%BCrgens&amp;publication_year=2008&amp;journal=Limnol%20Oceanogr&amp;volume=53&amp;pages=14-22&amp;doi=10.4319%2Flo.2008.53.1.0014">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-20-1" title="View reference  in text"
+                           id="ref-20">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.20"
+                             data-doi="10.1111/j.1574-6941.2009.00798.x">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jost</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Martens-Habbena</span>,  <span class="cit-name-given-names">W.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pollehne</span>,  <span class="cit-name-given-names">F.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Schnetger</span>,  <span class="cit-name-given-names">B.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Labrenz</span>,  <span class="cit-name-given-names">M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2010</span><strong>).</strong> <span class="cit-article-title">Anaerobic sulfur oxidation in the absence of nitrate dominates microbial chemoautotrophy beneath the pelagic chemocline of
+                                    the eastern Gotland Basin, Baltic Sea</span>. <abbr class="cit-jnl-abbrev">FEMS Microbiol Ecol</abbr> <span class="cit-vol">71</span>, <span class="cit-fpage">226</span>–<span class="cit-lpage">236</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1111/j.1574-6941.2009.00798.x</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>19925634</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1111/j.1574-6941.2009.00798.x&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=19925634&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Anaerobic%20sulfur%20oxidation%20in%20the%20absence%20of%20nitrate%20dominates%20microbial%20chemoautotrophy%20beneath%20the%20pelagic%20chemocline%20of%20the%20eastern%20Gotland%20Basin%2C%20Baltic%20Sea&amp;author=G.%20Jost&amp;author=W.%20Martens-Habbena&amp;author=F.%20Pollehne&amp;author=B.%20Schnetger&amp;author=M.%20Labrenz&amp;publication_year=2010&amp;journal=FEMS%20Microbiol%20Ecol&amp;volume=71&amp;pages=226-236&amp;doi=10.1111%2Fj.1574-6941.2009.00798.x&amp;pmid=19925634">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-21-1" title="View reference  in text"
+                           id="ref-21">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.21"
+                             data-doi="10.1128/AEM.70.8.4971-4979.2004">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Labrenz</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brettar</span>,  <span class="cit-name-given-names">I.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Christen</span>,  <span class="cit-name-given-names">R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Flavier</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bötel</span>,  <span class="cit-name-given-names">J.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Höfle</span>,  <span class="cit-name-given-names">M. G.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2004</span><strong>).</strong> <span class="cit-article-title">Development and application of a real-time PCR approach for quantification of uncultured bacteria in the central Baltic Sea</span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">70</span>, <span class="cit-fpage">4971</span>–<span class="cit-lpage">4979</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.70.8.4971-4979.2004</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>15294837</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=70/8/4971"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-22-1" title="View reference  in text"
+                           id="ref-22">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.22"
+                             data-doi="10.1128/AEM.71.11.6664-6672.2005">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Labrenz</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jost</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pohl</span>,  <span class="cit-name-given-names">C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Beckmann</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Martens-Habbena</span>,  <span class="cit-name-given-names">W.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jürgens</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2005</span><strong>).</strong> <span class="cit-article-title">Impact of different <em>in vitro</em> electron donor/acceptor conditions on potential chemolithoautotrophic communities from marine pelagic redoxclines</span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">71</span>, <span class="cit-fpage">6664</span>–<span class="cit-lpage">6672</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.71.11.6664-6672.2005</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>16269695</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=71/11/6664"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-23-1" title="View reference  in text"
+                           id="ref-23">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.23"
+                             data-doi="10.3354/ame046177">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Labrenz</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jost</span>,  <span class="cit-name-given-names">G.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jürgens</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2007</span><strong>).</strong> <span class="cit-article-title">Distribution of abundant prokaryotic organisms in the water column of the central Baltic Sea with an oxic-anoxic interface</span>. <abbr class="cit-jnl-abbrev">Aquat Microb Ecol</abbr> <span class="cit-vol">46</span>, <span class="cit-fpage">177</span>–<span class="cit-lpage">190</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.3354/ame046177</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.3354/ame046177&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Distribution%20of%20abundant%20prokaryotic%20organisms%20in%20the%20water%20column%20of%20the%20central%20Baltic%20Sea%20with%20an%20oxic-anoxic%20interface&amp;author=M.%20Labrenz&amp;author=G.%20Jost&amp;author=K.%20J%C3%BCrgens&amp;publication_year=2007&amp;journal=Aquat%20Microb%20Ecol&amp;volume=46&amp;pages=177-190&amp;doi=10.3354%2Fame046177">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-24-1" title="View reference  in text"
+                           id="ref-24">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.24"
+                             data-doi="10.1016/S0025-3227(98)00046-2">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lepland</span>,  <span class="cit-name-given-names">A.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stevens</span>,  <span class="cit-name-given-names">R. L.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1998</span><strong>).</strong> <span class="cit-article-title">Manganese authigenesis in the Landsort Deep, Baltic Sea</span>. <abbr class="cit-jnl-abbrev">Mar Geol</abbr> <span class="cit-vol">151</span>, <span class="cit-fpage">1</span>–<span class="cit-lpage">25</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/S0025-3227(98)00046-2</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/S0025-3227(98)00046-2&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Manganese%20authigenesis%20in%20the%20Landsort%20Deep%2C%20Baltic%20Sea&amp;author=A.%20Lepland&amp;author=R.%20L.%20Stevens&amp;publication_year=1998&amp;journal=Mar%20Geol&amp;volume=151&amp;pages=1-25&amp;doi=10.1016%2FS0025-3227%2898%2900046-2">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-25-1" title="View reference  in text"
+                           id="ref-25">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.25"
+                             data-doi="10.1093/nar/gkh293">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ludwig</span>,  <span class="cit-name-given-names">W.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Strunk</span>,  <span class="cit-name-given-names">O.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Westram</span>,  <span class="cit-name-given-names">R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Richter</span>,  <span class="cit-name-given-names">L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Meier</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Yadhukumar</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Buchner</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lai</span>,  <span class="cit-name-given-names">T.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Steppi</span>,  <span class="cit-name-given-names">S.</span></span></li>
+                              </ol><cite> <strong>&amp; other authors (</strong><span class="cit-pub-date">2004</span><strong>).</strong> <span class="cit-article-title"><span class="sc">arb</span>: a software environment for sequence data</span>. <abbr class="cit-jnl-abbrev">Nucleic Acids Res</abbr> <span class="cit-vol">32</span>, <span class="cit-fpage">1363</span>–<span class="cit-lpage">1371</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1093/nar/gkh293</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>14985472</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=nar&amp;resid=32/4/1363"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-26-1" title="View reference  in text"
+                           id="ref-26">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.26"
+                             data-doi="10.1111/j.1574-6941.2008.00502.x">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nakagawa</span>,  <span class="cit-name-given-names">S.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Takai</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2008</span><strong>).</strong> <span class="cit-article-title">Deep-sea vent chemoautotrophs: diversity, biochemistry and ecological significance</span>. <abbr class="cit-jnl-abbrev">FEMS Microbiol Ecol</abbr> <span class="cit-vol">65</span>, <span class="cit-fpage">1</span>–<span class="cit-lpage">14</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1111/j.1574-6941.2008.00502.x</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>18503548</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=femsec&amp;resid=65/1/1"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-27-1" title="View reference  in text"
+                           id="ref-27">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.27"
+                             data-doi="10.1111/j.1462-2920.2005.00856.x">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nakagawa</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Takai</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Inagaki</span>,  <span class="cit-name-given-names">F.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hirayama</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nunoura</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Horikoshi</span>,  <span class="cit-name-given-names">K.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sako</span>,  <span class="cit-name-given-names">Y.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2005</span><strong>).</strong> <span class="cit-article-title">Distribution, phylogenetic diversity and physiological characteristics of epsilon-<em>Proteobacteria</em> in a deep-sea hydrothermal field</span>. <abbr class="cit-jnl-abbrev">Environ Microbiol</abbr> <span class="cit-vol">7</span>, <span class="cit-fpage">1619</span>–<span class="cit-lpage">1632</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1111/j.1462-2920.2005.00856.x</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>16156735</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1111/j.1462-2920.2005.00856.x&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=16156735&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Distribution%2C%20phylogenetic%20diversity%20and%20physiological%20characteristics%20of%20epsilon-Proteobacteria%20in%20a%20deep-sea%20hydrothermal%20field&amp;author=S.%20Nakagawa&amp;author=K.%20Takai&amp;author=F.%20Inagaki&amp;author=H.%20Hirayama&amp;author=T.%20Nunoura&amp;author=K.%20Horikoshi&amp;author=Y.%20Sako&amp;publication_year=2005&amp;journal=Environ%20Microbiol&amp;volume=7&amp;pages=1619-1632&amp;doi=10.1111%2Fj.1462-2920.2005.00856.x&amp;pmid=16156735">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-28-1" title="View reference  in text"
+                           id="ref-28">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.28"
+                             data-doi="10.1016/S0304-4203(03)00048-3">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Neretin</span>,  <span class="cit-name-given-names">L. N.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pohl</span>,  <span class="cit-name-given-names">C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jost</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Leipe</span>,  <span class="cit-name-given-names">T.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pollehne</span>,  <span class="cit-name-given-names">F.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2003</span><strong>).</strong> <span class="cit-article-title">Manganese cycling in the Gotland Deep, Baltic Sea</span>. <abbr class="cit-jnl-abbrev">Mar Chem</abbr> <span class="cit-vol">82</span>, <span class="cit-fpage">125</span>–<span class="cit-lpage">143</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/S0304-4203(03)00048-3</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/S0304-4203(03)00048-3&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Manganese%20cycling%20in%20the%20Gotland%20Deep%2C%20Baltic%20Sea&amp;author=L.%20N.%20Neretin&amp;author=C.%20Pohl&amp;author=G.%20Jost&amp;author=T.%20Leipe&amp;author=F.%20Pollehne&amp;publication_year=2003&amp;journal=Mar%20Chem&amp;volume=82&amp;pages=125-143&amp;doi=10.1016%2FS0304-4203%2803%2900048-3">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-29-1" title="View reference  in text"
+                           id="ref-29">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.29"
+                             data-doi="10.1073/pnas.85.8.2444">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pearson</span>,  <span class="cit-name-given-names">W. R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lipman</span>,  <span class="cit-name-given-names">D. J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1988</span><strong>).</strong> <span class="cit-article-title">Improved tools for biological sequence comparison</span>. <abbr class="cit-jnl-abbrev">Proc Natl Acad Sci U S A</abbr> <span class="cit-vol">85</span>, <span class="cit-fpage">2444</span>–<span class="cit-lpage">2448</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1073/pnas.85.8.2444</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>3162770</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=pnas&amp;resid=85/8/2444"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><div class="cit ref-cit ref-book no-rev-xref" id="cit-63.Pt_11.4141.30">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sasser</span>,  <span class="cit-name-given-names">M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1990</span><strong>).</strong> <span class="cit-source">Identification of bacteria by gas chromatography of cellular fatty acids</span>, MIDI Technical Note 101. <span class="cit-publ-loc">Newark, DE</span>: <span class="cit-publ-name">Microbial ID</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Identification%20of%20bacteria%20by%20gas%20chromatography%20of%20cellular%20fatty%20acids&amp;author=M.%20Sasser&amp;publication_year=1990">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-31-1" title="View reference  in text"
+                           id="ref-31">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.31"
+                             data-doi="10.1128/AEM.01844-07">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sievert</span>,  <span class="cit-name-given-names">S. M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Scott</span>,  <span class="cit-name-given-names">K. M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Klotz</span>,  <span class="cit-name-given-names">M. G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Chain</span>,  <span class="cit-name-given-names">P. S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hauser</span>,  <span class="cit-name-given-names">L. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hemp</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hügler</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Land</span>,  <span class="cit-name-given-names">M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lapidus</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>&amp; other authors (</strong><span class="cit-pub-date">2008</span><strong>).</strong> <span class="cit-article-title">Genome of the epsilonproteobacterial chemolithoautotroph <em>Sulfurimonas denitrificans</em></span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">74</span>, <span class="cit-fpage">1145</span>–<span class="cit-lpage">1156</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.01844-07</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>18065616</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=74/4/1145"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-32-1" title="View reference  in text"
+                           id="ref-32">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.32"
+                             data-doi="10.1099/00207713-44-4-846">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stackebrandt</span>,  <span class="cit-name-given-names">E.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Goebel</span>,  <span class="cit-name-given-names">B. M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1994</span><strong>).</strong> <span class="cit-article-title">Taxonomic Note: A place for DNA-DNA reassociation and 16S rRNA sequence analysis in the present species definition in Bacteriology</span>. <abbr class="cit-jnl-abbrev">Int J Syst Bacteriol</abbr> <span class="cit-vol">44</span>, <span class="cit-fpage">846</span>–<span class="cit-lpage">849</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-44-4-846</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=44/4/846"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-33-1" title="View reference  in text"
+                           id="ref-33">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.33"
+                             data-doi="10.1099/mic.0.2008/018085-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Starkenburg</span>,  <span class="cit-name-given-names">S. R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Arp</span>,  <span class="cit-name-given-names">D. J.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bottomley</span>,  <span class="cit-name-given-names">P. J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2008</span><strong>).</strong> <span class="cit-article-title"><span class="sc">d</span>-Lactate metabolism and the obligate requirement for CO<sub>2</sub> during growth on nitrite by the facultative lithoautotroph <em>Nitrobacter hamburgensis</em></span>. <abbr class="cit-jnl-abbrev">Microbiology</abbr> <span class="cit-vol">154</span>, <span class="cit-fpage">2473</span>–<span class="cit-lpage">2481</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/mic.0.2008/018085-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>18667580</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=mic&amp;resid=154/8/2473"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-34-1" title="View reference  in text"
+                           id="ref-34">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.34"
+                             data-doi="10.1128/AEM.71.9.5440-5450.2005">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Suzuki</span>,  <span class="cit-name-given-names">Y.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sasaki</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Suzuki</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nogi</span>,  <span class="cit-name-given-names">Y.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Miwa</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Takai</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nealson</span>,  <span class="cit-name-given-names">K. H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Horikoshi</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2005</span><strong>).</strong> <span class="cit-article-title">Novel chemoautotrophic endosymbiosis between a member of the <em>Epsilonproteobacteria</em> and the hydrothermal-vent gastropod <em>Alviniconcha</em> aff. <em>hessleri</em> (Gastropoda: Provannidae) from the Indian Ocean</span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">71</span>, <span class="cit-fpage">5440</span>–<span class="cit-lpage">5450</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.71.9.5440-5450.2005</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>16151136</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=71/9/5440"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-35-1" title="View reference  in text"
+                           id="ref-35">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.35"
+                             data-doi="10.1128/AEM.72.2.1388-1393.2006">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Suzuki</span>,  <span class="cit-name-given-names">Y.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kojima</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sasaki</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Suzuki</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Utsumi</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Watanabe</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Urakawa</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Tsuchida</span>,  <span class="cit-name-given-names">S.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nunoura</span>,  <span class="cit-name-given-names">T.</span></span></li>
+                              </ol><cite> <strong>&amp; other authors (</strong><span class="cit-pub-date">2006</span><strong>).</strong> <span class="cit-article-title">Host-symbiont relationships in hydrothermal vent gastropods of the genus <em>Alviniconcha</em> from the Southwest Pacific</span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">72</span>, <span class="cit-fpage">1388</span>–<span class="cit-lpage">1393</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.72.2.1388-1393.2006</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>16461691</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=72/2/1388"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-36-1" title="View reference  in text"
+                           id="ref-36">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.36"
+                             data-doi="10.1099/ijs.0.64255-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Takai</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Suzuki</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nakagawa</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Miyazaki</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Suzuki</span>,  <span class="cit-name-given-names">Y.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Inagaki</span>,  <span class="cit-name-given-names">F.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Horikoshi</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2006</span><strong>).</strong> <span class="cit-article-title"><em>Sulfurimonas paralvinellae</em> sp. nov., a novel mesophilic, hydrogen- and sulfur-oxidizing chemolithoautotroph within the <em>Epsilonproteobacteria</em> isolated from a deep-sea hydrothermal vent polychaete nest, reclassification of <em>Thiomicrospira denitrificans</em> as <em>Sulfurimonas denitrificans</em> comb. nov. and emended description of the genus <em>Sulfurimonas</em></span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">56</span>, <span class="cit-fpage">1725</span>–<span class="cit-lpage">1733</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.64255-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>16901999</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=56/8/1725"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-37-1" title="View reference  in text"
+                           id="ref-37">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.37"
+                             data-doi="10.1016/0077-7579(75)90008-3">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Timmer-ten Hoor</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1975</span><strong>).</strong> <span class="cit-article-title">A new type of thiosulphate oxidizing, nitrate reducing microorganism: <em>Thiomicrospira denitrificans</em> sp. nov.</span>. <abbr class="cit-jnl-abbrev">Neth J Sea Res</abbr> <span class="cit-vol">9</span>, <span class="cit-fpage">344</span>–<span class="cit-lpage">350</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/0077-7579(75)90008-3</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/0077-7579(75)90008-3&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=A%20new%20type%20of%20thiosulphate%20oxidizing%2C%20nitrate%20reducing%20microorganism%3A%20Thiomicrospira%20denitrificans%20sp.%20nov.&amp;author=A.%20Timmer-ten%20Hoor&amp;publication_year=1975&amp;journal=Neth%20J%20Sea%20Res&amp;volume=9&amp;pages=344-350&amp;doi=10.1016%2F0077-7579%2875%2990008-3">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-38-1" title="View reference  in text"
+                           id="ref-38">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4141.38">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Balows</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Trüper</span>,  <span class="cit-name-given-names">H. G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Dworkin</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Harder</span>,  <span class="cit-name-given-names">W.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Schleifer</span>,  <span class="cit-name-given-names">K.-H.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Widdel</span>,  <span class="cit-name-given-names">F.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bak</span>,  <span class="cit-name-given-names">F.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1992</span><strong>).</strong> <span class="cit-article-title">Chapter 183. Gram-negative mesophilic sulfate-reducing bacteria</span>. In <span class="cit-source">The Prokaryotes</span>. <span class="cit-edition">2nd edn</span>, <span class="cit-vol">vol. IV</span>, pp, <span class="cit-fpage">3352</span>–<span class="cit-lpage">3378</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Balows</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Trüper</span>,  <span class="cit-name-given-names">H. G.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Dworkin</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Harder</span>,  <span class="cit-name-given-names">W.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Schleifer</span>,  <span class="cit-name-given-names">K.-H.</span></span>
+                                 . <span class="cit-publ-loc">New York</span>: <span class="cit-publ-name">Springer</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Chapter%20183.%20Gram-negative%20mesophilic%20sulfate-reducing%20bacteria&amp;author=F.%20Widdel&amp;author=F.%20Bak&amp;publication_year=1992&amp;citation_inbook_title=The%20Prokaryotes">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-39-1" title="View reference  in text"
+                           id="ref-39">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4141.39"
+                             data-doi="10.1007/BF00407804">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Widdel</span>,  <span class="cit-name-given-names">F.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kohring</span>,  <span class="cit-name-given-names">G. W.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Mayer</span>,  <span class="cit-name-given-names">F.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1983</span><strong>).</strong> <span class="cit-article-title">Studies on dissimilatory sulfate-reducing bacteria that decompose fatty acids. III. Characterization of the filamentous gliding
+                                    <em>Desulfonema limicola</em> gen. nov. sp. nov., and <em>Desulfonema magnum</em> sp. nov.</span> <abbr class="cit-jnl-abbrev">Arch Microbiol</abbr> <span class="cit-vol">134</span>, <span class="cit-fpage">286</span>–<span class="cit-lpage">294</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/BF00407804</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/BF00407804&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=7283636&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Studies%20on%20dissimilatory%20sulfate-reducing%20bacteria%20that%20decompose%20fatty%20acids.%20III.%20Characterization%20of%20the%20filamentous%20gliding%20Desulfonema%20limicola%20gen.%20nov.%20sp.%20nov.%2C%20and%20Desulfonema%20magnum%20sp.%20nov.&amp;author=F.%20Widdel&amp;author=G.%20W.%20Kohring&amp;author=F.%20Mayer&amp;publication_year=1983&amp;journal=Arch%20Microbiol&amp;volume=134&amp;pages=286-294&amp;doi=10.1007%2FBF00407804">Google Scholar</a></div>
+                        </div>
+                     </li>
+                  </ol>
+               </div><span class="highwire-journal-article-marker-end"></span></div>
+            <div class="social-bookmarking">
+               
+               <ul class="social-bookmark-links">
+                  <li class="social-bookmarking-item social-bookmarking-item-citeulike"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=CITEULIKE"><img src="/shared/img/common/social-bookmarking/citeulike.gif"
+                             alt="Add to CiteULike"
+                             title="CiteULike" /></a><span class="soc-bm-link-text">CiteULike</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-delicious"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=DEL_ICIO_US"><img src="/shared/img/common/social-bookmarking/delicious.gif"
+                             alt="Add to Delicious"
+                             title="Delicious" /></a><span class="soc-bm-link-text">Delicious</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-digg"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=DIGG"><img src="/shared/img/common/social-bookmarking/digg.gif" alt="Add to Digg"
+                             title="Digg" /></a><span class="soc-bm-link-text">Digg</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-facebook"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/short/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=FACEBOOK"
+                        class="sb-facebook"
+                        rel="external-nw"><img src="/shared/img/common/social-bookmarking/facebook.gif" alt="Add to Facebook"
+                             title="Facebook" /></a><span class="soc-bm-link-text">Facebook</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-googleplus"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=GOOGLEPLUS&amp;log_only=yes"><img src="/shared/img/common/social-bookmarking/googleplus.jpg" alt="Add to Google+"
+                             title="Google+" /></a><span class="soc-bm-link-text">Google+</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-linkedin"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=LINKEDIN"><img src="/shared/img/common/social-bookmarking/linkedin.gif" alt="Add to LinkedIn"
+                             title="LinkedIn" /></a><span class="soc-bm-link-text">LinkedIn</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-mendeley"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=MENDELEY"><img src="/shared/img/common/social-bookmarking/mendeley.gif" alt="Add to Mendeley"
+                             title="Mendeley" /></a><span class="soc-bm-link-text">Mendeley</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-reddit"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=REDDIT"><img src="/shared/img/common/social-bookmarking/reddit.gif" alt="Add to Reddit"
+                             title="Reddit" /></a><span class="soc-bm-link-text">Reddit</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-twitter"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=TWITTER"><img src="/shared/img/common/social-bookmarking/twitter.gif" alt="Add to Twitter"
+                             title="Twitter" /></a><span class="soc-bm-link-text">Twitter</span></li>
+               </ul>
+               
+               <p class="social-bookmarking-help"><a href="/help/social_bookmarks.dtl">What's this?</a></p>
+               
+            </div><span id="related-urls"></span></div>
+         <div id="col-2">
+            
+            <div class="article-nav sidebar-nav">
+               <a href="/content/63/Pt_11/4136.short" title="Previous article" class="previous">« Previous</a><span class="article-nav-sep"> | </span><a href="/content/63/Pt_11/4149.short" title="Next article" class="next">Next Article »</a>
+               
+               <span class="toc-link">
+                  				<a href="/content/63/Pt_11.toc" title="Table of Contents">Table of Contents</a>
+                  			</span>
+               
+               
+            </div>
+            <div class="open-access-note">
+               <span class="open-access-note">OPEN ACCESS ARTICLE</span>
+               
+            </div>
+            <div class="content-box" id="article-cb-main">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Article</span></h3>
+                  <div class="cb-section cb-slug">
+                     <ol>
+                        <li>
+                           <div id="slugline">
+                              
+                              
+                              	    <span class="slug-metadata-note ahead-of-print">
+                                 	
+                                 Published online ahead of print
+                                 
+                                 <span class="slug-ahead-of-print-date">June 7, 2013</span>,
+                                 doi:
+                                 <span title="10.1099/ijs.0.048827-0" class="slug-doi">10.1099/ijs.0.048827-0
+                                    </span>
+                                 </span>
+                              
+                              <cite>
+                                 	    <abbr title="International Journal of Systematic and Evolutionary Microbiology"
+                                       class="slug-jnl-abbrev">
+                                    IJSEM</abbr><span class="slug-pub-date" itemprop="datePublished">
+                                    	    November 2013 
+                                    </span>
+                                 	    <span class="slug-vol">
+                                    vol. 63 
+                                    </span><span class="slug-issue">
+                                    no. Pt 11 
+                                    </span><span class="slug-pages">
+                                    4141-4148
+                                    </span>
+                                 </cite>
+                              
+                              	           
+                              
+                              
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section cb-views">
+                     <ol>
+                        <li><span class="oa-article">Free via Open Access: <span>OA</span></span></li>
+                        <li><span class="creative-commons-article">Free via Creative Commons: <span>CC</span></span></li>
+                        <li><span class="ccv cc-version-by/2.5/"></span></li>
+                        <li class="abstract-view-link primary"><span class="oa-view">OA </span><a href="/content/63/Pt_11/4141.abstract" rel="view-abstract">Abstract</a><span class="free">Free</span></li>
+                        <li class="notice full-text-view-link primary"><span class="variant-indicator">» <span>Full Text</span></span><span class="free">Free</span></li>
+                        <li class="notice full-text-pdf-view-link primary"><a href="/content/63/Pt_11/4141.full.pdf+html" rel="view-full-text.pdf">Full Text (PDF)</a><span class="free">Free</span></li>
+                        <li><a href="/powerpoint/63/Pt_11/4141">PPT Slides of All Figures</a></li>
+                        <li class="cb-versions">
+                           <div><span id="pap-all-versions-label">All Versions of this Article:</span><ol class="version-list">
+                                 <li><a href="/content/early/2013/06/04/ijs.0.048827-0">ijs.0.048827-0v1</a></li>
+                                 <li class="current-li"><span>63/Pt_11/4141</span> <span class="current-version">most recent</span></li>
+                              </ol>
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible" id="cb-art-cat">
+                     <h4 class="cb-section-header"><span>Classifications</span></h4>
+                     <ol>
+                        <li>
+                           <ul class="subject-headings">
+                              <li>New Taxa
+                                 <ul class="subject-sub-headings last-child">
+                                    <li><a class="tocsection-search"
+                                          href="/search?tocsectionid=Proteobacteria&amp;sortspec=date&amp;submit=Submit">Proteobacteria</a></li>
+                                 </ul>
+                              </li>
+                           </ul>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible" id="cb-art-svcs">
+                     <h4 class="cb-section-header"><span>Services</span></h4>
+                     <ol>
+                        <li class="mail-a-friend-link icon-link"><a href="/email?gca=ijs%3B63%2FPt_11%2F4141&amp;current-view-path=/content/63/Pt_11/4141.full">
+                              Email this article to a colleague</a></li>
+                        <li class="alert-link icon-link"><a href="/cgi/alerts/ctalert?alertType=citedby&amp;addAlert=cited_by&amp;cited_by_criteria_resid=ijs%3B63%2FPt_11%2F4141&amp;saveAlert=no&amp;return-type=article&amp;return_url=http://ijs.sgmjournals.org/content/63/Pt_11/4141.full">Alert me when this article is cited</a></li>
+                        <li class="alert-link icon-link"><a href="/cgi/alerts/ctalert?alertType=correction&amp;addAlert=correction&amp;correction_criteria_value=63/Pt_11/4141&amp;saveAlert=no&amp;return-type=article&amp;return_url=http://ijs.sgmjournals.org/content/63/Pt_11/4141.full">Alert me if a correction is posted</a></li>
+                        <li class="similar-link"><a href="/search?qbe=ijs%3Bijs.0.048827-0&amp;citation=Labrenz%20et%20al.%2063%20%28Pt%2011%29:%204141&amp;submit=yes">Similar articles in this journal</a></li>
+                        <li class="similar-link"><a href="/external-ref?access_num=ijs%3B63%2FPt_11%2F4141&amp;link_type=ISI_RELATEDRECORDS"
+                              id="cb-isi-similar-articles"
+                              class="similar-link">Similar articles in Web of Science</a></li>
+                        <li class="similar-link"><a href="/external-ref?access_num=23749282&amp;link_type=MED_NBRS"
+                              class="similar-link">Similar articles in PubMed</a></li>
+                        <li class="cit-man-link icon-link cite-link"><a href="/citmgr?gca=ijs%3B63%2FPt_11%2F4141">Download to citation manager</a></li>
+                        <li class="copyright-link icon-link"><a href="/external-ref?link_type=PERMISSIONDIRECT"><img src="/shared/img/content/permissions.gif" /></a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-cit">
+                     <h4 class="cb-section-header"><span>Citing Articles</span></h4>
+                     <ol>
+                        <li class="hw-citing-link"><a href="/content/63/Pt_11/4141.full?cited-by=yes&amp;legid=ijs;63/Pt_11/4141#cited-by"
+                              id="cb-hw-citing-articles">Load citing article information</a></li>
+                        <li><a href="/cgi/crossref-forward-links/63/Pt_11/4141" rel="external-nw"
+                              id="cb-crossref-citing-articles">Citing articles via CrossRef</a></li>
+                        <li><a href="/external-ref?access_num=%2Fijs%2F63%2FPt_11%2F4141&amp;link_type=ISI_CITING&amp;accnum_type=native"
+                              rel="external-nw"
+                              id="cb-isi-citing-articles">Citing articles via Web of Science</a></li>
+                        <li><a href="/external-ref?access_num=http://ijs.sgmjournals.org/content/63/Pt_11/4141.abstract&amp;link_type=GOOGLESCHOLAR">Citing articles via Google Scholar</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-gs">
+                     <h4 class="cb-section-header"><span>Google Scholar</span></h4>
+                     <ol>
+                        <li class="cb-art-gs-auth author-link"><a href="http://scholar.google.com/scholar?q=%22author%3ALabrenz%20author%3AM.%22"
+                              class="cb-art-gs-auth author-link">Articles by  Labrenz, M.</a></li>
+                        <li class="cb-art-gs-auth author-link"><a href="http://scholar.google.com/scholar?q=%22author%3AJ%C3%BCrgens%20author%3AK.%22"
+                              class="cb-art-gs-auth author-link">Articles by  Jürgens, K.</a></li>
+                        <li class="cb-art-gs-rel similar-link"><a href="/external-ref?access_num=http://ijs.sgmjournals.org/content/63/Pt_11/4141.abstract&amp;link_type=GOOGLESCHOLARRELATED">Search for related content</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-pm">
+                     <h4 class="cb-section-header"><span>PubMed</span></h4>
+                     <ol>
+                        <li class="cb-art-pm-cite cite-link icon-link"><a href="/external-ref?access_num=23749282&amp;link_type=PUBMED"
+                              class="cb-art-pm-cite cite-link icon-link">PubMed citation</a></li>
+                        <li class="cb-art-pm-auth author-link"><a href="/external-ref?access_num=Labrenz%20M&amp;link_type=AUTHORSEARCH"
+                              class="cb-art-pm-auth author-link">Articles by  Labrenz, M.</a></li>
+                        <li class="cb-art-pm-auth author-link"><a href="/external-ref?access_num=J%C3%BCrgens%20K&amp;link_type=AUTHORSEARCH"
+                              class="cb-art-pm-auth author-link">Articles by  Jürgens, K.</a></li>
+                        <li>
+                           <div id="cb-entrez-links-placeholder"><a href="/entrez-links/23749282"></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-rel">
+                     <h4 class="cb-section-header"><span>Related Content</span></h4>
+                     <ol>
+                        <li><a href="/content/63/Pt_11/4141.full?related-urls=yes&amp;legid=ijs;63/Pt_11/4141#related-urls"
+                              id="cb-related-urls">Load related web page information</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed soc-links icon-link"
+                       id="cb-art-soc">
+                     <h4 class="cb-section-header"><span>Social Bookmarking</span></h4>
+                     <ol>
+                        <li>
+                           <div class="social-bookmarking">
+                              
+                              <ul class="social-bookmark-links">
+                                 <li class="social-bookmarking-item social-bookmarking-item-citeulike"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=CITEULIKE"><img src="/shared/img/common/social-bookmarking/citeulike.gif"
+                                            alt="Add to CiteULike"
+                                            title="CiteULike" /></a><span class="soc-bm-link-text">CiteULike</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-delicious"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=DEL_ICIO_US"><img src="/shared/img/common/social-bookmarking/delicious.gif"
+                                            alt="Add to Delicious"
+                                            title="Delicious" /></a><span class="soc-bm-link-text">Delicious</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-digg"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=DIGG"><img src="/shared/img/common/social-bookmarking/digg.gif" alt="Add to Digg"
+                                            title="Digg" /></a><span class="soc-bm-link-text">Digg</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-facebook"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/short/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=FACEBOOK"
+                                       class="sb-facebook"
+                                       rel="external-nw"><img src="/shared/img/common/social-bookmarking/facebook.gif" alt="Add to Facebook"
+                                            title="Facebook" /></a><span class="soc-bm-link-text">Facebook</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-googleplus"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=GOOGLEPLUS&amp;log_only=yes"><img src="/shared/img/common/social-bookmarking/googleplus.jpg" alt="Add to Google+"
+                                            title="Google+" /></a><span class="soc-bm-link-text">Google+</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-linkedin"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=LINKEDIN"><img src="/shared/img/common/social-bookmarking/linkedin.gif" alt="Add to LinkedIn"
+                                            title="LinkedIn" /></a><span class="soc-bm-link-text">LinkedIn</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-mendeley"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=MENDELEY"><img src="/shared/img/common/social-bookmarking/mendeley.gif" alt="Add to Mendeley"
+                                            title="Mendeley" /></a><span class="soc-bm-link-text">Mendeley</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-reddit"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=REDDIT"><img src="/shared/img/common/social-bookmarking/reddit.gif" alt="Add to Reddit"
+                                            title="Reddit" /></a><span class="soc-bm-link-text">Reddit</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-twitter"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4141&amp;title=Sulfurimonas%20gotlandica%20sp.%20nov.%2C%20a%20chemoautotrophic%20and%20psychrotolerant%20epsilonproteobacterium%20isolated%20from%20a%20pelagic%20redoxcline%2C%20and%20an%20emended%20description%20of%20the%20genus%20Sulfurimonas+--+Labrenz%20et%20al.%2063%20%28Pt%2011%29%3A%204141+--+IJSEM&amp;doi=10.1099/ijs.0.048827-0&amp;link_type=TWITTER"><img src="/shared/img/common/social-bookmarking/twitter.gif" alt="Add to Twitter"
+                                            title="Twitter" /></a><span class="soc-bm-link-text">Twitter</span></li>
+                              </ul>
+                              
+                              <p class="social-bookmarking-help"><a href="/help/social_bookmarks.dtl">What's this?</a></p>
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+            
+            <div class="content-box" id="article-dyn-nav">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>Navigate This Article</span></h3>
+                  <div class="cb-section" id="cb-art-nav">
+                     <ol>
+                        <li><a href="#content-block">Top</a></li>
+                        <li><a href="#abstract-1">Abstract</a></li>
+                        <li><a href="#ack-1">Acknowledgements</a></li>
+                        <li><a href="#ref-list-1">References</a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+         </div>
+         <div id="col-3">
+            
+            <div class="content-box" id="sidebar-current-issue">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Month's Issue</span></h3>
+                  <div class="cb-section">
+                     <ol>
+                        <li><span><a href="/content/current" rel="current-issue">April 2015, 65 (Pt 4)</a></span></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section">
+                     <ol>
+                        <li>
+                           <div class="current-issue"><a href="/content/current" rel="current-issue"><img src="/content/65/Pt_4.cover.gif" width="67" height="89" alt="Current Issue" /></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section sidebar-etoc-link">
+                     <ol>
+                        <li><a href="/cgi/alerts/etoc">Alert me to new issues of IJSEM
+                              </a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            <div id="sidebar-global-nav">
+               
+               		
+               <ul class="button-list pub-links">
+                  <li class="first"><a href="/site/misc/about.xhtml" title="ABOUT IJSEM"><span>ABOUT IJSEM</span></a></li>
+                  <li><a href="/site/misc/edboard.xhtml" title="EDITORIAL BOARD &amp; STAFF"><span>EDITORIAL BOARD &amp; STAFF</span></a></li>
+                  <li><a href="http://www.editorialmanager.com/ijs/" title="SUBMIT A MANUSCRIPT"><span>SUBMIT A MANUSCRIPT</span></a></li>
+                  <li><a href="/site/misc/ifora.xhtml" title="INFORMATION FOR AUTHORS"><span>INFORMATION FOR AUTHORS</span></a></li>
+                  <li><a href="/site/misc/iforr.xhtml" title="INFORMATION FOR REVIEWERS"><span>INFORMATION FOR REVIEWERS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/site/librarians/index.xhtml"
+                        title="INFORMATION FOR LIBRARIANS"><span>INFORMATION FOR LIBRARIANS</span></a></li>
+                  <li><a href="/site/misc/reprints.xhtml" title="PERMISSIONS AND REPRINTS"><span>PERMISSIONS AND REPRINTS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/subscriptions" title="SUBSCRIPTIONS"><span>SUBSCRIPTIONS</span></a></li>
+                  <li><a href="/site/misc/addir.xhtml" title="ADVERTISING"><span>ADVERTISING</span></a></li>
+                  <li class="rss-img-button"><a href="/site/misc/alerts_feeds.xhtml" title="ALERTS &amp; FEEDS"><span>ALERTS &amp; FEEDS</span></a></li>
+                  <li class="last"><a href="/feedback" title="FEEDBACK"><span>FEEDBACK</span></a></li>
+               </ul>
+               		
+               <ul class="button-list pub-links umbrella-links">
+                  <li class="first"><a href="http://mic.sgmjournals.org" title="MICROBIOLOGY"><span>MICROBIOLOGY</span></a></li>
+                  <li><a href="http://vir.sgmjournals.org" title="J GEN VIROL"><span>J GEN VIROL</span></a></li>
+                  <li><a href="http://jmm.sgmjournals.org" title="J MED MICROBIOL"><span>J MED MICROBIOL</span></a></li>
+                  <li><a href="http://jmmcr.sgmjournals.org" title="JMM CASE REPORTS"><span>JMM CASE REPORTS</span></a></li>
+                  <li class="last"><a href="http://www.sgmjournals.org" title="ALL SGM JOURNALS"><span>ALL SGM JOURNALS</span></a></li>
+               </ul>
+               		
+               <div class="sidebar-icon-group">
+                  			
+                  <div class="icons">
+                     			<a href="http://www.sgm.ac.uk/" rel="external-nw"><img src="/publisher/img/society_logo.gif" class="publisher-icon" alt="Society Logo" /></a>
+                     			<a href="http://www.the-icsp.org/" rel="external-nw"><img src="/publisher/img/icsp_logo.gif" class="publisher-icon" alt="ICSP Logo" /></a>
+                     			<a href="http://highwire.stanford.edu/" rel="external-nw"><img src="/publisher/img/hplogo.gif" class="hw-icon" alt="HighWire Press Logo" /></a>
+                     			
+                  </div>
+                  			
+                  <div class="sidebar-icon-text"><span>The <a href="http://www.sgmjournals.org"> Society for General Microbiology</a> publishes online with the assistance of <a href="http://highwire.stanford.edu">HighWire Press®</a>.</span></div>
+                  		
+               </div>
+               	
+            </div>
+            <div class="most-links-box js-marker">
+               
+               <div class="most-header">
+                  
+                  <h3>Most</h3>
+                  
+               </div>
+               
+               <ul>
+                  <li class="most-cur-sel">
+                     <h4>Viewed</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/1070?rss=1&amp;ssource=mfr">Proposal to consistently apply the International Code of Nomenclature of Prokaryotes (ICNP) to names of the oxygenic photosynthetic
+                                 bacteria (cyanobacteria), including those validly published under the International Code of Botanical Nomenclature (ICBN)/International
+                                 Code of Nomenclature for algae, fungi and plants (ICN), and proposal to change Principle 2 of the ICNP</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfr">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/316?rss=1&amp;ssource=mfr">Integrating genomics into the taxonomy and systematics of the Bacteria and Archaea</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/333?rss=1&amp;ssource=mfr">Applications of next-generation sequencing to unravelling the evolutionary history of algae</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/739?rss=1&amp;ssource=mfr">Notification that new names of prokaryotes, new combinations, and new taxonomic opinions have appeared in volume 64, part
+                                 12, of the IJSEM</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfr1.dtl" class="view-all">» View all Most Viewed articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+                  <li>
+                     <h4>Cited</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4386?rss=1&amp;ssource=mfc">Chryseobacterium hispalense sp. nov., a plant-growth-promoting bacterium isolated from a rainwater pond in an olive plant
+                                 nursery, and emended descriptions of Chryseobacterium defluvii, Chryseobacterium indologenes, Chryseobacterium wanjuense and
+                                 Chryseobacterium gregarium</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfc">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_1/138?rss=1&amp;ssource=mfc">Aquibacter zeaxanthinifaciens gen. nov., sp. nov., a zeaxanthin-producing bacterium of the family Flavobacteriaceae isolated
+                                 from surface seawater, and emended descriptions of the genera Aestuariibaculum and Gaetbulibacter</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4790?rss=1&amp;ssource=mfc">Kordia aquimaris sp. nov., a zeaxanthin-producing member of the family Flavobacteriaceae isolated from surface seawater, and
+                                 emended description of the genus Kordia</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4524?rss=1&amp;ssource=mfc">Erythrobacter odishensis sp. nov. and Pontibacter odishensis sp. nov. isolated from dry soil of a solar saltern</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfc1.dtl" class="view-all">» View all Most Cited articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+               </ul>
+               
+               
+            </div>
+            
+            
+            
+         </div>
+         <div id="footer">
+            
+            <div class="bar">
+               
+               <div class="footer-group footer-col-left">
+                  		
+                  <p class="copyright">Copyright ©
+                     		2015 International Union of Microbiological Societies
+                     	
+                  </p>
+                  	
+               </div>
+               
+               <div class="footer-group footer-col-right">
+                  	    
+                  <ul class="issns">
+                     <li>
+                        <span>Print ISSN: </span>
+                        <span class="issn">1466-5026</span>
+                        
+                     </li>
+                     <li>
+                        <span>Online ISSN: </span>
+                        <span class="issn">1466-5034</span>
+                        
+                     </li>
+                  </ul>
+                  	  
+               </div>
+               	  
+            </div>
+            
+            
+            <div class="block-2 sb-div"></div>
+            
+         </div><script type="text/javascript">
+        var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
+        document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
+        </script><script type="text/javascript">
+        try {
+        var pageTracker = _gat._getTracker("UA-189672-25");
+        pageTracker._setDomainName(".sgmjournals.org");
+        pageTracker._trackPageview();
+        } catch(err) {}
+        </script><script type="text/javascript">
+	(function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
+		(i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
+		m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
+	})(window,document,'script','//www.google-analytics.com/analytics.js','ga');
+
+	ga('create', 'UA-48529861-1', '.sgmjournals.org');
+	ga('send', 'pageview');
+	</script></div>
+   </body>
+</html>
\ No newline at end of file
diff --git a/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4141.full/fulltext.pdf b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4141.full/fulltext.pdf
new file mode 100644
index 00000000..07da41b7
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4141.full/fulltext.pdf differ
diff --git a/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4174.full/fulltext.html b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4174.full/fulltext.html
new file mode 100644
index 00000000..e837245e
--- /dev/null
+++ b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4174.full/fulltext.html
@@ -0,0 +1,23 @@
+<!DOCTYPE html
+  PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html
+      xmlns="http://www.w3.org/1999/xhtml"
+      xml:lang="en"
+      lang="en">
+   <head>
+      <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
+      <title>Arthrobacter siccitolerans sp. nov., a highly desiccation-tolerant, xeroprotectant-producing strain isolated from dry soil
+         
+      </title>
+      <meta name="googlebot" content="NOODP" />
+      <meta name="HW.ad-path" content="/cgi/content/full/63/Pt_11/4174" />
+      <meta content="/ijs/63/Pt_11/4174.atom" name="HW.identifier" />
+      <meta name="DC.Format" content="text/html" />
+      <meta name="DC.Language" content="en" />
+      <meta content="Arthrobacter siccitolerans sp. nov., a highly desiccation-tolerant, xeroprotectant-producing strain isolated from dry soil"
+            name="DC.Title" />
+      <meta content="10.1099/ijs.0.052902-0" name="DC.Identifier" />
+      <meta content="2013-11-01" name="DC.Date" />
+      <meta content="Society for General Microbiology" name="DC.Publisher" />
+      <meta content="L. SantaCruz-Calvo" name="DC.Contributor" />
+      <meta content="J. González-López" name="DC.C
\ No newline at end of file
diff --git a/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4174.full/fulltext.pdf b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4174.full/fulltext.pdf
new file mode 100644
index 00000000..ed8bb19a
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4174.full/fulltext.pdf differ
diff --git a/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/F2.large.jpg b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/F2.large.jpg
new file mode 100644
index 00000000..5062af48
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/F2.large.jpg differ
diff --git a/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/fulltext.html b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/fulltext.html
new file mode 100644
index 00000000..313ba305
--- /dev/null
+++ b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/fulltext.html
@@ -0,0 +1,1390 @@
+<!DOCTYPE html
+  PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html
+      xmlns="http://www.w3.org/1999/xhtml"
+      xml:lang="en"
+      lang="en">
+   <head>
+      <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
+      <title>Prevotella jejuni sp. nov., isolated from the small intestine of a child with coeliac disease </title>
+      <meta name="googlebot" content="NOODP" />
+      <meta name="HW.ad-path" content="/cgi/content/full/63/Pt_11/4218" />
+      <meta content="/ijs/63/Pt_11/4218.atom" name="HW.identifier" />
+      <meta name="DC.Format" content="text/html" />
+      <meta name="DC.Language" content="en" />
+      <meta content="Prevotella jejuni sp. nov., isolated from the small intestine of a child with coeliac disease"
+            name="DC.Title" />
+      <meta content="10.1099/ijs.0.052647-0" name="DC.Identifier" />
+      <meta content="2013-11-01" name="DC.Date" />
+      <meta content="Society for General Microbiology" name="DC.Publisher" />
+      <meta content="Maria E. Hedberg" name="DC.Contributor" />
+      <meta content="Anne Israelsson" name="DC.Contributor" />
+      <meta content="Edward R. B. Moore" name="DC.Contributor" />
+      <meta content="Liselott Svensson-Stadler" name="DC.Contributor" />
+      <meta content="Sun Nyunt Wai" name="DC.Contributor" />
+      <meta content="Grzegorz Pietz" name="DC.Contributor" />
+      <meta content="Olof Sandström" name="DC.Contributor" />
+      <meta content="Olle Hernell" name="DC.Contributor" />
+      <meta content="Marie-Louise Hammarström" name="DC.Contributor" />
+      <meta content="Sten Hammarström" name="DC.Contributor" />
+      <meta content="International Journal of Systematic and Evolutionary&#xA;                Microbiology"
+            name="citation_journal_title" />
+      <meta content="Int J Syst Evol&#xA;                Microbiol"
+            name="citation_journal_abbrev" />
+      <meta content="1466-5026" name="citation_issn" />
+      <meta content="1466-5034" name="citation_issn" />
+      <meta name="citation_author" content="Maria E. Hedberg" />
+      <meta name="citation_author_institution"
+            content="1Department of Clinical Microbiology, Immunology, Umeå University, SE-90187 Umeå, Sweden" />
+      <meta name="citation_author" content="Anne Israelsson" />
+      <meta name="citation_author_institution"
+            content="1Department of Clinical Microbiology, Immunology, Umeå University, SE-90187 Umeå, Sweden" />
+      <meta name="citation_author" content="Edward R. B. Moore" />
+      <meta name="citation_author_institution"
+            content="2CCUG – Culture Collection University of Gothenburg, Department of Clinical Bacteriology, Sahlgrenska University Hospital, SE-41345 Göteborg, Sweden" />
+      <meta name="citation_author_institution"
+            content="3Department of Infectious Diseases, Sahlgrenska Academy of the University of Gothenburg, SE-40530 Göteborg, Sweden" />
+      <meta name="citation_author" content="Liselott Svensson-Stadler" />
+      <meta name="citation_author_institution"
+            content="2CCUG – Culture Collection University of Gothenburg, Department of Clinical Bacteriology, Sahlgrenska University Hospital, SE-41345 Göteborg, Sweden" />
+      <meta name="citation_author" content="Sun Nyunt Wai" />
+      <meta name="citation_author_institution"
+            content="4Department of Molecular Biology, Umeå University, SE-90187 Umeå, Sweden" />
+      <meta name="citation_author" content="Grzegorz Pietz" />
+      <meta name="citation_author_institution"
+            content="1Department of Clinical Microbiology, Immunology, Umeå University, SE-90187 Umeå, Sweden" />
+      <meta name="citation_author" content="Olof Sandström" />
+      <meta name="citation_author_institution"
+            content="5Department of Clinical Sciences, Pediatrics, Umeå University, SE-90187 Umeå, Sweden" />
+      <meta name="citation_author" content="Olle Hernell" />
+      <meta name="citation_author_institution"
+            content="5Department of Clinical Sciences, Pediatrics, Umeå University, SE-90187 Umeå, Sweden" />
+      <meta name="citation_author" content="Marie-Louise Hammarström" />
+      <meta name="citation_author_institution"
+            content="1Department of Clinical Microbiology, Immunology, Umeå University, SE-90187 Umeå, Sweden" />
+      <meta name="citation_author" content="Sten Hammarström" />
+      <meta name="citation_author_institution"
+            content="1Department of Clinical Microbiology, Immunology, Umeå University, SE-90187 Umeå, Sweden" />
+      <meta content="Prevotella jejuni sp. nov., isolated from the small intestine of a child with coeliac disease"
+            name="citation_title" />
+      <meta content="11/01/2013" name="citation_date" />
+      <meta content="63" name="citation_volume" />
+      <meta content="Pt 11" name="citation_issue" />
+      <meta content="4218" name="citation_firstpage" />
+      <meta content="4223" name="citation_lastpage" />
+      <meta content="63/Pt_11/4218" name="citation_id" />
+      <meta content="63/Pt 11/4218" name="citation_id_from_sass_path" />
+      <meta content="ijs;63/Pt_11/4218" name="citation_mjid" />
+      <meta content="10.1099/ijs.0.052647-0" name="citation_doi" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4218.abstract"
+            name="citation_abstract_html_url" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4218.full"
+            name="citation_fulltext_html_url" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4218.full.pdf"
+            name="citation_pdf_url" />
+      <meta content="/content/63/Pt_11.cover.gif" name="issue_cover_image" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4218"
+            name="citation_public_url" />
+      <meta content="23793857" name="citation_pmid" />
+      <meta name="citation_access" content="all" />
+      <meta name="citation_fulltext_world_readable" content="" />
+      <meta name="citation_section" content="Bacteroidetes" />
+      <meta name="robots" content="noarchive,nofollow" />
+      <meta name="googlebot" content="noarchive" />
+      <link href="/content/63/Pt_11/4207.short" rel="prev" />
+      <link href="/content/63/Pt_11/4224.short" rel="next" />
+      <link rel="stylesheet" type="text/css" media="all" href="/shared/css/hw-global.css" />
+      <link rel="stylesheet" type="text/css" media="print" href="/shared/css/hw-print.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/standard-designs/design25/main.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/local/css/hw-local-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/jquery.fancybox-1.3.4.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-global-colexpand.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-global-colexpand.css" /><script type="text/javascript" id="session-d6344287e1">var callbackToken='563D232F73E9C85';</script><script type="text/javascript" id="session-d6344287e3">
+                      var subCode='sgmjournal_sub';
+                    </script><script type="text/javascript" src="/shared/js/jquery-min.js"></script><script type="text/javascript" src="/shared/js/fingerprint.js"></script><script type="text/javascript" src="/shared/js/hw-shared.js"></script><script type="text/javascript" src="/shared/js/design/hw-design1.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-shared.js"></script><script type="text/javascript" src="/shared/js/pages/hw-content.js"></script><script type="text/javascript" src="/shared/js/fancybox/jquery.fancybox-1.3.4.js"></script><script type="text/javascript" src="/shared/js/fancybox/jquery.easing-1.3.pack.js"></script><script type="text/javascript"
+              src="/shared/js/fancybox/jquery.mousewheel-3.0.4.pack.js"></script><script type="text/javascript" src="/shared/js/util/content.jquery.addVariantLink.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-custom-free.js"></script><script type="text/javascript" src="/shared/js/util/hw-col-expand.js"></script><script type="text/javascript"
+              src="https://data.namesforlife.com/script/NamesforLife.js"></script></head>
+   <body>
+      <div class="hw-gen-page pagetype-content" id="pageid-content" itemscope="itemscope"
+           itemtype="http://schema.org/ScholarlyArticle">
+         <div id="header">
+            
+            <h1><a id="logo" href="/"><span>International Journal of Systematic and Evolutionary Microbiology</span></a></h1>
+            
+            <p id="skip-link">
+               <a href="#content-block">Skip to main page content</a>
+               
+            </p>
+            
+            <ul class="button-list header-buttons">
+               <li class="first"><a href="/" title="HOME"><span>HOME</span></a></li>
+               <li><a href="/content/current" title="CURRENT ISSUE"><span>CURRENT ISSUE</span></a></li>
+               <li><a href="/content" title="ARCHIVE"><span>ARCHIVE</span></a></li>
+               <li><a href="/search" title="SEARCH"><span>SEARCH</span></a></li>
+               <li><a href="/help" title="HELP"><span>HELP</span></a></li>
+               <li class="last"><a href="/feedback" title="CONTACT US"><span>CONTACT US</span></a></li>
+            </ul>
+            
+            
+            <div class="header-qs">
+               
+               <form class="searchbox" action="/search" method="get">
+                  <div>
+                     	<label for="header-qs-input" id="header-qs-search-label">Search for Keyword:</label>
+                     <input value="" title="Search" type="text" name="fulltext" id="header-qs-input" /><input type="hidden" name="submit" value="yes" /><label for="header-qs-search" id="header-qs-search-label">GO</label><input value="GO" alt="Link: Go" type="image" id="header-qs-search-go"
+                            src="/shared/img/standard-design/design2/go.gif" /> 
+                     
+                  </div>
+                  <div class="adv-search-link"><a href="/search">Advanced Search</a></div>
+               </form>
+               
+               
+            </div>
+            
+            <div class="header-ac-elements">
+               
+               <div id="authstring" class="suppress-header-login">
+                  
+                  <ul>
+                     <li class="subscr-ref">Institution: THE NATURAL HISTORY MUSEUM</li>
+                     <li>
+                        <a href="/login?uri=http%3A%2F%2Fijs.sgmjournals.org%2Fcontent%2F63%2FPt_11%2F4218.full">
+                           Sign In as Member / Individual
+                           </a>
+                        
+                     </li>
+                  </ul>           
+                  
+               </div> 
+               
+               <div id="hdr-login" class="suppress-header-login"></div>
+               
+            </div>
+            
+            <div class="banner-ads">
+               		
+               <ul>
+                  <li class="position-1 no-ad hdr_left"><span>  </span></li>
+               </ul>
+               	
+            </div>
+            
+            <div class="bar">
+               
+               <div class="bar-inner"></div>
+               
+            </div>
+            
+         </div>
+         <div id="content-block">
+            <div class="article fulltext-view " itemprop="articleBody"><span class="highwire-journal-article-marker-start"></span><h1 id="article-title-1" itemprop="headline"><em>Prevotella jejuni</em> sp. nov., isolated from the small intestine of a child with coeliac disease
+               </h1>
+               <div class="contributors">
+                  <ol class="contributor-list" id="contrib-group-1">
+                     <li class="contributor" id="contrib-1" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Maria+E.+Hedberg&amp;sortspec=date&amp;submit=Submit">Maria E. Hedberg</a></span><a id="xref-aff-1-1" class="xref-aff" href="#aff-1"><sup>1</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-2" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Anne+Israelsson&amp;sortspec=date&amp;submit=Submit">Anne Israelsson</a></span><a id="xref-aff-1-2" class="xref-aff" href="#aff-1"><sup>1</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-3" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Edward+R.+B.+Moore&amp;sortspec=date&amp;submit=Submit">Edward R. B. Moore</a></span><a id="xref-aff-2-1" class="xref-aff" href="#aff-2"><sup>2</sup></a><span class="xref-sep">,</span><a id="xref-aff-3-1" class="xref-aff" href="#aff-3"><sup>3</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-4" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Liselott+Svensson-Stadler&amp;sortspec=date&amp;submit=Submit">Liselott Svensson-Stadler</a></span><a id="xref-aff-2-2" class="xref-aff" href="#aff-2"><sup>2</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-5" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Sun+Nyunt+Wai&amp;sortspec=date&amp;submit=Submit">Sun Nyunt Wai</a></span><a id="xref-aff-4-1" class="xref-aff" href="#aff-4"><sup>4</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-6" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Grzegorz+Pietz&amp;sortspec=date&amp;submit=Submit">Grzegorz Pietz</a></span><a id="xref-aff-1-3" class="xref-aff" href="#aff-1"><sup>1</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-7" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Olof+Sandstr%C3%B6m&amp;sortspec=date&amp;submit=Submit">Olof Sandström</a></span><a id="xref-aff-5-1" class="xref-aff" href="#aff-5"><sup>5</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-8" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Olle+Hernell&amp;sortspec=date&amp;submit=Submit">Olle Hernell</a></span><a id="xref-aff-5-2" class="xref-aff" href="#aff-5"><sup>5</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-9" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Marie-Louise+Hammarstr%C3%B6m&amp;sortspec=date&amp;submit=Submit">Marie-Louise Hammarström</a></span><a id="xref-aff-1-4" class="xref-aff" href="#aff-1"><sup>1</sup></a> and 
+                     </li>
+                     <li class="last" id="contrib-10"><span class="name"><a class="name-search"
+                              href="/search?author1=Sten+Hammarstr%C3%B6m&amp;sortspec=date&amp;submit=Submit">Sten Hammarström</a></span><a id="xref-aff-1-5" class="xref-aff" href="#aff-1"><sup>1</sup></a></li>
+                  </ol>
+                  <ol class="affiliation-list">
+                     <li class="aff"><a id="aff-1" name="aff-1"></a><address><sup>1</sup>Department of Clinical Microbiology, Immunology, Umeå University, SE-90187 Umeå, Sweden
+                        </address>
+                     </li>
+                     <li class="aff"><a id="aff-2" name="aff-2"></a><address><sup>2</sup>CCUG – Culture Collection University of Gothenburg, Department of Clinical Bacteriology, Sahlgrenska University Hospital,
+                           SE-41345 Göteborg, Sweden
+                        </address>
+                     </li>
+                     <li class="aff"><a id="aff-3" name="aff-3"></a><address><sup>3</sup>Department of Infectious Diseases, Sahlgrenska Academy of the University of Gothenburg, SE-40530 Göteborg, Sweden
+                        </address>
+                     </li>
+                     <li class="aff"><a id="aff-4" name="aff-4"></a><address><sup>4</sup>Department of Molecular Biology, Umeå University, SE-90187 Umeå, Sweden
+                        </address>
+                     </li>
+                     <li class="aff"><a id="aff-5" name="aff-5"></a><address><sup>5</sup>Department of Clinical Sciences, Pediatrics, Umeå University, SE-90187 Umeå, Sweden
+                        </address>
+                     </li>
+                  </ol>
+                  <ol class="corresp-list">
+                     <li class="corresp" id="corresp-1"><strong>Correspondence</strong><br /> Maria E. Hedberg <span class="em-link"><span class="em-addr">maria.hedberg{at}climi.umu.se</span></span> Sten Hammarström <span class="em-link"><span class="em-addr">sten.hammarstrom{at}climi.umu.se</span></span></li>
+                  </ol>
+               </div>
+               <div class="section abstract" id="abstract-1" itemprop="description">
+                  <div class="section-nav">
+                     <div class="nav-placeholder"> </div><a href="#fn-group-1" title="Next Section" class="next-section-link"><span>Next Section</span></a></div>
+                  <h2>Abstract</h2>
+                  
+                  <p id="p-4">Five obligately anaerobic, Gram-stain-negative, saccharolytic and proteolytic, non-spore-forming bacilli (strains CD3 : 27,
+                     CD3 : 28<sup>T</sup>, CD3 : 33, CD3 : 32 and CD3 : 34) are described. All five strains were isolated from the small intestine of a female child
+                     with coeliac disease. Cells of the five strains were short rods or coccoid cells with longer filamentous forms seen sporadically.
+                     The organisms produced acetic acid and succinic acid as major metabolic end products. Phylogenetic analysis based on comparative
+                     16S rRNA gene sequence analysis revealed close relationships between CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33, between CD3 : 32 and <span class="named-content species" id="named-content-1"><a class="namesforlife" rel="namesforlife-name" title="Prevotella histicola"
+                           href="doi:10.1601/nm.13539"><em>Prevotella histicola</em></a></span> CCUG 55407<sup>T</sup>, and between CD3 : 34 and <span class="named-content species" id="named-content-2"><a class="namesforlife" rel="namesforlife-name" title="Prevotella melaninogenica"
+                           href="doi:10.1601/nm.8043"><em>Prevotella melaninogenica</em></a></span> CCUG 4944B<sup>T</sup>. Strains CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33 were clearly different from all recognized species within the genus <span class="named-content genus" id="named-content-3"><a class="namesforlife" rel="namesforlife-name" title="Prevotella"
+                           href="doi:10.1601/nm.8042"><em>Prevotella</em></a></span> and related most closely to but distinct from <span class="named-content species" id="named-content-4"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                           href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span>. Based on 16S rRNA, RNA polymerase β-subunit (<em>rpoB</em>) and 60 kDa chaperonin protein subunit (<em>cpn60</em>) gene sequencing, and phenotypic, chemical and biochemical properties, strains CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33 are considered to represent a novel species within the genus <span class="named-content genus" id="named-content-5"><a class="namesforlife" rel="namesforlife-name" title="Prevotella"
+                           href="doi:10.1601/nm.8042"><em>Prevotella</em></a></span>, for which the name <em>Prevotella jejuni</em> sp. nov. is proposed. Strain CD3 : 28<sup>T</sup> ( = CCUG 60371<sup>T</sup> = DSM 26989<sup>T</sup>) is the type strain of the proposed novel species. All five strains were able to form homologous aggregates, in which tube-like
+                     structures were connecting individual bacteria cells. The five strains were able to bind to human intestinal carcinoma cell
+                     lines at 37 °C.
+                  </p>
+                  
+               </div>
+               <div class="section fn-group" id="fn-group-1">
+                  <div class="section-nav"><a href="#abstract-1" title="Abstract" class="prev-section-link"><span>Previous Section</span></a><a href="#sec-1" title="Next Section" class="next-section-link"><span>Next Section</span></a></div>
+                  <ul>
+                     <li class="fn-other" id="fn-1">
+                        <p id="p-1">The GenBank/EMBL/DDBJ accession number for the 16S rRNA gene sequence of strain CD3 : 28<sup>T</sup> is JQ778983.
+                        </p>
+                     </li>
+                     <li class="fn-supplementary-material" id="fn-2">
+                        <p id="p-2">One supplementary figure and three supplementary tables are available with the online version of this paper.</p>
+                     </li>
+                  </ul>
+               </div>
+               <div class="license" id="license-1">
+                  <p id="p-3">This is an open-access article distributed under the terms of the Creative Commons Attribution License, which permits unrestricted
+                     use, distribution, and reproduction in any medium, provided the original work is properly cited.
+                  </p>
+               </div>
+               <p id="p-12">Coeliac disease (CD) is an immune-mediated enteropathy with a multifactorial aetiology. Early childhood infections have been
+                  shown to be a risk factor for CD (<a id="xref-ref-13-1" class="xref-bibr" href="#ref-13">Myléus <em>et al.</em>, 2012</a>). Also, the jejunal microbiota is considered to play a role in the pathogenesis of CD (<a id="xref-ref-14-1" class="xref-bibr" href="#ref-14">Olivares <em>et al.</em>, 2013</a>). This is supported by epidemiological data from Sweden showing that childhood CD has features of an infectious disease with
+                  a peak incidence between 1985 and 1996 in children younger than 2 years of age, a period referred to as ‘the Swedish CD epidemic’
+                  (<a id="xref-ref-10-1" class="xref-bibr" href="#ref-10">Ivarsson <em>et al.</em>, 2000</a>). A similar increase in incidence was seen later, during 2001–2004 (<a id="xref-ref-15-1" class="xref-bibr" href="#ref-15">Olsson <em>et al.</em>, 2008</a>; Namatovu, F. <em>et</em> <em>al.</em>, unpublished data). After both peaks, incidence returned to normal. We have shown that CD patients born during ‘the Swedish
+                  CD epidemic’ had a significant enrichment of mucosa-associated rod-shaped bacteria of the order <span class="named-content order" id="named-content-6"><a class="namesforlife" rel="namesforlife-name" title="Clostridiales"
+                        href="doi:10.1601/nm.3876"><em>Clostridiales</em></a></span>, and genera <span class="named-content genus" id="named-content-7"><a class="namesforlife" rel="namesforlife-name" title="Prevotella"
+                        href="doi:10.1601/nm.8042"><em>Prevotella</em></a></span> and <span class="named-content genus" id="named-content-8"><a class="namesforlife" rel="namesforlife-name" title="Actinomyces"
+                        href="doi:10.1601/nm.5771"><em>Actinomyces</em></a></span> in the jejunum (<a id="xref-ref-5-1" class="xref-bibr" href="#ref-5">Forsberg <em>et al.</em>, 2004</a>; <a id="xref-ref-16-1" class="xref-bibr" href="#ref-16">Ou <em>et al.</em>, 2009</a>). Recently, we characterized a novel species of a new genus, <span class="named-content species" id="named-content-9"><a class="namesforlife" rel="namesforlife-name"
+                        title="Lachnoanaerobaculum umeaense"
+                        href="doi:10.1601/nm.23523"><em>Lachnoanaerobaculum umeaense</em></a></span>, that had been isolated from the jejunal mucosa of a child born during ‘the Swedish CD epidemic’ (<a id="xref-ref-9-1" class="xref-bibr" href="#ref-9">Hedberg <em>et al.</em>, 2012</a>). We assumed that this bacterium corresponded to the prevalent bacteria of the order <span class="named-content order" id="named-content-10"><a class="namesforlife" rel="namesforlife-name" title="Clostridiales"
+                        href="doi:10.1601/nm.3876"><em>Clostridiales</em></a></span> we had previously reported (<a id="xref-ref-16-2" class="xref-bibr" href="#ref-16">Ou <em>et al.</em>, 2009</a>). To further characterize the microbiota of the small intestine of children with CD born during the first epidemic we have
+                  now studied isolates of the genus <span class="named-content genus" id="named-content-11"><a class="namesforlife" rel="namesforlife-name" title="Prevotella"
+                        href="doi:10.1601/nm.8042"><em>Prevotella</em></a></span>.
+               </p>
+               <p id="p-13">At the time of writing, 48 species of the genus <span class="named-content genus" id="named-content-12"><a class="namesforlife" rel="namesforlife-name" title="Prevotella"
+                        href="doi:10.1601/nm.8042"><em>Prevotella</em></a></span> have been described (<a id="xref-ref-4-1" class="xref-bibr" href="#ref-4">Euzéby, 2013</a>). The vast majority were isolated from humans, with the oral cavity being the main source (<a id="xref-ref-2-1" class="xref-bibr" href="#ref-2">Dewhirst <em>et al.</em>, 2010</a>). However, <span class="named-content genus" id="named-content-13"><a class="namesforlife" rel="namesforlife-name" title="Prevotella"
+                        href="doi:10.1601/nm.8042"><em>Prevotella</em></a></span> species have also been isolated from faeces (<a id="xref-ref-8-1" class="xref-bibr" href="#ref-8">Hayashi <em>et al.</em>, 2007</a>), the female genital tract, skin and respiratory tract, and from the rumen and hindgut of non-human mammals (<a id="xref-ref-1-1" class="xref-bibr" href="#ref-1">Alauzet <em>et al.</em>, 2010</a>). Until now, no species of the genus <span class="named-content genus" id="named-content-14"><a class="namesforlife" rel="namesforlife-name" title="Prevotella"
+                        href="doi:10.1601/nm.8042"><em>Prevotella</em></a></span> from the human small intestine had been characterized. Species of the genus <span class="named-content genus" id="named-content-15"><a class="namesforlife" rel="namesforlife-name" title="Prevotella"
+                        href="doi:10.1601/nm.8042"><em>Prevotella</em></a></span> are generally considered to be non-pathogenic or opportunistic pathogens. However, they have been shown to be involved in
+                  serious infections, and virulence factors such as haemolysins, haemagglutinins, fimbrial adhesins, proteases and phospholipases
+                  have been demonstrated in strains of several species (<a id="xref-ref-1-2" class="xref-bibr" href="#ref-1">Alauzet <em>et al.</em>, 2010</a>).
+               </p>
+               <p id="p-14">This study describes the phenotypic and genotypic characterization of strains CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33, representing isolates of a novel species, CD3 : 32, probably a strain of <span class="named-content species" id="named-content-16"><a class="namesforlife" rel="namesforlife-name" title="Prevotella histicola"
+                        href="doi:10.1601/nm.13539"><em>Prevotella histicola</em></a></span> (<a id="xref-ref-3-1" class="xref-bibr" href="#ref-3">Downes <em>et al.</em>, 2008</a>), and CD3 : 34, probably a strain of <span class="named-content species" id="named-content-17"><a class="namesforlife" rel="namesforlife-name" title="Prevotella melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>Prevotella melaninogenica</em></a></span> (<a id="xref-ref-19-1" class="xref-bibr" href="#ref-19">Shah &amp; Collins, 1990</a>). Additionally, we describe the phylogenetic relationships between the five isolates and other members of the genus <span class="named-content genus" id="named-content-18"><a class="namesforlife" rel="namesforlife-name" title="Prevotella"
+                        href="doi:10.1601/nm.8042"><em>Prevotella</em></a></span>, based upon comparative 16S rRNA gene sequence analyses. Moreover, the five isolates have been subjected to whole genome
+                  sequencing (WGS) using 454 pyro-sequencing technology (GS Junior; Roche Diagnostics), and the sequences of the genes encoding
+                  chaperonin 60 (<em>cpn60</em>) and DNA-directed RNA polymerase subunit-β (<em>rpoB</em>) have also been compared.
+               </p>
+               <p id="p-15">The five strains were isolated from a biopsy of the proximal small intestine of a girl with CD, born in 1995, i.e. during
+                  the 1985–1996 Swedish CD epidemic. She was on a gluten-free diet when the biopsy was taken at the Department of Paediatrics,
+                  Umeå University Hospital, Umeå, in 2007. Informed consent was obtained from her parents. The study was approved by the local
+                  Research Ethics Committee of the Faculty of Medicine (Um dnr: 96-304 and 04-156). The biopsy was weighed, homogenized and
+                  serially diluted ten-fold in Fastidious Anaerobe Broth medium (Lab M) and immediately plated onto selective and non-selective
+                  agar media. All <span class="named-content genus" id="named-content-19"><a class="namesforlife" rel="namesforlife-name" title="Prevotella"
+                        href="doi:10.1601/nm.8042"><em>Prevotella</em></a></span> strains were primarily isolated on blood agar plates [Columbia Blood Agar Base (Acumedia), supplemented with 5 % defibrinated
+                  horse blood]. <span class="named-content species" id="named-content-20"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> CCUG 55407<sup>T</sup>, <span class="named-content species" id="named-content-21"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> CCUG 4944B<sup>T</sup> and <span class="named-content species" id="named-content-22"><a class="namesforlife" rel="namesforlife-name" title="Prevotella stercorea"
+                        href="doi:10.1601/nm.10959"><em>Prevotella stercorea</em></a></span> CCUG 55595<sup>T</sup> were obtained from the Culture Collection University of Gothenburg (CCUG; <a href="http://www.ccug.se">http://www.ccug.se</a>).
+               </p>
+               <p id="p-16">Pure cultures of the five strains grew well on blood agar plates and in Brucella broth (BBL) supplemented with vitamin K (1
+                  µg ml<sup>−1</sup>) and haemin (5 µg ml<sup>−1</sup>) under an anaerobic atmosphere (10 % H<sub>2</sub>, 5 % CO<sub>2</sub> in N<sub>2</sub>) at 37 °C.
+               </p>
+               <p id="p-17">Colony morphologies and the results of presumptive identification tests by diagnostic discs (<a id="xref-ref-11-1" class="xref-bibr" href="#ref-11">Jousimies-Somer <em>et al.</em>, 2002</a>) were examined on blood agar plates after incubation for 3–5 days. None of the five strains grew in the presence of oxygen
+                  and they should be considered strictly anaerobic. Growth was improved and pigmentation and haemolytic activity increased if
+                  the atmosphere contained 10 % CO<sub>2</sub> and 5 % H<sub>2</sub> as compared with standard conditions. The appearance of the colonies of the five strains differed: isolate CD3 : 27 had circular,
+                  raised, convex, weakly to moderately pigmented and strongly haemolytic colonies; CD3 : 28<sup>T</sup> and CD3 : 33 had circular, convex, weakly pigmented, weakly haemolytic colonies; CD3 : 32 had circular, slightly raised and
+                  brown-reddish pigmented colonies with a shiny ‘wet’ appearance. Moreover, the centres of the colonies of CD3 : 32 were darker
+                  than the outer part. Colonies of CD3 : 34 were similar to those of CD3 : 28<sup>T</sup> and CD3 : 33, but with a surface appearing ‘drier’ (Fig. S1 available in IJSEM Online).
+               </p>
+               <p id="p-18">Light microscopy after Gram staining, dark field microscopy, scanning electron microscopy (SEM) and transmission electron
+                  microscopy (TEM) were used to investigate cell morphologies. Cells of the five strains were rod-shaped, 0.7×0.8–2 µm in size,
+                  occurring most often as short rods or as coccoid cells, with longer filamentous forms (&gt;10 µm) seen sporadically. All five
+                  strains were Gram-stain-negative and lacked spores. SEM revealed that all five strains, particularly if grown on agar medium,
+                  as opposed to in liquid culture, formed large aggregates of bacterial cells connected to each other by multiple, thin, strait,
+                  rod-shaped structures (<a id="xref-fig-1-1" class="xref-fig" href="#F1">Fig. 1a–c</a>). Cells of strains CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33 showed a similar degree of interconnectivity. Outer membrane vesicles were frequently observed. Analysis of
+                  thin sections of the aggregates by TEM suggested that the rod-shaped structures were hollow, characterized as tubes connecting
+                  cells to each other (<a id="xref-fig-1-2" class="xref-fig" href="#F1">Fig. 1d</a>).
+               </p>
+               <div id="F1" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4218/F1.expansion.html"><img alt="Fig. 1. " src="4218/F1.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4218/F1.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4218/F1.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4218/F1">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 1. </span> 
+                     
+                     <p id="p-19" class="first-child">Scanning electron micrographs showing surface structures of cells of <em>P. jejuni</em>, strains CD3 : 27 (a) and CD3 : 28<sup>T</sup> (b) and <em>P. histicola</em> strain CD3 : 32 (c). (d) Transmission electron micrograph of a cell of strain <em>P. jejuni</em> CD3 : 33; arrows indicate cross-section of the tube-like structures shown in (a)–(c) and arrowheads indicate outer membrane
+                        vesicles. Bars, 0.2 µm (a, b, d); 1 µm (c).
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <p id="p-20">All five strains exhibited a temperature optimum for growth at 37 °C. The optimal pH for growth was 6–7 with reduced growth
+                  at pH 5.5 and 7.5. Motility was not observed. All five strains were haemolytic and produced NH<sub>3</sub>. Growth on glucose as the sole carbon source yielded acetic acid, succinic acid and small amounts of isovaleric acid for
+                  strains CD3 : 27, CD3 : 32 and CD3 : 34, and acetic acid and succinic acid for strains CD3 : 28<sup>T</sup> and CD3 : 33.
+               </p>
+               <p id="p-21">The nucleotide sequences of the 16S rRNA genes of strains CD3 : 27, CD3 : 28<sup>T</sup>, CD3 : 33, CD3 : 32 and CD3 : 34 were determined by primer walking, covering the gene, and by cloning and sequencing of PCR
+                  amplification fragments also covering the gene (<a id="xref-ref-9-2" class="xref-bibr" href="#ref-9">Hedberg <em>et al.</em>, 2012</a>). These sequences were subsequently confirmed by genomic sequencing, allowing us to establish that there was only one copy
+                  of the 16S rRNA gene per genome. Other 16S rRNA gene sequences for comparative analyses were retrieved from the NCBI database
+                  (<a id="xref-ref-18-1" class="xref-bibr" href="#ref-18">Sayers <em>et al.</em>, 2010</a>). Strains CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33 shared &gt;99.8 % 16S rRNA gene sequence similarity with each other and 98.1–98.3 % similarity with <span class="named-content species" id="named-content-23"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> CCUG 4944B<sup>T</sup> (AY323525), <span class="named-content species" id="named-content-24"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> CCUG 55407<sup>T</sup> (AB547685), N 12-20 (EU126662), CD3 : 34 and CD3 : 32, and 97.3–97.7 % similarity with <span class="named-content species" id="named-content-25"><a class="namesforlife" rel="namesforlife-name" title="Prevotella veroralis"
+                        href="doi:10.1601/nm.8066"><em>Prevotella veroralis</em></a></span> CCUG 15422<sup>T</sup> (AY836507). Strain CD3 : 32 was related most closely to <span class="named-content species" id="named-content-26"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> (AB547685 and EU126662) showing &gt;99.6 % sequence similarity. Strain CD3 : 34 showed 99.8 % sequence similarity to <span class="named-content species" id="named-content-27"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> (AY323525 and NC-014370). <a id="xref-fig-2-1" class="xref-fig" href="#F2">Fig. 2</a> shows the phylogenetic tree reconstructed using the maximum composite likelihood model based on 16S rRNA gene sequences.
+                  Strains CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33 formed a separate group distinct from recognized species of the genus <span class="named-content genus" id="named-content-28"><a class="namesforlife" rel="namesforlife-name" title="Prevotella"
+                        href="doi:10.1601/nm.8042"><em>Prevotella</em></a></span> while strain CD3 : 32 clustered with <span class="named-content species" id="named-content-29"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> and strain CD3 : 34 with <span class="named-content species" id="named-content-30"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span>.
+               </p>
+               <div id="F2" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4218/F2.expansion.html"><img alt="Fig. 2. " src="4218/F2.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4218/F2.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4218/F2.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4218/F2">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 2. </span> 
+                     
+                     <p id="p-22" class="first-child">Phylogenetic tree based on 16S rRNA gene sequences showing the relationships between strains CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33 and related species. The 16S rRNA gene sequence of <span class="named-content species" id="named-content-31"><a class="namesforlife" rel="namesforlife-name" title="Porphyromonas gingivalis"
+                              href="doi:10.1601/nm.8029"><em>Porphyromonas gingivalis</em></a></span> ATCC 33277<sup>T</sup> served as an outgroup. Bar, 0.02 substitutions per nucleotide position.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <p id="p-23">Genomic DNA–DNA reassociation analysis was carried out using the hybridization protocols described by <a id="xref-ref-21-1" class="xref-bibr" href="#ref-21">Urdiain <em>et al.</em> (2008)</a>. Strain CD3 : 28<sup>T</sup> hybridized to a high level (95–112 %) with strains CD3 : 27 and CD3 : 33, confirming that these three strains belong to the
+                  same species. The level of hybridization between strain CD3 : 28<sup>T</sup> and <span class="named-content species" id="named-content-32"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> CCUG 55407<sup>T</sup>, <span class="named-content species" id="named-content-33"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> CCUG 4944B<sup>T</sup>, <span class="named-content species" id="named-content-34"><a class="namesforlife" rel="namesforlife-name" title="Prevotella scopos"
+                        href="doi:10.1601/nm.21331"><em>Prevotella scopos</em></a></span> CCUG 57945<sup>T</sup> and <span class="named-content species" id="named-content-35"><a class="namesforlife" rel="namesforlife-name" title="P. veroralis"
+                        href="doi:10.1601/nm.8066"><em>P. veroralis</em></a></span> CCUG 15422<sup>T</sup> was below 43 %. Levels of hybridization between strain CD3 : 28<sup>T</sup> and strains CD3 : 32 and CD3 : 34 were 49 and 59 % respectively. The level of hybridization between <span class="named-content species" id="named-content-36"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> CCUG 4944B<sup>T</sup> and strain CD3 : 34 was high (104 %), while that between strain CD3 : 34 and strain CD3 : 28<sup>T</sup> was 51 %. <span class="named-content species" id="named-content-37"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> hybridized to a low level (30 %) with <span class="named-content species" id="named-content-38"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> CCUG 55407<sup>T</sup>. The coefficient of variation was less than 5.5 %. As the genomic DNA hybridization values were well below 70 % for strains
+                  CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33 on the one hand and strains CD3 : 32 or CD3 : 34 on the other, the strains can be considered to represent different
+                  species (<a id="xref-ref-20-1" class="xref-bibr" href="#ref-20">Stackebrandt &amp; Goebel, 1994</a>).
+               </p>
+               <p id="p-24">To shed further light on whether CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33 should be considered as strains of the same novel species we compared the nucleotide sequences of the <em>rpoB</em> and <em>cpn60</em> genes (<a id="xref-ref-1-3" class="xref-bibr" href="#ref-1">Alauzet <em>et al.</em>, 2010</a>; <a id="xref-ref-17-1" class="xref-bibr" href="#ref-17">Sakamoto &amp; Ohkuma, 2010</a>). Similarly, we compared strain CD3 : 32 with <span class="named-content species" id="named-content-39"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> and strain CD3 : 34 with <span class="named-content species" id="named-content-40"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span>. The <em>rpoB</em> and <em>cpn60</em> (3810 and 1626 nt respectively) gene sequences were 100.0 % identical between strains CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33. Sequence similarity between CD3 : 32 and <span class="named-content species" id="named-content-41"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> F0411 was 99.3 % for <em>rpoB</em> and 98.7 % for <em>cpn60</em>. Strain CD3 : 34 and <span class="named-content species" id="named-content-42"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> CCUG 4944B<sup>T</sup> shared 98.3 % <em>rpoB</em> gene sequence similarity and 97.7 % <em>cpn60</em> gene sequence similarity.
+               </p>
+               <p id="p-25">The sizes of the genomes and the DNA G+C contents of the five strains were determined from WGS data (<a id="xref-table-wrap-1-1" class="xref-table" href="#T1">Table 1</a>). Strains CD3 : 28<sup>T</sup> and CD3 : 33 had almost the same genome size, 3.81×10<sup>6</sup> and 3.80×10<sup>6</sup> bp, respectively, while CD3 : 27 had a size of 3.68×10<sup>6</sup> bp. The genome of strain CD3 : 32 had a size of 3.20×10<sup>6</sup> bp, larger than that of the closely related <span class="named-content species" id="named-content-43"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> F0411 (2.99×10<sup>6</sup> bp). The genome size of strain CD3 : 34 was 3.27×10<sup>6</sup> bp, about 102×10<sup>3</sup> bp larger than that of <span class="named-content species" id="named-content-44"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> CCUG 4944B<sup>T</sup>. The DNA G+C contents of the strains grouped together, in that strains CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33 had values of 41.7–41.8 mol%, CD3 : 32 and <span class="named-content species" id="named-content-45"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> F0411 had values of 41.1 and 41.2 mol%, respectively, and CD3 : 34 and <span class="named-content species" id="named-content-46"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> CCUG 4944B<sup>T</sup> values of 40.7 and 41.0 mol%, respectively.
+               </p>
+               <div id="T1" class="table pos-float">
+                  <div class="table-inline">
+                     <div class="callout"><span>View this table:</span><ul class="callout-links">
+                           <li><a href="4218/T1.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4218/T1.expansion.html">In a new window</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="table-caption"><span class="table-label">Table 1. </span> 
+                     <span class="caption-title">Genome size and DNA G+C content of <em>Prevotella jejuni</em> sp. nov., and the other two <span class="named-content genus" id="named-content-47"><a class="namesforlife" rel="namesforlife-name" title="Prevotella"
+                              href="doi:10.1601/nm.8042"><em>Prevotella</em></a></span> isolates from human small intestine compared with <span class="named-content species" id="named-content-48"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                              href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> and <span class="named-content species" id="named-content-49"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                              href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span></span>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <p id="p-28">Cellular fatty acid (CFA) methyl ester analyses were performed using a standardized protocol (<a href="http://www.ccug.se/pages/CFA_method_2008">http://www.ccug.se/pages/CFA_method_2008</a> and as detailed by <a id="xref-ref-9-3" class="xref-bibr" href="#ref-9">Hedberg <em>et al.</em>, 2012</a>). Strains were grown anaerobically (10 % H<sub>2</sub>, 5 % CO<sub>2</sub> in N<sub>2</sub>), using chocolate agar as culture medium at 37 °C, and harvested after 48 h. CFAs were extracted and saponified by mild alkaline
+                  methanolysis and released fatty acids were methylated. CFAs were identified and quantified by GC (Hewlett Packard HP 5890).
+                  Retention times of CFA peaks were converted to equivalent chain-length values and the relative amount (w/w) of each fatty
+                  acid was expressed as a percentage of the total fatty acids in the profile of the respective strain (Table S1). The major
+                  CFAs detected in strains CD3 : 27, CD3 : 28<sup>T</sup>, CD3 : 33, CD3 : 32 and CD3 : 34 were iso-C<sub>15 : 0</sub>, anteiso-C<sub>15 : 0</sub>, C<sub>16 : 0</sub>, C<sub>18 : 2</sub>ω6,9<em>c</em>/anteiso-C<sub>18 : 0</sub> and iso-C<sub>17 : 0</sub> 3-OH. These five CFAs occurred in approximately the same relative amounts in the five strains with anteiso-C<sub>15 : 0</sub> accounting for 38.5–42.5 % of the total CFAs. Interestingly, strains CD3 : 27, CD3 : 28<sup>T</sup>, CD3 : 33, CD3 : 32 and CD3 : 34 were more similar to each other than were CD3 : 32 to <span class="named-content species" id="named-content-52"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> CCUG 55407<sup>T</sup> or CD3 : 34 to <span class="named-content species" id="named-content-53"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> CCUG 4944B<sup>T</sup> (Table S1). The similarities between the five jejunal isolates, although representing three different species, are perhaps
+                  a reflection of the fact that they were isolated from the same organ of one individual.
+               </p>
+               <p id="p-29">Analysis of metabolic and biochemical characteristics (rapid ID 32A, API 20A and APIZYM; bioMérieux) showed that the five
+                  strains are saccharolytic and proteolytic (Table S2). Strains CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33 demonstrated an almost identical pattern of biochemical characteristics. The only difference observed was that
+                  strain CD3 : 33 had α-galactosidase activity, while the other two strains did not. CD3 : 32 and <span class="named-content species" id="named-content-54"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> CCUG 55407<sup>T</sup> showed an identical pattern of biochemical characteristics and the same was true for the comparison between CD3 : 34 and
+                  <span class="named-content species" id="named-content-55"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> CCUG 4944B<sup>T</sup>. Sialidase activity was detected using 2′-(4-methylumbelliferyl)α-<span class="sc">d</span>-<em>N</em>-acetylneuraminic acid as substrate (<a id="xref-ref-12-1" class="xref-bibr" href="#ref-12">Moncla &amp; Braham, 1989</a>). All strains produced sialidase except CD3 : 32 and <span class="named-content species" id="named-content-56"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> CCUG 55407<sup>T</sup>.
+               </p>
+               <p id="p-30">By disc diffusion it was shown that all five isolates and <span class="named-content species" id="named-content-57"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> CCUG 55407<sup>T</sup> were resistant to vancomycin (5 µg) but susceptible to kanamycin (1 mg), colistin (10 µg) (Oxoid) and bile (1000 µg) (Oxgall
+                  tablets; Rosco Diagnostica), whereas <span class="named-content species" id="named-content-58"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> CCUG 4944B<sup>T</sup> was resistant to vancomycin and kanamycin but susceptible to colistin and bile. <span class="named-content species" id="named-content-59"><a class="namesforlife" rel="namesforlife-name" title="P. stercorea"
+                        href="doi:10.1601/nm.10959"><em>P. stercorea</em></a></span> CCUG 55595<sup>T</sup> was resistant to kanamycin and colistin but susceptible to bile and unexpectedly also susceptible to vancomycin (<a id="xref-ref-11-2" class="xref-bibr" href="#ref-11">Jousimies-Somer <em>et al.</em>, 2002</a>). Because the bacteria were isolated from the small intestine adjacent to the bile duct, susceptibility to bile was investigated
+                  further using an agar dilution technique. A stock solution containing 320 mM synthetic bile acids (taurocholate, 134.4 mM;
+                  taurochenodeoxycholate, 83.2 mM; glycocholate, 70.4 mM; glycochenodeoxycholate, 32 mM) yielded final concentrations of 0.125–16
+                  mM bile acids in the assay. Interestingly, growth and haemolytic activity of all five jejunum isolates were stimulated at
+                  low concentrations of bile (0.5–1.5 mM) compared with medium without bile, while growth was inhibited at higher bile concentrations
+                  (2–8 mM).
+               </p>
+               <p id="p-31">Susceptibility to penicillin G was tested using MIC Evaluator Strips (Oxoid). Strains CD3 : 32, CD3 : 34 and <span class="named-content species" id="named-content-60"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> CCUG 55407<sup>T</sup> were resistant (MIC &gt;32 µg ml<sup>−1</sup>). The other strains were susceptible to penicillin G, with MICs ranging from 0.003 to 0.015 µg ml<sup>−1</sup>. According to the nitrocefin disc test (Remel), strains CD3 : 32, CD3 : 34 and <span class="named-content species" id="named-content-61"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> CCUG 55407<sup>T</sup> produce β-lactamase. WGS revealed the presence of the <em>cfxA</em> β-lactamase gene in strains CD3 : 32 and CD3 : 34, but not in <span class="named-content species" id="named-content-62"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> F0411, the only other <span class="named-content species" id="named-content-63"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> isolate that has been sequenced so far, or <span class="named-content species" id="named-content-64"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> CCUG 4944B<sup>T</sup>. Strains CD3 : 32 and CD3 : 34 shared 100 and 99 % <em>cfxA</em> gene sequence similarity with <span class="named-content species" id="named-content-65"><a class="namesforlife" rel="namesforlife-name" title="Prevotella marshii"
+                        href="doi:10.1601/nm.9557"><em>Prevotella marshii</em></a></span> CCUG 50419<sup>T</sup>, respectively.
+               </p>
+               <p id="p-32">The abilities of strains CD3 : 27, CD3 : 28<sup>T</sup>, CD3 : 33, CD3 : 32, CD3 : 34, <span class="named-content species" id="named-content-66"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> CCUG 55407<sup>T</sup> and <span class="named-content species" id="named-content-67"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> CCUG 4944B<sup>T</sup> to agglutinate human erythrocytes was investigated. Strains CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33 strongly agglutinated human O and AB erythrocytes; there was no difference in the strength of the agglutination
+                  reaction between the three strains, nor was there a difference in their ability to agglutinate AB versus O red blood cells.
+                  Strain CD3 : 34 showed a weak agglutination reaction while strains CD3 : 32, <span class="named-content species" id="named-content-68"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> CCUG 55407<sup>T</sup> and <span class="named-content species" id="named-content-69"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> CCUG 4944B<sup>T</sup> were negative. The finding that some strains of <span class="named-content species" id="named-content-70"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span> are able to weakly agglutinate red blood cells (<a id="xref-ref-7-1" class="xref-bibr" href="#ref-7">Haraldsson <em>et al.</em>, 2005</a>) is in agreement with our results.
+               </p>
+               <p id="p-33">To confirm that the five jejunal isolates were able to bind to intestinal epithelial cells, binding of PKH-2 fluorescence
+                  dye-labelled bacteria to PKH-26 fluorescence dye-labelled intestinal epithelial cells was studied by flow cytometry (<a id="xref-ref-6-1" class="xref-bibr" href="#ref-6">Hara-Kaonga &amp; Pistole, 2007</a>). Binding was evaluated after incubation at 37 °C and at 4 °C for 1 h. The cell lines were T84 (colon carcinoma), LS174T
+                  (colon carcinoma), HT29 (small intestine-like carcinoma) and Int407 (fetal small intestine epithelial cells), all obtained
+                  from the American Type Culture Collection (Rockville, MD). At 37 °C, all five isolates were able to bind to the four cell
+                  lines with two exceptions: strains CD3 : 27 and CD3 : 28<sup>T</sup> did not bind to LS174T cells (Table S3).
+               </p>
+               <p id="p-34">We conclude that strains CD3 : 27, CD3 : 28<sup>T</sup> and CD3 : 33 represent a novel species of the genus <span class="named-content genus" id="named-content-71"><a class="namesforlife" rel="namesforlife-name" title="Prevotella"
+                        href="doi:10.1601/nm.8042"><em>Prevotella</em></a></span>, for which the name <em>Prevotella jejuni</em> sp. nov. is proposed, that CD3 : 32 is a strain of <span class="named-content species" id="named-content-72"><a class="namesforlife" rel="namesforlife-name" title="P. histicola"
+                        href="doi:10.1601/nm.13539"><em>P. histicola</em></a></span> and that CD3 : 34 is a strain of <span class="named-content species" id="named-content-73"><a class="namesforlife" rel="namesforlife-name" title="P. melaninogenica"
+                        href="doi:10.1601/nm.8043"><em>P. melaninogenica</em></a></span>. The latter two jejunal isolates have larger genome sizes than the corresponding previously characterized strains. All five
+                  jejunal isolates are able to bind to human intestinal epithelial cells.
+               </p>
+               <div class="section" id="sec-1">
+                  <div class="section-nav"><a href="#fn-group-1" title="Previous Section" class="prev-section-link"><span>Previous Section</span></a><a href="#ack-1" title="Acknowledgements" class="next-section-link"><span>Next Section</span></a></div>
+                  
+                  
+                  <div id="sec-2" class="subsection">
+                     
+                     <h3>Description of <em>Prevotella jejuni</em> sp. nov.
+                     </h3>
+                     
+                     <p id="p-35"><em>Prevotella jejuni</em> (je.ju′ni. L. gen. n. <em>jejuni</em> of or from the jejunum, referring to the isolation of the type strain from the jejunum).
+                     </p>
+                     
+                     <p id="p-36">The description is based on three strains isolated from the human jejunum. Cells are obligately anaerobic, non-motile, Gram-stain-negative
+                        bacilli (0.7×0.8–2 µm). After 3–5 days of incubation on blood agar plates, colonies are 1–2 mm in diameter, circular, convex,
+                        weakly to moderately pigmented and weakly to strongly haemolytic. The optimum conditions for growth are 37 °C and pH 6–7.
+                        Acetic acid, succinic acid and small amounts of isovaleric acid are produced from glucose. NH<sub>3</sub> is produced. Cells are saccharolytic and proteolytic and are able to ferment glucose, lactose, maltose, mannose, raffinose
+                        and sucrose, but not arabinose, cellobiose, mannitol, melezitose, rhamnose, salicin, sorbitol, trehalose or xylose. Positive
+                        for activity of β-galactosidase, β-galactosidase-6-phosphate, α-glucosidase, <em>N</em>-acetyl-β-glucosaminidase, α-fucosidase, sialidase, acid phosphatase, alkaline phosphatase, naphthol-AS-BI-phosphate, arginine
+                        arylamidase, alanine arylamidase, leucine arylamidase and leucyl glycine arylamidase (Table S2). Gelatin is hydrolysed but
+                        aesculin is not. Cells agglutinate human AB and O erythrocytes and bind to several human intestinal cell lines. The predominant
+                        CFA is anteiso-C<sub>15 : 0</sub>, accounting for 42.5 % of the total CFA profile. 
+                     </p>
+                     
+                     <p id="p-37">The type strain is CD3 : 28<sup>T</sup> ( = CCUG 60371<sup>T</sup> = DSM 26989<sup>T</sup>), which was isolated from a biopsy of the small intestine of a child with CD. Strains CD3 : 27 ( = CCUG 60308) and CD3 : 33
+                        ( = CCUG 60311) are additional strains of this species. The DNA G+C content of the type strain is 41.7 mol%.
+                     </p>
+                     
+                  </div>
+               </div>
+               <div class="section ack" id="ack-1">
+                  <div class="section-nav"><a href="#sec-1" title="Previous Section" class="prev-section-link"><span>Previous Section</span></a><a href="#ref-list-1" title="References" class="next-section-link"><span>Next Section</span></a></div>
+                  <h2>Acknowledgements</h2>
+                  
+                  <p id="p-38">Funding was provided by: the Swedish Research Council, Natural Sciences and Engineering Sciences (no. 2010-5669); the TORNADO-project
+                     within the 7th framework program theme (grant agreement no. 222720-2); the Fund for Biotechnology-oriented Basic Science at
+                     Umeå University; the County of Västerbotten; and the Medical Faculty of Umeå University. The funders had no role in study
+                     design, data collection and analysis, decision to publish, or preparation of the manuscript.
+                  </p>
+                  
+               </div>
+               <div class="section ref-list" id="ref-list-1">
+                  <div class="section-nav"><a href="#ack-1" title="Acknowledgements" class="prev-section-link"><span>Previous Section</span></a><div class="nav-placeholder"> </div>
+                  </div>
+                  <h2>References</h2>
+                  <ol class="cit-list ref-use-labels">
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-1-1" title="View reference  in text"
+                           id="ref-1">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.1"
+                             data-doi="10.2217/fmb.10.126">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Alauzet</span>,  <span class="cit-name-given-names">C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Marchandin</span>,  <span class="cit-name-given-names">H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lozniewski</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2010</span><strong>).</strong> <span class="cit-article-title">New insights into <em>Prevotella</em> diversity and medical microbiology</span>. <abbr class="cit-jnl-abbrev">Future Microbiol</abbr> <span class="cit-vol">5</span>, <span class="cit-fpage">1695</span>–<span class="cit-lpage">1718</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.2217/fmb.10.126</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>21133690</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.2217/fmb.10.126&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=21133690&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=New%20insights%20into%20Prevotella%20diversity%20and%20medical%20microbiology&amp;author=C.%20Alauzet&amp;author=H.%20Marchandin&amp;author=A.%20Lozniewski&amp;publication_year=2010&amp;journal=Future%20Microbiol&amp;volume=5&amp;pages=1695-1718&amp;doi=10.2217%2Ffmb.10.126&amp;pmid=21133690">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-2-1" title="View reference  in text"
+                           id="ref-2">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.2"
+                             data-doi="10.1128/JB.00542-10">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Dewhirst</span>,  <span class="cit-name-given-names">F. E.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Chen</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Izard</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Paster</span>,  <span class="cit-name-given-names">B. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Tanner</span>,  <span class="cit-name-given-names">A. C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Yu</span>,  <span class="cit-name-given-names">W. H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lakshmanan</span>,  <span class="cit-name-given-names">A.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wade</span>,  <span class="cit-name-given-names">W. G.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2010</span><strong>).</strong> <span class="cit-article-title">The human oral microbiome</span>. <abbr class="cit-jnl-abbrev">J Bacteriol</abbr> <span class="cit-vol">192</span>, <span class="cit-fpage">5002</span>–<span class="cit-lpage">5017</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/JB.00542-10</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>20656903</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=jb&amp;resid=192/19/5002"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-3-1" title="View reference  in text"
+                           id="ref-3">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.3"
+                             data-doi="10.1099/ijs.0.65656-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Downes</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hooper</span>,  <span class="cit-name-given-names">S. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wilson</span>,  <span class="cit-name-given-names">M. J.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wade</span>,  <span class="cit-name-given-names">W. G.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2008</span><strong>).</strong> <span class="cit-article-title"><em>Prevotella histicola</em> sp. nov., isolated from the human oral cavity</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">58</span>, <span class="cit-fpage">1788</span>–<span class="cit-lpage">1791</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.65656-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>18676457</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=58/8/1788"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-4-1" title="View reference  in text"
+                           id="ref-4">↵</a><div class="cit ref-cit ref-other" id="cit-63.Pt_11.4218.4">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Euzéby</span>,  <span class="cit-name-given-names">J. P.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2013</span><strong>).</strong> <span class="cit-article-title">List of prokaryotic names with standing in nomenclature</span>. <a href="http://www.bacterio.cict.fr/classifgenerafamilies.html">www.bacterio.cict.fr/classifgenerafamilies.html</a></cite></div>
+                           <div class="cit-extra"></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-5-1" title="View reference  in text"
+                           id="ref-5">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.5"
+                             data-doi="10.1111/j.1572-0241.2004.04157.x">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Forsberg</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Fahlgren</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hörstedt</span>,  <span class="cit-name-given-names">P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hammarström</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hernell</span>,  <span class="cit-name-given-names">O.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hammarström</span>,  <span class="cit-name-given-names">M.-L.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2004</span><strong>).</strong> <span class="cit-article-title">Presence of bacteria and innate immunity of intestinal epithelium in childhood celiac disease</span>. <abbr class="cit-jnl-abbrev">Am J Gastroenterol</abbr> <span class="cit-vol">99</span>, <span class="cit-fpage">894</span>–<span class="cit-lpage">904</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1111/j.1572-0241.2004.04157.x</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>15128357</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1111/j.1572-0241.2004.04157.x&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=15128357&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Presence%20of%20bacteria%20and%20innate%20immunity%20of%20intestinal%20epithelium%20in%20childhood%20celiac%20disease&amp;author=G.%20Forsberg&amp;author=A.%20Fahlgren&amp;author=P.%20H%C3%B6rstedt&amp;author=S.%20Hammarstr%C3%B6m&amp;author=O.%20Hernell&amp;author=M.-L.%20Hammarstr%C3%B6m&amp;publication_year=2004&amp;journal=Am%20J%20Gastroenterol&amp;volume=99&amp;pages=894-904&amp;doi=10.1111%2Fj.1572-0241.2004.04157.x&amp;pmid=15128357">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-6-1" title="View reference  in text"
+                           id="ref-6">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.6"
+                             data-doi="10.1016/j.mimet.2006.11.017">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hara-Kaonga</span>,  <span class="cit-name-given-names">B.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pistole</span>,  <span class="cit-name-given-names">T. G.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2007</span><strong>).</strong> <span class="cit-article-title">A dual fluorescence flow cytometric analysis of bacterial adherence to mammalian host cells</span>. <abbr class="cit-jnl-abbrev">J Microbiol Methods</abbr> <span class="cit-vol">69</span>, <span class="cit-fpage">37</span>–<span class="cit-lpage">43</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/j.mimet.2006.11.017</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>17222473</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/j.mimet.2006.11.017&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=17222473&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=A%20dual%20fluorescence%20flow%20cytometric%20analysis%20of%20bacterial%20adherence%20to%20mammalian%20host%20cells&amp;author=B.%20Hara-Kaonga&amp;author=T.%20G.%20Pistole&amp;publication_year=2007&amp;journal=J%20Microbiol%20Methods&amp;volume=69&amp;pages=37-43&amp;doi=10.1016%2Fj.mimet.2006.11.017&amp;pmid=17222473">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-7-1" title="View reference  in text"
+                           id="ref-7">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.7"
+                             data-doi="10.1016/j.anaerobe.2005.02.004">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Haraldsson</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Meurman</span>,  <span class="cit-name-given-names">J. H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Könönen</span>,  <span class="cit-name-given-names">E.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Holbrook</span>,  <span class="cit-name-given-names">W. P.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2005</span><strong>).</strong> <span class="cit-article-title">Properties of hemagglutination by <em>Prevotella melaninogenica</em></span>. <abbr class="cit-jnl-abbrev">Anaerobe</abbr> <span class="cit-vol">11</span>, <span class="cit-fpage">285</span>–<span class="cit-lpage">289</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/j.anaerobe.2005.02.004</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>16701585</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/j.anaerobe.2005.02.004&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=16701585&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Properties%20of%20hemagglutination%20by%20Prevotella%20melaninogenica&amp;author=G.%20Haraldsson&amp;author=J.%20H.%20Meurman&amp;author=E.%20K%C3%B6n%C3%B6nen&amp;author=W.%20P.%20Holbrook&amp;publication_year=2005&amp;journal=Anaerobe&amp;volume=11&amp;pages=285-289&amp;doi=10.1016%2Fj.anaerobe.2005.02.004&amp;pmid=16701585">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-8-1" title="View reference  in text"
+                           id="ref-8">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.8"
+                             data-doi="10.1099/ijs.0.64778-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hayashi</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Shibata</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sakamoto</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Tomita</span>,  <span class="cit-name-given-names">S.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Benno</span>,  <span class="cit-name-given-names">Y.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2007</span><strong>).</strong> <span class="cit-article-title"><em>Prevotella copri</em> sp. nov. and <em>Prevotella stercorea</em> sp. nov., isolated from human faeces</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">57</span>, <span class="cit-fpage">941</span>–<span class="cit-lpage">946</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.64778-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>17473237</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=57/5/941"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-9-1" title="View reference  in text"
+                           id="ref-9">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.9"
+                             data-doi="10.1099/ijs.0.033613-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hedberg</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Moore</span>,  <span class="cit-name-given-names">E. R. B.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Svensson-Stadler</span>,  <span class="cit-name-given-names">L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hörstedt</span>,  <span class="cit-name-given-names">P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Baranov</span>,  <span class="cit-name-given-names">V.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hernell</span>,  <span class="cit-name-given-names">O.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nyunt Wai</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hammarström</span>,  <span class="cit-name-given-names">S.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hammarström</span>,  <span class="cit-name-given-names">M.-L.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2012</span><strong>).</strong> <span class="cit-article-title"><em>Lachnoanaerobaculum</em> gen. nov., a new genus in the <em>Lachnospiraceae</em>; characterization of <em>Lachnoanaerobaculum umeaense</em> gen. nov., sp. nov., isolated from the human small intestine, <em>Lachnoanaerobaculum orale</em> sp. nov., isolated from saliva and reclassification of <em>Eubacterium saburreum</em> (Prévot) Holdeman and Moore 1970 as <em>Lachnoanaerobaculum saburreum</em> comb. nov.</span> <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">62</span>, <span class="cit-fpage">2685</span>–<span class="cit-lpage">2690</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.033613-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>22228654</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=62/Pt_11/2685"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-10-1" title="View reference  in text"
+                           id="ref-10">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.10"
+                             data-doi="10.1080/080352500750028771">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ivarsson</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Persson</span>,  <span class="cit-name-given-names">L.-Å.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nyström</span>,  <span class="cit-name-given-names">L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ascher</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Cavell</span>,  <span class="cit-name-given-names">B.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Danielsson</span>,  <span class="cit-name-given-names">L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Dannaeus</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lindberg</span>,  <span class="cit-name-given-names">T.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lindquist</span>,  <span class="cit-name-given-names">B.</span></span></li>
+                              </ol><cite> <strong>&amp; other authors (</strong><span class="cit-pub-date">2000</span><strong>).</strong> <span class="cit-article-title">Epidemic of coeliac disease in Swedish children</span>. <abbr class="cit-jnl-abbrev">Acta Paediatr</abbr> <span class="cit-vol">89</span>, <span class="cit-fpage">165</span>–<span class="cit-lpage">171</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1111/j.1651-2227.2000.tb01210.x</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>10709885</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1080/080352500750028771&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=10709885&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Epidemic%20of%20coeliac%20disease%20in%20Swedish%20children&amp;author=A.%20Ivarsson&amp;author=L.-%C3%85.%20Persson&amp;author=L.%20Nystr%C3%B6m&amp;author=H.%20Ascher&amp;author=B.%20Cavell&amp;author=L.%20Danielsson&amp;author=A.%20Dannaeus&amp;author=T.%20Lindberg&amp;author=B.%20Lindquist&amp;publication_year=2000&amp;journal=Acta%20Paediatr&amp;volume=89&amp;pages=165-171&amp;doi=10.1111%2Fj.1651-2227.2000.tb01210.x&amp;pmid=10709885">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-11-1" title="View reference  in text"
+                           id="ref-11">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4218.11">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jousimies-Somer</span>,  <span class="cit-name-given-names">H. R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Summanen</span>,  <span class="cit-name-given-names">P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Citron</span>,  <span class="cit-name-given-names">D. M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Baron</span>,  <span class="cit-name-given-names">E. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wexler</span>,  <span class="cit-name-given-names">H. M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Finegold</span>,  <span class="cit-name-given-names">S. M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2002</span><strong>).</strong> <span class="cit-source">Wadsworth-KTL anaerobic bacteriology manual</span>, <span class="cit-edition">6th edn</span>. <span class="cit-publ-loc">Belmont, CA</span>: <span class="cit-publ-name">Star Publishing Company</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Wadsworth-KTL%20anaerobic%20bacteriology%20manual&amp;author=H.%20R.%20Jousimies-Somer&amp;author=P.%20Summanen&amp;author=D.%20M.%20Citron&amp;author=E.%20J.%20Baron&amp;author=H.%20M.%20Wexler&amp;author=S.%20M.%20Finegold&amp;publication_year=2002">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-12-1" title="View reference  in text"
+                           id="ref-12">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.12">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Moncla</span>,  <span class="cit-name-given-names">B.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Braham</span>,  <span class="cit-name-given-names">P.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1989</span><strong>).</strong> <span class="cit-article-title">Detection of sialidase (neuraminidase) by using 2′-(4-methylumbelliferyl)α-<span class="sc">d</span>-<em>N</em>-acetylneuraminic acid in a filter paper spot test</span>. <abbr class="cit-jnl-abbrev">J Clin Microbiol</abbr> <span class="cit-vol">27</span>, <span class="cit-fpage">182</span>–<span class="cit-lpage">184</span>.<span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>2643620</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=jcm&amp;resid=27/1/182"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-13-1" title="View reference  in text"
+                           id="ref-13">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.13"
+                             data-doi="10.1186/1471-2431-12-194">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Myléus</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hernell</span>,  <span class="cit-name-given-names">O.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Gothefors</span>,  <span class="cit-name-given-names">L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hammarström</span>,  <span class="cit-name-given-names">M.-L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Persson</span>,  <span class="cit-name-given-names">L.-Å.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stenlund</span>,  <span class="cit-name-given-names">H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ivarsson</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2012</span><strong>).</strong> <span class="cit-article-title">Early infections are associated with increased risk for celiac disease: an incident case-referent study</span>. <abbr class="cit-jnl-abbrev">BMC Pediatr</abbr> <span class="cit-vol">12</span>, <span class="cit-fpage">194</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1186/1471-2431-12-194</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>23249321</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1186/1471-2431-12-194&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=23249321&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Early%20infections%20are%20associated%20with%20increased%20risk%20for%20celiac%20disease%3A%20an%20incident%20case-referent%20study&amp;author=A.%20Myl%C3%A9us&amp;author=O.%20Hernell&amp;author=L.%20Gothefors&amp;author=M.-L.%20Hammarstr%C3%B6m&amp;author=L.-%C3%85.%20Persson&amp;author=H.%20Stenlund&amp;author=A.%20Ivarsson&amp;publication_year=2012&amp;journal=BMC%20Pediatr&amp;volume=12&amp;pages=194&amp;doi=10.1186%2F1471-2431-12-194&amp;pmid=23249321">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-14-1" title="View reference  in text"
+                           id="ref-14">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.14"
+                             data-doi="10.1017/S0007114512005521">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Olivares</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Laparra</span>,  <span class="cit-name-given-names">J. M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sanz</span>,  <span class="cit-name-given-names">Y.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2013</span><strong>).</strong> <span class="cit-article-title">Host genotype, intestinal microbiota and inflammatory disorders</span>. <abbr class="cit-jnl-abbrev">Br J Nutr</abbr> <span class="cit-vol">109</span> (<span class="cit-supplement">Suppl 2</span>), <span class="cit-fpage">S76</span>–<span class="cit-lpage">S80</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1017/S0007114512005521</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>23360883</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1017/S0007114512005521&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=23360883&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Host%20genotype%2C%20intestinal%20microbiota%20and%20inflammatory%20disorders&amp;author=M.%20Olivares&amp;author=J.%20M.%20Laparra&amp;author=Y.%20Sanz&amp;publication_year=2013&amp;journal=Br%20J%20Nutr&amp;volume=109&amp;pages=S76-S80&amp;doi=10.1017%2FS0007114512005521&amp;pmid=23360883">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-15-1" title="View reference  in text"
+                           id="ref-15">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.15"
+                             data-doi="10.1542/peds.2007-2989">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Olsson</span>,  <span class="cit-name-given-names">C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hernell</span>,  <span class="cit-name-given-names">O.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hörnell</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lönnberg</span>,  <span class="cit-name-given-names">G.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ivarsson</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2008</span><strong>).</strong> <span class="cit-article-title">Difference in celiac disease risk between Swedish birth cohorts suggests an opportunity for primary prevention</span>. <abbr class="cit-jnl-abbrev">Pediatrics</abbr> <span class="cit-vol">122</span>, <span class="cit-fpage">528</span>–<span class="cit-lpage">534</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1542/peds.2007-2989</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>18762522</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=pediatrics&amp;resid=122/3/528"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-16-1" title="View reference  in text"
+                           id="ref-16">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.16"
+                             data-doi="10.1038/ajg.2009.524">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ou</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hedberg</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hörstedt</span>,  <span class="cit-name-given-names">P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Baranov</span>,  <span class="cit-name-given-names">V.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Forsberg</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Drobni</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sandström</span>,  <span class="cit-name-given-names">O.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wai</span>,  <span class="cit-name-given-names">S. N.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Johansson</span>,  <span class="cit-name-given-names">I.</span></span></li>
+                              </ol><cite> <strong>&amp; other authors (</strong><span class="cit-pub-date">2009</span><strong>).</strong> <span class="cit-article-title">Proximal small intestinal microbiota and identification of rod-shaped bacteria associated with childhood celiac disease</span>. <abbr class="cit-jnl-abbrev">Am J Gastroenterol</abbr> <span class="cit-vol">104</span>, <span class="cit-fpage">3058</span>–<span class="cit-lpage">3067</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1038/ajg.2009.524</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>19755974</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1038/ajg.2009.524&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=19755974&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Proximal%20small%20intestinal%20microbiota%20and%20identification%20of%20rod-shaped%20bacteria%20associated%20with%20childhood%20celiac%20disease&amp;author=G.%20Ou&amp;author=M.%20Hedberg&amp;author=P.%20H%C3%B6rstedt&amp;author=V.%20Baranov&amp;author=G.%20Forsberg&amp;author=M.%20Drobni&amp;author=O.%20Sandstr%C3%B6m&amp;author=S.%20N.%20Wai&amp;author=I.%20Johansson&amp;publication_year=2009&amp;journal=Am%20J%20Gastroenterol&amp;volume=104&amp;pages=3058-3067&amp;doi=10.1038%2Fajg.2009.524&amp;pmid=19755974">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-17-1" title="View reference  in text"
+                           id="ref-17">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.17"
+                             data-doi="10.1099/jmm.0.020420-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sakamoto</span>,  <span class="cit-name-given-names">M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ohkuma</span>,  <span class="cit-name-given-names">M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2010</span><strong>).</strong> <span class="cit-article-title">Usefulness of the <em>hsp60</em> gene for the identification and classification of Gram-negative anaerobic rods</span>. <abbr class="cit-jnl-abbrev">J Med Microbiol</abbr> <span class="cit-vol">59</span>, <span class="cit-fpage">1293</span>–<span class="cit-lpage">1302</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/jmm.0.020420-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>20671088</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=medmicro&amp;resid=59/11/1293"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-18-1" title="View reference  in text"
+                           id="ref-18">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.18"
+                             data-doi="10.1093/nar/gkp967">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sayers</span>,  <span class="cit-name-given-names">E. W.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Barrett</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Benson</span>,  <span class="cit-name-given-names">D. A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bolton</span>,  <span class="cit-name-given-names">E.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bryant</span>,  <span class="cit-name-given-names">S. H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Canese</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Chetvernin</span>,  <span class="cit-name-given-names">V.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Church</span>,  <span class="cit-name-given-names">D. M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Dicuccio</span>,  <span class="cit-name-given-names">M.</span></span></li>
+                              </ol><cite> <strong>&amp; other authors (</strong><span class="cit-pub-date">2010</span><strong>).</strong> <span class="cit-article-title">Database resources of the National Center for Biotechnology Information</span>. <abbr class="cit-jnl-abbrev">Nucleic Acids Res</abbr> <span class="cit-vol">38</span> (<span class="cit-supplement">Database issue</span>), <span class="cit-fpage">D5</span>–<span class="cit-lpage">D16</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1093/nar/gkp967</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>19910364</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=nar&amp;resid=38/suppl_1/D5"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-19-1" title="View reference  in text"
+                           id="ref-19">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.19"
+                             data-doi="10.1099/00207713-40-2-205">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Shah</span>,  <span class="cit-name-given-names">H. N.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Collins</span>,  <span class="cit-name-given-names">D. M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1990</span><strong>).</strong> <span class="cit-article-title"><em>Prevotella</em>, a new genus to include <em>Bacteroides melaninogenicus</em> and related species formerly classified in the genus <em>Bacteroides</em></span>. <abbr class="cit-jnl-abbrev">Int J Syst Bacteriol</abbr> <span class="cit-vol">40</span>, <span class="cit-fpage">205</span>–<span class="cit-lpage">208</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-40-2-205</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>2223612</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=40/2/205"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-20-1" title="View reference  in text"
+                           id="ref-20">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.20"
+                             data-doi="10.1099/00207713-44-4-846">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stackebrandt</span>,  <span class="cit-name-given-names">E.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Goebel</span>,  <span class="cit-name-given-names">B. M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1994</span><strong>).</strong> <span class="cit-article-title">Taxonomic note: a place for DNA-DNA reassociation and 16S rRNA sequence analysis in the present species definition in bacteriology</span>. <abbr class="cit-jnl-abbrev">Int J Syst Bacteriol</abbr> <span class="cit-vol">44</span>, <span class="cit-fpage">846</span>–<span class="cit-lpage">849</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-44-4-846</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=44/4/846"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-21-1" title="View reference  in text"
+                           id="ref-21">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4218.21"
+                             data-doi="10.1016/j.syapm.2008.07.002">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Urdiain</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">López-López</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Gonzalo</span>,  <span class="cit-name-given-names">C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Busse</span>,  <span class="cit-name-given-names">H. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Langer</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kämpfer</span>,  <span class="cit-name-given-names">P.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Rosselló-Móra</span>,  <span class="cit-name-given-names">R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2008</span><strong>).</strong> <span class="cit-article-title">Reclassification of <em>Rhodobium marinum</em> and <em>Rhodobium pfennigii</em> as <em>Afifella marina</em> gen. nov. comb. nov. and <em>Afifella pfennigii</em> comb. nov., a new genus of photoheterotrophic <em>Alphaproteobacteria</em> and emended descriptions of <em>Rhodobium</em>, <em>Rhodobium orientis</em> and <em>Rhodobium gokarnense</em></span>. <abbr class="cit-jnl-abbrev">Syst Appl Microbiol</abbr> <span class="cit-vol">31</span>, <span class="cit-fpage">339</span>–<span class="cit-lpage">351</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/j.syapm.2008.07.002</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>18774253</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/j.syapm.2008.07.002&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=18774253&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Reclassification%20of%20Rhodobium%20marinum%20and%20Rhodobium%20pfennigii%20as%20Afifella%20marina%20gen.%20nov.%20comb.%20nov.%20and%20Afifella%20pfennigii%20comb.%20nov.%2C%20a%20new%20genus%20of%20photoheterotrophic%20Alphaproteobacteria%20and%20emended%20descriptions%20of%20Rhodobium%2C%20Rhodobium%20orientis%20and%20Rhodobium%20gokarnense&amp;author=M.%20Urdiain&amp;author=A.%20L%C3%B3pez-L%C3%B3pez&amp;author=C.%20Gonzalo&amp;author=H.%20J.%20Busse&amp;author=S.%20Langer&amp;author=P.%20K%C3%A4mpfer&amp;author=R.%20Rossell%C3%B3-M%C3%B3ra&amp;publication_year=2008&amp;journal=Syst%20Appl%20Microbiol&amp;volume=31&amp;pages=339-351&amp;doi=10.1016%2Fj.syapm.2008.07.002&amp;pmid=18774253">Google Scholar</a></div>
+                        </div>
+                     </li>
+                  </ol>
+               </div><span class="highwire-journal-article-marker-end"></span></div>
+            <div class="social-bookmarking">
+               
+               <ul class="social-bookmark-links">
+                  <li class="social-bookmarking-item social-bookmarking-item-citeulike"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=CITEULIKE"><img src="/shared/img/common/social-bookmarking/citeulike.gif"
+                             alt="Add to CiteULike"
+                             title="CiteULike" /></a><span class="soc-bm-link-text">CiteULike</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-delicious"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=DEL_ICIO_US"><img src="/shared/img/common/social-bookmarking/delicious.gif"
+                             alt="Add to Delicious"
+                             title="Delicious" /></a><span class="soc-bm-link-text">Delicious</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-digg"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=DIGG"><img src="/shared/img/common/social-bookmarking/digg.gif" alt="Add to Digg"
+                             title="Digg" /></a><span class="soc-bm-link-text">Digg</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-facebook"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/short/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=FACEBOOK"
+                        class="sb-facebook"
+                        rel="external-nw"><img src="/shared/img/common/social-bookmarking/facebook.gif" alt="Add to Facebook"
+                             title="Facebook" /></a><span class="soc-bm-link-text">Facebook</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-googleplus"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=GOOGLEPLUS&amp;log_only=yes"><img src="/shared/img/common/social-bookmarking/googleplus.jpg" alt="Add to Google+"
+                             title="Google+" /></a><span class="soc-bm-link-text">Google+</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-linkedin"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=LINKEDIN"><img src="/shared/img/common/social-bookmarking/linkedin.gif" alt="Add to LinkedIn"
+                             title="LinkedIn" /></a><span class="soc-bm-link-text">LinkedIn</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-mendeley"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=MENDELEY"><img src="/shared/img/common/social-bookmarking/mendeley.gif" alt="Add to Mendeley"
+                             title="Mendeley" /></a><span class="soc-bm-link-text">Mendeley</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-reddit"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=REDDIT"><img src="/shared/img/common/social-bookmarking/reddit.gif" alt="Add to Reddit"
+                             title="Reddit" /></a><span class="soc-bm-link-text">Reddit</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-twitter"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=TWITTER"><img src="/shared/img/common/social-bookmarking/twitter.gif" alt="Add to Twitter"
+                             title="Twitter" /></a><span class="soc-bm-link-text">Twitter</span></li>
+               </ul>
+               
+               <p class="social-bookmarking-help"><a href="/help/social_bookmarks.dtl">What's this?</a></p>
+               
+            </div><span id="related-urls"></span></div>
+         <div id="col-2">
+            
+            <div class="article-nav sidebar-nav">
+               <a href="/content/63/Pt_11/4207.short" title="Previous article" class="previous">« Previous</a><span class="article-nav-sep"> | </span><a href="/content/63/Pt_11/4224.short" title="Next article" class="next">Next Article »</a>
+               
+               <span class="toc-link">
+                  				<a href="/content/63/Pt_11.toc" title="Table of Contents">Table of Contents</a>
+                  			</span>
+               
+               
+            </div>
+            <div class="open-access-note">
+               <span class="open-access-note">OPEN ACCESS ARTICLE</span>
+               
+            </div>
+            <div class="content-box" id="article-cb-main">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Article</span></h3>
+                  <div class="cb-section cb-slug">
+                     <ol>
+                        <li>
+                           <div id="slugline">
+                              
+                              
+                              	    <span class="slug-metadata-note ahead-of-print">
+                                 	
+                                 Published online ahead of print
+                                 
+                                 <span class="slug-ahead-of-print-date">June 21, 2013</span>,
+                                 doi:
+                                 <span title="10.1099/ijs.0.052647-0" class="slug-doi">10.1099/ijs.0.052647-0
+                                    </span>
+                                 </span>
+                              
+                              <cite>
+                                 	    <abbr title="International Journal of Systematic and Evolutionary Microbiology"
+                                       class="slug-jnl-abbrev">
+                                    IJSEM</abbr><span class="slug-pub-date" itemprop="datePublished">
+                                    	    November 2013 
+                                    </span>
+                                 	    <span class="slug-vol">
+                                    vol. 63 
+                                    </span><span class="slug-issue">
+                                    no. Pt 11 
+                                    </span><span class="slug-pages">
+                                    4218-4223
+                                    </span>
+                                 </cite>
+                              
+                              	           
+                              
+                              
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section cb-views">
+                     <ol>
+                        <li><span class="oa-article">Free via Open Access: <span>OA</span></span></li>
+                        <li><span class="creative-commons-article">Free via Creative Commons: <span>CC</span></span></li>
+                        <li><span class="ccv cc-version-by/2.5/"></span></li>
+                        <li class="abstract-view-link primary"><span class="oa-view">OA </span><a href="/content/63/Pt_11/4218.abstract" rel="view-abstract">Abstract</a><span class="free">Free</span></li>
+                        <li class="notice full-text-view-link primary"><span class="variant-indicator">» <span>Full Text</span></span><span class="free">Free</span></li>
+                        <li class="notice full-text-pdf-view-link primary"><a href="/content/63/Pt_11/4218.full.pdf+html" rel="view-full-text.pdf">Full Text (PDF)</a><span class="free">Free</span></li>
+                        <li><a href="/content/63/Pt_11/4218/suppl/DC1" rel="supplemental-data"
+                              class="dslink-supplementary-material">Supplementary material</a></li>
+                        <li><a href="/powerpoint/63/Pt_11/4218">PPT Slides of All Figures</a></li>
+                        <li class="cb-versions">
+                           <div><span id="pap-all-versions-label">All Versions of this Article:</span><ol class="version-list">
+                                 <li><a href="/content/early/2013/06/18/ijs.0.052647-0">ijs.0.052647-0v1</a></li>
+                                 <li class="current-li"><span>63/Pt_11/4218</span> <span class="current-version">most recent</span></li>
+                              </ol>
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible" id="cb-art-cat">
+                     <h4 class="cb-section-header"><span>Classifications</span></h4>
+                     <ol>
+                        <li>
+                           <ul class="subject-headings">
+                              <li>New Taxa
+                                 <ul class="subject-sub-headings last-child">
+                                    <li><a class="tocsection-search"
+                                          href="/search?tocsectionid=Bacteroidetes&amp;sortspec=date&amp;submit=Submit">Bacteroidetes</a></li>
+                                 </ul>
+                              </li>
+                           </ul>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible" id="cb-art-svcs">
+                     <h4 class="cb-section-header"><span>Services</span></h4>
+                     <ol>
+                        <li class="mail-a-friend-link icon-link"><a href="/email?gca=ijs%3B63%2FPt_11%2F4218&amp;current-view-path=/content/63/Pt_11/4218.full">
+                              Email this article to a colleague</a></li>
+                        <li class="alert-link icon-link"><a href="/cgi/alerts/ctalert?alertType=citedby&amp;addAlert=cited_by&amp;cited_by_criteria_resid=ijs%3B63%2FPt_11%2F4218&amp;saveAlert=no&amp;return-type=article&amp;return_url=http://ijs.sgmjournals.org/content/63/Pt_11/4218.full">Alert me when this article is cited</a></li>
+                        <li class="alert-link icon-link"><a href="/cgi/alerts/ctalert?alertType=correction&amp;addAlert=correction&amp;correction_criteria_value=63/Pt_11/4218&amp;saveAlert=no&amp;return-type=article&amp;return_url=http://ijs.sgmjournals.org/content/63/Pt_11/4218.full">Alert me if a correction is posted</a></li>
+                        <li class="similar-link"><a href="/search?qbe=ijs%3Bijs.0.052647-0&amp;citation=Hedberg%20et%20al.%2063%20%28Pt%2011%29:%204218&amp;submit=yes">Similar articles in this journal</a></li>
+                        <li class="similar-link"><a href="/external-ref?access_num=ijs%3B63%2FPt_11%2F4218&amp;link_type=ISI_RELATEDRECORDS"
+                              id="cb-isi-similar-articles"
+                              class="similar-link">Similar articles in Web of Science</a></li>
+                        <li class="similar-link"><a href="/external-ref?access_num=23793857&amp;link_type=MED_NBRS"
+                              class="similar-link">Similar articles in PubMed</a></li>
+                        <li class="cit-man-link icon-link cite-link"><a href="/citmgr?gca=ijs%3B63%2FPt_11%2F4218">Download to citation manager</a></li>
+                        <li class="copyright-link icon-link"><a href="/external-ref?link_type=PERMISSIONDIRECT"><img src="/shared/img/content/permissions.gif" /></a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-cit">
+                     <h4 class="cb-section-header"><span>Citing Articles</span></h4>
+                     <ol>
+                        <li class="hw-citing-link"><a href="/content/63/Pt_11/4218.full?cited-by=yes&amp;legid=ijs;63/Pt_11/4218#cited-by"
+                              id="cb-hw-citing-articles">Load citing article information</a></li>
+                        <li><a href="/cgi/crossref-forward-links/63/Pt_11/4218" rel="external-nw"
+                              id="cb-crossref-citing-articles">Citing articles via CrossRef</a></li>
+                        <li><a href="/external-ref?access_num=%2Fijs%2F63%2FPt_11%2F4218&amp;link_type=ISI_CITING&amp;accnum_type=native"
+                              rel="external-nw"
+                              id="cb-isi-citing-articles">Citing articles via Web of Science</a></li>
+                        <li><a href="/external-ref?access_num=http://ijs.sgmjournals.org/content/63/Pt_11/4218.abstract&amp;link_type=GOOGLESCHOLAR">Citing articles via Google Scholar</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-gs">
+                     <h4 class="cb-section-header"><span>Google Scholar</span></h4>
+                     <ol>
+                        <li class="cb-art-gs-auth author-link"><a href="http://scholar.google.com/scholar?q=%22author%3AHedberg%20author%3AM.E.%22"
+                              class="cb-art-gs-auth author-link">Articles by  Hedberg, M. E.</a></li>
+                        <li class="cb-art-gs-auth author-link"><a href="http://scholar.google.com/scholar?q=%22author%3AHammarstr%C3%B6m%20author%3AS.%22"
+                              class="cb-art-gs-auth author-link">Articles by  Hammarström, S.</a></li>
+                        <li class="cb-art-gs-rel similar-link"><a href="/external-ref?access_num=http://ijs.sgmjournals.org/content/63/Pt_11/4218.abstract&amp;link_type=GOOGLESCHOLARRELATED">Search for related content</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-pm">
+                     <h4 class="cb-section-header"><span>PubMed</span></h4>
+                     <ol>
+                        <li class="cb-art-pm-cite cite-link icon-link"><a href="/external-ref?access_num=23793857&amp;link_type=PUBMED"
+                              class="cb-art-pm-cite cite-link icon-link">PubMed citation</a></li>
+                        <li class="cb-art-pm-auth author-link"><a href="/external-ref?access_num=Hedberg%20ME&amp;link_type=AUTHORSEARCH"
+                              class="cb-art-pm-auth author-link">Articles by  Hedberg, M. E.</a></li>
+                        <li class="cb-art-pm-auth author-link"><a href="/external-ref?access_num=Hammarstr%C3%B6m%20S&amp;link_type=AUTHORSEARCH"
+                              class="cb-art-pm-auth author-link">Articles by  Hammarström, S.</a></li>
+                        <li>
+                           <div id="cb-entrez-links-placeholder"><a href="/entrez-links/23793857"></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-rel">
+                     <h4 class="cb-section-header"><span>Related Content</span></h4>
+                     <ol>
+                        <li><a href="/content/63/Pt_11/4218.full?related-urls=yes&amp;legid=ijs;63/Pt_11/4218#related-urls"
+                              id="cb-related-urls">Load related web page information</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed soc-links icon-link"
+                       id="cb-art-soc">
+                     <h4 class="cb-section-header"><span>Social Bookmarking</span></h4>
+                     <ol>
+                        <li>
+                           <div class="social-bookmarking">
+                              
+                              <ul class="social-bookmark-links">
+                                 <li class="social-bookmarking-item social-bookmarking-item-citeulike"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=CITEULIKE"><img src="/shared/img/common/social-bookmarking/citeulike.gif"
+                                            alt="Add to CiteULike"
+                                            title="CiteULike" /></a><span class="soc-bm-link-text">CiteULike</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-delicious"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=DEL_ICIO_US"><img src="/shared/img/common/social-bookmarking/delicious.gif"
+                                            alt="Add to Delicious"
+                                            title="Delicious" /></a><span class="soc-bm-link-text">Delicious</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-digg"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=DIGG"><img src="/shared/img/common/social-bookmarking/digg.gif" alt="Add to Digg"
+                                            title="Digg" /></a><span class="soc-bm-link-text">Digg</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-facebook"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/short/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=FACEBOOK"
+                                       class="sb-facebook"
+                                       rel="external-nw"><img src="/shared/img/common/social-bookmarking/facebook.gif" alt="Add to Facebook"
+                                            title="Facebook" /></a><span class="soc-bm-link-text">Facebook</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-googleplus"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=GOOGLEPLUS&amp;log_only=yes"><img src="/shared/img/common/social-bookmarking/googleplus.jpg" alt="Add to Google+"
+                                            title="Google+" /></a><span class="soc-bm-link-text">Google+</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-linkedin"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=LINKEDIN"><img src="/shared/img/common/social-bookmarking/linkedin.gif" alt="Add to LinkedIn"
+                                            title="LinkedIn" /></a><span class="soc-bm-link-text">LinkedIn</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-mendeley"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=MENDELEY"><img src="/shared/img/common/social-bookmarking/mendeley.gif" alt="Add to Mendeley"
+                                            title="Mendeley" /></a><span class="soc-bm-link-text">Mendeley</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-reddit"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=REDDIT"><img src="/shared/img/common/social-bookmarking/reddit.gif" alt="Add to Reddit"
+                                            title="Reddit" /></a><span class="soc-bm-link-text">Reddit</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-twitter"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4218&amp;title=Prevotella%20jejuni%20sp.%20nov.%2C%20isolated%20from%20the%20small%20intestine%20of%20a%20child%20with%20coeliac%20disease+--+Hedberg%20et%20al.%2063%20%28Pt%2011%29%3A%204218+--+IJSEM&amp;doi=10.1099/ijs.0.052647-0&amp;link_type=TWITTER"><img src="/shared/img/common/social-bookmarking/twitter.gif" alt="Add to Twitter"
+                                            title="Twitter" /></a><span class="soc-bm-link-text">Twitter</span></li>
+                              </ul>
+                              
+                              <p class="social-bookmarking-help"><a href="/help/social_bookmarks.dtl">What's this?</a></p>
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+            
+            <div class="content-box" id="article-dyn-nav">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>Navigate This Article</span></h3>
+                  <div class="cb-section" id="cb-art-nav">
+                     <ol>
+                        <li><a href="#content-block">Top</a></li>
+                        <li><a href="#abstract-1">Abstract</a></li>
+                        <li><a href="#ack-1">Acknowledgements</a></li>
+                        <li><a href="#ref-list-1">References</a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+         </div>
+         <div id="col-3">
+            
+            <div class="content-box" id="sidebar-current-issue">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Month's Issue</span></h3>
+                  <div class="cb-section">
+                     <ol>
+                        <li><span><a href="/content/current" rel="current-issue">April 2015, 65 (Pt 4)</a></span></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section">
+                     <ol>
+                        <li>
+                           <div class="current-issue"><a href="/content/current" rel="current-issue"><img src="/content/65/Pt_4.cover.gif" width="67" height="89" alt="Current Issue" /></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section sidebar-etoc-link">
+                     <ol>
+                        <li><a href="/cgi/alerts/etoc">Alert me to new issues of IJSEM
+                              </a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            <div id="sidebar-global-nav">
+               
+               		
+               <ul class="button-list pub-links">
+                  <li class="first"><a href="/site/misc/about.xhtml" title="ABOUT IJSEM"><span>ABOUT IJSEM</span></a></li>
+                  <li><a href="/site/misc/edboard.xhtml" title="EDITORIAL BOARD &amp; STAFF"><span>EDITORIAL BOARD &amp; STAFF</span></a></li>
+                  <li><a href="http://www.editorialmanager.com/ijs/" title="SUBMIT A MANUSCRIPT"><span>SUBMIT A MANUSCRIPT</span></a></li>
+                  <li><a href="/site/misc/ifora.xhtml" title="INFORMATION FOR AUTHORS"><span>INFORMATION FOR AUTHORS</span></a></li>
+                  <li><a href="/site/misc/iforr.xhtml" title="INFORMATION FOR REVIEWERS"><span>INFORMATION FOR REVIEWERS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/site/librarians/index.xhtml"
+                        title="INFORMATION FOR LIBRARIANS"><span>INFORMATION FOR LIBRARIANS</span></a></li>
+                  <li><a href="/site/misc/reprints.xhtml" title="PERMISSIONS AND REPRINTS"><span>PERMISSIONS AND REPRINTS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/subscriptions" title="SUBSCRIPTIONS"><span>SUBSCRIPTIONS</span></a></li>
+                  <li><a href="/site/misc/addir.xhtml" title="ADVERTISING"><span>ADVERTISING</span></a></li>
+                  <li class="rss-img-button"><a href="/site/misc/alerts_feeds.xhtml" title="ALERTS &amp; FEEDS"><span>ALERTS &amp; FEEDS</span></a></li>
+                  <li class="last"><a href="/feedback" title="FEEDBACK"><span>FEEDBACK</span></a></li>
+               </ul>
+               		
+               <ul class="button-list pub-links umbrella-links">
+                  <li class="first"><a href="http://mic.sgmjournals.org" title="MICROBIOLOGY"><span>MICROBIOLOGY</span></a></li>
+                  <li><a href="http://vir.sgmjournals.org" title="J GEN VIROL"><span>J GEN VIROL</span></a></li>
+                  <li><a href="http://jmm.sgmjournals.org" title="J MED MICROBIOL"><span>J MED MICROBIOL</span></a></li>
+                  <li><a href="http://jmmcr.sgmjournals.org" title="JMM CASE REPORTS"><span>JMM CASE REPORTS</span></a></li>
+                  <li class="last"><a href="http://www.sgmjournals.org" title="ALL SGM JOURNALS"><span>ALL SGM JOURNALS</span></a></li>
+               </ul>
+               		
+               <div class="sidebar-icon-group">
+                  			
+                  <div class="icons">
+                     			<a href="http://www.sgm.ac.uk/" rel="external-nw"><img src="/publisher/img/society_logo.gif" class="publisher-icon" alt="Society Logo" /></a>
+                     			<a href="http://www.the-icsp.org/" rel="external-nw"><img src="/publisher/img/icsp_logo.gif" class="publisher-icon" alt="ICSP Logo" /></a>
+                     			<a href="http://highwire.stanford.edu/" rel="external-nw"><img src="/publisher/img/hplogo.gif" class="hw-icon" alt="HighWire Press Logo" /></a>
+                     			
+                  </div>
+                  			
+                  <div class="sidebar-icon-text"><span>The <a href="http://www.sgmjournals.org"> Society for General Microbiology</a> publishes online with the assistance of <a href="http://highwire.stanford.edu">HighWire Press®</a>.</span></div>
+                  		
+               </div>
+               	
+            </div>
+            <div class="most-links-box js-marker">
+               
+               <div class="most-header">
+                  
+                  <h3>Most</h3>
+                  
+               </div>
+               
+               <ul>
+                  <li class="most-cur-sel">
+                     <h4>Viewed</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/1070?rss=1&amp;ssource=mfr">Proposal to consistently apply the International Code of Nomenclature of Prokaryotes (ICNP) to names of the oxygenic photosynthetic
+                                 bacteria (cyanobacteria), including those validly published under the International Code of Botanical Nomenclature (ICBN)/International
+                                 Code of Nomenclature for algae, fungi and plants (ICN), and proposal to change Principle 2 of the ICNP</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfr">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/316?rss=1&amp;ssource=mfr">Integrating genomics into the taxonomy and systematics of the Bacteria and Archaea</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/333?rss=1&amp;ssource=mfr">Applications of next-generation sequencing to unravelling the evolutionary history of algae</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/739?rss=1&amp;ssource=mfr">Notification that new names of prokaryotes, new combinations, and new taxonomic opinions have appeared in volume 64, part
+                                 12, of the IJSEM</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfr1.dtl" class="view-all">» View all Most Viewed articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+                  <li>
+                     <h4>Cited</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4386?rss=1&amp;ssource=mfc">Chryseobacterium hispalense sp. nov., a plant-growth-promoting bacterium isolated from a rainwater pond in an olive plant
+                                 nursery, and emended descriptions of Chryseobacterium defluvii, Chryseobacterium indologenes, Chryseobacterium wanjuense and
+                                 Chryseobacterium gregarium</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfc">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_1/138?rss=1&amp;ssource=mfc">Aquibacter zeaxanthinifaciens gen. nov., sp. nov., a zeaxanthin-producing bacterium of the family Flavobacteriaceae isolated
+                                 from surface seawater, and emended descriptions of the genera Aestuariibaculum and Gaetbulibacter</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4790?rss=1&amp;ssource=mfc">Kordia aquimaris sp. nov., a zeaxanthin-producing member of the family Flavobacteriaceae isolated from surface seawater, and
+                                 emended description of the genus Kordia</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4524?rss=1&amp;ssource=mfc">Erythrobacter odishensis sp. nov. and Pontibacter odishensis sp. nov. isolated from dry soil of a solar saltern</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfc1.dtl" class="view-all">» View all Most Cited articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+               </ul>
+               
+               
+            </div>
+            
+            
+            
+         </div>
+         <div id="footer">
+            
+            <div class="bar">
+               
+               <div class="footer-group footer-col-left">
+                  		
+                  <p class="copyright">Copyright ©
+                     		2015 International Union of Microbiological Societies
+                     	
+                  </p>
+                  	
+               </div>
+               
+               <div class="footer-group footer-col-right">
+                  	    
+                  <ul class="issns">
+                     <li>
+                        <span>Print ISSN: </span>
+                        <span class="issn">1466-5026</span>
+                        
+                     </li>
+                     <li>
+                        <span>Online ISSN: </span>
+                        <span class="issn">1466-5034</span>
+                        
+                     </li>
+                  </ul>
+                  	  
+               </div>
+               	  
+            </div>
+            
+            
+            <div class="block-2 sb-div"></div>
+            
+         </div><script type="text/javascript">
+        var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
+        document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
+        </script><script type="text/javascript">
+        try {
+        var pageTracker = _gat._getTracker("UA-189672-25");
+        pageTracker._setDomainName(".sgmjournals.org");
+        pageTracker._trackPageview();
+        } catch(err) {}
+        </script><script type="text/javascript">
+	(function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
+		(i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
+		m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
+	})(window,document,'script','//www.google-analytics.com/analytics.js','ga');
+
+	ga('create', 'UA-48529861-1', '.sgmjournals.org');
+	ga('send', 'pageview');
+	</script></div>
+   </body>
+</html>
\ No newline at end of file
diff --git a/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/fulltext.pdf b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/fulltext.pdf
new file mode 100644
index 00000000..8cc6e132
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/fulltext.pdf differ
diff --git a/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/ijs052647_forPAP.pdf b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/ijs052647_forPAP.pdf
new file mode 100644
index 00000000..258deb4f
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4218.full/ijs052647_forPAP.pdf differ
diff --git a/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/F5.large.jpg b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/F5.large.jpg
new file mode 100644
index 00000000..a272e3c4
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/F5.large.jpg differ
diff --git a/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/fulltext.html b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/fulltext.html
new file mode 100644
index 00000000..f411ba32
--- /dev/null
+++ b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/fulltext.html
@@ -0,0 +1,2072 @@
+<!DOCTYPE html
+  PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html
+      xmlns="http://www.w3.org/1999/xhtml"
+      xml:lang="en"
+      lang="en">
+   <head>
+      <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
+      <title>Molecular and phenotypic analyses reveal the non-identity of the Phaeobacter gallaeciensis type strain deposits CIP 105210T
+         and DSM 17395 
+      </title>
+      <meta name="googlebot" content="NOODP" />
+      <meta name="HW.ad-path" content="/cgi/content/full/63/Pt_11/4340" />
+      <meta content="/ijs/63/Pt_11/4340.atom" name="HW.identifier" />
+      <meta name="DC.Format" content="text/html" />
+      <meta name="DC.Language" content="en" />
+      <meta content="Molecular and phenotypic analyses reveal the non-identity of the Phaeobacter gallaeciensis type strain deposits CIP 105210T and DSM 17395"
+            name="DC.Title" />
+      <meta content="10.1099/ijs.0.053900-0" name="DC.Identifier" />
+      <meta content="2013-11-01" name="DC.Date" />
+      <meta content="Society for General Microbiology" name="DC.Publisher" />
+      <meta content="Nora Buddruhs" name="DC.Contributor" />
+      <meta content="Silke Pradella" name="DC.Contributor" />
+      <meta content="Markus Göker" name="DC.Contributor" />
+      <meta content="Orsola Päuker" name="DC.Contributor" />
+      <meta content="Rüdiger Pukall" name="DC.Contributor" />
+      <meta content="Cathrin Spröer" name="DC.Contributor" />
+      <meta content="Peter Schumann" name="DC.Contributor" />
+      <meta content="Jörn Petersen" name="DC.Contributor" />
+      <meta content="Thorsten Brinkhoff" name="DC.Contributor" />
+      <meta content="International Journal of Systematic and Evolutionary&#xA;                Microbiology"
+            name="citation_journal_title" />
+      <meta content="Int J Syst Evol&#xA;                Microbiol"
+            name="citation_journal_abbrev" />
+      <meta content="1466-5026" name="citation_issn" />
+      <meta content="1466-5034" name="citation_issn" />
+      <meta name="citation_author" content="Nora Buddruhs" />
+      <meta name="citation_author_institution"
+            content="1Leibniz Institute DSMZ – German Collection of Microorganisms and Cell Cultures, Braunschweig, Germany" />
+      <meta name="citation_author" content="Silke Pradella" />
+      <meta name="citation_author_institution"
+            content="1Leibniz Institute DSMZ – German Collection of Microorganisms and Cell Cultures, Braunschweig, Germany" />
+      <meta name="citation_author" content="Markus Göker" />
+      <meta name="citation_author_institution"
+            content="1Leibniz Institute DSMZ – German Collection of Microorganisms and Cell Cultures, Braunschweig, Germany" />
+      <meta name="citation_author" content="Orsola Päuker" />
+      <meta name="citation_author_institution"
+            content="1Leibniz Institute DSMZ – German Collection of Microorganisms and Cell Cultures, Braunschweig, Germany" />
+      <meta name="citation_author" content="Rüdiger Pukall" />
+      <meta name="citation_author_institution"
+            content="1Leibniz Institute DSMZ – German Collection of Microorganisms and Cell Cultures, Braunschweig, Germany" />
+      <meta name="citation_author" content="Cathrin Spröer" />
+      <meta name="citation_author_institution"
+            content="1Leibniz Institute DSMZ – German Collection of Microorganisms and Cell Cultures, Braunschweig, Germany" />
+      <meta name="citation_author" content="Peter Schumann" />
+      <meta name="citation_author_institution"
+            content="1Leibniz Institute DSMZ – German Collection of Microorganisms and Cell Cultures, Braunschweig, Germany" />
+      <meta name="citation_author" content="Jörn Petersen" />
+      <meta name="citation_author_institution"
+            content="1Leibniz Institute DSMZ – German Collection of Microorganisms and Cell Cultures, Braunschweig, Germany" />
+      <meta name="citation_author" content="Thorsten Brinkhoff" />
+      <meta name="citation_author_institution"
+            content="2Institute for Chemistry and Biology of the Marine Environment, University of Oldenburg, Oldenburg, Germany" />
+      <meta content="Molecular and phenotypic analyses reveal the non-identity of the Phaeobacter gallaeciensis type strain deposits CIP 105210T and DSM 17395"
+            name="citation_title" />
+      <meta content="11/01/2013" name="citation_date" />
+      <meta content="63" name="citation_volume" />
+      <meta content="Pt 11" name="citation_issue" />
+      <meta content="4340" name="citation_firstpage" />
+      <meta content="4349" name="citation_lastpage" />
+      <meta content="63/Pt_11/4340" name="citation_id" />
+      <meta content="63/Pt 11/4340" name="citation_id_from_sass_path" />
+      <meta content="ijs;63/Pt_11/4340" name="citation_mjid" />
+      <meta content="10.1099/ijs.0.053900-0" name="citation_doi" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4340.abstract"
+            name="citation_abstract_html_url" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4340.full"
+            name="citation_fulltext_html_url" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4340.full.pdf"
+            name="citation_pdf_url" />
+      <meta content="/content/63/Pt_11.cover.gif" name="issue_cover_image" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4340"
+            name="citation_public_url" />
+      <meta content="24187021" name="citation_pmid" />
+      <meta name="citation_fulltext_world_readable" content="" />
+      <meta name="citation_section" content="Taxonomic Note" />
+      <meta name="robots" content="noarchive,nofollow" />
+      <meta name="googlebot" content="noarchive" />
+      <link href="/content/63/Pt_11/4330.short" rel="prev" />
+      <link href="/content/63/Pt_11/4350.short" rel="next" />
+      <link rel="stylesheet" type="text/css" media="all" href="/shared/css/hw-global.css" />
+      <link rel="stylesheet" type="text/css" media="print" href="/shared/css/hw-print.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/standard-designs/design25/main.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/local/css/hw-local-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/jquery.fancybox-1.3.4.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-global-colexpand.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-global-colexpand.css" /><script type="text/javascript" id="session-d7496846e1">var callbackToken='5634D5117134042';</script><script type="text/javascript" id="session-d7496846e3">
+                      var subCode='sgmjournal_sub';
+                    </script><script type="text/javascript" src="/shared/js/jquery-min.js"></script><script type="text/javascript" src="/shared/js/fingerprint.js"></script><script type="text/javascript" src="/shared/js/hw-shared.js"></script><script type="text/javascript" src="/shared/js/design/hw-design1.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-shared.js"></script><script type="text/javascript" src="/shared/js/pages/hw-content.js"></script><script type="text/javascript" src="/shared/js/fancybox/jquery.fancybox-1.3.4.js"></script><script type="text/javascript" src="/shared/js/fancybox/jquery.easing-1.3.pack.js"></script><script type="text/javascript"
+              src="/shared/js/fancybox/jquery.mousewheel-3.0.4.pack.js"></script><script type="text/javascript" src="/shared/js/util/content.jquery.addVariantLink.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-custom-free.js"></script><script type="text/javascript" src="/shared/js/util/hw-col-expand.js"></script><script type="text/javascript"
+              src="https://data.namesforlife.com/script/NamesforLife.js"></script></head>
+   <body>
+      <div class="hw-gen-page pagetype-content" id="pageid-content" itemscope="itemscope"
+           itemtype="http://schema.org/ScholarlyArticle">
+         <div id="header">
+            
+            <h1><a id="logo" href="/"><span>International Journal of Systematic and Evolutionary Microbiology</span></a></h1>
+            
+            <p id="skip-link">
+               <a href="#content-block">Skip to main page content</a>
+               
+            </p>
+            
+            <ul class="button-list header-buttons">
+               <li class="first"><a href="/" title="HOME"><span>HOME</span></a></li>
+               <li><a href="/content/current" title="CURRENT ISSUE"><span>CURRENT ISSUE</span></a></li>
+               <li><a href="/content" title="ARCHIVE"><span>ARCHIVE</span></a></li>
+               <li><a href="/search" title="SEARCH"><span>SEARCH</span></a></li>
+               <li><a href="/help" title="HELP"><span>HELP</span></a></li>
+               <li class="last"><a href="/feedback" title="CONTACT US"><span>CONTACT US</span></a></li>
+            </ul>
+            
+            
+            <div class="header-qs">
+               
+               <form class="searchbox" action="/search" method="get">
+                  <div>
+                     	<label for="header-qs-input" id="header-qs-search-label">Search for Keyword:</label>
+                     <input value="" title="Search" type="text" name="fulltext" id="header-qs-input" /><input type="hidden" name="submit" value="yes" /><label for="header-qs-search" id="header-qs-search-label">GO</label><input value="GO" alt="Link: Go" type="image" id="header-qs-search-go"
+                            src="/shared/img/standard-design/design2/go.gif" /> 
+                     
+                  </div>
+                  <div class="adv-search-link"><a href="/search">Advanced Search</a></div>
+               </form>
+               
+               
+            </div>
+            
+            <div class="header-ac-elements">
+               
+               <div id="authstring" class="suppress-header-login">
+                  
+                  <ul>
+                     <li class="subscr-ref">Institution: THE NATURAL HISTORY MUSEUM</li>
+                     <li>
+                        <a href="/login?uri=http%3A%2F%2Fijs.sgmjournals.org%2Fcontent%2F63%2FPt_11%2F4340.full">
+                           Sign In as Member / Individual
+                           </a>
+                        
+                     </li>
+                  </ul>           
+                  
+               </div> 
+               
+               <div id="hdr-login" class="suppress-header-login"></div>
+               
+            </div>
+            
+            <div class="banner-ads">
+               		
+               <ul>
+                  <li class="position-1 no-ad hdr_left"><span>  </span></li>
+               </ul>
+               	
+            </div>
+            
+            <div class="bar">
+               
+               <div class="bar-inner"></div>
+               
+            </div>
+            
+         </div>
+         <div id="content-block">
+            <div class="article fulltext-view " itemprop="articleBody"><span class="highwire-journal-article-marker-start"></span><h1 id="article-title-1" itemprop="headline">Molecular and phenotypic analyses reveal the non-identity of the <em>Phaeobacter gallaeciensis</em> type strain deposits CIP 105210<sup>T</sup> and DSM 17395
+               </h1>
+               <div class="contributors">
+                  <ol class="contributor-list" id="contrib-group-1">
+                     <li class="contributor" id="contrib-1" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Nora+Buddruhs&amp;sortspec=date&amp;submit=Submit">Nora Buddruhs</a></span><a id="xref-aff-1-1" class="xref-aff" href="#aff-1"><sup>1</sup></a><span class="xref-sep">,</span><a id="xref-fn-1-1" class="xref-fn" href="#fn-1">†</a>, 
+                     </li>
+                     <li class="contributor" id="contrib-2" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Silke+Pradella&amp;sortspec=date&amp;submit=Submit">Silke Pradella</a></span><a id="xref-aff-1-2" class="xref-aff" href="#aff-1"><sup>1</sup></a><span class="xref-sep">,</span><a id="xref-fn-1-2" class="xref-fn" href="#fn-1">†</a>, 
+                     </li>
+                     <li class="contributor" id="contrib-3" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Markus+G%C3%B6ker&amp;sortspec=date&amp;submit=Submit">Markus Göker</a></span><a id="xref-aff-1-3" class="xref-aff" href="#aff-1"><sup>1</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-4" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Orsola+P%C3%A4uker&amp;sortspec=date&amp;submit=Submit">Orsola Päuker</a></span><a id="xref-aff-1-4" class="xref-aff" href="#aff-1"><sup>1</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-5" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=R%C3%BCdiger+Pukall&amp;sortspec=date&amp;submit=Submit">Rüdiger Pukall</a></span><a id="xref-aff-1-5" class="xref-aff" href="#aff-1"><sup>1</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-6" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Cathrin+Spr%C3%B6er&amp;sortspec=date&amp;submit=Submit">Cathrin Spröer</a></span><a id="xref-aff-1-6" class="xref-aff" href="#aff-1"><sup>1</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-7" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Peter+Schumann&amp;sortspec=date&amp;submit=Submit">Peter Schumann</a></span><a id="xref-aff-1-7" class="xref-aff" href="#aff-1"><sup>1</sup></a>, 
+                     </li>
+                     <li class="contributor" id="contrib-8" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=J%C3%B6rn+Petersen&amp;sortspec=date&amp;submit=Submit">Jörn Petersen</a></span><a id="xref-aff-1-8" class="xref-aff" href="#aff-1"><sup>1</sup></a> and 
+                     </li>
+                     <li class="last" id="contrib-9"><span class="name"><a class="name-search"
+                              href="/search?author1=Thorsten+Brinkhoff&amp;sortspec=date&amp;submit=Submit">Thorsten Brinkhoff</a></span><a id="xref-aff-2-1" class="xref-aff" href="#aff-2"><sup>2</sup></a></li>
+                  </ol>
+                  <ol class="affiliation-list">
+                     <li class="aff"><a id="aff-1" name="aff-1"></a><address><sup>1</sup>Leibniz Institute DSMZ – German Collection of Microorganisms and Cell Cultures, Braunschweig, Germany
+                        </address>
+                     </li>
+                     <li class="aff"><a id="aff-2" name="aff-2"></a><address><sup>2</sup>Institute for Chemistry and Biology of the Marine Environment, University of Oldenburg, Oldenburg, Germany
+                        </address>
+                     </li>
+                  </ol>
+                  <ol class="corresp-list">
+                     <li class="corresp" id="corresp-1"><strong>Correspondence</strong><br /> Jörn Petersen <span class="em-link"><span class="em-addr">joern.petersen{at}dsmz.de</span></span></li>
+                  </ol>
+               </div>
+               <div class="section abstract" id="abstract-1" itemprop="description">
+                  <div class="section-nav">
+                     <div class="nav-placeholder"> </div><a href="#fn-group-1" title="Next Section" class="next-section-link"><span>Next Section</span></a></div>
+                  <h2>Abstract</h2>
+                  
+                  <p id="p-4">The marine genus <span class="named-content genus" id="named-content-4"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                           href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> currently comprises six species, some of which were intensively studied mainly due to their ability to produce secondary
+                     metabolites. The type strain of the type species, <span class="named-content species" id="named-content-5"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>Phaeobacter gallaeciensis</em></a></span> BS107<sup>T</sup>, has been deposited at several public culture collections worldwide. Based on differences in plasmid profiles, we detected
+                     that the alleged <span class="named-content species" id="named-content-6"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> type strains deposited at the Collection Institute Pasteur (CIP; Paris, France) as CIP 105210 and at the German Collection
+                     of Microorganisms and Cell Cultures (DSMZ; Braunschweig, Germany) as DSM 17395 are not identical. To determine the identity
+                     of these strains, we conducted DNA–DNA hybridization, matrix-assisted laser desorption/ionization time-of-flight mass spectrometry
+                     (MALDI-TOF), 16S rRNA gene and internal transcribed spacer (ITS) sequence analyses, as well as physiological experiments.
+                     Based on the detailed 16S rRNA gene reanalysis we showed that strain CIP 105210 most likely corresponds to the original <span class="named-content species" id="named-content-7"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> type strain BS107<sup>T</sup>. In contrast, the <span class="named-content genus" id="named-content-8"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                           href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strain DSM 17395 exhibits a much closer affiliation to <span class="named-content species" id="named-content-9"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter inhibens"
+                           href="doi:10.1601/nm.10132"><em>Phaeobacter inhibens</em></a></span> DSM 16374<sup>T</sup> ( = T5<sup>T</sup>) and should thus be allocated to this species. The detection of the dissimilarity of strains CIP 105210<sup>T</sup> and DSM 17395 will influence future comparative studies within the genus <span class="named-content genus" id="named-content-10"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                           href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span>.
+                  </p>
+                  
+               </div>
+               <div class="section fn-group" id="fn-group-1">
+                  <div class="section-nav"><a href="#abstract-1" title="Abstract" class="prev-section-link"><span>Previous Section</span></a><a href="#sec-1" title="Introduction" class="next-section-link"><span>Next Section</span></a></div>
+                  <ul>
+                     <li class="fn-equal" id="fn-1">
+                        <p id="p-1"><a class="rev-xref" href="#xref-fn-1-1">↵</a><span class="fn-label">†</span> These authors contributed equally to this work.
+                        </p>
+                     </li>
+                     <li class="fn-other" id="fn-2">
+                        <p id="p-2">The GenBank/EMBL/DDBJ accession numbers for the 16S rRNA gene sequences of the <span class="named-content genus" id="named-content-2"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains CIP 105210<sup>T</sup>, DSM 16374<sup>T</sup>, DSM 17395 and DSM 24564<sup>T</sup> are KC176239, KC176240, KC176241 and KC176242, respectively. The GenBank/EMBL/DDBJ accession numbers for the 16S–23S rRNA
+                           gene internal transcribed spacer of the <span class="named-content genus" id="named-content-3"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains CIP 105210<sup>T</sup>, DSM 16374<sup>T</sup>, DSM 17395, DSM 23529<sup>T</sup>, DSM 23566<sup>T</sup>, DSM 24564<sup>T</sup> and DSM 25627<sup>T</sup> are KC176233, KC176234, KC176235, KC176236, KC176237, KC176238 and KC907729, respectively.
+                        </p>
+                     </li>
+                     <li class="fn-supplementary-material" id="fn-3">
+                        <p id="p-3">Four supplementary figures and four supplementary tables are available with the online version of this paper.</p>
+                     </li>
+                  </ul>
+               </div>
+               <div class="section intro" id="sec-1">
+                  <div class="section-nav"><a href="#fn-group-1" title="Previous Section" class="prev-section-link"><span>Previous Section</span></a><a href="#sec-2" title="Methods" class="next-section-link"><span>Next Section</span></a></div>
+                  
+                  <h2>Introduction</h2>
+                  
+                  <p id="p-13">The genus <span class="named-content genus" id="named-content-11"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                           href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span><em>,</em> currently comprising the species <span class="named-content species" id="named-content-12"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>Phaeobacter gallaeciensis</em></a></span>, <span class="named-content species" id="named-content-13"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                           href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span>, <span class="named-content species" id="named-content-14"><a class="namesforlife" rel="namesforlife-name" title="P. daeponensis"
+                           href="doi:10.1601/nm.10944"><em>P. daeponensis</em></a></span><em>,</em> <span class="named-content species" id="named-content-15"><a class="namesforlife" rel="namesforlife-name" title="P. caeruleus"
+                           href="doi:10.1601/nm.14301"><em>P. caeruleus</em></a></span>, <span class="named-content species" id="named-content-16"><a class="namesforlife" rel="namesforlife-name" title="P. arcticus"
+                           href="doi:10.1601/nm.14057"><em>P. arcticus</em></a></span> and <span class="named-content species" id="named-content-17"><a class="namesforlife" rel="namesforlife-name" title="P. leonis"
+                           href="doi:10.1601/nm.24496"><em>P. leonis</em></a></span> (<a id="xref-ref-16-1" class="xref-bibr" href="#ref-16">Gaboyer <em>et al.</em>, 2013</a>), belongs to the marine <span class="named-content genus" id="named-content-18"><a class="namesforlife" rel="namesforlife-name" title="Roseobacter"
+                           href="doi:10.1601/nm.1134"><em>Roseobacter</em></a></span> clade. It was established by <a id="xref-ref-25-1" class="xref-bibr" href="#ref-25">Martens <em>et al.</em> (2006)</a> after reclassification of <span class="named-content species" id="named-content-19"><a class="namesforlife" rel="namesforlife-name" title="Roseobacter gallaeciensis"
+                           href="doi:10.1601/nm.1138"><em>Roseobacter gallaeciensis</em></a></span> (<a id="xref-ref-34-1" class="xref-bibr" href="#ref-34">Ruiz-Ponte <em>et al.</em>, 1998</a>) as <span class="named-content species" id="named-content-20"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span>, which is the type species of the genus, and description of <span class="named-content species" id="named-content-21"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                           href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> as a new species. During recent years, <span class="named-content genus" id="named-content-22"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                           href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains have received a lot of interest due to the production of various secondary metabolites (e.g. <a id="xref-ref-2-1" class="xref-bibr" href="#ref-2">Berger <em>et al.</em>, 2011</a>, <a id="xref-ref-3-1" class="xref-bibr" href="#ref-3">2012</a>; <a id="xref-ref-6-1" class="xref-bibr" href="#ref-6">Brinkhoff <em>et al.</em>, 2004</a>; <a id="xref-ref-7-1" class="xref-bibr" href="#ref-7">Bruhn <em>et al.</em>, 2007</a>; <a id="xref-ref-17-1" class="xref-bibr" href="#ref-17">Geng <em>et al.</em>, 2008</a>; <a id="xref-ref-26-1" class="xref-bibr" href="#ref-26">Martens <em>et al.</em>, 2007</a>; <a id="xref-ref-35-1" class="xref-bibr" href="#ref-35">Seyedsayamdost <em>et al.</em>, 2011a</a>, <a id="xref-ref-36-1" class="xref-bibr" href="#ref-36">b</a>).
+                  </p>
+                  
+                  <p id="p-14">Recently the genomes of three <span class="named-content genus" id="named-content-23"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                           href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains have been published, <span class="named-content species" id="named-content-24"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> DSM 17395, <span class="named-content species" id="named-content-25"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> 2.10 (<a id="xref-ref-40-1" class="xref-bibr" href="#ref-40">Thole <em>et al.</em>, 2012</a>) and <span class="named-content species" id="named-content-26"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> ANG1 (<a id="xref-ref-9-1" class="xref-bibr" href="#ref-9">Collins &amp; Nyholm, 2011</a>). However, evidence already indicated that strain ANG1 is more similar to <span class="named-content species" id="named-content-27"><a class="namesforlife" rel="namesforlife-name" title="P. daeponensis"
+                           href="doi:10.1601/nm.10944"><em>P. daeponensis</em></a></span> DSM 23529<sup>T</sup> ( = TF-218<sup>T</sup>) than to either DSM 17395 or DSM 24588 ( = 2.10) (unpublished results). Strain 2.10 was previously used in competition experiments
+                     of bacterial biofilms on the thalloid green alga <em>Ulva australis</em> (<a id="xref-ref-32-1" class="xref-bibr" href="#ref-32">Rao <em>et al.</em>, 2005</a>). Various physiological and genetic aspects of <span class="named-content species" id="named-content-28"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> DSM 17395 have also been studied, such as the pathway and substrate specificity of the algal metabolite dimethylsulfoniopropionate
+                     (DMSP) catabolism (<a id="xref-ref-11-1" class="xref-bibr" href="#ref-11">Dickschat <em>et al.</em>, 2010</a>), the compatibility of the plasmids (<a id="xref-ref-28-1" class="xref-bibr" href="#ref-28">Petersen, 2011</a>), and the primary metabolism by proteome analyses (<a id="xref-ref-44-1" class="xref-bibr" href="#ref-44">Zech <em>et al.</em>, 2009</a>).
+                  </p>
+                  
+                  <p id="p-15">With the description of the species <span class="named-content species" id="named-content-29"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> (basonym <span class="named-content species" id="named-content-30"><a class="namesforlife" rel="namesforlife-name" title="R. gallaeciensis"
+                           href="doi:10.1601/nm.1138"><em>R. gallaeciensis</em></a></span>) in 1998, the type strain BS107<sup>T</sup> was primarily deposited at the Collection Institute Pasteur (CIP; Paris, France) as CIP 105210 (<a id="xref-ref-34-2" class="xref-bibr" href="#ref-34">Ruiz-Ponte <em>et al.</em>, 1998</a>). According to the strain history (<a href="http://www.straininfo.net/strains/620650">http://www.straininfo.net/strains/620650</a>), the CIP referred the strain to the Colección Española de Cultivos Tipo (CECT; Burjassot, Spain) and to the American Type
+                     Culture Collection (ATCC; Manassas, USA), which in turn referred it to the Japan Collection of Micro-organisms at the RIKEN
+                     Bioscience Center (Tsikiba, Japan) followed by a transfer to the NITE (National Institute of Technology and Evaluation) Biological
+                     Resource Center (Kisarazu, Japan). At these culture collections the derivatives of strain CIP 105210 were designated CECT
+                     7277<sup>T</sup>, ATCC 700781<sup>T</sup>, JCM 21319<sup>T</sup> and NBRC 16654<sup>T</sup>, respectively. The Leibniz Institute DSMZ – German Collection of Microorganisms and Cell Cultures (DSMZ; Braunschweig, Germany)
+                     independently requested <span class="named-content species" id="named-content-31"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> BS107<sup>T</sup> from the laboratory of the original depositor in 2005 and included it as DSM 17395 in the strain collection. Strain DSM 17395
+                     was subsequently collected by the Laboratorium voor Microbiologie (LMG; Gent, Belgium) and deposited as LMG 24391<sup>T</sup>. When investigating plasmid profiles of various <span class="named-content genus" id="named-content-32"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                           href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains, we observed differences between the strains CIP 105210 and DSM 17395 even though both were considered identical
+                     with the type strain BS107<sup>T</sup>. This is critical, as due to the broad scientific interest in the <span class="named-content species" id="named-content-33"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> type strain, it was either obtained from the public culture collections or retrieved from other sources several times. For
+                     example, <a id="xref-ref-36-2" class="xref-bibr" href="#ref-36">Seyedsayamdost <em>et al.</em> (2011b)</a> allegedly used strain BS107<sup>T</sup> to investigate the mutualistic or pathogenic symbioses between <span class="named-content species" id="named-content-34"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> and the unicellular haptophycean alga <em>Emiliania huxleyi</em>. It was indicated that these authors received the strain BS107<sup>T</sup> from a collaborating laboratory; hence the biological identity of the strain used is ultimately unclear.
+                  </p>
+                  
+                  <p id="p-16">In this study, we consequently reassessed the biological identity of these strains. We compared in detail the characteristics
+                     of the strains CIP 105210 and DSM 17395 with those of the description of BS107<sup>T</sup> given by <a id="xref-ref-34-3" class="xref-bibr" href="#ref-34">Ruiz-Ponte <em>et al.</em> (1998)</a> and with those of other closely related <span class="named-content genus" id="named-content-35"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                           href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains, i.e. <span class="named-content species" id="named-content-36"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> DSM 24588 ( = 2.10; <a id="xref-ref-40-2" class="xref-bibr" href="#ref-40">Thole <em>et al.</em>, 2012</a>) and <span class="named-content species" id="named-content-37"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                           href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> DSM 16374<sup>T</sup> ( = T5<sup>T</sup>; <a id="xref-ref-25-2" class="xref-bibr" href="#ref-25">Martens <em>et al.</em>, 2006</a>). Based on our results, according reclassifications are proposed.
+                  </p>
+                  
+               </div>
+               <div class="section methods" id="sec-2">
+                  <div class="section-nav"><a href="#sec-1" title="Introduction" class="prev-section-link"><span>Previous Section</span></a><a href="#sec-11" title="Results" class="next-section-link"><span>Next Section</span></a></div>
+                  
+                  <h2>Methods</h2>
+                  
+                  <div id="sec-3" class="subsection">
+                     
+                     
+                     <div id="sec-4" class="subsection">
+                        
+                        <h4>Source of bacteria and culturing.</h4>
+                        
+                        <p id="p-17">The <span class="named-content genus" id="named-content-38"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains DSM 16374<sup>T</sup> ( = T5<sup>T</sup>), DSM 17395, DSM 23529<sup>T</sup> ( = TF-218<sup>T</sup>), DSM 23566<sup>T</sup> ( = 20188<sup>T</sup>), DSM 24564<sup>T</sup>, DSM 24588 ( = 2.10) and DSM 25627<sup>T</sup> ( = 306<sup>T</sup>) as well as <span class="named-content species" id="named-content-39"><a class="namesforlife" rel="namesforlife-name" title="Roseobacter litoralis"
+                                 href="doi:10.1601/nm.1135"><em>Roseobacter litoralis</em></a></span> DSM 6996<sup>T</sup>, <span class="named-content species" id="named-content-40"><a class="namesforlife" rel="namesforlife-name" title="Marinovum algicola"
+                                 href="doi:10.1601/nm.9794"><em>Marinovum algicola</em></a></span> DSM 10251<sup>T</sup> and <span class="named-content species" id="named-content-41"><a class="namesforlife" rel="namesforlife-name" title="Roseobacter denitrificans"
+                                 href="doi:10.1601/nm.1137"><em>Roseobacter denitrificans</em></a></span> DSM 7001<sup>T</sup> were obtained from the DSMZ. The <span class="named-content genus" id="named-content-42"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strain CIP 105210 was obtained from the CIP. Unless otherwise stated, cells were grown in marine broth 2216 (MB; Difco) or
+                           on MB agar at 28 °C (and at 25 °C in case of <span class="named-content species" id="named-content-43"><a class="namesforlife" rel="namesforlife-name" title="P. leonis"
+                                 href="doi:10.1601/nm.24496"><em>P. leonis</em></a></span> DSM 25627<sup>T</sup>).
+                        </p>
+                        
+                     </div>
+                     <div id="sec-5" class="subsection">
+                        
+                        <h4>Profiles of the extrachromosomal elements.</h4>
+                        
+                        <p id="p-18">To analyse the plasmid content of the <span class="named-content genus" id="named-content-44"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains, their high-molecular-mass total genomic DNA was prepared within agarose plugs as previously described and subjected
+                           to pulsed-field gel electrophoresis (PFGE; <a id="xref-ref-30-1" class="xref-bibr" href="#ref-30">Pradella <em>et al.</em>, 2010</a>). PFGE was performed in a contour-clamped homogeneous electric field (CHEF) system on a CHEF-DR III device (Bio-Rad) with
+                           1 % or 1.2 % agarose gels and modified 0.5× TBE buffer (45 mM Tris, 45 mM boric acid, 0.1 mM EDTA) at 14 °C. PFGE parameters,
+                           namely pulse time ramps and run times, were varied both to resolve chromosomal and extrachromosomal DNA and to identify different
+                           plasmid conformations (<a id="xref-ref-33-1" class="xref-bibr" href="#ref-33">Römling <em>et al.</em>, 1996</a>). Two PFGE parameter sets were applied to assess plasmid topology: (i) set A, 1 % (w/v) agarose gel with pulse times of 1
+                           to 48 s for 24 h at 200 V (6 V cm<sup>−1</sup>) and (ii) set B, 1 % (w/v) agarose gel with pulse times of 1 to 20 s for 22 h at 200 V (6 V cm<sup>−1</sup>). At least two PFGE gels were evaluated to determine plasmid sizes. The resulting plasmid profiles were interpreted as described
+                           by <a id="xref-ref-30-2" class="xref-bibr" href="#ref-30">Pradella <em>et al.</em> (2010)</a>. Conventional unidirectional gel electrophoresis of DNA was in 0.8 % agarose gels and 1× TBE (89 mM Tris, 89 mM boric acid,
+                           2 mM EDTA) at 10 °C and 70 mA for 8.5 h. The BAC Tracker supercoiled DNA ladder (from 38 to 120 kb; Epicentre) was used to
+                           size plasmids with covalently closed circular (ccc) DNA topology.
+                        </p>
+                        
+                     </div>
+                     <div id="sec-6" class="subsection">
+                        
+                        <h4>16S rRNA gene and 16S–23S rRNA gene internal transcribed spacer (ITS) analysis.</h4>
+                        
+                        <p id="p-19">The PCR amplification of 16S rRNA genes from the genomic DNA of the <span class="named-content genus" id="named-content-45"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains was done as described by <a id="xref-ref-31-1" class="xref-bibr" href="#ref-31">Rainey <em>et al.</em> (1996)</a>. For the PCR amplification of the ITS region, the primer pair 16S_1401f 5′-GRGCCTTGYACACACCG-3′ (<a id="xref-ref-23-1" class="xref-bibr" href="#ref-23">Lane, 1991</a>) and 23S_130r 5′-GGTTBCCCCATTCRG-3′ (<a id="xref-ref-18-1" class="xref-bibr" href="#ref-18">Gürtler &amp; Stanisich, 1996</a>) was used. Resulting PCR products were cycle sequenced with the primers mentioned above in ‘Extended Hot Shot’ reactions
+                           as offered by the Seqlab company, Germany. The sequence analysis tool BioEdit 7.0.1 (<a href="http://www.mbio.ncsu.edu/BioEdit/bioedit.html">http://www.mbio.ncsu.edu/BioEdit/bioedit.html</a>) was utilized for 16S rRNA gene and ITS sequence editing. The accession numbers of retrieved 16S rRNA gene sequences from
+                           <span class="named-content species" id="named-content-46"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> BS107<sup>T</sup> (<a id="xref-ref-34-4" class="xref-bibr" href="#ref-34">Ruiz-Ponte <em>et al.</em>, 1998</a>), <span class="named-content species" id="named-content-47"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                 href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> T5<sup>T</sup> (<a id="xref-ref-25-3" class="xref-bibr" href="#ref-25">Martens <em>et al.</em>, 2006</a>), <span class="named-content species" id="named-content-48"><a class="namesforlife" rel="namesforlife-name" title="P. daeponensis"
+                                 href="doi:10.1601/nm.10944"><em>P. daeponensis</em></a></span> TF-218<sup>T</sup>, <span class="named-content species" id="named-content-49"><a class="namesforlife" rel="namesforlife-name" title="P. arcticus"
+                                 href="doi:10.1601/nm.14057"><em>P. arcticus</em></a></span> 20188<sup>T</sup>, <span class="named-content species" id="named-content-50"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> LSS9 and <span class="named-content species" id="named-content-51"><a class="namesforlife" rel="namesforlife-name" title="P. leonis"
+                                 href="doi:10.1601/nm.24496"><em>P. leonis</em></a></span> 306<sup>T</sup> were Y13244, AY177712, NR_044026, NR_043888, GQ906799 and HE661585, respectively. Further 16S rRNA gene or ITS sequences
+                           used in this study were extracted from the genome sequences of <span class="named-content genus" id="named-content-52"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains DSM 17395 (ABIF01000000), DSM 24588 ( = 2.10; CP002972–CP002975) and ANG1 (AFCF01000000) using the Integrated Microbial
+                           Genomes (IMG) system (<a href="http://img.jgi.doe.gov/cgi-bin/w/main.cgi">http://img.jgi.doe.gov/cgi-bin/w/main.cgi</a>; <a id="xref-ref-24-1" class="xref-bibr" href="#ref-24">Markowitz <em>et al.</em>, 2012</a>).
+                        </p>
+                        
+                        <p id="p-20">Sequences were aligned with <span class="sc">mafft</span> version 6.850b, using the ‘--<em>genafpair</em>’ option but default settings otherwise (<a id="xref-ref-22-1" class="xref-bibr" href="#ref-22">Katoh <em>et al.</em>, 2005</a>). Phylogenetic analysis under the maximum-likelihood (ML) criterion (<a id="xref-ref-13-1" class="xref-bibr" href="#ref-13">Felsenstein, 1981</a>) was conducted with RAxML version 7.2.8, using its novel rapid bootstrap option combined with the autoMRE bootstrapping criterion
+                           (<a id="xref-ref-27-1" class="xref-bibr" href="#ref-27">Pattengale <em>et al.</em>, 2010</a>) with subsequent search for the best tree under the GTRMIX approach (<a id="xref-ref-38-1" class="xref-bibr" href="#ref-38">Stamatakis <em>et al.</em>, 2008</a>). Branch-and-bound search for the best trees under the maximum-parsimony (MP) criterion (<a id="xref-ref-15-1" class="xref-bibr" href="#ref-15">Fitch, 1971</a>) was done with <span class="sc">paup</span>* version 4.0b10 (<a id="xref-ref-39-1" class="xref-bibr" href="#ref-39">Swofford, 2002</a>), treating gaps as missing data and collapsing branches of zero minimum length; 1000 bootstrap replicates were conducted
+                           in the same manner. The resulting best trees were rooted using the midpoint-rooting method (<a id="xref-ref-12-1" class="xref-bibr" href="#ref-12">Farris, 1972</a>; <a id="xref-ref-20-1" class="xref-bibr" href="#ref-20">Hess &amp; De Moraes Russo, 2007</a>).
+                        </p>
+                        
+                     </div>
+                     <div id="sec-7" class="subsection">
+                        
+                        <h4>MALDI-TOF MS protein analysis.</h4>
+                        
+                        <p id="p-21">Whole-cell protein extracts of the <span class="named-content genus" id="named-content-53"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains CIP 105210, DSM 17395, DSM 24588, DSM 16374<sup>T</sup>, DSM 23529<sup>T</sup>, DSM 23566<sup>T</sup>, DSM 24564<sup>T</sup> and DSM 25627<sup>T</sup> were analysed by matrix-assisted laser desorption/ionization time-of-flight mass spectrometry (MALDI-TOF MS) using a Microflex
+                           L20 mass spectrometer (Bruker Daltonics) equipped with a N<sub>2</sub> laser. Sample preparation for MALDI-TOF MS protein analysis was carried out according to the ethanol/formic acid extraction
+                           protocol recommended by Bruker Daltonics as described in detail by <a id="xref-ref-41-1" class="xref-bibr" href="#ref-41">Tóth <em>et al.</em> (2008)</a>. The MALDI-TOF mass spectra were analysed with the BioTyper software (version 3.0; Bruker Daltonics).
+                        </p>
+                        
+                     </div>
+                     <div id="sec-8" class="subsection">
+                        
+                        <h4>DNA–DNA hybridization (DDH).</h4>
+                        
+                        <p id="p-22">Cells of the <span class="named-content genus" id="named-content-54"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains CIP 105210, DSM 17395, DSM 16374<sup>T</sup> and DSM 24588 were disrupted by using a Constant Systems TS 0.75 kW (IUL Instruments) and the DNA in the crude lysate was
+                           purified by chromatography on hydroxyapatite as described by <a id="xref-ref-8-1" class="xref-bibr" href="#ref-8">Cashion <em>et al.</em> (1977)</a>. DNA–DNA hybridization was carried out as described by <a id="xref-ref-10-1" class="xref-bibr" href="#ref-10">De Ley <em>et al.</em> (1970)</a> and modified by <a id="xref-ref-21-1" class="xref-bibr" href="#ref-21">Huß <em>et al.</em> (1983)</a> using a model Cary 100 Bio UV/VIS-spectrophotometer equipped with a Peltier-thermostatted 6×6 multi-cell changer and a temperature
+                           controller with <em>in situ</em> temperature probe (Varian). Each strain was measured in two technical replicates and the mean result was taken.
+                        </p>
+                        
+                     </div>
+                     <div id="sec-9" class="subsection">
+                        
+                        <h4>Growth and hydrolysis experiments.</h4>
+                        
+                        <p id="p-23">To determine the substrate spectrum of the <span class="named-content genus" id="named-content-55"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains CIP 105210 and DSM 17395, cells were grown in artificial seawater (ASW; solution of Sigma sea salts: S9883) supplemented
+                           with 10 mg caseine hydrolysate l<sup>−1</sup> (CAS: 65072-00-6; Merck) to avoid auxotrophy and with different carbon sources at a concentration of 0.1 % each, including
+                           2-ketoglutarate, acetate, <span class="sc">l</span>-arabinose, butyrate, cellobiose, citrate, <span class="sc">d</span>-fucose, glucosamine, glycerol, <span class="sc">l</span>-leucine, maltose, <span class="sc">l</span>-rhamnose, <span class="sc">l</span>-serine, <span class="sc">d</span>-sorbitol, succinate, sucrose, trehalose, Tween 20, Tween 40 and Tween 80. The tests were performed in the 24-well microtitre-plate
+                           format. In detail, cells were grown on MB agar for 2 days at 28 °C, then harvested with a sterile swab and inoculated in ASW
+                           medium. The cell suspension was thereby adjusted to a turbidity of 80 % transmittance using a turbidimeter (AES Chemunex BLG
+                           3531). Afterwards, 2 ml of each suspension was pipetted into a 24-well microtitre plate (Greiner). A sample lacking any carbon
+                           source was included as negative control. Cells were incubated in a microtitre plate reader (Infinite F200 pro; Tecan) at 23
+                           °C and with shaking at 88 r.p.m. for 7 days. Growth was automatically measured every 15 min with the Infinite F200 system
+                           as increase of the OD<sub>600</sub>. Growth at temperatures of 4 °C and 37 °C was determined in 200 ml MB within Erlenmeyer flasks for one month and measured
+                           photometrically as increase of the OD<sub>600</sub> using an Ultrospec II spectrophotometer (LKB-Biochrom).
+                        </p>
+                        
+                        <p id="p-24">Exoenzyme activities (hydrolysis of gelatin, starch and Tween 80) were analysed using MB solidified with 4 % (w/v) gelatin
+                           or 1.5 % (w/v) agarose and supplemented with 0.2 % (w/v) starch and 1 % (v/v) Tween 80, respectively, as described by <a id="xref-ref-37-1" class="xref-bibr" href="#ref-37">Smibert &amp; Krieg (1981)</a>. As a positive control, <span class="named-content species" id="named-content-56"><a class="namesforlife" rel="namesforlife-name" title="R. litoralis"
+                                 href="doi:10.1601/nm.1135"><em>R. litoralis</em></a></span> DSM 6996<sup>T</sup> was used for gelatin and Tween 80 hydrolysis and <span class="named-content species" id="named-content-57"><a class="namesforlife" rel="namesforlife-name" title="M. algicola"
+                                 href="doi:10.1601/nm.9794"><em>M. algicola</em></a></span> DSM 10251<sup>T</sup> for starch hydrolysis. Reduction of nitrate was tested according to <a id="xref-ref-37-2" class="xref-bibr" href="#ref-37">Smibert &amp; Krieg (1981)</a> in MB supplemented with 0.1 % (w/v) potassium nitrate; <span class="named-content species" id="named-content-58"><a class="namesforlife" rel="namesforlife-name" title="R. denitrificans"
+                                 href="doi:10.1601/nm.1137"><em>R. denitrificans</em></a></span> DSM 7001<sup>T</sup> served as a negative control. The assays were incubated for 7 days at 28 °C, except for the hydrolysis of starch, conducted
+                           at 20 °C. The growth and hydrolysis tests described above were all performed in three technical replicates.
+                        </p>
+                        
+                     </div>
+                     <div id="sec-10" class="subsection">
+                        
+                        <h4>Phenotype MicroArray (PM) experiments.</h4>
+                        
+                        <p id="p-25">To determine the metabolic properties of the <span class="named-content genus" id="named-content-59"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains CIP 105210, DSM 17395, DSM 24588 and DSM 16374<sup>T</sup> we used the PM technology (Biolog; <a id="xref-ref-4-1" class="xref-bibr" href="#ref-4">Bochner, 2009</a>). The <span class="named-content genus" id="named-content-60"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains were grown on MB agar for 48 h and subsequently analysed using the Phenotype MicroArray MicroPlate PM01 and PM02-A
+                           (AES Chemunex BLG 12111, BLG 12112) over 70 h; thus 190 different carbon sources were tested. Each strain was measured in
+                           three biological replicates. The inoculation medium was modified according to the requirements of marine bacteria, i.e. 10
+                           ml of the inoculation fluid IF-0a (AES Chemunex BLG 72268) was supplemented with 1200 µl artificial seawater stock solution,
+                           120 µl vitamin stock solution, 12 µl trace element stock solution, 120 µl NaHCO<sub>3</sub> buffer, 428 µl ultrapure H<sub>2</sub>O and 120 µl DyeD (AES Chemunex BLG 74224). The stock solutions had the following composition (l<sup>−1</sup>): (i) artificial seawater stock solution: 200 g NaCl, 40 g Na<sub>2</sub>SO<sub>4</sub>, 30 g MgCl<sub>2</sub> . 6H<sub>2</sub>O, 5 g KCl, 2.5 g NH<sub>4</sub>Cl, 2 g KH<sub>2</sub>PO<sub>4</sub>, 1.5 g CaCl<sub>2</sub> . 2H<sub>2</sub>O; (ii) trace element stock solution: 2.1 g FeSO<sub>4</sub> . 7H<sub>2</sub>O, 13 ml 25 % HCl, 5.2 g Titriplex III (Na<sub>2</sub>EDTA; adjust pH to 6.0–6.5 to resolve), 190 mg CoCl<sub>2</sub> . 6H<sub>2</sub>O, 144 mg ZnSO<sub>4</sub> . 7H<sub>2</sub>O, 100 mg MnCl<sub>2</sub> . 4H<sub>2</sub>O, 36 mg Na<sub>2</sub>MoO<sub>4</sub> . 2H<sub>2</sub>O, 30 mg H<sub>3</sub>BO<sub>3</sub>, 24 mg NiCl<sub>2</sub> . 6H<sub>2</sub>O, 2 mg CuCl<sub>2</sub> . 2H<sub>2</sub>O; (iii) vitamin stock solution: 100 mg thiamine, 20 mg niacin, 8 mg 4-aminobenzoic acid, 2 mg biotin; and (iii) buffer stock
+                           solution: 19 g NaHCO<sub>3</sub>.
+                        </p>
+                        
+                        <p id="p-26">The cells were suspended in the modified inoculation medium using a sterile swab. The turbidity was adjusted to a cell density
+                           of 85 % transmittance using a turbidimeter (AES Chemunex BLG 3531) and 100 µl of the cell suspension were pipetted in each
+                           of the wells. The MicroPlates were sealed with Parafilm, incubated at 28 °C and measured in the Omnilog unit (Biolog). The
+                           results were analysed using the R package ‘<em>opm</em>’ (<a id="xref-ref-42-1" class="xref-bibr" href="#ref-42">Vaas <em>et al.</em>, 2012</a>). The curve parameter maximum height (A) was estimated for each substrate, differences were visualized using heat maps, and
+                           the data were discretized into negative, ambiguous and positive reactions using the built-in functions of ‘<em>opm</em>’ under default settings.
+                        </p>
+                        
+                     </div>
+                  </div>
+               </div>
+               <div class="section results" id="sec-11">
+                  <div class="section-nav"><a href="#sec-2" title="Methods" class="prev-section-link"><span>Previous Section</span></a><a href="#sec-19" title="Discussion" class="next-section-link"><span>Next Section</span></a></div>
+                  
+                  <h2>Results</h2>
+                  
+                  <div id="sec-12" class="subsection">
+                     
+                     <h3>Profiles of the extrachromosomal elements</h3>
+                     
+                     <p id="p-27">The high-molecular-mass genomic DNA of different <span class="named-content genus" id="named-content-61"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                              href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains was separated with PFGE. A representative PFGE gel resolving linear DNA molecules in the size range from 23 to 533
+                        kb is shown in <a id="xref-fig-1-1" class="xref-fig" href="#F1">Fig. 1(a)</a>. In addition to the chromosomes (<a id="xref-fig-1-2" class="xref-fig" href="#F1">Fig. 1a</a>, Chr) a distinct number of extrachromosomal bands was revealed for each of the strains CIP 105210, DSM 17395, DSM 24588 and
+                        DSM 16374<sup>T</sup>. To determine the conformation of the detected extrachromosomal DNA (ccc versus linear; <a id="xref-ref-30-3" class="xref-bibr" href="#ref-30">Pradella <em>et al.</em>, 2010</a>; <a id="xref-ref-33-2" class="xref-bibr" href="#ref-33">Römling <em>et al.</em>, 1996</a>), we varied the PFGE conditions (PFGE parameter set A and B) in different gel runs. Using PFGE parameter set A, the fuzzy,
+                        faint bands within the lanes of strains CIP 105210 and DSM 17395 (<a id="xref-fig-1-3" class="xref-fig" href="#F1">Fig. 1a</a>, marked a, b and c, respectively) ran at approximately 319 (a) and 380 (b, c) kb (<a id="xref-fig-1-4" class="xref-fig" href="#F1">Fig. 1a</a>). With PFGE parameter set B (data not shown) band (a) ran at 184 kb and bands (b) and (c) ran at approximately 210 kb indicating
+                        that the respective bands migrated independently of the PFGE parameters applied. From this anomalous migration behaviour we
+                        concluded that the inherent DNA had a circular conformation. The sizes of the detected ccc DNA were estimated as 66 (a) and
+                        79 (b, c) kb by conventional electrophoresis using the BAC Tracker as ccc size marker (data not shown). As these sizes were
+                        close to those estimated for the linearized plasmids of 64 and 77 kb in <span class="named-content genus" id="named-content-62"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                              href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strain CIP 105210 and 75 kb in strain DSM 17395 (see below), it is most likely that they represent the same plasmids in different
+                        conformations.
+                     </p>
+                     
+                     <div id="F1" class="fig pos-float type-figure  odd">
+                        <div class="fig-inline"><a href="4340/F1.expansion.html"><img alt="Fig. 1. " src="4340/F1.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                                 <li><a href="4340/F1.expansion.html">In this window</a></li>
+                                 <li><a class="in-nw" href="4340/F1.expansion.html">In a new window</a></li>
+                              </ul>
+                              <ul class="fig-services">
+                                 <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4340/F1">Download as PowerPoint Slide</a></li>
+                              </ul>
+                           </div>
+                        </div>
+                        <div class="fig-caption"><span class="fig-label">Fig. 1. </span> 
+                           
+                           <p id="p-28" class="first-child">(a) PFGE plasmid profiles of the <span class="named-content genus" id="named-content-63"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                    href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains CIP 105210<sup>T</sup>, DSM 17395, DSM 24588 and DSM 16374<sup>T</sup> based on uncut high-molecular-mass genomic DNA. (b) Calculated plasmid sizes as mean values taken from at least two different
+                              gel runs. The PFGE conditions were: 1 % (w/v) agarose gel with pulse times of 1 to 48 s for 24 h at 200 V (6 V cm<sup>−1</sup>). Chr, chromosomal DNA; λ, lambda phage concatemers as molecular-mass PFGE markers (New England Biolabs); li, linear. <sup>(*)</sup>, The two largest plasmids (linearized forms) of <span class="named-content genus" id="named-content-64"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                    href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains CIP 105210<sup>T</sup> and DSM 17395 migrated about the same distance in the gel and thus seemed to have an identical size. In contrast, both bands
+                              could be clearly distinguished by their size in other PFGE runs (data not shown) using different DNA sample preparations.
+                              DNA mobility is largely influenced by the DNA concentration of the sample. The observed discrepancy can thus be explained
+                              by the relatively high DNA concentration in CIP 105210<sup>T</sup> (compared to DSM 17395<sup>T</sup>), which retards band migration (<a id="xref-ref-33-3" class="xref-bibr" href="#ref-33">Römling <em>et al.</em>, 1996</a>). <sup>(†) (‡)</sup>, The PFGE-based plasmid size estimations of 75 and 63 kb of DSM 17395 correspond to the plasmid sizes of 78 and 65 kb, respectively,
+                              determined by genome sequencing (<a id="xref-ref-40-3" class="xref-bibr" href="#ref-40">Thole <em>et al.</em>, 2012</a>; NC_018287.1, NC_018288.1). <sup>(§)</sup>, The 36 kb plasmid of <span class="named-content species" id="named-content-65"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                    href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> CIP 105210<sup>T</sup> had a very low fluorescence intensity and is thus hardly visible on the gel image. ++, The 77 kb band of strain CIP 105210<sup>T</sup> showed increased fluorescence intensity and presumably represents a double band (plasmid duplet).
+                           </p>
+                           
+                           <div class="sb-div caption-clear"></div>
+                        </div>
+                     </div>
+                     
+                     <p id="p-29">By contrast, the sharp bands between 23 kb and 262 kb were separated strictly in accordance with their size when PFGE parameter
+                        sets A and B were used. They were thus assumed linear (li, <a id="xref-fig-1-5" class="xref-fig" href="#F1">Fig. 1a</a>), most possibly originating from randomly linearized ccc plasmids (<a id="xref-ref-30-4" class="xref-bibr" href="#ref-30">Pradella <em>et al.</em>, 2010</a>).
+                     </p>
+                     
+                     <p id="p-30">Regarding the linearized plasmid fraction of the <span class="named-content genus" id="named-content-66"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                              href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains, which was very well suited to determine the plasmid complement of the strains and their sizes (<a id="xref-ref-30-5" class="xref-bibr" href="#ref-30">Pradella <em>et al.</em>, 2010</a>), seven extrachromosomal replicons were evident in <span class="named-content species" id="named-content-67"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                              href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> CIP 105210, four in <span class="named-content species" id="named-content-68"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                              href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> DSM 16374<sup>T</sup> and three in the strains DSM 17395 and DSM 24588. The estimated sizes of the detected plasmids (17 altogether) ranged from
+                        36 to 262 kb (<a id="xref-fig-1-6" class="xref-fig" href="#F1">Fig. 1b</a>). They were all different, but their size distribution in the individual strains showed some similarity, i.e. all <span class="named-content genus" id="named-content-69"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                              href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains have one large plasmid (262, 253, 239 and 227 kb in strains DSM 17395, CIP 105210, DSM 24588 and DSM 16374<sup>T</sup>, respectively) and two or three smaller ones in the size range between 63 and 77 kb. Our PFGE analysis thus indicated that
+                        the <span class="named-content genus" id="named-content-70"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                              href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains CIP 105210 and DSM 17395 – both deposited as type strain of <span class="named-content species" id="named-content-71"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter gallaeciensis"
+                              href="doi:10.1601/nm.9798"><em>Phaeobacter gallaeciensis</em></a></span> – are not identical.
+                     </p>
+                     
+                  </div>
+                  <div id="sec-13" class="subsection">
+                     
+                     <h3>Classification of the <span class="named-content genus" id="named-content-72"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                              href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains using 16S rRNA gene sequence, MALDI-TOF MS protein and 16S–23S rRNA gene ITS analyses
+                     </h3>
+                     
+                     <div id="sec-14" class="subsection">
+                        
+                        <h4>16S rRNA gene sequence analysis.</h4>
+                        
+                        <p id="p-31">We re-evaluated the phylogenetic relationships of the <span class="named-content genus" id="named-content-73"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains and therefore resequenced the PCR-amplified 16S rRNA genes of strains DSM 17395, DSM 16374<sup>T</sup> and CIP 105210. In the phylogenetic tree inferred from 16S rRNA gene sequences of representative members of the genus <span class="named-content genus" id="named-content-74"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span>, as well as strains DSM 24588 ( = 2.10), ANG1 and LSS9, for which finished or draft genome sequences exist (<a id="xref-ref-9-2" class="xref-bibr" href="#ref-9">Collins &amp; Nyholm, 2011</a>; <a id="xref-ref-14-1" class="xref-bibr" href="#ref-14">Fernandes <em>et al.</em>, 2011</a>; <a id="xref-ref-40-4" class="xref-bibr" href="#ref-40">Thole <em>et al.</em>, 2012</a>; <a id="xref-fig-2-1" class="xref-fig" href="#F2">Fig. 2</a>), the <span class="named-content genus" id="named-content-75"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains DSM 17395, DSM 24588 ( = 2.10), DSM 16374<sup>T</sup> and CIP 105210 clustered together (<span class="named-content species" id="named-content-76"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span>/<span class="named-content species" id="named-content-77"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                 href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> cluster) and were well separated from the <span class="named-content species" id="named-content-78"><a class="namesforlife" rel="namesforlife-name" title="P. arcticus"
+                                 href="doi:10.1601/nm.14057"><em>P. arcticus</em></a></span><em>/</em><span class="named-content species" id="named-content-79"><a class="namesforlife" rel="namesforlife-name" title="P. leonis"
+                                 href="doi:10.1601/nm.24496"><em>P. leonis</em></a></span> lineage and the branch formed by <span class="named-content species" id="named-content-80"><a class="namesforlife" rel="namesforlife-name" title="P. caeruleus"
+                                 href="doi:10.1601/nm.14301"><em>P. caeruleus</em></a></span>, <span class="named-content species" id="named-content-81"><em>Phaeobacter</em> sp.</span> ANG1 and <span class="named-content species" id="named-content-82"><a class="namesforlife" rel="namesforlife-name" title="P. daeponensis"
+                                 href="doi:10.1601/nm.10944"><em>P. daeponensis</em></a></span> (16S rRNA gene identity ≥97.8 %). Within the <span class="named-content species" id="named-content-83"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span>/<span class="named-content species" id="named-content-84"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                 href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> cluster, the 16S rRNA gene of strain CIP 105210 (KC176239) grouped together with the originally deposited BS107<sup>T</sup> sequence (Y13244), exhibiting 72 % and 91 % support from MP and ML bootstrapping, respectively. The 16S rRNA gene sequences
+                           of the <span class="named-content genus" id="named-content-85"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains DSM 17395, DSM 24588 and DSM 16374<sup>T</sup> (KC176240) were identical and differed by four bases from the <span class="named-content species" id="named-content-86"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> CIP 105210 sequence KC176239 (16S rRNA gene identity of 99.7 %; see below).
+                        </p>
+                        
+                        <div id="F2" class="fig pos-float type-figure  odd">
+                           <div class="fig-inline"><a href="4340/F2.expansion.html"><img alt="Fig. 2. " src="4340/F2.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                                    <li><a href="4340/F2.expansion.html">In this window</a></li>
+                                    <li><a class="in-nw" href="4340/F2.expansion.html">In a new window</a></li>
+                                 </ul>
+                                 <ul class="fig-services">
+                                    <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4340/F2">Download as PowerPoint Slide</a></li>
+                                 </ul>
+                              </div>
+                           </div>
+                           <div class="fig-caption"><span class="fig-label">Fig. 2. </span> 
+                              
+                              <p id="p-32" class="first-child">Midpoint-rooted MP phylogeny inferred from 16S rRNA gene sequences of <span class="named-content genus" id="named-content-87"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                       href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains closely related to <span class="named-content species" id="named-content-88"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                       href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> and <span class="named-content species" id="named-content-89"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                       href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span>. Branches are scaled in terms of the minimum number of substitutions (using <span class="sc">deltran</span> optimization; <a id="xref-ref-38-2" class="xref-bibr" href="#ref-38">Stamatakis <em>et al.</em>, 2008</a>). Numbers above branches are support values from MP (left) and ML (right) bootstrapping. Original designation of strains
+                                 that are deposited at culture collections is indicated in parentheses; square brackets give the respective accession number.
+                              </p>
+                              
+                              <div class="sb-div caption-clear"></div>
+                           </div>
+                        </div>
+                        
+                        <p id="p-33">Neither the 16S rRNA gene sequence of <span class="named-content species" id="named-content-90"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> CIP 105210 (KC176239) nor the sequence of <span class="named-content species" id="named-content-91"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                 href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> DSM 16374<sup>T</sup> (KC176240) was exactly identical to that of the original deposit, <span class="named-content species" id="named-content-92"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> BS107<sup>T</sup> (Y13244) or <span class="named-content species" id="named-content-93"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                 href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> T5<sup>T</sup> (AY177712), respectively (<a id="xref-fig-2-2" class="xref-fig" href="#F2">Fig. 2</a>, Fig. S1 available in IJSEM Online). More precisely, the 16S rRNA gene sequences of the alleged <span class="named-content species" id="named-content-94"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> type strains differed at the base positions (<span class="named-content species" id="named-content-95"><a class="namesforlife" rel="namesforlife-name" title="Escherichia coli"
+                                 href="doi:10.1601/nm.3093"><em>Escherichia coli</em></a></span> numbering; <a id="xref-ref-19-1" class="xref-bibr" href="#ref-19">Gutell <em>et al.</em>, 1994</a>) 47, 260, 777, 928, 930, 1030, 1210 and 1387 (Fig. S1; Table S1); and those of the alleged <span class="named-content species" id="named-content-96"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                 href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> type strains at the positions 29, 1210, 1387, 1436, 1459, 1466 and 1480 (Fig. S1; Table S2). We assessed in detail whether
+                           these discrepancies could be caused by sequencing errors, as is already indicated by the long-terminal branches leading to
+                           BS107<sup>T</sup> and T5<sup>T</sup> (<a id="xref-fig-2-3" class="xref-fig" href="#F2">Fig. 2</a>). We thus compared the respective sequences with the bacterial 16S rRNA variability map (<a id="xref-ref-1-1" class="xref-bibr" href="#ref-1">Baker <em>et al.</em>, 2003</a>) and/or the 16S rRNA secondary structure model (<a id="xref-ref-19-2" class="xref-bibr" href="#ref-19">Gutell <em>et al.</em>, 1994</a>) and showed that the 16S rRNA gene sequences provided in this study were all in accordance with bases categorized as conserved
+                           by <a id="xref-ref-1-2" class="xref-bibr" href="#ref-1">Baker <em>et al.</em> (2003)</a> or the proposed rRNA secondary structure (Tables S1 and S2), whereas the previously determined 16S rRNA gene sequences Y13244
+                           and AY177712 were flawed.
+                        </p>
+                        
+                        <p id="p-34">Furthermore, we examined whether the four differences in the 16S rRNA gene sequences of <span class="named-content species" id="named-content-97"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> CIP 105210 (KC176239) and <span class="named-content species" id="named-content-98"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                 href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> DSM 16374<sup>T</sup> (KC176240) were genuine. They were localized at the base positions 614 (<span class="named-content species" id="named-content-99"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span>: G; <span class="named-content species" id="named-content-100"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                 href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span>: A) and 626 (<span class="named-content species" id="named-content-101"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span>: C; <span class="named-content species" id="named-content-102"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                 href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span>: U) within the 16S rRNA variable region V4 (<a id="xref-ref-1-3" class="xref-bibr" href="#ref-1">Baker <em>et al.</em>, 2003</a>) and at the positions 835 (<span class="named-content species" id="named-content-103"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span>: G; <span class="named-content species" id="named-content-104"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                 href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span>: A) and 851 (<span class="named-content species" id="named-content-105"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span>: C; <span class="named-content species" id="named-content-106"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                 href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span>: U) within the variable V5 region, respectively (<span class="named-content species" id="named-content-107"><a class="namesforlife" rel="namesforlife-name" title="E. coli"
+                                 href="doi:10.1601/nm.3093"><em>E. coli</em></a></span> numbering; Fig. S1; Table S3). Comparison with the secondary 16S rRNA structure model (<a id="xref-ref-19-3" class="xref-bibr" href="#ref-19">Gutell <em>et al.</em>, 1994</a>) and a simulation of the rRNA folding using the Mfold web server (<a id="xref-ref-45-1" class="xref-bibr" href="#ref-45">Zuker, 2003</a>) indicated that bases 614 and 626 paired in the variable region V4 stem–loop (<a id="xref-fig-3-1" class="xref-fig" href="#F3">Fig. 3</a>); similarly, bases 835 and 851 matched in the V5 stem–loop (Fig. S2). We thus assumed that the present transitions of G and
+                           C in <span class="named-content species" id="named-content-108"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> to A and U in <span class="named-content species" id="named-content-109"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                 href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span>, respectively, reflect genuine and characteristic mutations in the 16S rRNA genes of these species. Considering these bases,
+                           the 16S rRNA gene sequence of <span class="named-content genus" id="named-content-110"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strain CIP 105210 resembled the original one of BS107<sup>T</sup> (Y13244), which would indicate that strain CIP 105210 is the type strain of <span class="named-content species" id="named-content-111"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span>.
+                        </p>
+                        
+                        <div id="F3" class="fig pos-float type-figure  odd">
+                           <div class="fig-inline"><a href="4340/F3.expansion.html"><img alt="Fig. 3. " src="4340/F3.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                                    <li><a href="4340/F3.expansion.html">In this window</a></li>
+                                    <li><a class="in-nw" href="4340/F3.expansion.html">In a new window</a></li>
+                                 </ul>
+                                 <ul class="fig-services">
+                                    <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4340/F3">Download as PowerPoint Slide</a></li>
+                                 </ul>
+                              </div>
+                           </div>
+                           <div class="fig-caption"><span class="fig-label">Fig. 3. </span> 
+                              
+                              <p id="p-35" class="first-child">Secondary structure of the 16S rRNA variable region V4 of <span class="named-content species" id="named-content-112"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                       href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> CIP 105210<sup>T</sup> (a) and <span class="named-content species" id="named-content-113"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                       href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> DSM 17395 (b) demonstrating transition of bases 614 and 626 (<span class="named-content species" id="named-content-114"><a class="namesforlife" rel="namesforlife-name" title="E. coli"
+                                       href="doi:10.1601/nm.3093"><em>E. coli</em></a></span> numbering; bases 529 and 541 according to the CIP 105210<sup>T</sup> numbering). RNA folding was simulated using the Mfold web server for nucleic acid folding and hybridization prediction (<a id="xref-ref-45-2" class="xref-bibr" href="#ref-45">Zuker, 2003</a>; <a href="http://mfold.rna.albany.edu/?q=mfold/RNA-Folding-Form">http://mfold.rna.albany.edu/?q=mfold/RNA-Folding-Form</a>).
+                              </p>
+                              
+                              <div class="sb-div caption-clear"></div>
+                           </div>
+                        </div>
+                     </div>
+                     <div id="sec-15" class="subsection">
+                        
+                        <h4>MALDI-TOF MS analysis.</h4>
+                        
+                        <p id="p-36">In the MALDI-TOF MS dendrogram (<a id="xref-fig-4-1" class="xref-fig" href="#F4">Fig. 4</a>), the <span class="named-content genus" id="named-content-115"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains DSM 16374<sup>T</sup>, DSM 24588 and DSM 17395 not only formed a cluster but were virtually indistinguishable from each other. Strain CIP 105210
+                           appeared as the sister group of those three strains, whereas <span class="named-content species" id="named-content-116"><a class="namesforlife" rel="namesforlife-name" title="P. daeponensis"
+                                 href="doi:10.1601/nm.10944"><em>P. daeponensis</em></a></span> and <span class="named-content species" id="named-content-117"><a class="namesforlife" rel="namesforlife-name" title="P. caeruleus"
+                                 href="doi:10.1601/nm.14301"><em>P. caeruleus</em></a></span> as well as <span class="named-content species" id="named-content-118"><a class="namesforlife" rel="namesforlife-name" title="P. arcticus"
+                                 href="doi:10.1601/nm.14057"><em>P. arcticus</em></a></span> and <span class="named-content species" id="named-content-119"><a class="namesforlife" rel="namesforlife-name" title="P. leonis"
+                                 href="doi:10.1601/nm.24496"><em>P. leonis</em></a></span> were well set apart.
+                        </p>
+                        
+                        <div id="F4" class="fig pos-float type-figure  odd">
+                           <div class="fig-inline"><a href="4340/F4.expansion.html"><img alt="Fig. 4. " src="4340/F4.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                                    <li><a href="4340/F4.expansion.html">In this window</a></li>
+                                    <li><a class="in-nw" href="4340/F4.expansion.html">In a new window</a></li>
+                                 </ul>
+                                 <ul class="fig-services">
+                                    <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4340/F4">Download as PowerPoint Slide</a></li>
+                                 </ul>
+                              </div>
+                           </div>
+                           <div class="fig-caption"><span class="fig-label">Fig. 4. </span> 
+                              
+                              <p id="p-37" class="first-child">Score-oriented dendrogram showing the similarity of MALDI-TOF mass spectra from cell extracts of selected <span class="named-content genus" id="named-content-120"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                       href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains. The dendrogram was generated by the BioTyper software (version 3.0; Bruker Daltonics).
+                              </p>
+                              
+                              <div class="sb-div caption-clear"></div>
+                           </div>
+                        </div>
+                     </div>
+                     <div id="sec-16" class="subsection">
+                        
+                        <h4>ITS analysis.</h4>
+                        
+                        <p id="p-38">A comparable picture was observed in the ITS analysis (<a id="xref-fig-5-1" class="xref-fig" href="#F5">Fig. 5</a>). <span class="named-content genus" id="named-content-121"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                 href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strain DSM 17395 appeared as sister strain of <span class="named-content species" id="named-content-122"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                 href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> DSM 16374<sup>T</sup> with 93 % support under ML and 99 % support under MP. The sister-group relationship of these and strain DSM 24588 was supported
+                           with 70 % and 88 % bootstrap values, respectively, to the exclusion of <span class="named-content species" id="named-content-123"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                 href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> CIP 105210. <span class="named-content species" id="named-content-124"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter sp."
+                                 href="doi:10.1601/nm.17585"><em>Phaeobacter sp.</em></a></span> ANG1 was placed in a distinct cluster together with the type strains of <span class="named-content species" id="named-content-125"><a class="namesforlife" rel="namesforlife-name" title="P. daeponensis"
+                                 href="doi:10.1601/nm.10944"><em>P. daeponensis</em></a></span> and <span class="named-content species" id="named-content-126"><a class="namesforlife" rel="namesforlife-name" title="P. caeruleus"
+                                 href="doi:10.1601/nm.14301"><em>P. caeruleus</em></a></span> (100 % support).
+                        </p>
+                        
+                        <div id="F5" class="fig pos-float type-figure  odd">
+                           <div class="fig-inline"><a href="4340/F5.expansion.html"><img alt="Fig. 5. " src="4340/F5.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                                    <li><a href="4340/F5.expansion.html">In this window</a></li>
+                                    <li><a class="in-nw" href="4340/F5.expansion.html">In a new window</a></li>
+                                 </ul>
+                                 <ul class="fig-services">
+                                    <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4340/F5">Download as PowerPoint Slide</a></li>
+                                 </ul>
+                              </div>
+                           </div>
+                           <div class="fig-caption"><span class="fig-label">Fig. 5. </span> 
+                              
+                              <p id="p-39" class="first-child">Midpoint-rooted ML phylogeny inferred from ITS sequences of <span class="named-content genus" id="named-content-127"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                       href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains closely related to <span class="named-content species" id="named-content-128"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                                       href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> and <span class="named-content species" id="named-content-129"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                                       href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span>. Branches are scaled in terms of the expected number of substitutions per site. Numbers above branches are support values
+                                 from ML (left) and MP (right) bootstrapping. Original designation of strains that are deposited at culture collections is
+                                 indicated in parentheses; square brackets give the respective accession number.
+                              </p>
+                              
+                              <div class="sb-div caption-clear"></div>
+                           </div>
+                        </div>
+                     </div>
+                  </div>
+                  <div id="sec-17" class="subsection">
+                     
+                     <h3>DNA–DNA hybridization.</h3>
+                     
+                     <p id="p-40">In contrast to the highly similar genomic DNA between the strains DSM 17395 and DSM 16374<sup>T</sup> (82 %) as well as between the strains DSM 16374<sup>T</sup> and DSM 24588 (83 %), strain CIP 105210 shared only 62 % and 63 % DNA–DNA relatedness to the strains DSM 17395 and DSM 16374<sup>T</sup>, respectively (<a id="xref-table-wrap-1-1" class="xref-table" href="#T1">Table 1</a>). This is below the threshold of 70 % recommended by <a id="xref-ref-43-1" class="xref-bibr" href="#ref-43">Wayne <em>et al.</em> (1987)</a> hence indicating the status of strain CIP 105210 in a separate species. Conversely, the values clearly above 70 % indicate
+                        that strains DSM 17395, DSM 16374<sup>T</sup> and DSM 24588 belong to the same species.
+                     </p>
+                     
+                     <div id="T1" class="table pos-float">
+                        <div class="table-inline">
+                           <div class="callout"><span>View this table:</span><ul class="callout-links">
+                                 <li><a href="4340/T1.expansion.html">In this window</a></li>
+                                 <li><a class="in-nw" href="4340/T1.expansion.html">In a new window</a></li>
+                              </ul>
+                           </div>
+                        </div>
+                        <div class="table-caption"><span class="table-label">Table 1. </span> 
+                           <span class="caption-title">Mean DNA–DNA similarity values (<em>n</em> = 2) between the <span class="named-content genus" id="named-content-130"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                                    href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains CIP 105210<sup>T</sup>, DSM 17395, DSM 16374<sup>T</sup> and DSM 24588</span>
+                           
+                           <div class="sb-div caption-clear"></div>
+                        </div>
+                     </div>
+                  </div>
+                  <div id="sec-18" class="subsection">
+                     
+                     <h3>Growth, hydrolysis and PM experiments</h3>
+                     
+                     <p id="p-42">The growth and hydrolysis experiments for <span class="named-content genus" id="named-content-132"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                              href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains CIP 105210 and DSM 17395 could only partially reproduce those conducted by <a id="xref-ref-34-5" class="xref-bibr" href="#ref-34">Ruiz-Ponte <em>et al.</em> (1998)</a> (Table S4). The results for strain CIP 105210 differed from all other series of measurements by growth of this strain on
+                        <span class="sc">l</span>-arabinose and hydrolysis of Tween 80. Strain DSM 17395 showed no specific characteristics, but it – as well as CIP 105210
+                        – differed from strain BS107<sup>T</sup> (<a id="xref-ref-34-6" class="xref-bibr" href="#ref-34">Ruiz-Ponte <em>et al.</em>, 1998</a>) as they grew on serine (like T5<sup>T</sup>; <a id="xref-ref-25-4" class="xref-bibr" href="#ref-25">Martens <em>et al.</em>, 2006</a>) and showed slow growth on <span class="sc">l</span>-rhamnose and 2-ketoglutarate (Table S4). The overall number of specific differences of all other strains to T5<sup>T</sup> (<a id="xref-ref-25-5" class="xref-bibr" href="#ref-25">Martens <em>et al.</em>, 2006</a>) was four (growth on citrate, glucosamine and on MB at 4 °C or 37 °C).
+                     </p>
+                     
+                     <p id="p-43">In contrast, the PM experiments, which are more sensitive than bacterial growth tests because they monitor substrate respiration
+                        (<a id="xref-ref-5-1" class="xref-bibr" href="#ref-5">Bochner <em>et al.</em>, 2001</a>), yielded significant physiological differences between all four tested <span class="named-content genus" id="named-content-133"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                              href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains, DSM 24588, DSM 16374<sup>T</sup>, DSM 17395 and CIP 105210 (Figs S3 and S4). The physiological similarity between strains CIP 105210 and DSM 17395 was high,
+                        but the differences between the two were clearly reproducible. According to the discretization approach implemented in ‘<em>opm</em>’ (<a id="xref-ref-42-2" class="xref-bibr" href="#ref-42">Vaas <em>et al.</em>, 2012</a>), respiration on tyramine (PM01-H04; blue box Fig. S3) was positive in DSM 17395 and DSM 16374, weak in DSM 24588 but negative
+                        in CIP 105210. Respiration on butyrate (PM02A-D12; Fig. S4) was positive in CIP 105210 and DSM 24588, weak in DSM 16374<sup>T</sup>, but negative in DSM 17395.
+                     </p>
+                     
+                     <p id="p-44">Regarding the common subset of growth or hydrolysis experiments on the one hand and PM experiments on the other hand, the
+                        results were identical with a few exceptions. Expectedly, no substrate was detected on which growth (or hydrolysis) was measurable
+                        but respiration was not observed, whereas on some substrates respiration was detected by PM analysis even though these substrates
+                        sustained no growth. Accordingly, a weak PM reaction on <span class="sc">l</span>-arabinose (PM01-A02) and a positive PM reaction on citrate (PM01-F02) were observed for all four tested strains. A positive
+                        PM reaction to Tween 80 (PM01-E05) was observed for strains DSM 24588 and CIP 105210, whereas strains DSM 17395 and DSM 16374<sup>T</sup> showed a weak reaction (compare red boxes in Fig. S3 with Table S4).
+                     </p>
+                     
+                  </div>
+               </div>
+               <div class="section discussion" id="sec-19">
+                  <div class="section-nav"><a href="#sec-11" title="Results" class="prev-section-link"><span>Previous Section</span></a><a href="#ack-1" title="Acknowledgements" class="next-section-link"><span>Next Section</span></a></div>
+                  
+                  <h2>Discussion</h2>
+                  
+                  <p id="p-45">According to the PFGE profiles of the extrachromosomal elements – which are largely supported by the complete genome sequences
+                     of the <span class="named-content genus" id="named-content-134"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                           href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains DSM 17395, DSM 24588 (<a id="xref-ref-40-5" class="xref-bibr" href="#ref-40">Thole <em>et al.</em>, 2012</a>), DSM 16374<sup>T</sup> (Dogs, M. and others, unpublished) and CIP 105210 (Frank, O. and others, unpublished) – DDH similarities, 16S rRNA gene sequence
+                     analysis, 16S–23S rRNA gene ITS sequence analysis, MALDI-TOF MS protein analysis, and high-throughput phenotyping using the
+                     PM technology, the <span class="named-content genus" id="named-content-135"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter"
+                           href="doi:10.1601/nm.10131"><em>Phaeobacter</em></a></span> strains CIP 105210 and DSM 17395, both supposed to be deposits of the type strain of <span class="named-content species" id="named-content-136"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> BS107<sup>T</sup>, are biologically clearly distinct. ITS sequence and MALDI-TOF analysis additionally showed that DSM 17395 (and DSM 24588)
+                     group together with <span class="named-content species" id="named-content-137"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                           href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> DSM 16374<sup>T</sup> to the exclusion of CIP 105210. As confirmed by DDH (≥76 % similarity), DSM 16374<sup>T</sup>, DSM 17395 and DSM 24588 are conspecific, i.e. all belong to the species <span class="named-content species" id="named-content-138"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                           href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span>. Analysis of 16S rRNA gene sequences was in accordance with this finding, too, because the sequences of these strains were
+                     identical (if the resequenced 16S rRNA gene sequence of DSM 16374<sup>T</sup> was considered). Our sequence analyses confirmed the finding of <a id="xref-ref-40-6" class="xref-bibr" href="#ref-40">Thole <em>et al.</em> (2012)</a> that the <span class="named-content species" id="named-content-139"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter sp."
+                           href="doi:10.1601/nm.17585"><em>Phaeobacter</em> sp.</a></span> ANG1 does not belong to the species <span class="named-content species" id="named-content-140"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span>.
+                  </p>
+                  
+                  <p id="p-46">Because DSM 17395 must hence be excluded from the species <span class="named-content species" id="named-content-141"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span>, the question arises whether the alternative type strain deposit, CIP 105210, represents <span class="named-content species" id="named-content-142"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> BS107<sup>T</sup>. DDH analysis (&lt;70 % similarity) indicates that CIP 105210 is not conspecific with <span class="named-content species" id="named-content-143"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                           href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span>. Analysis of growth behaviours and enzymic activities could not fully reproduce the findings of <a id="xref-ref-34-7" class="xref-bibr" href="#ref-34">Ruiz-Ponte <em>et al.</em> (1998)</a>, but given the overall low number of characters tested, the low number of known differences to the type strain of the sister
+                     species, <span class="named-content species" id="named-content-144"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                           href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span>, and the well-known difficulties in reproducing physiological tests in distinct laboratories in general, the significance
+                     of these discrepancies is unclear. Essentially, based on the newly generated CIP 105210 16S rRNA gene sequence that is identical
+                     to the one from BS107<sup>T</sup>, except for deviations that were likely to be sequencing errors, we could clearly document the type strain status of <span class="named-content species" id="named-content-145"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> CIP 105210<sup>T</sup>. As the strains CIP 105210<sup>T</sup> and DSM 17395 have been independently deposited at the CIP and the DSMZ, respectively, it is the most probable explanation
+                     that the later strain has been mixed-up prior to deposition.
+                  </p>
+                  
+                  <p id="p-47">Research laboratories are usually not equipped with sufficient resources to verify the biological identity of their cultures.
+                     Moreover, culture collections have to cope with the deposition of interchanged or contaminated strains and the quality of
+                     incoming material will presumably even deteriorate due to the decline of basic microbiological methodology in the era of molecular
+                     biology. Problems are expected particularly if confusion with closely related strains has occurred, as in the case of DSM
+                     17395, which apparently belongs to the sister species of the correct strain. Hence, it is advisable that researchers working
+                     on a certain strain exactly denote the source from which it was received. Providing the accession numbers of culture-collection
+                     deposits (such as ‘CIP 105210<sup>T</sup>’ or ‘DSM 17395’) should thus be preferred over just stating the original strain designator (such as ‘BS107<sup>T</sup>’) irrespective of the source from which the strain has been received. In any case, with respect to cultivatable microbes,
+                     only strains with a demonstrable history should be considered in serious research.
+                  </p>
+                  
+                  <p id="p-48">The three homologous plasmids of the completely sequenced <span class="named-content species" id="named-content-146"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                           href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> strains DSM 17395 and DSM 24588 exhibit a long-range synteny (<a id="xref-ref-40-7" class="xref-bibr" href="#ref-40">Thole <em>et al.</em>, 2012</a>), but several indels (insertions/deletions) are responsible for the deviating plasmid sizes [262 versus 238 kb (DnaA-like
+                     replicon; <a id="xref-ref-28-2" class="xref-bibr" href="#ref-28">Petersen, 2011</a>), 75(78)  versus 94 kb (RepB-I), 65(63) versus 70 kb (RepA-I); <a id="xref-fig-1-7" class="xref-fig" href="#F1">Fig. 1</a>]. Homologues of these replicons may also be present in the sister species <span class="named-content species" id="named-content-147"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> CIP 105210<sup>T</sup> e.g. represented by the 253, 77 and 64 kb replicons. However, the conspicuously different plasmid profiles in <span class="named-content species" id="named-content-148"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> and <span class="named-content species" id="named-content-149"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                           href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> (<a id="xref-fig-1-8" class="xref-fig" href="#F1">Fig. 1</a>) may reflect horizontal recruitment of four additional replicons in <span class="named-content species" id="named-content-150"><a class="namesforlife" rel="namesforlife-name" title="P. gallaeciensis"
+                           href="doi:10.1601/nm.9798"><em>P. gallaeciensis</em></a></span> CIP 105210<sup>T</sup>. The same explanation is supported by the presence of a type IV secretion system on the fourth 86 kb plasmid of the <span class="named-content species" id="named-content-151"><a class="namesforlife" rel="namesforlife-name" title="P. inhibens"
+                           href="doi:10.1601/nm.10132"><em>P. inhibens</em></a></span> type strain DSM 16374<sup>T</sup> (Dogs, M. and others, unpublished), which may be responsible for plasmid mobilization via conjugation (<a id="xref-ref-29-1" class="xref-bibr" href="#ref-29">Petersen <em>et al.</em>, 2013</a>). In the near future, genome sequencing and comparative genomics of more distantly related strains, such as <span class="named-content species" id="named-content-152"><a class="namesforlife" rel="namesforlife-name" title="Phaeobacter arcticus"
+                           href="doi:10.1601/nm.14057"><em>Phaeobacter arcticus</em></a></span>, will help to reveal the extent of horizontal exchange and vertical evolution within the <span class="named-content genus" id="named-content-153"><a class="namesforlife" rel="namesforlife-name" title="Roseobacter"
+                           href="doi:10.1601/nm.1134"><em>Roseobacter</em></a></span> clade.
+                  </p>
+                  
+               </div>
+               <div class="section ack" id="ack-1">
+                  <div class="section-nav"><a href="#sec-19" title="Discussion" class="prev-section-link"><span>Previous Section</span></a><a href="#ref-list-1" title="References" class="next-section-link"><span>Next Section</span></a></div>
+                  <h2>Acknowledgements</h2>
+                  
+                  <p id="p-49">This work, including a PhD stipend for N. B., was supported by the Transregional Collaborative Research Center ‘<em>Roseobacter</em>’ of the Deutsche Forschungsgemeinschaft (Transregio TRR 51) and the MICROME project, EU Framework Program 7 Collaborative
+                     Project (222886-2). We thank Victoria Michael, Bettina Sträubler and Ulrike Steiner for excellent technical assistance, Brian
+                     Tindall and Sabine Gronow for their helpful discussions, as well as the two anonymous reviewers for their constructive criticism.
+                  </p>
+                  
+               </div>
+               <div class="section ref-list" id="ref-list-1">
+                  <div class="section-nav"><a href="#ack-1" title="Acknowledgements" class="prev-section-link"><span>Previous Section</span></a><div class="nav-placeholder"> </div>
+                  </div>
+                  <h2>References</h2>
+                  <ol class="cit-list ref-use-labels">
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-1-1" title="View reference  in text"
+                           id="ref-1">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.1"
+                             data-doi="10.1016/j.mimet.2003.08.009">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Baker</span>,  <span class="cit-name-given-names">G. C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Smith</span>,  <span class="cit-name-given-names">J. J.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Cowan</span>,  <span class="cit-name-given-names">D. A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2003</span><strong>).</strong> <span class="cit-article-title">Review and re-analysis of domain-specific 16S primers</span>. <abbr class="cit-jnl-abbrev">J Microbiol Methods</abbr> <span class="cit-vol">55</span>, <span class="cit-fpage">541</span>–<span class="cit-lpage">555</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/j.mimet.2003.08.009</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>14607398</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/j.mimet.2003.08.009&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=14607398&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Review%20and%20re-analysis%20of%20domain-specific%2016S%20primers&amp;author=G.%20C.%20Baker&amp;author=J.%20J.%20Smith&amp;author=D.%20A.%20Cowan&amp;publication_year=2003&amp;journal=J%20Microbiol%20Methods&amp;volume=55&amp;pages=541-555&amp;doi=10.1016%2Fj.mimet.2003.08.009&amp;pmid=14607398">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-2-1" title="View reference  in text"
+                           id="ref-2">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.2"
+                             data-doi="10.1128/JB.05818-11">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Berger</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Neumann</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Schulz</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Simon</span>,  <span class="cit-name-given-names">M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brinkhoff</span>,  <span class="cit-name-given-names">T.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2011</span><strong>).</strong> <span class="cit-article-title">Tropodithietic acid production in <em>Phaeobacter gallaeciensis</em> is regulated by <em>N</em>-acyl homoserine lactone-mediated quorum sensing</span>. <abbr class="cit-jnl-abbrev">J Bacteriol</abbr> <span class="cit-vol">193</span>, <span class="cit-fpage">6576</span>–<span class="cit-lpage">6585</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/JB.05818-11</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>21949069</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=jb&amp;resid=193/23/6576"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-3-1" title="View reference  in text"
+                           id="ref-3">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.3"
+                             data-doi="10.1128/AEM.07657-11">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Berger</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brock</span>,  <span class="cit-name-given-names">N. L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Liesegang</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Dogs</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Preuth</span>,  <span class="cit-name-given-names">I.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Simon</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Dickschat</span>,  <span class="cit-name-given-names">J. S.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brinkhoff</span>,  <span class="cit-name-given-names">T.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2012</span><strong>).</strong> <span class="cit-article-title">Genetic analysis of the upper phenylacetate catabolic pathway in the production of tropodithietic acid by <em>Phaeobacter gallaeciensis</em></span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">78</span>, <span class="cit-fpage">3539</span>–<span class="cit-lpage">3551</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.07657-11</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>22407685</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=78/10/3539"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-4-1" title="View reference  in text"
+                           id="ref-4">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.4"
+                             data-doi="10.1111/j.1574-6976.2008.00149.x">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bochner</span>,  <span class="cit-name-given-names">B. R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2009</span><strong>).</strong> <span class="cit-article-title">Global phenotypic characterization of bacteria</span>. <abbr class="cit-jnl-abbrev">FEMS Microbiol Rev</abbr> <span class="cit-vol">33</span>, <span class="cit-fpage">191</span>–<span class="cit-lpage">205</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1111/j.1574-6976.2008.00149.x</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>19054113</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=femsre&amp;resid=33/1/191"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-5-1" title="View reference  in text"
+                           id="ref-5">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.5"
+                             data-doi="10.1101/gr.186501">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bochner</span>,  <span class="cit-name-given-names">B. R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Gadzinski</span>,  <span class="cit-name-given-names">P.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Panomitros</span>,  <span class="cit-name-given-names">E.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2001</span><strong>).</strong> <span class="cit-article-title">Phenotype microarrays for high-throughput phenotypic testing and assay of gene function</span>. <abbr class="cit-jnl-abbrev">Genome Res</abbr> <span class="cit-vol">11</span>, <span class="cit-fpage">1246</span>–<span class="cit-lpage">1255</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1101/gr.186501</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>11435407</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=genome&amp;resid=11/7/1246"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-6-1" title="View reference  in text"
+                           id="ref-6">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.6"
+                             data-doi="10.1128/AEM.70.4.2560-2565.2003">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brinkhoff</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bach</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Heidorn</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Liang</span>,  <span class="cit-name-given-names">L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Schlingloff</span>,  <span class="cit-name-given-names">A.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Simon</span>,  <span class="cit-name-given-names">M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2004</span><strong>).</strong> <span class="cit-article-title">Antibiotic production by a <em>Roseobacter</em> clade-affiliated species from the German Wadden Sea and its antagonistic effects on indigenous isolates</span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">70</span>, <span class="cit-fpage">2560</span>–<span class="cit-lpage">2565</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.70.4.2560-2565.2003</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>15066861</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=70/4/2560"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-7-1" title="View reference  in text"
+                           id="ref-7">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.7"
+                             data-doi="10.1128/AEM.02238-06">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bruhn</span>,  <span class="cit-name-given-names">J. B.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Gram</span>,  <span class="cit-name-given-names">L.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Belas</span>,  <span class="cit-name-given-names">R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2007</span><strong>).</strong> <span class="cit-article-title">Production of antibacterial compounds and biofilm formation by <em>Roseobacter</em> species are influenced by culture conditions</span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">73</span>, <span class="cit-fpage">442</span>–<span class="cit-lpage">450</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.02238-06</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>17098910</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=73/2/442"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-8-1" title="View reference  in text"
+                           id="ref-8">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.8"
+                             data-doi="10.1016/0003-2697(77)90720-5">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Cashion</span>,  <span class="cit-name-given-names">P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Holder-Franklin</span>,  <span class="cit-name-given-names">M. A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">McCully</span>,  <span class="cit-name-given-names">J.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Franklin</span>,  <span class="cit-name-given-names">M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1977</span><strong>).</strong> <span class="cit-article-title">A rapid method for the base ratio determination of bacterial DNA</span>. <abbr class="cit-jnl-abbrev">Anal Biochem</abbr> <span class="cit-vol">81</span>, <span class="cit-fpage">461</span>–<span class="cit-lpage">466</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/0003-2697(77)90720-5</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>907108</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/0003-2697(77)90720-5&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=907108&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=A%20rapid%20method%20for%20the%20base%20ratio%20determination%20of%20bacterial%20DNA&amp;author=P.%20Cashion&amp;author=M.%20A.%20Holder-Franklin&amp;author=J.%20McCully&amp;author=M.%20Franklin&amp;publication_year=1977&amp;journal=Anal%20Biochem&amp;volume=81&amp;pages=461-466&amp;doi=10.1016%2F0003-2697%2877%2990720-5&amp;pmid=907108">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-9-1" title="View reference  in text"
+                           id="ref-9">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.9"
+                             data-doi="10.1128/JB.05139-11">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Collins</span>,  <span class="cit-name-given-names">A. J.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nyholm</span>,  <span class="cit-name-given-names">S. V.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2011</span><strong>).</strong> <span class="cit-article-title">Draft genome of <em>Phaeobacter gallaeciensis</em> ANG1, a dominant member of the accessory nidamental gland of <em>Euprymna scolopes</em></span>. <abbr class="cit-jnl-abbrev">J Bacteriol</abbr> <span class="cit-vol">193</span>, <span class="cit-fpage">3397</span>–<span class="cit-lpage">3398</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/JB.05139-11</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>21551313</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=jb&amp;resid=193/13/3397"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-10-1" title="View reference  in text"
+                           id="ref-10">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.10"
+                             data-doi="10.1111/j.1432-1033.1970.tb00830.x">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">De Ley</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Cattoir</span>,  <span class="cit-name-given-names">H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Reynaerts</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1970</span><strong>).</strong> <span class="cit-article-title">The quantitative measurement of DNA hybridization from renaturation rates</span>. <abbr class="cit-jnl-abbrev">Eur J Biochem</abbr> <span class="cit-vol">12</span>, <span class="cit-fpage">133</span>–<span class="cit-lpage">142</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1111/j.1432-1033.1970.tb00830.x</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>4984993</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1111/j.1432-1033.1970.tb00830.x&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=4984993&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=The%20quantitative%20measurement%20of%20DNA%20hybridization%20from%20renaturation%20rates&amp;author=J.%20De%20Ley&amp;author=H.%20Cattoir&amp;author=A.%20Reynaerts&amp;publication_year=1970&amp;journal=Eur%20J%20Biochem&amp;volume=12&amp;pages=133-142&amp;doi=10.1111%2Fj.1432-1033.1970.tb00830.x&amp;pmid=4984993">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-11-1" title="View reference  in text"
+                           id="ref-11">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.11"
+                             data-doi="10.1002/cbic.200900668">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Dickschat</span>,  <span class="cit-name-given-names">J. S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Zell</span>,  <span class="cit-name-given-names">C.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brock</span>,  <span class="cit-name-given-names">N. L.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2010</span><strong>).</strong> <span class="cit-article-title">Pathways and substrate specificity of DMSP catabolism in marine bacteria of the <em>Roseobacter</em> clade</span>. <abbr class="cit-jnl-abbrev">ChemBioChem</abbr> <span class="cit-vol">11</span>, <span class="cit-fpage">417</span>–<span class="cit-lpage">425</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1002/cbic.200900668</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>20043308</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1002/cbic.200900668&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=20043308&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Pathways%20and%20substrate%20specificity%20of%20DMSP%20catabolism%20in%20marine%20bacteria%20of%20the%20Roseobacter%20clade&amp;author=J.%20S.%20Dickschat&amp;author=C.%20Zell&amp;author=N.%20L.%20Brock&amp;publication_year=2010&amp;journal=ChemBioChem&amp;volume=11&amp;pages=417-425&amp;doi=10.1002%2Fcbic.200900668&amp;pmid=20043308">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-12-1" title="View reference  in text"
+                           id="ref-12">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.12"
+                             data-doi="10.1086/282802">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Farris</span>,  <span class="cit-name-given-names">J. S.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1972</span><strong>).</strong> <span class="cit-article-title">Estimating phylogenetic trees from distance matrices</span>. <abbr class="cit-jnl-abbrev">Am Nat</abbr> <span class="cit-vol">106</span>, <span class="cit-fpage">645</span>–<span class="cit-lpage">668</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1086/282802</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1086/282802&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Estimating%20phylogenetic%20trees%20from%20distance%20matrices&amp;author=J.%20S.%20Farris&amp;publication_year=1972&amp;journal=Am%20Nat&amp;volume=106&amp;pages=645-668&amp;doi=10.1086%2F282802">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-13-1" title="View reference  in text"
+                           id="ref-13">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.13"
+                             data-doi="10.1007/BF01734359">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Felsenstein</span>,  <span class="cit-name-given-names">J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1981</span><strong>).</strong> <span class="cit-article-title">Evolutionary trees from DNA sequences: a maximum likelihood approach</span>. <abbr class="cit-jnl-abbrev">J Mol Evol</abbr> <span class="cit-vol">17</span>, <span class="cit-fpage">368</span>–<span class="cit-lpage">376</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/BF01734359</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>7288891</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/BF01734359&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=7288891&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Evolutionary%20trees%20from%20DNA%20sequences%3A%20a%20maximum%20likelihood%20approach&amp;author=J.%20Felsenstein&amp;publication_year=1981&amp;journal=J%20Mol%20Evol&amp;volume=17&amp;pages=368-376&amp;doi=10.1007%2FBF01734359&amp;pmid=7288891">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-14-1" title="View reference  in text"
+                           id="ref-14">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.14"
+                             data-doi="10.1371/journal.pone.0027387">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Fernandes</span>,  <span class="cit-name-given-names">N.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Case</span>,  <span class="cit-name-given-names">R. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Longford</span>,  <span class="cit-name-given-names">S. R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Seyedsayamdost</span>,  <span class="cit-name-given-names">M. R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Steinberg</span>,  <span class="cit-name-given-names">P. D.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kjelleberg</span>,  <span class="cit-name-given-names">S.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Thomas</span>,  <span class="cit-name-given-names">T.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2011</span><strong>).</strong> <span class="cit-article-title">Genomes and virulence factors of novel bacterial pathogens causing bleaching disease in the marine red alga <em>Delisea pulchra</em></span>. <abbr class="cit-jnl-abbrev">PLoS ONE</abbr> <span class="cit-vol">6</span>, <span class="cit-fpage">e27387</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1371/journal.pone.0027387</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>22162749</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1371/journal.pone.0027387&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=22162749&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Genomes%20and%20virulence%20factors%20of%20novel%20bacterial%20pathogens%20causing%20bleaching%20disease%20in%20the%20marine%20red%20alga%20Delisea%20pulchra&amp;author=N.%20Fernandes&amp;author=R.%20J.%20Case&amp;author=S.%20R.%20Longford&amp;author=M.%20R.%20Seyedsayamdost&amp;author=P.%20D.%20Steinberg&amp;author=S.%20Kjelleberg&amp;author=T.%20Thomas&amp;publication_year=2011&amp;journal=PLoS%20ONE&amp;volume=6&amp;pages=e27387&amp;doi=10.1371%2Fjournal.pone.0027387&amp;pmid=22162749">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-15-1" title="View reference  in text"
+                           id="ref-15">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.15"
+                             data-doi="10.1093/sysbio/20.4.406">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Fitch</span>,  <span class="cit-name-given-names">W. M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1971</span><strong>).</strong> <span class="cit-article-title">Towards defining the course of evolution: minimal change for a specified tree topology</span>. <abbr class="cit-jnl-abbrev">Syst Zool</abbr> <span class="cit-vol">20</span>, <span class="cit-fpage">406</span>–<span class="cit-lpage">416</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.2307/2412116</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=sysbio&amp;resid=20/4/406"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-16-1" title="View reference  in text"
+                           id="ref-16">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.16"
+                             data-doi="10.1099/ijs.0.046128-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Gaboyer</span>,  <span class="cit-name-given-names">F.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Tindall</span>,  <span class="cit-name-given-names">B. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ciobanu</span>,  <span class="cit-name-given-names">M.-C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Duthoit</span>,  <span class="cit-name-given-names">F.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Le Romancer</span>,  <span class="cit-name-given-names">M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Alain</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2013</span><strong>).</strong> <span class="cit-article-title"><em>Phaeobacter leonis</em> sp. nov., an alphaproteobacterium from Mediterranean Sea sediments</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">63</span>, <span class="cit-fpage">3301</span>–<span class="cit-lpage">3306</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.046128-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>23475346</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=63/Pt_9/3301"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-17-1" title="View reference  in text"
+                           id="ref-17">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.17"
+                             data-doi="10.1128/AEM.02339-07">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Geng</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bruhn</span>,  <span class="cit-name-given-names">J. B.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nielsen</span>,  <span class="cit-name-given-names">K. F.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Gram</span>,  <span class="cit-name-given-names">L.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Belas</span>,  <span class="cit-name-given-names">R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2008</span><strong>).</strong> <span class="cit-article-title">Genetic dissection of tropodithietic acid biosynthesis by marine roseobacters</span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">74</span>, <span class="cit-fpage">1535</span>–<span class="cit-lpage">1545</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.02339-07</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>18192410</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=74/5/1535"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-18-1" title="View reference  in text"
+                           id="ref-18">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.18"
+                             data-doi="10.1099/13500872-142-1-3">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Gürtler</span>,  <span class="cit-name-given-names">V.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stanisich</span>,  <span class="cit-name-given-names">V. A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1996</span><strong>).</strong> <span class="cit-article-title">New approaches to typing and identification of bacteria using the 16S–23S rDNA spacer region</span>. <abbr class="cit-jnl-abbrev">Microbiology</abbr> <span class="cit-vol">142</span>, <span class="cit-fpage">3</span>–<span class="cit-lpage">16</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/13500872-142-1-3</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>8581168</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=PDF&amp;journalCode=mic&amp;resid=142/1/3"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-19-1" title="View reference  in text"
+                           id="ref-19">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.19">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Gutell</span>,  <span class="cit-name-given-names">R. R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Larsen</span>,  <span class="cit-name-given-names">N.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Woese</span>,  <span class="cit-name-given-names">C. R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1994</span><strong>).</strong> <span class="cit-article-title">Lessons from an evolving rRNA: 16S and 23S rRNA structures from a comparative perspective</span>. <abbr class="cit-jnl-abbrev">Microbiol Rev</abbr> <span class="cit-vol">58</span>, <span class="cit-fpage">10</span>–<span class="cit-lpage">26</span>.<span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>8177168</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=mmbr&amp;resid=58/1/10"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-20-1" title="View reference  in text"
+                           id="ref-20">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.20"
+                             data-doi="10.1111/j.1095-8312.2007.00864.x">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hess</span>,  <span class="cit-name-given-names">P. N.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">De Moraes Russo</span>,  <span class="cit-name-given-names">C. A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2007</span><strong>).</strong> <span class="cit-article-title">An empirical test of the midpoint rooting method</span>. <abbr class="cit-jnl-abbrev">Biol J Linn Soc Lond</abbr> <span class="cit-vol">92</span>, <span class="cit-fpage">669</span>–<span class="cit-lpage">674</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1111/j.1095-8312.2007.00864.x</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1111/j.1095-8312.2007.00864.x&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=An%20empirical%20test%20of%20the%20midpoint%20rooting%20method&amp;author=P.%20N.%20Hess&amp;author=C.%20A.%20De%20Moraes%20Russo&amp;publication_year=2007&amp;journal=Biol%20J%20Linn%20Soc%20Lond&amp;volume=92&amp;pages=669-674&amp;doi=10.1111%2Fj.1095-8312.2007.00864.x">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-21-1" title="View reference  in text"
+                           id="ref-21">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.21"
+                             data-doi="10.1016/S0723-2020(83)80048-4">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Huß</span>,  <span class="cit-name-given-names">V. A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Festl</span>,  <span class="cit-name-given-names">H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Schleifer</span>,  <span class="cit-name-given-names">K. H.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1983</span><strong>).</strong> <span class="cit-article-title">Studies on the spectrophotometric determination of DNA hybridization from renaturation rates</span>. <abbr class="cit-jnl-abbrev">Syst Appl Microbiol</abbr> <span class="cit-vol">4</span>, <span class="cit-fpage">184</span>–<span class="cit-lpage">192</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/S0723-2020(83)80048-4</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>23194591</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/S0723-2020(83)80048-4&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=23194591&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Studies%20on%20the%20spectrophotometric%20determination%20of%20DNA%20hybridization%20from%20renaturation%20rates&amp;author=V.%20A.%20Hu%C3%9F&amp;author=H.%20Festl&amp;author=K.%20H.%20Schleifer&amp;publication_year=1983&amp;journal=Syst%20Appl%20Microbiol&amp;volume=4&amp;pages=184-192&amp;doi=10.1016%2FS0723-2020%2883%2980048-4&amp;pmid=23194591">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-22-1" title="View reference  in text"
+                           id="ref-22">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.22"
+                             data-doi="10.1093/nar/gki198">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Katoh</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kuma</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Toh</span>,  <span class="cit-name-given-names">H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Miyata</span>,  <span class="cit-name-given-names">T.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2005</span><strong>).</strong> <span class="cit-article-title"><span class="sc">mafft</span> version 5: improvement in accuracy of multiple sequence alignment</span>. <abbr class="cit-jnl-abbrev">Nucleic Acids Res</abbr> <span class="cit-vol">33</span>, <span class="cit-fpage">511</span>–<span class="cit-lpage">518</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1093/nar/gki198</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>15661851</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=nar&amp;resid=33/2/511"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-23-1" title="View reference  in text"
+                           id="ref-23">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4340.23">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Stackebrandt</span>,  <span class="cit-name-given-names">E.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Goodfellow</span>,  <span class="cit-name-given-names">M.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lane</span>,  <span class="cit-name-given-names">D. J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1991</span><strong>).</strong> <span class="cit-article-title">16S/23S rRNA sequencing</span>. In <span class="cit-source">Nucleic Acid Techniques in Bacterial Systematics</span>, pp. <span class="cit-fpage">115</span>–<span class="cit-lpage">175</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Stackebrandt</span>,  <span class="cit-name-given-names">E.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Goodfellow</span>,  <span class="cit-name-given-names">M.</span></span>
+                                 . <span class="cit-publ-loc">Chichester</span>: <span class="cit-publ-name">Wiley</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=16S%2F23S%20rRNA%20sequencing&amp;author=D.%20J.%20Lane&amp;publication_year=1991&amp;citation_inbook_title=Nucleic%20Acid%20Techniques%20in%20Bacterial%20Systematics">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-24-1" title="View reference  in text"
+                           id="ref-24">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.24"
+                             data-doi="10.1093/nar/gkr1044">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Markowitz</span>,  <span class="cit-name-given-names">V. M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Chen</span>,  <span class="cit-name-given-names">I.-M. A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Palaniappan</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Chu</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Szeto</span>,  <span class="cit-name-given-names">E.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Grechkin</span>,  <span class="cit-name-given-names">Y.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ratner</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jacob</span>,  <span class="cit-name-given-names">B.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Huang</span>,  <span class="cit-name-given-names">J.</span></span></li>
+                              </ol><cite> <strong>&amp; other authors (</strong><span class="cit-pub-date">2012</span><strong>).</strong> <span class="cit-article-title">IMG: the Integrated Microbial Genomes database and comparative analysis system</span>. <abbr class="cit-jnl-abbrev">Nucleic Acids Res</abbr> <span class="cit-vol">40</span> (<span class="cit-supplement">Database issue</span>), <span class="cit-fpage">D115</span>–<span class="cit-lpage">D122</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1093/nar/gkr1044</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>22194640</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=nar&amp;resid=40/D1/D115"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-25-1" title="View reference  in text"
+                           id="ref-25">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.25"
+                             data-doi="10.1099/ijs.0.63724-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Martens</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Heidorn</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pukall</span>,  <span class="cit-name-given-names">R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Simon</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Tindall</span>,  <span class="cit-name-given-names">B. J.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brinkhoff</span>,  <span class="cit-name-given-names">T.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2006</span><strong>).</strong> <span class="cit-article-title">Reclassification of <em>Roseobacter gallaeciensis</em> Ruiz-Ponte <em>et al.</em> 1998 as <em>Phaeobacter gallaeciensis</em> gen. nov., comb. nov., description of <em>Phaeobacter inhibens</em> sp. nov., reclassification of <em>Ruegeria algicola</em> (Lafay <em>et al.</em> 1995) Uchino <em>et al.</em> 1999 as <em>Marinovum algicola</em> gen. nov., comb. nov., and emended descriptions of the genera <em>Roseobacter</em>, <em>Ruegeria</em> and <em>Leisingera</em></span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">56</span>, <span class="cit-fpage">1293</span>–<span class="cit-lpage">1304</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.63724-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>16738106</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=56/6/1293"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-26-1" title="View reference  in text"
+                           id="ref-26">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.26"
+                             data-doi="10.1007/s00248-006-9165-2">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Martens</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Gram</span>,  <span class="cit-name-given-names">L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Grossart</span>,  <span class="cit-name-given-names">H.-P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kessler</span>,  <span class="cit-name-given-names">D.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Müller</span>,  <span class="cit-name-given-names">R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Simon</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wenzel</span>,  <span class="cit-name-given-names">S. C.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brinkhoff</span>,  <span class="cit-name-given-names">T.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2007</span><strong>).</strong> <span class="cit-article-title">Bacteria of the <em>Roseobacter</em> clade show potential for secondary metabolite production</span>. <abbr class="cit-jnl-abbrev">Microb Ecol</abbr> <span class="cit-vol">54</span>, <span class="cit-fpage">31</span>–<span class="cit-lpage">42</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/s00248-006-9165-2</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>17351813</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/s00248-006-9165-2&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=17351813&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Bacteria%20of%20the%20Roseobacter%20clade%20show%20potential%20for%20secondary%20metabolite%20production&amp;author=T.%20Martens&amp;author=L.%20Gram&amp;author=H.-P.%20Grossart&amp;author=D.%20Kessler&amp;author=R.%20M%C3%BCller&amp;author=M.%20Simon&amp;author=S.%20C.%20Wenzel&amp;author=T.%20Brinkhoff&amp;publication_year=2007&amp;journal=Microb%20Ecol&amp;volume=54&amp;pages=31-42&amp;doi=10.1007%2Fs00248-006-9165-2&amp;pmid=17351813">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-27-1" title="View reference  in text"
+                           id="ref-27">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.27"
+                             data-doi="10.1089/cmb.2009.0179">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pattengale</span>,  <span class="cit-name-given-names">N. D.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Alipour</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bininda-Emonds</span>,  <span class="cit-name-given-names">O. R. P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Moret</span>,  <span class="cit-name-given-names">B. M. E.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stamatakis</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2010</span><strong>).</strong> <span class="cit-article-title">How many bootstrap replicates are necessary?</span> <abbr class="cit-jnl-abbrev">J Comput Biol</abbr> <span class="cit-vol">17</span>, <span class="cit-fpage">337</span>–<span class="cit-lpage">354</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1089/cmb.2009.0179</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>20377449</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1089/cmb.2009.0179&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=20377449&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=How%20many%20bootstrap%20replicates%20are%20necessary%3F&amp;author=N.%20D.%20Pattengale&amp;author=M.%20Alipour&amp;author=O.%20R.%20P.%20Bininda-Emonds&amp;author=B.%20M.%20E.%20Moret&amp;author=A.%20Stamatakis&amp;publication_year=2010&amp;journal=J%20Comput%20Biol&amp;volume=17&amp;pages=337-354&amp;doi=10.1089%2Fcmb.2009.0179&amp;pmid=20377449">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-28-1" title="View reference  in text"
+                           id="ref-28">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.28">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Petersen</span>,  <span class="cit-name-given-names">J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2011</span><strong>).</strong> <span class="cit-article-title">Phylogeny and compatibility: plasmid classification in the genomics era</span>. <abbr class="cit-jnl-abbrev">Arch Microbiol</abbr> <span class="cit-vol">193</span>, <span class="cit-fpage">313</span>–<span class="cit-lpage">321</span>.<span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>21374058</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=21374058&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Phylogeny%20and%20compatibility%3A%20plasmid%20classification%20in%20the%20genomics%20era&amp;author=J.%20Petersen&amp;publication_year=2011&amp;journal=Arch%20Microbiol&amp;volume=193&amp;pages=313-321&amp;pmid=21374058">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-29-1" title="View reference  in text"
+                           id="ref-29">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.29"
+                             data-doi="10.1007/s00253-013-4746-8">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Petersen</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Frank</span>,  <span class="cit-name-given-names">O.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Göker</span>,  <span class="cit-name-given-names">M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pradella</span>,  <span class="cit-name-given-names">S.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2013</span><strong>).</strong> <span class="cit-article-title">Extrachromosomal, extraordinary and essential — the plasmids of the Roseobacter clade</span>. <abbr class="cit-jnl-abbrev">Appl Microbiol Biotechnol</abbr> <span class="cit-vol">97</span>, <span class="cit-fpage">2805</span>–<span class="cit-lpage">2815</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/s00203-009-0535-2</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>20039020</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/s00253-013-4746-8&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=20039020&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Extrachromosomal%2C%20extraordinary%20and%20essential%20%E2%80%94%20the%20plasmids%20of%20the%20Roseobacter%20clade&amp;author=J.%20Petersen&amp;author=O.%20Frank&amp;author=M.%20G%C3%B6ker&amp;author=S.%20Pradella&amp;publication_year=2013&amp;journal=Appl%20Microbiol%20Biotechnol&amp;volume=97&amp;pages=2805-2815&amp;doi=10.1007%2Fs00203-009-0535-2&amp;pmid=20039020">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-30-1" title="View reference  in text"
+                           id="ref-30">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.30"
+                             data-doi="10.1007/s00203-009-0535-2">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pradella</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Päuker</span>,  <span class="cit-name-given-names">O.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Petersen</span>,  <span class="cit-name-given-names">J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2010</span><strong>).</strong> <span class="cit-article-title">Genome organisation of the marine <em>Roseobacter</em> clade member <em>Marinovum algicola</em></span>. <abbr class="cit-jnl-abbrev">Arch Microbiol</abbr> <span class="cit-vol">192</span>, <span class="cit-fpage">115</span>–<span class="cit-lpage">126</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/s00203-009-0535-2</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>20039020</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/s00203-009-0535-2&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=20039020&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Genome%20organisation%20of%20the%20marine%20Roseobacter%20clade%20member%20Marinovum%20algicola&amp;author=S.%20Pradella&amp;author=O.%20P%C3%A4uker&amp;author=J.%20Petersen&amp;publication_year=2010&amp;journal=Arch%20Microbiol&amp;volume=192&amp;pages=115-126&amp;doi=10.1007%2Fs00203-009-0535-2&amp;pmid=20039020">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-31-1" title="View reference  in text"
+                           id="ref-31">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.31"
+                             data-doi="10.1099/00207713-46-4-1088">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Rainey</span>,  <span class="cit-name-given-names">F. A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ward-Rainey</span>,  <span class="cit-name-given-names">N.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kroppenstedt</span>,  <span class="cit-name-given-names">R. M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stackebrandt</span>,  <span class="cit-name-given-names">E.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1996</span><strong>).</strong> <span class="cit-article-title">The genus <em>Nocardiopsis</em> represents a phylogenetically coherent taxon and a distinct actinomycete lineage: proposal of <em>Nocardiopsaceae</em> fam. nov.</span> <abbr class="cit-jnl-abbrev">Int J Syst Bacteriol</abbr> <span class="cit-vol">46</span>, <span class="cit-fpage">1088</span>–<span class="cit-lpage">1092</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-46-4-1088</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>8863440</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=46/4/1088"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-32-1" title="View reference  in text"
+                           id="ref-32">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.32"
+                             data-doi="10.1128/AEM.71.4.1729-1736.2005">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Rao</span>,  <span class="cit-name-given-names">D.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Webb</span>,  <span class="cit-name-given-names">J. S.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kjelleberg</span>,  <span class="cit-name-given-names">S.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2005</span><strong>).</strong> <span class="cit-article-title">Competitive interactions in mixed-species biofilms containing the marine bacterium <em>Pseudoalteromonas tunicata</em></span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">71</span>, <span class="cit-fpage">1729</span>–<span class="cit-lpage">1736</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/AEM.71.4.1729-1736.2005</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>15811995</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=71/4/1729"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-33-1" title="View reference  in text"
+                           id="ref-33">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4340.33"
+                             data-doi="10.1016/B978-012101285-4/50007-2">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Birren</span>,  <span class="cit-name-given-names">B.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Lai</span>,  <span class="cit-name-given-names">E.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Römling</span>,  <span class="cit-name-given-names">U.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Fislage</span>,  <span class="cit-name-given-names">R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Tümmler</span>,  <span class="cit-name-given-names">B.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1996</span><strong>).</strong> <span class="cit-article-title">Macrorestriction mapping an analysis of bacterial genomes</span>. In <span class="cit-source">Nonmammalian Genomic Analysis: A Practical Guide</span>, pp. <span class="cit-fpage">165</span>–<span class="cit-lpage">195</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Birren</span>,  <span class="cit-name-given-names">B.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Lai</span>,  <span class="cit-name-given-names">E.</span></span>
+                                 . <span class="cit-publ-loc">San Diego, CA</span>: <span class="cit-publ-name">Academic Press</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/B978-012101285-4/50007-2</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/B978-012101285-4/50007-2&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Macrorestriction%20mapping%20an%20analysis%20of%20bacterial%20genomes&amp;author=U.%20R%C3%B6mling&amp;author=R.%20Fislage&amp;author=B.%20T%C3%BCmmler&amp;publication_year=1996&amp;citation_inbook_title=Nonmammalian%20Genomic%20Analysis%3A%20A%20Practical%20Guide">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-34-1" title="View reference  in text"
+                           id="ref-34">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.34"
+                             data-doi="10.1099/00207713-48-2-537">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ruiz-Ponte</span>,  <span class="cit-name-given-names">C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Cilia</span>,  <span class="cit-name-given-names">V.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lambert</span>,  <span class="cit-name-given-names">C.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nicolas</span>,  <span class="cit-name-given-names">J. L.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1998</span><strong>).</strong> <span class="cit-article-title"><em>Roseobacter gallaeciensis</em> sp. nov., a new marine bacterium isolated from rearings and collectors of the scallop <em>Pecten maximus</em></span>. <abbr class="cit-jnl-abbrev">Int J Syst Bacteriol</abbr> <span class="cit-vol">48</span>, <span class="cit-fpage">537</span>–<span class="cit-lpage">542</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-48-2-537</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>9731295</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=48/2/537"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-35-1" title="View reference  in text"
+                           id="ref-35">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.35"
+                             data-doi="10.1021/ja207172s">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Seyedsayamdost</span>,  <span class="cit-name-given-names">M. R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Carr</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kolter</span>,  <span class="cit-name-given-names">R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Clardy</span>,  <span class="cit-name-given-names">J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2011a</span><strong>).</strong> <span class="cit-article-title">Roseobacticides: small molecule modulators of an algal-bacterial symbiosis</span>. <abbr class="cit-jnl-abbrev">J Am Chem Soc</abbr> <span class="cit-vol">133</span>, <span class="cit-fpage">18343</span>–<span class="cit-lpage">18349</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1021/ja207172s</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>21928816</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1021/ja207172s&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=21928816&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Roseobacticides%3A%20small%20molecule%20modulators%20of%20an%20algal-bacterial%20symbiosis&amp;author=M.%20R.%20Seyedsayamdost&amp;author=G.%20Carr&amp;author=R.%20Kolter&amp;author=J.%20Clardy&amp;publication_year=2011a&amp;journal=J%20Am%20Chem%20Soc&amp;volume=133&amp;pages=18343-18349&amp;doi=10.1021%2Fja207172s&amp;pmid=21928816">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-36-1" title="View reference  in text"
+                           id="ref-36">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.36"
+                             data-doi="10.1038/nchem.1002">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Seyedsayamdost</span>,  <span class="cit-name-given-names">M. R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Case</span>,  <span class="cit-name-given-names">R. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kolter</span>,  <span class="cit-name-given-names">R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Clardy</span>,  <span class="cit-name-given-names">J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2011b</span><strong>).</strong> <span class="cit-article-title">The Jekyll-and-Hyde chemistry of <em>Phaeobacter gallaeciensis</em></span>. <abbr class="cit-jnl-abbrev">Nat Chem</abbr> <span class="cit-vol">3</span>, <span class="cit-fpage">331</span>–<span class="cit-lpage">335</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1038/nchem.1002</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>21430694</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1038/nchem.1002&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=21430694&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=The%20Jekyll-and-Hyde%20chemistry%20of%20Phaeobacter%20gallaeciensis&amp;author=M.%20R.%20Seyedsayamdost&amp;author=R.%20J.%20Case&amp;author=R.%20Kolter&amp;author=J.%20Clardy&amp;publication_year=2011b&amp;journal=Nat%20Chem&amp;volume=3&amp;pages=331-335&amp;doi=10.1038%2Fnchem.1002&amp;pmid=21430694">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-37-1" title="View reference  in text"
+                           id="ref-37">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4340.37">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Gerhardt</span>,  <span class="cit-name-given-names">P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Murray</span>,  <span class="cit-name-given-names">R. G. E.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Wood</span>,  <span class="cit-name-given-names">W. A.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Smibert</span>,  <span class="cit-name-given-names">R. M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1981</span><strong>).</strong> <span class="cit-article-title">Phenotypic characterization</span>. In <span class="cit-source">Manual of Methods for General Bacteriology</span>, pp. <span class="cit-fpage">607</span>–<span class="cit-lpage">654</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Gerhardt</span>,  <span class="cit-name-given-names">P.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Murray</span>,  <span class="cit-name-given-names">R. G. E.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Wood</span>,  <span class="cit-name-given-names">W. A.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span>
+                                 . <span class="cit-publ-loc">Washington, DC</span>: <span class="cit-publ-name">American Society for Microbiology</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Phenotypic%20characterization&amp;author=R.%20M.%20Smibert&amp;author=N.%20R.%20Krieg&amp;publication_year=1981&amp;citation_inbook_title=Manual%20of%20Methods%20for%20General%20Bacteriology">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-38-1" title="View reference  in text"
+                           id="ref-38">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.38"
+                             data-doi="10.1080/10635150802429642">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stamatakis</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hoover</span>,  <span class="cit-name-given-names">P.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Rougemont</span>,  <span class="cit-name-given-names">J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2008</span><strong>).</strong> <span class="cit-article-title">A rapid bootstrap algorithm for the RAxML Web servers</span>. <abbr class="cit-jnl-abbrev">Syst Biol</abbr> <span class="cit-vol">57</span>, <span class="cit-fpage">758</span>–<span class="cit-lpage">771</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1080/10635150802429642</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>18853362</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=sysbio&amp;resid=57/5/758"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-39-1" title="View reference  in text"
+                           id="ref-39">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4340.39">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Swofford</span>,  <span class="cit-name-given-names">D. L.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2002</span><strong>).</strong> <span class="cit-article-title"><span class="sc">paup</span>*: Phylogenetic analysis using parsimony (and other methods), version 4.0b10</span>. <span class="cit-publ-loc">Sunderland</span>: <span class="cit-publ-name">Sinauer Associates</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=paup%2A%3A%20Phylogenetic%20analysis%20using%20parsimony%20%28and%20other%20methods%29%2C%20version%204.0b10&amp;author=D.%20L.%20Swofford&amp;publication_year=2002">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-40-1" title="View reference  in text"
+                           id="ref-40">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.40"
+                             data-doi="10.1038/ismej.2012.62">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Thole</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kalhoefer</span>,  <span class="cit-name-given-names">D.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Voget</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Berger</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Engelhardt</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Liesegang</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wollherr</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kjelleberg</span>,  <span class="cit-name-given-names">S.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Daniel</span>,  <span class="cit-name-given-names">R.</span></span></li>
+                              </ol><cite> <strong>&amp; other authors (</strong><span class="cit-pub-date">2012</span><strong>).</strong> <span class="cit-article-title"><em>Phaeobacter gallaeciensis</em> genomes from globally opposite locations reveal high similarity of adaptation to surface life</span>. <abbr class="cit-jnl-abbrev">ISME J</abbr> <span class="cit-vol">6</span>, <span class="cit-fpage">2229</span>–<span class="cit-lpage">2244</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1038/ismej.2012.62</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>21716312</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1038/ismej.2012.62&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=22717884&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Phaeobacter%20gallaeciensis%20genomes%20from%20globally%20opposite%20locations%20reveal%20high%20similarity%20of%20adaptation%20to%20surface%20life&amp;author=S.%20Thole&amp;author=D.%20Kalhoefer&amp;author=S.%20Voget&amp;author=M.%20Berger&amp;author=T.%20Engelhardt&amp;author=H.%20Liesegang&amp;author=A.%20Wollherr&amp;author=S.%20Kjelleberg&amp;author=R.%20Daniel&amp;publication_year=2012&amp;journal=ISME%20J&amp;volume=6&amp;pages=2229-2244&amp;doi=10.1038%2Fismej.2012.62&amp;pmid=21716312">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-41-1" title="View reference  in text"
+                           id="ref-41">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.41"
+                             data-doi="10.1099/ijs.0.65324-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Tóth</span>,  <span class="cit-name-given-names">E. M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Schumann</span>,  <span class="cit-name-given-names">P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Borsodi</span>,  <span class="cit-name-given-names">A. K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kéki</span>,  <span class="cit-name-given-names">Z.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kovács</span>,  <span class="cit-name-given-names">A. L.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Márialigeti</span>,  <span class="cit-name-given-names">K.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2008</span><strong>).</strong> <span class="cit-article-title"><em>Wohlfahrtiimonas chitiniclastica</em> gen. nov., sp. nov., a new gammaproteobacterium isolated from <em>Wohlfahrtia magnifica</em> (Diptera: Sarcophagidae)</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">58</span>, <span class="cit-fpage">976</span>–<span class="cit-lpage">981</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.65324-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>18398205</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=58/4/976"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-42-1" title="View reference  in text"
+                           id="ref-42">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.42"
+                             data-doi="10.1371/journal.pone.0034846">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Vaas</span>,  <span class="cit-name-given-names">L. A. I.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sikorski</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Michael</span>,  <span class="cit-name-given-names">V.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Göker</span>,  <span class="cit-name-given-names">M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Klenk</span>,  <span class="cit-name-given-names">H.-P.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2012</span><strong>).</strong> <span class="cit-article-title">Visualization and curve-parameter estimation strategies for efficient exploration of phenotype microarray kinetics</span>. <abbr class="cit-jnl-abbrev">PLoS ONE</abbr> <span class="cit-vol">7</span>, <span class="cit-fpage">e34846</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1371/journal.pone.0034846</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>22536335</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1371/journal.pone.0034846&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=22536335&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Visualization%20and%20curve-parameter%20estimation%20strategies%20for%20efficient%20exploration%20of%20phenotype%20microarray%20kinetics&amp;author=L.%20A.%20I.%20Vaas&amp;author=J.%20Sikorski&amp;author=V.%20Michael&amp;author=M.%20G%C3%B6ker&amp;author=H.-P.%20Klenk&amp;publication_year=2012&amp;journal=PLoS%20ONE&amp;volume=7&amp;pages=e34846&amp;doi=10.1371%2Fjournal.pone.0034846&amp;pmid=22536335">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-43-1" title="View reference  in text"
+                           id="ref-43">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.43"
+                             data-doi="10.1099/00207713-37-4-463">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wayne</span>,  <span class="cit-name-given-names">L. G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brenner</span>,  <span class="cit-name-given-names">D. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Colwell</span>,  <span class="cit-name-given-names">R. R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Grimont</span>,  <span class="cit-name-given-names">P. A. D.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kandler</span>,  <span class="cit-name-given-names">O.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Krichevsky</span>,  <span class="cit-name-given-names">M. I.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Moore</span>,  <span class="cit-name-given-names">L. H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Moore</span>,  <span class="cit-name-given-names">W. E. C.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Murray</span>,  <span class="cit-name-given-names">R. G. E.</span></span></li>
+                              </ol><cite> <strong>&amp; other authors (</strong><span class="cit-pub-date">1987</span><strong>).</strong> <span class="cit-article-title">Report of the ad hoc committee on reconciliation of approaches to bacterial systematics</span>. <abbr class="cit-jnl-abbrev">Int J Syst Bacteriol</abbr> <span class="cit-vol">37</span>, <span class="cit-fpage">463</span>–<span class="cit-lpage">464</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-37-4-463</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=PDF&amp;journalCode=ijs&amp;resid=37/4/463"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-44-1" title="View reference  in text"
+                           id="ref-44">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.44"
+                             data-doi="10.1002/pmic.200900120">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Zech</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Thole</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Schreiber</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kalhöfer</span>,  <span class="cit-name-given-names">D.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Voget</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brinkhoff</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Simon</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Schomburg</span>,  <span class="cit-name-given-names">D.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Rabus</span>,  <span class="cit-name-given-names">R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2009</span><strong>).</strong> <span class="cit-article-title">Growth phase-dependent global protein and metabolite profiles of <em>Phaeobacter gallaeciensis</em> strain DSM 17395, a member of the marine <em>Roseobacter</em>-clade</span>. <abbr class="cit-jnl-abbrev">Proteomics</abbr> <span class="cit-vol">9</span>, <span class="cit-fpage">3677</span>–<span class="cit-lpage">3697</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1002/pmic.200900120</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>19639587</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1002/pmic.200900120&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=19639587&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Growth%20phase-dependent%20global%20protein%20and%20metabolite%20profiles%20of%20Phaeobacter%20gallaeciensis%20strain%20DSM%2017395%2C%20a%20member%20of%20the%20marine%20Roseobacter-clade&amp;author=H.%20Zech&amp;author=S.%20Thole&amp;author=K.%20Schreiber&amp;author=D.%20Kalh%C3%B6fer&amp;author=S.%20Voget&amp;author=T.%20Brinkhoff&amp;author=M.%20Simon&amp;author=D.%20Schomburg&amp;author=R.%20Rabus&amp;publication_year=2009&amp;journal=Proteomics&amp;volume=9&amp;pages=3677-3697&amp;doi=10.1002%2Fpmic.200900120&amp;pmid=19639587">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-45-1" title="View reference  in text"
+                           id="ref-45">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4340.45"
+                             data-doi="10.1093/nar/gkg595">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Zuker</span>,  <span class="cit-name-given-names">M.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2003</span><strong>).</strong> <span class="cit-article-title">Mfold web server for nucleic acid folding and hybridization prediction</span>. <abbr class="cit-jnl-abbrev">Nucleic Acids Res</abbr> <span class="cit-vol">31</span>, <span class="cit-fpage">3406</span>–<span class="cit-lpage">3415</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1093/nar/gkg595</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>12824337</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=nar&amp;resid=31/13/3406"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                  </ol>
+               </div><span class="highwire-journal-article-marker-end"></span></div>
+            <div class="social-bookmarking">
+               
+               <ul class="social-bookmark-links">
+                  <li class="social-bookmarking-item social-bookmarking-item-citeulike"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=CITEULIKE"><img src="/shared/img/common/social-bookmarking/citeulike.gif"
+                             alt="Add to CiteULike"
+                             title="CiteULike" /></a><span class="soc-bm-link-text">CiteULike</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-delicious"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=DEL_ICIO_US"><img src="/shared/img/common/social-bookmarking/delicious.gif"
+                             alt="Add to Delicious"
+                             title="Delicious" /></a><span class="soc-bm-link-text">Delicious</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-digg"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=DIGG"><img src="/shared/img/common/social-bookmarking/digg.gif" alt="Add to Digg"
+                             title="Digg" /></a><span class="soc-bm-link-text">Digg</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-facebook"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/short/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=FACEBOOK"
+                        class="sb-facebook"
+                        rel="external-nw"><img src="/shared/img/common/social-bookmarking/facebook.gif" alt="Add to Facebook"
+                             title="Facebook" /></a><span class="soc-bm-link-text">Facebook</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-googleplus"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=GOOGLEPLUS&amp;log_only=yes"><img src="/shared/img/common/social-bookmarking/googleplus.jpg" alt="Add to Google+"
+                             title="Google+" /></a><span class="soc-bm-link-text">Google+</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-linkedin"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=LINKEDIN"><img src="/shared/img/common/social-bookmarking/linkedin.gif" alt="Add to LinkedIn"
+                             title="LinkedIn" /></a><span class="soc-bm-link-text">LinkedIn</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-mendeley"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=MENDELEY"><img src="/shared/img/common/social-bookmarking/mendeley.gif" alt="Add to Mendeley"
+                             title="Mendeley" /></a><span class="soc-bm-link-text">Mendeley</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-reddit"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=REDDIT"><img src="/shared/img/common/social-bookmarking/reddit.gif" alt="Add to Reddit"
+                             title="Reddit" /></a><span class="soc-bm-link-text">Reddit</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-twitter"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=TWITTER"><img src="/shared/img/common/social-bookmarking/twitter.gif" alt="Add to Twitter"
+                             title="Twitter" /></a><span class="soc-bm-link-text">Twitter</span></li>
+               </ul>
+               
+               <p class="social-bookmarking-help"><a href="/help/social_bookmarks.dtl">What's this?</a></p>
+               
+            </div><span id="related-urls"></span></div>
+         <div id="col-2">
+            
+            <div class="article-nav sidebar-nav">
+               <a href="/content/63/Pt_11/4330.short" title="Previous article" class="previous">« Previous</a><span class="article-nav-sep"> | </span><a href="/content/63/Pt_11/4350.short" title="Next article" class="next">Next Article »</a>
+               
+               <span class="toc-link">
+                  				<a href="/content/63/Pt_11.toc" title="Table of Contents">Table of Contents</a>
+                  			</span>
+               
+               
+            </div>
+            <div class="free-article">
+               <span class="free-article-note">
+                  FREE ARTICLE
+                  </span>
+               
+            </div>
+            <div class="content-box" id="article-cb-main">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Article</span></h3>
+                  <div class="cb-section cb-slug">
+                     <ol>
+                        <li>
+                           <div id="slugline">
+                              
+                              
+                              	    
+                              
+                              doi:
+                              <span title="10.1099/ijs.0.053900-0" class="slug-doi">10.1099/ijs.0.053900-0
+                                 </span>
+                              <cite>
+                                 	    <abbr title="International Journal of Systematic and Evolutionary Microbiology"
+                                       class="slug-jnl-abbrev">
+                                    IJSEM</abbr><span class="slug-pub-date" itemprop="datePublished">
+                                    	    November 2013 
+                                    </span>
+                                 	    <span class="slug-vol">
+                                    vol. 63 
+                                    </span><span class="slug-issue">
+                                    no. Pt 11 
+                                    </span><span class="slug-pages">
+                                    4340-4349
+                                    </span>
+                                 </cite>
+                              
+                              	           
+                              
+                              
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section cb-views">
+                     <ol>
+                        <li class="abstract-view-link primary"><a href="/content/63/Pt_11/4340.abstract" rel="view-abstract">Abstract</a><span class="free">Free</span></li>
+                        <li class="notice full-text-view-link primary"><span class="variant-indicator">» <span>Full Text</span></span><span class="free">Free</span></li>
+                        <li class="notice full-text-pdf-view-link primary"><a href="/content/63/Pt_11/4340.full.pdf+html" rel="view-full-text.pdf">Full Text (PDF)</a><span class="free">Free</span></li>
+                        <li><a href="/content/63/Pt_11/4340/suppl/DC1" rel="supplemental-data"
+                              class="dslink-supplementary-material">Supplementary material</a></li>
+                        <li><a href="/powerpoint/63/Pt_11/4340">PPT Slides of All Figures</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible" id="cb-art-cat">
+                     <h4 class="cb-section-header"><span>Classifications</span></h4>
+                     <ol>
+                        <li>
+                           <ul class="subject-headings last-child">
+                              <li><a class="tocsection-search"
+                                    href="/search?tocsectionid=Taxonomic+Note&amp;sortspec=date&amp;submit=Submit">Taxonomic Note</a></li>
+                           </ul>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible" id="cb-art-svcs">
+                     <h4 class="cb-section-header"><span>Services</span></h4>
+                     <ol>
+                        <li class="mail-a-friend-link icon-link"><a href="/email?gca=ijs%3B63%2FPt_11%2F4340&amp;current-view-path=/content/63/Pt_11/4340.full">
+                              Email this article to a colleague</a></li>
+                        <li class="alert-link icon-link"><a href="/cgi/alerts/ctalert?alertType=citedby&amp;addAlert=cited_by&amp;cited_by_criteria_resid=ijs%3B63%2FPt_11%2F4340&amp;saveAlert=no&amp;return-type=article&amp;return_url=http://ijs.sgmjournals.org/content/63/Pt_11/4340.full">Alert me when this article is cited</a></li>
+                        <li class="alert-link icon-link"><a href="/cgi/alerts/ctalert?alertType=correction&amp;addAlert=correction&amp;correction_criteria_value=63/Pt_11/4340&amp;saveAlert=no&amp;return-type=article&amp;return_url=http://ijs.sgmjournals.org/content/63/Pt_11/4340.full">Alert me if a correction is posted</a></li>
+                        <li class="similar-link"><a href="/search?qbe=ijs%3Bijs.0.053900-0&amp;citation=Buddruhs%20et%20al.%2063%20%28Pt%2011%29:%204340&amp;submit=yes">Similar articles in this journal</a></li>
+                        <li class="similar-link"><a href="/external-ref?access_num=ijs%3B63%2FPt_11%2F4340&amp;link_type=ISI_RELATEDRECORDS"
+                              id="cb-isi-similar-articles"
+                              class="similar-link">Similar articles in Web of Science</a></li>
+                        <li class="similar-link"><a href="/external-ref?access_num=24187021&amp;link_type=MED_NBRS"
+                              class="similar-link">Similar articles in PubMed</a></li>
+                        <li class="cit-man-link icon-link cite-link"><a href="/citmgr?gca=ijs%3B63%2FPt_11%2F4340">Download to citation manager</a></li>
+                        <li class="copyright-link icon-link"><a href="/external-ref?link_type=PERMISSIONDIRECT"><img src="/shared/img/content/permissions.gif" /></a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-cit">
+                     <h4 class="cb-section-header"><span>Citing Articles</span></h4>
+                     <ol>
+                        <li class="hw-citing-link"><a href="/content/63/Pt_11/4340.full?cited-by=yes&amp;legid=ijs;63/Pt_11/4340#cited-by"
+                              id="cb-hw-citing-articles">Load citing article information</a></li>
+                        <li><a href="/cgi/crossref-forward-links/63/Pt_11/4340" rel="external-nw"
+                              id="cb-crossref-citing-articles">Citing articles via CrossRef</a></li>
+                        <li><a href="/external-ref?access_num=%2Fijs%2F63%2FPt_11%2F4340&amp;link_type=ISI_CITING&amp;accnum_type=native"
+                              rel="external-nw"
+                              id="cb-isi-citing-articles">Citing articles via Web of Science</a></li>
+                        <li><a href="/external-ref?access_num=http://ijs.sgmjournals.org/content/63/Pt_11/4340.abstract&amp;link_type=GOOGLESCHOLAR">Citing articles via Google Scholar</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-gs">
+                     <h4 class="cb-section-header"><span>Google Scholar</span></h4>
+                     <ol>
+                        <li class="cb-art-gs-auth author-link"><a href="http://scholar.google.com/scholar?q=%22author%3ABuddruhs%20author%3AN.%22"
+                              class="cb-art-gs-auth author-link">Articles by  Buddruhs, N.</a></li>
+                        <li class="cb-art-gs-auth author-link"><a href="http://scholar.google.com/scholar?q=%22author%3ABrinkhoff%20author%3AT.%22"
+                              class="cb-art-gs-auth author-link">Articles by  Brinkhoff, T.</a></li>
+                        <li class="cb-art-gs-rel similar-link"><a href="/external-ref?access_num=http://ijs.sgmjournals.org/content/63/Pt_11/4340.abstract&amp;link_type=GOOGLESCHOLARRELATED">Search for related content</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-pm">
+                     <h4 class="cb-section-header"><span>PubMed</span></h4>
+                     <ol>
+                        <li class="cb-art-pm-cite cite-link icon-link"><a href="/external-ref?access_num=24187021&amp;link_type=PUBMED"
+                              class="cb-art-pm-cite cite-link icon-link">PubMed citation</a></li>
+                        <li class="cb-art-pm-auth author-link"><a href="/external-ref?access_num=Buddruhs%20N&amp;link_type=AUTHORSEARCH"
+                              class="cb-art-pm-auth author-link">Articles by  Buddruhs, N.</a></li>
+                        <li class="cb-art-pm-auth author-link"><a href="/external-ref?access_num=Brinkhoff%20T&amp;link_type=AUTHORSEARCH"
+                              class="cb-art-pm-auth author-link">Articles by  Brinkhoff, T.</a></li>
+                        <li>
+                           <div id="cb-entrez-links-placeholder"><a href="/entrez-links/24187021"></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-rel">
+                     <h4 class="cb-section-header"><span>Related Content</span></h4>
+                     <ol>
+                        <li><a href="/content/63/Pt_11/4340.full?related-urls=yes&amp;legid=ijs;63/Pt_11/4340#related-urls"
+                              id="cb-related-urls">Load related web page information</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed soc-links icon-link"
+                       id="cb-art-soc">
+                     <h4 class="cb-section-header"><span>Social Bookmarking</span></h4>
+                     <ol>
+                        <li>
+                           <div class="social-bookmarking">
+                              
+                              <ul class="social-bookmark-links">
+                                 <li class="social-bookmarking-item social-bookmarking-item-citeulike"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=CITEULIKE"><img src="/shared/img/common/social-bookmarking/citeulike.gif"
+                                            alt="Add to CiteULike"
+                                            title="CiteULike" /></a><span class="soc-bm-link-text">CiteULike</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-delicious"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=DEL_ICIO_US"><img src="/shared/img/common/social-bookmarking/delicious.gif"
+                                            alt="Add to Delicious"
+                                            title="Delicious" /></a><span class="soc-bm-link-text">Delicious</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-digg"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=DIGG"><img src="/shared/img/common/social-bookmarking/digg.gif" alt="Add to Digg"
+                                            title="Digg" /></a><span class="soc-bm-link-text">Digg</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-facebook"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/short/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=FACEBOOK"
+                                       class="sb-facebook"
+                                       rel="external-nw"><img src="/shared/img/common/social-bookmarking/facebook.gif" alt="Add to Facebook"
+                                            title="Facebook" /></a><span class="soc-bm-link-text">Facebook</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-googleplus"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=GOOGLEPLUS&amp;log_only=yes"><img src="/shared/img/common/social-bookmarking/googleplus.jpg" alt="Add to Google+"
+                                            title="Google+" /></a><span class="soc-bm-link-text">Google+</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-linkedin"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=LINKEDIN"><img src="/shared/img/common/social-bookmarking/linkedin.gif" alt="Add to LinkedIn"
+                                            title="LinkedIn" /></a><span class="soc-bm-link-text">LinkedIn</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-mendeley"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=MENDELEY"><img src="/shared/img/common/social-bookmarking/mendeley.gif" alt="Add to Mendeley"
+                                            title="Mendeley" /></a><span class="soc-bm-link-text">Mendeley</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-reddit"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=REDDIT"><img src="/shared/img/common/social-bookmarking/reddit.gif" alt="Add to Reddit"
+                                            title="Reddit" /></a><span class="soc-bm-link-text">Reddit</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-twitter"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4340&amp;title=Molecular%20and%20phenotypic%20analyses%20reveal%20the%20non-identity%20of%20the%20Phaeobacter%20gallaeciensis%20type%20strain%20deposits%20CIP%20105210T%20and%20DSM%2017395+--+Buddruhs%20et%20al.%2063%20%28Pt%2011%29%3A%204340+--+IJSEM&amp;doi=10.1099/ijs.0.053900-0&amp;link_type=TWITTER"><img src="/shared/img/common/social-bookmarking/twitter.gif" alt="Add to Twitter"
+                                            title="Twitter" /></a><span class="soc-bm-link-text">Twitter</span></li>
+                              </ul>
+                              
+                              <p class="social-bookmarking-help"><a href="/help/social_bookmarks.dtl">What's this?</a></p>
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+            
+            <div class="content-box" id="article-dyn-nav">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>Navigate This Article</span></h3>
+                  <div class="cb-section" id="cb-art-nav">
+                     <ol>
+                        <li><a href="#content-block">Top</a></li>
+                        <li><a href="#abstract-1">Abstract</a></li>
+                        <li><a href="#sec-1">Introduction</a></li>
+                        <li><a href="#sec-2">Methods</a></li>
+                        <li><a href="#sec-11">Results</a></li>
+                        <li><a href="#sec-19">Discussion</a></li>
+                        <li><a href="#ack-1">Acknowledgements</a></li>
+                        <li><a href="#ref-list-1">References</a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+         </div>
+         <div id="col-3">
+            
+            <div class="content-box" id="sidebar-current-issue">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Month's Issue</span></h3>
+                  <div class="cb-section">
+                     <ol>
+                        <li><span><a href="/content/current" rel="current-issue">April 2015, 65 (Pt 4)</a></span></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section">
+                     <ol>
+                        <li>
+                           <div class="current-issue"><a href="/content/current" rel="current-issue"><img src="/content/65/Pt_4.cover.gif" width="67" height="89" alt="Current Issue" /></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section sidebar-etoc-link">
+                     <ol>
+                        <li><a href="/cgi/alerts/etoc">Alert me to new issues of IJSEM
+                              </a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            <div id="sidebar-global-nav">
+               
+               		
+               <ul class="button-list pub-links">
+                  <li class="first"><a href="/site/misc/about.xhtml" title="ABOUT IJSEM"><span>ABOUT IJSEM</span></a></li>
+                  <li><a href="/site/misc/edboard.xhtml" title="EDITORIAL BOARD &amp; STAFF"><span>EDITORIAL BOARD &amp; STAFF</span></a></li>
+                  <li><a href="http://www.editorialmanager.com/ijs/" title="SUBMIT A MANUSCRIPT"><span>SUBMIT A MANUSCRIPT</span></a></li>
+                  <li><a href="/site/misc/ifora.xhtml" title="INFORMATION FOR AUTHORS"><span>INFORMATION FOR AUTHORS</span></a></li>
+                  <li><a href="/site/misc/iforr.xhtml" title="INFORMATION FOR REVIEWERS"><span>INFORMATION FOR REVIEWERS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/site/librarians/index.xhtml"
+                        title="INFORMATION FOR LIBRARIANS"><span>INFORMATION FOR LIBRARIANS</span></a></li>
+                  <li><a href="/site/misc/reprints.xhtml" title="PERMISSIONS AND REPRINTS"><span>PERMISSIONS AND REPRINTS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/subscriptions" title="SUBSCRIPTIONS"><span>SUBSCRIPTIONS</span></a></li>
+                  <li><a href="/site/misc/addir.xhtml" title="ADVERTISING"><span>ADVERTISING</span></a></li>
+                  <li class="rss-img-button"><a href="/site/misc/alerts_feeds.xhtml" title="ALERTS &amp; FEEDS"><span>ALERTS &amp; FEEDS</span></a></li>
+                  <li class="last"><a href="/feedback" title="FEEDBACK"><span>FEEDBACK</span></a></li>
+               </ul>
+               		
+               <ul class="button-list pub-links umbrella-links">
+                  <li class="first"><a href="http://mic.sgmjournals.org" title="MICROBIOLOGY"><span>MICROBIOLOGY</span></a></li>
+                  <li><a href="http://vir.sgmjournals.org" title="J GEN VIROL"><span>J GEN VIROL</span></a></li>
+                  <li><a href="http://jmm.sgmjournals.org" title="J MED MICROBIOL"><span>J MED MICROBIOL</span></a></li>
+                  <li><a href="http://jmmcr.sgmjournals.org" title="JMM CASE REPORTS"><span>JMM CASE REPORTS</span></a></li>
+                  <li class="last"><a href="http://www.sgmjournals.org" title="ALL SGM JOURNALS"><span>ALL SGM JOURNALS</span></a></li>
+               </ul>
+               		
+               <div class="sidebar-icon-group">
+                  			
+                  <div class="icons">
+                     			<a href="http://www.sgm.ac.uk/" rel="external-nw"><img src="/publisher/img/society_logo.gif" class="publisher-icon" alt="Society Logo" /></a>
+                     			<a href="http://www.the-icsp.org/" rel="external-nw"><img src="/publisher/img/icsp_logo.gif" class="publisher-icon" alt="ICSP Logo" /></a>
+                     			<a href="http://highwire.stanford.edu/" rel="external-nw"><img src="/publisher/img/hplogo.gif" class="hw-icon" alt="HighWire Press Logo" /></a>
+                     			
+                  </div>
+                  			
+                  <div class="sidebar-icon-text"><span>The <a href="http://www.sgmjournals.org"> Society for General Microbiology</a> publishes online with the assistance of <a href="http://highwire.stanford.edu">HighWire Press®</a>.</span></div>
+                  		
+               </div>
+               	
+            </div>
+            <div class="most-links-box js-marker">
+               
+               <div class="most-header">
+                  
+                  <h3>Most</h3>
+                  
+               </div>
+               
+               <ul>
+                  <li class="most-cur-sel">
+                     <h4>Viewed</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/1070?rss=1&amp;ssource=mfr">Proposal to consistently apply the International Code of Nomenclature of Prokaryotes (ICNP) to names of the oxygenic photosynthetic
+                                 bacteria (cyanobacteria), including those validly published under the International Code of Botanical Nomenclature (ICBN)/International
+                                 Code of Nomenclature for algae, fungi and plants (ICN), and proposal to change Principle 2 of the ICNP</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfr">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/316?rss=1&amp;ssource=mfr">Integrating genomics into the taxonomy and systematics of the Bacteria and Archaea</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/333?rss=1&amp;ssource=mfr">Applications of next-generation sequencing to unravelling the evolutionary history of algae</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/739?rss=1&amp;ssource=mfr">Notification that new names of prokaryotes, new combinations, and new taxonomic opinions have appeared in volume 64, part
+                                 12, of the IJSEM</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfr1.dtl" class="view-all">» View all Most Viewed articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+                  <li>
+                     <h4>Cited</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4386?rss=1&amp;ssource=mfc">Chryseobacterium hispalense sp. nov., a plant-growth-promoting bacterium isolated from a rainwater pond in an olive plant
+                                 nursery, and emended descriptions of Chryseobacterium defluvii, Chryseobacterium indologenes, Chryseobacterium wanjuense and
+                                 Chryseobacterium gregarium</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfc">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_1/138?rss=1&amp;ssource=mfc">Aquibacter zeaxanthinifaciens gen. nov., sp. nov., a zeaxanthin-producing bacterium of the family Flavobacteriaceae isolated
+                                 from surface seawater, and emended descriptions of the genera Aestuariibaculum and Gaetbulibacter</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4790?rss=1&amp;ssource=mfc">Kordia aquimaris sp. nov., a zeaxanthin-producing member of the family Flavobacteriaceae isolated from surface seawater, and
+                                 emended description of the genus Kordia</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4524?rss=1&amp;ssource=mfc">Erythrobacter odishensis sp. nov. and Pontibacter odishensis sp. nov. isolated from dry soil of a solar saltern</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfc1.dtl" class="view-all">» View all Most Cited articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+               </ul>
+               
+               
+            </div>
+            
+            
+            
+         </div>
+         <div id="footer">
+            
+            <div class="bar">
+               
+               <div class="footer-group footer-col-left">
+                  		
+                  <p class="copyright">Copyright ©
+                     		2015 International Union of Microbiological Societies
+                     	
+                  </p>
+                  	
+               </div>
+               
+               <div class="footer-group footer-col-right">
+                  	    
+                  <ul class="issns">
+                     <li>
+                        <span>Print ISSN: </span>
+                        <span class="issn">1466-5026</span>
+                        
+                     </li>
+                     <li>
+                        <span>Online ISSN: </span>
+                        <span class="issn">1466-5034</span>
+                        
+                     </li>
+                  </ul>
+                  	  
+               </div>
+               	  
+            </div>
+            
+            
+            <div class="block-2 sb-div"></div>
+            
+         </div><script type="text/javascript">
+        var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
+        document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
+        </script><script type="text/javascript">
+        try {
+        var pageTracker = _gat._getTracker("UA-189672-25");
+        pageTracker._setDomainName(".sgmjournals.org");
+        pageTracker._trackPageview();
+        } catch(err) {}
+        </script><script type="text/javascript">
+	(function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
+		(i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
+		m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
+	})(window,document,'script','//www.google-analytics.com/analytics.js','ga');
+
+	ga('create', 'UA-48529861-1', '.sgmjournals.org');
+	ga('send', 'pageview');
+	</script></div>
+   </body>
+</html>
\ No newline at end of file
diff --git a/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/fulltext.pdf b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/fulltext.pdf
new file mode 100644
index 00000000..38beffcf
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/fulltext.pdf differ
diff --git a/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/ijs053900.pdf b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/ijs053900.pdf
new file mode 100644
index 00000000..168137f4
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4340.full/ijs053900.pdf differ
diff --git a/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F10.large.jpg b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F10.large.jpg
new file mode 100644
index 00000000..c469df1b
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/F10.large.jpg differ
diff --git a/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/fulltext.html b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/fulltext.html
new file mode 100644
index 00000000..9579dec3
--- /dev/null
+++ b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/fulltext.html
@@ -0,0 +1,1307 @@
+<!DOCTYPE html
+  PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html
+      xmlns="http://www.w3.org/1999/xhtml"
+      xml:lang="en"
+      lang="en">
+   <head>
+      <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
+      <title>Designation of type strains for seven species of the order Myxococcales and proposal for neotype strains of Cystobacter ferrugineus,
+         Cystobacter minus and Polyangium fumosum 
+      </title>
+      <meta name="googlebot" content="NOODP" />
+      <meta name="HW.ad-path" content="/cgi/content/full/63/Pt_11/4354" />
+      <meta content="/ijs/63/Pt_11/4354.atom" name="HW.identifier" />
+      <meta name="DC.Format" content="text/html" />
+      <meta name="DC.Language" content="en" />
+      <meta content="Designation of type strains for seven species of the order Myxococcales and proposal for neotype strains of Cystobacter ferrugineus, Cystobacter minus and Polyangium fumosum"
+            name="DC.Title" />
+      <meta content="10.1099/ijs.0.056440-0" name="DC.Identifier" />
+      <meta content="2013-11-01" name="DC.Date" />
+      <meta content="Society for General Microbiology" name="DC.Publisher" />
+      <meta content="Elke Lang" name="DC.Contributor" />
+      <meta content="Hans Reichenbach" name="DC.Contributor" />
+      <meta content="International Journal of Systematic and Evolutionary&#xA;                Microbiology"
+            name="citation_journal_title" />
+      <meta content="Int J Syst Evol&#xA;                Microbiol"
+            name="citation_journal_abbrev" />
+      <meta content="1466-5026" name="citation_issn" />
+      <meta content="1466-5034" name="citation_issn" />
+      <meta name="citation_author" content="Elke Lang" />
+      <meta name="citation_author_institution"
+            content="1Leibniz-Institut DSMZ – Deutsche Sammlung von Mikroorganismen und Zellkulturen GmbH, Inhoffenstrasse 7B, 38124 Braunschweig, Germany" />
+      <meta name="citation_author" content="Hans Reichenbach" />
+      <meta name="citation_author_institution"
+            content="2Helmholtz-Zentrum für Infektionsforschung, Inhoffenstrasse 7, 38124 Braunschweig, Germany" />
+      <meta content="Designation of type strains for seven species of the order Myxococcales and proposal for neotype strains of Cystobacter ferrugineus, Cystobacter minus and Polyangium fumosum"
+            name="citation_title" />
+      <meta content="11/01/2013" name="citation_date" />
+      <meta content="63" name="citation_volume" />
+      <meta content="Pt 11" name="citation_issue" />
+      <meta content="4354" name="citation_firstpage" />
+      <meta content="4360" name="citation_lastpage" />
+      <meta content="63/Pt_11/4354" name="citation_id" />
+      <meta content="63/Pt 11/4354" name="citation_id_from_sass_path" />
+      <meta content="ijs;63/Pt_11/4354" name="citation_mjid" />
+      <meta content="10.1099/ijs.0.056440-0" name="citation_doi" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4354.abstract"
+            name="citation_abstract_html_url" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4354.full"
+            name="citation_fulltext_html_url" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4354.full.pdf"
+            name="citation_pdf_url" />
+      <meta content="/content/63/Pt_11.cover.gif" name="issue_cover_image" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_11/4354"
+            name="citation_public_url" />
+      <meta content="24187023" name="citation_pmid" />
+      <meta name="citation_fulltext_world_readable" content="" />
+      <meta name="citation_section" content="Taxonomic Note" />
+      <meta name="robots" content="noarchive,nofollow" />
+      <meta name="googlebot" content="noarchive" />
+      <link href="/content/63/Pt_11/4350.short" rel="prev" />
+      <link href="/content/63/Pt_11/4361.short" rel="next" />
+      <link rel="stylesheet" type="text/css" media="all" href="/shared/css/hw-global.css" />
+      <link rel="stylesheet" type="text/css" media="print" href="/shared/css/hw-print.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/standard-designs/design25/main.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/local/css/hw-local-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/jquery.fancybox-1.3.4.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-global-colexpand.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-global-colexpand.css" /><script type="text/javascript" id="session-d7221065e1">var callbackToken='563599B2663934A';</script><script type="text/javascript" id="session-d7221065e3">
+                      var subCode='sgmjournal_sub';
+                    </script><script type="text/javascript" src="/shared/js/jquery-min.js"></script><script type="text/javascript" src="/shared/js/fingerprint.js"></script><script type="text/javascript" src="/shared/js/hw-shared.js"></script><script type="text/javascript" src="/shared/js/design/hw-design1.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-shared.js"></script><script type="text/javascript" src="/shared/js/pages/hw-content.js"></script><script type="text/javascript" src="/shared/js/fancybox/jquery.fancybox-1.3.4.js"></script><script type="text/javascript" src="/shared/js/fancybox/jquery.easing-1.3.pack.js"></script><script type="text/javascript"
+              src="/shared/js/fancybox/jquery.mousewheel-3.0.4.pack.js"></script><script type="text/javascript" src="/shared/js/util/content.jquery.addVariantLink.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-custom-free.js"></script><script type="text/javascript" src="/shared/js/util/hw-col-expand.js"></script><script type="text/javascript"
+              src="https://data.namesforlife.com/script/NamesforLife.js"></script></head>
+   <body>
+      <div class="hw-gen-page pagetype-content" id="pageid-content" itemscope="itemscope"
+           itemtype="http://schema.org/ScholarlyArticle">
+         <div id="header">
+            
+            <h1><a id="logo" href="/"><span>International Journal of Systematic and Evolutionary Microbiology</span></a></h1>
+            
+            <p id="skip-link">
+               <a href="#content-block">Skip to main page content</a>
+               
+            </p>
+            
+            <ul class="button-list header-buttons">
+               <li class="first"><a href="/" title="HOME"><span>HOME</span></a></li>
+               <li><a href="/content/current" title="CURRENT ISSUE"><span>CURRENT ISSUE</span></a></li>
+               <li><a href="/content" title="ARCHIVE"><span>ARCHIVE</span></a></li>
+               <li><a href="/search" title="SEARCH"><span>SEARCH</span></a></li>
+               <li><a href="/help" title="HELP"><span>HELP</span></a></li>
+               <li class="last"><a href="/feedback" title="CONTACT US"><span>CONTACT US</span></a></li>
+            </ul>
+            
+            
+            <div class="header-qs">
+               
+               <form class="searchbox" action="/search" method="get">
+                  <div>
+                     	<label for="header-qs-input" id="header-qs-search-label">Search for Keyword:</label>
+                     <input value="" title="Search" type="text" name="fulltext" id="header-qs-input" /><input type="hidden" name="submit" value="yes" /><label for="header-qs-search" id="header-qs-search-label">GO</label><input value="GO" alt="Link: Go" type="image" id="header-qs-search-go"
+                            src="/shared/img/standard-design/design2/go.gif" /> 
+                     
+                  </div>
+                  <div class="adv-search-link"><a href="/search">Advanced Search</a></div>
+               </form>
+               
+               
+            </div>
+            
+            <div class="header-ac-elements">
+               
+               <div id="authstring" class="suppress-header-login">
+                  
+                  <ul>
+                     <li class="subscr-ref">Institution: THE NATURAL HISTORY MUSEUM</li>
+                     <li>
+                        <a href="/login?uri=http%3A%2F%2Fijs.sgmjournals.org%2Fcontent%2F63%2FPt_11%2F4354.full">
+                           Sign In as Member / Individual
+                           </a>
+                        
+                     </li>
+                  </ul>           
+                  
+               </div> 
+               
+               <div id="hdr-login" class="suppress-header-login"></div>
+               
+            </div>
+            
+            <div class="banner-ads">
+               		
+               <ul>
+                  <li class="position-1 no-ad hdr_left"><span>  </span></li>
+               </ul>
+               	
+            </div>
+            
+            <div class="bar">
+               
+               <div class="bar-inner"></div>
+               
+            </div>
+            
+         </div>
+         <div id="content-block">
+            <div class="article fulltext-view " itemprop="articleBody"><span class="highwire-journal-article-marker-start"></span><h1 id="article-title-1" itemprop="headline">Designation of type strains for seven species of the order <em>Myxococcales</em> and proposal for neotype strains of <em>Cystobacter ferrugineus</em>, <em>Cystobacter minus</em> and <em>Polyangium fumosum</em></h1>
+               <div class="contributors">
+                  <ol class="contributor-list" id="contrib-group-1">
+                     <li class="contributor" id="contrib-1" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Elke+Lang&amp;sortspec=date&amp;submit=Submit">Elke Lang</a></span><a id="xref-aff-1-1" class="xref-aff" href="#aff-1"><sup>1</sup></a> and 
+                     </li>
+                     <li class="last" id="contrib-2"><span class="name"><a class="name-search"
+                              href="/search?author1=Hans+Reichenbach&amp;sortspec=date&amp;submit=Submit">Hans Reichenbach</a></span><a id="xref-aff-2-1" class="xref-aff" href="#aff-2"><sup>2</sup></a><span class="xref-sep">,</span><a id="xref-fn-1-1" class="xref-fn" href="#fn-1">†</a></li>
+                  </ol>
+                  <ol class="affiliation-list">
+                     <li class="aff"><a id="aff-1" name="aff-1"></a><address><sup>1</sup>Leibniz-Institut DSMZ – Deutsche Sammlung von Mikroorganismen und Zellkulturen GmbH, Inhoffenstrasse 7B, 38124 Braunschweig,
+                           Germany
+                        </address>
+                     </li>
+                     <li class="aff"><a id="aff-2" name="aff-2"></a><address><sup>2</sup>Helmholtz-Zentrum für Infektionsforschung, Inhoffenstrasse 7, 38124 Braunschweig, Germany
+                        </address>
+                     </li>
+                  </ol>
+                  <ol class="corresp-list">
+                     <li class="corresp" id="corresp-1"><strong>Corresponding</strong><br />Elke Lang <span class="em-link"><span class="em-addr">ela{at}dsmz.de</span></span></li>
+                  </ol>
+               </div>
+               <div class="section abstract" id="abstract-1" itemprop="description">
+                  <div class="section-nav">
+                     <div class="nav-placeholder"> </div><a href="#fn-group-1" title="Next Section" class="next-section-link"><span>Next Section</span></a></div>
+                  <h2>Abstract</h2>
+                  
+                  <p id="p-3">Ten species of the order <span class="named-content order" id="named-content-1"><a class="namesforlife" rel="namesforlife-name" title="Myxococcales"
+                           href="doi:10.1601/nm.3690"><em>Myxococcales</em></a></span> with validly published names are devoid of living type strains. Four species of the genus <span class="named-content genus" id="named-content-2"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces"
+                           href="doi:10.1601/nm.3749"><em>Chondromyces</em></a></span> are represented by dead herbarium samples as the type material. For a species of the genus <span class="named-content genus" id="named-content-3"><a class="namesforlife" rel="namesforlife-name" title="Melittangium"
+                           href="doi:10.1601/nm.3710"><em>Melittangium</em></a></span> and two species of the genus <span class="named-content genus" id="named-content-4"><a class="namesforlife" rel="namesforlife-name" title="Polyangium"
+                           href="doi:10.1601/nm.3736"><em>Polyangium</em></a></span>, no physical type material was assigned at the time of validation of the names or later on. In accordance with rule 18f of
+                     the International Code of Nomenclature of Bacteria the following type strains are designated for these species: strain Cm
+                     a14<sup>T</sup> ( = DSM 14605<sup>T</sup> = JCM 12615<sup>T</sup>) as the type strain of <span class="named-content species" id="named-content-5"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces apiculatus"
+                           href="doi:10.1601/nm.3751"><em>Chondromyces apiculatus</em></a></span>, strain Cm c5<sup>T</sup> ( = DSM 14714<sup>T</sup> = JCM 12616<sup>T</sup>) as the type strain of <span class="named-content species" id="named-content-6"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces crocatus"
+                           href="doi:10.1601/nm.3750"><em>Chondromyces crocatus</em></a></span>, strain Sy t2<sup>T</sup> ( = DSM 14631<sup>T</sup> = JCM 12617<sup>T</sup>) as the type strain of <span class="named-content species" id="named-content-7"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces lanuginosus"
+                           href="doi:10.1601/nm.3753"><em>Chondromyces lanuginosus</em></a></span>, strain Cm p51<sup>T</sup> ( = DSM 14607<sup>T</sup> = JCM 12618<sup>T</sup>) as the type strain of <span class="named-content species" id="named-content-8"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces pediculatus"
+                           href="doi:10.1601/nm.3754"><em>Chondromyces pediculatus</em></a></span>, strain Me b8<sup>T</sup> ( = DSM 14713<sup>T</sup> = JCM 12633<sup>T</sup>) as the type strain of <span class="named-content species" id="named-content-9"><a class="namesforlife" rel="namesforlife-name" title="Melittangium boletus"
+                           href="doi:10.1601/nm.3711"><em>Melittangium boletus</em></a></span>, strain Pl s12<sup>T</sup> ( = DSM 14670<sup>T</sup> = JCM 12637<sup>T</sup>) as the type strain of <span class="named-content species" id="named-content-10"><a class="namesforlife" rel="namesforlife-name" title="Polyangium sorediatum"
+                           href="doi:10.1601/nm.3745"><em>Polyangium sorediatum</em></a></span> and strain Pl sm5<sup>T</sup> ( = DSM 14734<sup>T</sup> = JCM 12638<sup>T</sup>) as the type strain of <span class="named-content species" id="named-content-11"><a class="namesforlife" rel="namesforlife-name" title="Polyangium spumosum"
+                           href="doi:10.1601/nm.3746"><em>Polyangium spumosum</em></a></span>. Furthermore, the type strains given for three species of the genera <span class="named-content genus" id="named-content-12"><a class="namesforlife" rel="namesforlife-name" title="Cystobacter"
+                           href="doi:10.1601/nm.3693"><em>Cystobacter</em></a></span> and <span class="named-content genus" id="named-content-13"><a class="namesforlife" rel="namesforlife-name" title="Polyangium"
+                           href="doi:10.1601/nm.3736"><em>Polyangium</em></a></span> had been kept at one university institute and have been lost according to our investigations. In accordance with Rule 18c
+                     of the Bacteriological Code, we propose the following neotype strains: strain Cb fe18 ( = DSM 14716  = JCM 12624) as the neotype
+                     strain of <span class="named-content species" id="named-content-14"><a class="namesforlife" rel="namesforlife-name" title="Cystobacter ferrugineus"
+                           href="doi:10.1601/nm.3698"><em>Cystobacter ferrugineus</em></a></span>, strain Cb m2 ( = DSM 14751 = JCM 12627) as the neotype strain of <span class="named-content species" id="named-content-15"><a class="namesforlife" rel="namesforlife-name" title="Cystobacter minus"
+                           href="doi:10.1601/nm.10682"><em>Cystobacter minus</em></a></span> and strain Pl fu5 ( = DSM 14668 = JCM 12636) as the neotype strain of <span class="named-content species" id="named-content-16"><a class="namesforlife" rel="namesforlife-name" title="Polyangium fumosum"
+                           href="doi:10.1601/nm.3740"><em>Polyangium fumosum</em></a></span>. The proposals of the strains are based on the descriptions and strain proposals given in the respective chapters of <em>Bergey’s Manual of Systematic Bacteriology</em> (2005).
+                  </p>
+                  
+               </div>
+               <div class="section fn-group" id="fn-group-1">
+                  <div class="section-nav"><a href="#abstract-1" title="Abstract" class="prev-section-link"><span>Previous Section</span></a><a href="#ack-1" title="Acknowledgements" class="next-section-link"><span>Next Section</span></a></div>
+                  <ul>
+                     <li class="fn" id="fn-1">
+                        <p id="p-1"><a class="rev-xref" href="#xref-fn-1-1">↵</a><span class="fn-label">†</span> Retired.
+                        </p>
+                     </li>
+                     <li class="fn-supplementary-material" id="fn-2">
+                        <p id="p-2">Two supplementary tables are available with the online version of this paper.</p>
+                     </li>
+                  </ul>
+               </div>
+               <p id="p-4">An exceptionally high number of myxobacterial species descriptions is not supported by the availability of formally acknowledged
+                  living type strain material. Because of this lack of material, the species could not be included, for example, in species-representing
+                  16S rRNA gene sequence databases. These are the most frequently used guides in taxonomy currently, and for that reason, great
+                  efforts are taken to fill the sequencing gaps (<a id="xref-ref-23-1" class="xref-bibr" href="#ref-23">Yarza <em>et al.</em>, 2013</a>). The International Code of Nomenclature of Bacteria (<a id="xref-ref-12-1" class="xref-bibr" href="#ref-12">Lapage <em>et al.</em>, 1992</a>) allows for the designation of type strains in cases where descriptions or dead specimens represent the type given for species
+                  with validly published species names. The code also allows for the proposal of neotype strains if a specimen of the strain
+                  on which the original description was based cannot be found. These measures have been installed in order to clear the way
+                  for inclusion of such species in future examinations, in particular in studies including ‘new’ methods which had not been
+                  applied at the time of the species description. In this communication, we formally designate type strains for seven and formally
+                  propose neotype strains for three species of the order <span class="named-content order" id="named-content-17"><a class="namesforlife" rel="namesforlife-name" title="Myxococcales"
+                        href="doi:10.1601/nm.3690"><em>Myxococcales</em></a></span>.
+               </p>
+               <p id="p-5">The present wording of Rule 18f of the International Code is: ‘If a description or illustration constitutes, or a dead preserved
+                  specimen has been designated as the type of a species [Rule 18a(1)] and a later strain of this species is cultivated, then
+                  the type strain may be designated by the person who isolated the strain or by a subsequent author. This type strain shall
+                  then replace the description, illustration or preserved specimen as the nomenclatural type. The designation of a type strain
+                  in this manner must be published in the IJSB/IJSEM, the authorship and date of priority of publication being determined by
+                  the effective and valid publication of the name by the original authors (Rule 24b)’.
+               </p>
+               <p id="p-6">The presently designated type strains of the species <span class="named-content species" id="named-content-18"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces apiculatus"
+                        href="doi:10.1601/nm.3751"><em>Chondromyces apiculatus</em></a></span> (<a id="xref-ref-21-1" class="xref-bibr" href="#ref-21">Thaxter, 1897</a>), <span class="named-content species" id="named-content-19"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces crocatus"
+                        href="doi:10.1601/nm.3750"><em>Chondromyces crocatus</em></a></span> (Berkeley &amp; Curtis, 1874), <span class="named-content species" id="named-content-20"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces lanuginosus"
+                        href="doi:10.1601/nm.3753"><em>Chondromyces lanuginosus</em></a></span> (<a id="xref-ref-8-1" class="xref-bibr" href="#ref-8">Kofler, 1913</a>) and <span class="named-content species" id="named-content-21"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces pediculatus"
+                        href="doi:10.1601/nm.3754"><em>Chondromyces pediculatus</em></a></span> (<a id="xref-ref-22-1" class="xref-bibr" href="#ref-22">Thaxter, 1904</a>) are dead herbarium specimens in the Thaxter collection (TC), housed in the Farlow Herbarium, Harvard University, Cambridge,
+                  USA (<a id="xref-table-wrap-1-1" class="xref-table" href="#T1">Table 1</a>). Howard McCurdy studied myxobacteria at the University of Windsor, Ontario, Canada during the period around 1960–1970. He
+                  assigned specific samples of the Thaxter collection as the types of these species (<a id="xref-ref-14-1" class="xref-bibr" href="#ref-14">McCurdy, 1971</a>). The species names were included in the Approved Lists (Skerman <em>et al.</em>, 1980). According to a curator of the herbarium, the specimen for <span class="named-content species" id="named-content-22"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces lanuginosus"
+                        href="doi:10.1601/nm.3753"><em>Chondromyces lanuginosus</em></a></span> seems to be lost whereas the other three specimens are still there, dried on the original substrates, accompanied by some
+                  slides.
+               </p>
+               <div id="T1" class="table pos-float">
+                  <div class="table-inline">
+                     <div class="callout"><span>View this table:</span><ul class="callout-links">
+                           <li><a href="4354/T1.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4354/T1.expansion.html">In a new window</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="table-caption"><span class="table-label">Table 1. </span> 
+                     <span class="caption-title">Myxobacterial species for which a cultivable type strain or neotype strain is formally proposed and the 16S rRNA sequences
+                        of the proposed neotype strains. AL, type strain as given in Approved Lists (Skerman <em>et al.</em>, 1980). VL, types as given in Validation List No 31 (<a id="xref-ref-4-1" class="xref-bibr" href="#ref-4">Brockman, 1989b</a>, <a id="xref-ref-5-1" class="xref-bibr" href="#ref-5">c</a>)</span>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <p id="p-7">For the species <span class="named-content species" id="named-content-36"><a class="namesforlife" rel="namesforlife-name" title="Melittangium boletus"
+                        href="doi:10.1601/nm.3711"><em>Melittangium boletus</em></a></span> (<a id="xref-ref-7-2" class="xref-bibr" href="#ref-7">Jahn, 1924</a>), <span class="named-content species" id="named-content-37"><a class="namesforlife" rel="namesforlife-name" title="Polyangium sorediatum"
+                        href="doi:10.1601/nm.3745"><em>Polyangium sorediatum</em></a></span> (<a id="xref-ref-3-3" class="xref-bibr" href="#ref-3">Brockman, 1989a</a>) and <span class="named-content species" id="named-content-38"><a class="namesforlife" rel="namesforlife-name" title="Polyangium spumosum"
+                        href="doi:10.1601/nm.3746"><em>Polyangium spumosum</em></a></span> (<a id="xref-ref-3-4" class="xref-bibr" href="#ref-3">Brockman, 1989a</a>) no physical type strains were assigned in the Approved Lists (<a id="xref-ref-20-1" class="xref-bibr" href="#ref-20">Skerman <em>et al.</em>, 1980</a>) or in Validation List No. 31 (<a id="xref-ref-4-2" class="xref-bibr" href="#ref-4">Brockman, 1989b</a>,<a id="xref-ref-5-2" class="xref-bibr" href="#ref-5">c</a>), respectively. Instead, the descriptions of <a id="xref-ref-3-5" class="xref-bibr" href="#ref-3">Brockman (1989a)</a> or simply the statement ‘not cultivated’ are given.
+               </p>
+               <p id="p-8">Bergey’s Manual of Systematic Bacteriology, second edition, includes comprehensive chapters about the members of the order
+                  <span class="named-content order" id="named-content-39"><a class="namesforlife" rel="namesforlife-name" title="Myxococcales"
+                        href="doi:10.1601/nm.3690"><em>Myxococcales</em></a></span>. <a id="xref-ref-15-5" class="xref-bibr" href="#ref-15">Reichenbach (2005a</a>, <a id="xref-ref-16-5" class="xref-bibr" href="#ref-16">b</a>, <a id="xref-ref-17-2" class="xref-bibr" href="#ref-17">c</a>, d, e) are the chapters relevant to the taxa mentioned in this paper. These chapters are based on the experience and knowledge
+                  accumulated during 40 years of intense investigations on myxobacteria and were written after more than 3000 myxobacterial
+                  strains had been isolated. Based on the original species descriptions, appropriate strains were selected and described as
+                  the type strains of the respective species (<a id="xref-table-wrap-1-2" class="xref-table" href="#T1">Table 1</a>). However, it has not been formally proposed in the IJSEM until now to accept these strains as the type strains.
+               </p>
+               <p id="p-9">For the reason that presently dead preserved material constitutes-, or a description has been designated-, the type strain
+                  of the mentioned species, or no type strain has been assigned, it is formally proposed that the strains selected by Reichenbach
+                  shall be designated the type strains of the respective species according to Rule 18f. The proposed type strains listed in
+                  <a id="xref-table-wrap-1-3" class="xref-table" href="#T1">Table 1</a> shall replace the dead specimen or descriptions. These are <span class="named-content species" id="named-content-40"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces apiculatus"
+                        href="doi:10.1601/nm.3751"><em>Chondromyces apiculatus</em></a></span> Cm a14<sup>T</sup>, <span class="named-content species" id="named-content-41"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces crocatus"
+                        href="doi:10.1601/nm.3750"><em>Chondromyces crocatus</em></a></span> Cm c5<sup>T</sup>, <span class="named-content species" id="named-content-42"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces lanuginosus"
+                        href="doi:10.1601/nm.3753"><em>Chondromyces lanuginosus</em></a></span> Sy t2<sup>T</sup>, <span class="named-content species" id="named-content-43"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces pediculatus"
+                        href="doi:10.1601/nm.3754"><em>Chondromyces pediculatus</em></a></span> Cm p51<sup>T</sup>, <span class="named-content species" id="named-content-44"><a class="namesforlife" rel="namesforlife-name" title="M. boletus"
+                        href="doi:10.1601/nm.3711"><em>M. boletus</em></a></span> Me b8<sup>T</sup>, <span class="named-content species" id="named-content-45"><a class="namesforlife" rel="namesforlife-name" title="P. sorediatum"
+                        href="doi:10.1601/nm.3745"><em>P. sorediatum</em></a></span> Pl s12<sup>T</sup> and <span class="named-content species" id="named-content-46"><a class="namesforlife" rel="namesforlife-name" title="P. spumosum"
+                        href="doi:10.1601/nm.3746"><em>P. spumosum</em></a></span> Pl sm5<sup>T</sup>. The prerequisite for the acceptance of type strains, their deposit and availability in two culture collections is achieved.
+                  The designation of the type strains is based on the descriptions given in the respective chapters of Bergey’s Manual (<a id="xref-ref-15-6" class="xref-bibr" href="#ref-15">Reichenbach 2005a</a>, <a id="xref-ref-17-3" class="xref-bibr" href="#ref-17">c</a>, <a id="xref-ref-18-5" class="xref-bibr" href="#ref-18">d</a>). In order to facilitate the comparison of these recent descriptions with those of the authors who originally proposed, revived
+                  or emended the species these original descriptions are assembled in Table S1 available in IJSEM Online. The fatty acid composition
+                  of the proposed type strains are given in Table S2 (<a id="xref-ref-6-1" class="xref-bibr" href="#ref-6">Garcia <em>et al.</em>, 2011</a>). The figures from the original descriptions and of the proposed type strains are shown face to face with figures showing
+                  the proposed type strains in <a id="xref-fig-1-1" class="xref-fig" href="#F1">Figs 1</a>–<a id="xref-fig-2-1" class="xref-fig" href="#F2">10</a>.
+               </p>
+               <div id="F1" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4354/F1.expansion.html"><img alt="Fig. 1. " src="4354/F1.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4354/F1.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4354/F1.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4354/F1">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 1. </span> 
+                     
+                     <p id="p-10" class="first-child"><span class="named-content species" id="named-content-47"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces apiculatus"
+                              href="doi:10.1601/nm.3751"><em>Chondromyces apiculatus</em></a></span>. (a) Drawing from <a id="xref-ref-21-3" class="xref-bibr" href="#ref-21">Thaxter (1897)</a>, plate XXX on pages 405–406. (b) Fruiting body (bar, 100 µm) and vegetative cells (insert; bar, 10 µm) of Cm a14<sup>T</sup>.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <div id="F2" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4354/F2.expansion.html"><img alt="Fig. 10. " src="4354/F2.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4354/F2.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4354/F2.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4354/F2">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 10. </span> 
+                     
+                     <p id="p-11" class="first-child"><span class="named-content species" id="named-content-48"><a class="namesforlife" rel="namesforlife-name" title="Polyangium fumosum"
+                              href="doi:10.1601/nm.3740"><em>Polyangium fumosum</em></a></span>. (a) Drawing from <a id="xref-ref-11-3" class="xref-bibr" href="#ref-11">Krzemieniewska &amp; Krzemieniewski (1930)</a>, plate XVI, nos 6–9 depict <span class="named-content species" id="named-content-49"><a class="namesforlife" rel="namesforlife-name" title="P. fumosum"
+                              href="doi:10.1601/nm.3740"><em>P. fumosum</em></a></span>. Courtesy of the Polish Botanical Society. (b) Swarm of PI fu5 (bar, 2000 µm) and single sporangium of PI fu5 (insert; bar,
+                        100 µm). (c) Fruiting bodies of PI fu5. Bar, 300 µm.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <p id="p-12">The Bacteriological Code also allows for the proposal of neotype strains according to Rule 18c: ‘If a strain on which the
+                  original description was based cannot be found, a neotype strain may be proposed. A neotype strain must be proposed (proposed
+                  neotype) in the IJSB, together with citation of the author(s) of the name, a description or reference to an effectively published
+                  description and a record of the permanently established culture collection(s) where the strain is deposited (see also Note
+                  1 to Rule 24a)’.
+               </p>
+               <p id="p-13">The species <span class="named-content species" id="named-content-50"><a class="namesforlife" rel="namesforlife-name" title="Cystobacter ferrugineus"
+                        href="doi:10.1601/nm.3698"><em>Cystobacter ferrugineus</em></a></span>, <span class="named-content species" id="named-content-51"><a class="namesforlife" rel="namesforlife-name" title="Cystobacter minus"
+                        href="doi:10.1601/nm.10682"><em>Cystobacter minus</em></a></span> and <span class="named-content species" id="named-content-52"><a class="namesforlife" rel="namesforlife-name" title="Polyangium fumosum"
+                        href="doi:10.1601/nm.3740"><em>Polyangium fumosum</em></a></span> were first described by <a id="xref-ref-9-3" class="xref-bibr" href="#ref-9">Krzemieniewska &amp; Krzemieniewski (1926</a>, <a id="xref-ref-10-4" class="xref-bibr" href="#ref-10">1927</a>, <a id="xref-ref-11-4" class="xref-bibr" href="#ref-11">1930)</a>. McCurdy assigned three of his isolates as the type strains for the above-mentioned three species (<a id="xref-ref-13-5" class="xref-bibr" href="#ref-13">McCurdy, 1970</a>; <a id="xref-table-wrap-1-4" class="xref-table" href="#T1">Table 1</a>). The species names and type strains were included in the Approved Lists (<a id="xref-ref-20-2" class="xref-bibr" href="#ref-20">Skerman <em>et al.</em>, 1980</a>) but they have never been deposited in a culture collection to the best of our knowledge. In 2007, we wrote a letter to the
+                  head of the microbiology laboratory of the University of Windsor with the request for subcultures of the strains <span class="named-content species" id="named-content-53"><a class="namesforlife" rel="namesforlife-name" title="Cystobacter ferrugineus"
+                        href="doi:10.1601/nm.3698"><em>Cystobacter ferrugineus</em></a></span> M-203<sup>T</sup>, <span class="named-content species" id="named-content-54"><a class="namesforlife" rel="namesforlife-name" title="Cystobacter minus"
+                        href="doi:10.1601/nm.10682"><em>Cystobacter minus</em></a></span> M-307<sup>T</sup> and <span class="named-content species" id="named-content-55"><a class="namesforlife" rel="namesforlife-name" title="P. fumosum"
+                        href="doi:10.1601/nm.3740"><em>P. fumosum</em></a></span> M257<sup>T</sup>. Even though the importance for microbial taxonomy was stressed there was no response. In 2012, another attempt to contact
+                  the department at Windsor University was more successful in the respect that we received answers from two colleagues at Windsor
+                  and from H. D. McCurdy who retired several years ago. However, they informed us that they cannot find the samples. Since 1981,
+                  there have been no scientific papers originating from the University of Windsor dealing with myxobacteria (PubMed), a fact
+                  additionally suggesting that nobody at the university had a research interest to keep the cultures alive or, at least, under
+                  surveillance. For that reasons we conclude that these cultures must have been lost.
+               </p>
+               <p id="p-14">Since the presently assigned type strains of the mentioned species are no longer available as living cultures it is formally
+                  proposed that the strains selected by Reichenbach shall be proposed as the neotype strains of the respective species in accordance
+                  with Rule 18c, as given in <a id="xref-table-wrap-1-5" class="xref-table" href="#T1">Table 1</a>. The deposit and availability of the neotype strains from two culture collections is achieved. The proposals of the neotype
+                  strains are based on the suggestions in (<a id="xref-ref-16-6" class="xref-bibr" href="#ref-16">Reichenbach (2005b</a>, <a id="xref-ref-18-6" class="xref-bibr" href="#ref-18">d</a>). In these chapters, the strains <span class="named-content species" id="named-content-56"><a class="namesforlife" rel="namesforlife-name" title="Cystobacter ferrugineus"
+                        href="doi:10.1601/nm.3698"><em>Cystobacter ferrugineus</em></a></span> Cb fe18, <span class="named-content species" id="named-content-57"><a class="namesforlife" rel="namesforlife-name" title="Cystobacter minus"
+                        href="doi:10.1601/nm.10682"><em>Cystobacter minus</em></a></span> Cb m2 and <span class="named-content species" id="named-content-58"><a class="namesforlife" rel="namesforlife-name" title="P. fumosum"
+                        href="doi:10.1601/nm.3740"><em>P. fumosum</em></a></span> Pl fu5 were proposed as the type strains according to the species descriptions given in the respective chapters which rely
+                  on the original species descriptions by Krzemieniewska and Krzemieniewski and McCurdy (<a id="xref-ref-16-7" class="xref-bibr" href="#ref-16">Reichenbach 2005b</a>, <a id="xref-ref-18-7" class="xref-bibr" href="#ref-18">d</a>). However, since type strains have already been assigned these strains have to be proposed as the neotype strains of the
+                  respective species according to rule 18c.
+               </p>
+               <div id="F3" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4354/F3.expansion.html"><img alt="Fig. 2. " src="4354/F3.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4354/F3.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4354/F3.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4354/F3">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 2. </span> 
+                     
+                     <p id="p-15" class="first-child"><span class="named-content species" id="named-content-59"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces crocatus"
+                              href="doi:10.1601/nm.3750"><em>Chondromyces crocatus</em></a></span>. (a) Drawing from <a id="xref-ref-1-1" class="xref-bibr" href="#ref-1">Berkeley (1857)</a>, page 313. (b) Fruiting bodies of Cm c5<sup>T</sup>. Bar, 500 µm.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <div id="F4" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4354/F4.expansion.html"><img alt="Fig. 3. " src="4354/F4.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4354/F4.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4354/F4.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4354/F4">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 3. </span> 
+                     
+                     <p id="p-16" class="first-child"><span class="named-content species" id="named-content-60"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces lanuginosus"
+                              href="doi:10.1601/nm.3753"><em>Chondromyces lanuginosus</em></a></span>. (a) Figures from <a id="xref-ref-8-3" class="xref-bibr" href="#ref-8">Kofler (1913)</a>, <a id="xref-fig-1-2" class="xref-fig" href="#F1">Figs 1</a>–<a id="xref-fig-4-1" class="xref-fig" href="#F4">3</a> on page 877 depict <span class="named-content species" id="named-content-61"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces lanuginosus"
+                              href="doi:10.1601/nm.3753"><em>Chondromyces lanuginosus</em></a></span>. Courtesy Österreichische Akademie der Wissenschaften. (b) Fruiting body of Sy t2<sup>T</sup>. Bar, 100 µm.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <div id="F5" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4354/F5.expansion.html"><img alt="Fig. 4. " src="4354/F5.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4354/F5.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4354/F5.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4354/F5">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 4. </span> 
+                     
+                     <p id="p-17" class="first-child"><span class="named-content species" id="named-content-62"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces pediculatus"
+                              href="doi:10.1601/nm.3754"><em>Chondromyces pediculatus</em></a></span>. (a) Drawing from <a id="xref-ref-22-4" class="xref-bibr" href="#ref-22">Thaxter (1904)</a>, plate XXVI on page 411; nos 7–13 depict <span class="named-content species" id="named-content-63"><a class="namesforlife" rel="namesforlife-name" title="Chondromyces pediculatus"
+                              href="doi:10.1601/nm.3754"><em>Chondromyces pediculatus</em></a></span>. (b) Fruiting body of Cm p51<sup>T</sup>. Bar 100 µm.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <div id="F6" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4354/F6.expansion.html"><img alt="Fig. 5. " src="4354/F6.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4354/F6.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4354/F6.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4354/F6">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 5. </span> 
+                     
+                     <p id="p-18" class="first-child"><span class="named-content species" id="named-content-64"><a class="namesforlife" rel="namesforlife-name" title="Melittangium boletus"
+                              href="doi:10.1601/nm.3711"><em>Melittangium boletus</em></a></span>. (a) Drawing from <a id="xref-ref-7-3" class="xref-bibr" href="#ref-7">Jahn (1924)</a>, plate II, Fig. 17 on page 78. Courtesy Bornträger-Cramer, www.borntraeger-cramer.de. (b) and (c) Fruiting bodies of Me b8<sup>T</sup>. Bars, 120 and 80 µm, respectively.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <div id="F7" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4354/F7.expansion.html"><img alt="Fig. 6. " src="4354/F7.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4354/F7.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4354/F7.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4354/F7">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 6. </span> 
+                     
+                     <p id="p-19" class="first-child"><span class="named-content species" id="named-content-65"><a class="namesforlife" rel="namesforlife-name" title="Polyangium sorediatum"
+                              href="doi:10.1601/nm.3745"><em>Polyangium sorediatum</em></a></span>. (a) Drawing from <a id="xref-ref-22-5" class="xref-bibr" href="#ref-22">Thaxter (1904)</a>, plate XXVII. Nos 22–30 depict <span class="named-content species" id="named-content-66"><a class="namesforlife" rel="namesforlife-name" title="P. sorediatum"
+                              href="doi:10.1601/nm.3745"><em>P. sorediatum</em></a></span>. (b and c) Fruiting bodies of PI s12<sup>T</sup>. Insert: crushed sporangium releasing the single sporangioles. Bars, 200 µm.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <div id="F8" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4354/F8.expansion.html"><img alt="Fig. 7. " src="4354/F8.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4354/F8.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4354/F8.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4354/F8">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 7. </span> 
+                     
+                     <p id="p-20" class="first-child"><span class="named-content species" id="named-content-67"><a class="namesforlife" rel="namesforlife-name" title="Polyangium spumosum"
+                              href="doi:10.1601/nm.3746"><em>Polyangium spumosum</em></a></span>. (a) Figures from <a id="xref-ref-10-5" class="xref-bibr" href="#ref-10">Krzemieniewska &amp; Krzemieniewski (1926)</a>, plate V; no. 19 depicts <span class="named-content species" id="named-content-68"><a class="namesforlife" rel="namesforlife-name" title="P. spumosum"
+                              href="doi:10.1601/nm.3746"><em>P. spumosum</em></a></span> and from <a id="xref-ref-11-5" class="xref-bibr" href="#ref-11">Krzemieniewska &amp; Krzemieniewski (1930)</a>, plate XVI; nos 10–12 depict <span class="named-content species" id="named-content-69"><a class="namesforlife" rel="namesforlife-name" title="P. spumosum"
+                              href="doi:10.1601/nm.3746"><em>P. spumosum</em></a></span>. Courtesy of the Polish Botanical Society. (b–d) Degenerated fruiting bodies of PI sm5<sup>T</sup>. Bars, 500, 100 and 250 µm, respectively.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <div id="F9" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4354/F9.expansion.html"><img alt="Fig. 8. " src="4354/F9.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4354/F9.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4354/F9.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4354/F9">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 8. </span> 
+                     
+                     <p id="p-21" class="first-child"><span class="named-content species" id="named-content-70"><a class="namesforlife" rel="namesforlife-name" title="Cystobacter ferrugineus"
+                              href="doi:10.1601/nm.3698"><em>Cystobacter ferrugineus</em></a></span>. (a) Figures from <a id="xref-ref-13-6" class="xref-bibr" href="#ref-13">McCurdy (1970)</a>. (b–d) Strain Cb fe18, (b) myxospores and (c) fruiting bodies on <em>Escherichia coli</em> as food bacteria and (d) on a cellulose plate. Bars, 10 µm, 1 mm and 10 mm, respectively.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <div id="F10" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4354/F10.expansion.html"><img alt="Fig. 9. " src="4354/F10.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4354/F10.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4354/F10.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_11/4354/F10">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 9. </span> 
+                     
+                     <p id="p-22" class="first-child"><span class="named-content species" id="named-content-71"><a class="namesforlife" rel="namesforlife-name" title="Cystobacter minus"
+                              href="doi:10.1601/nm.10682"><em>Cystobacter minus</em></a></span>. (a), Figures from <a id="xref-ref-13-7" class="xref-bibr" href="#ref-13">McCurdy (1970)</a>. (b and c), Fruiting bodies of Cb m2. Bars, 500 µm and 200 µm, respectively.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <div class="section ack" id="ack-1">
+                  <div class="section-nav"><a href="#fn-group-1" title="Previous Section" class="prev-section-link"><span>Previous Section</span></a><a href="#ref-list-1" title="References" class="next-section-link"><span>Next Section</span></a></div>
+                  <h2>Acknowledgements</h2>
+                  
+                  <p id="p-23">We are thankful to K. Poling and I. Churchill at Windsor University, G. Lewis-Gentry at the Harvard University Herbaria and
+                     H. D. McCurdy for taking the effort to investigate the disposition of the type materials.
+                  </p>
+                  
+               </div>
+               <div class="section ref-list" id="ref-list-1">
+                  <div class="section-nav"><a href="#ack-1" title="Acknowledgements" class="prev-section-link"><span>Previous Section</span></a><div class="nav-placeholder"> </div>
+                  </div>
+                  <h2>References</h2>
+                  <ol class="cit-list ref-use-labels">
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-1-1" title="View reference  in text"
+                           id="ref-1">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4354.1">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Berkeley</span>,  <span class="cit-name-given-names">M. J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1857</span><strong>).</strong> <span class="cit-source">Introduction to Cryptogamic Botany</span>. <span class="cit-publ-loc">London</span>: <span class="cit-publ-name">H. Bailliere</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Introduction%20to%20Cryptogamic%20Botany&amp;author=M.%20J.%20Berkeley&amp;publication_year=1857">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><div class="cit ref-cit ref-journal no-rev-xref" id="cit-63.Pt_11.4354.2"
+                             data-doi="10.1099/00207713-39-4-495">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Berkeley</span>,  <span class="cit-name-given-names">M. J.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Curtis</span>,  <span class="cit-name-given-names">M. A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1874</span><strong>).</strong> <span class="cit-article-title">Notices of the North American Fungi</span>. <abbr class="cit-jnl-abbrev">Grevillea</abbr> <span class="cit-vol">3</span>, <span class="cit-fpage">49</span>–<span class="cit-lpage">64</span>.<span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-39-4-495</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1099/00207713-39-4-495&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Notices%20of%20the%20North%20American%20Fungi&amp;author=M.%20J.%20Berkeley&amp;author=M.%20A.%20Curtis&amp;publication_year=1874&amp;journal=Grevillea&amp;volume=3&amp;pages=49-64&amp;doi=10.1099%2F00207713-39-4-495">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-3-3" title="View reference  in text"
+                           id="ref-3">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4354.3">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Staley</span>,  <span class="cit-name-given-names">J. T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Bryant</span>,  <span class="cit-name-given-names">M. P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Pfennig</span>,  <span class="cit-name-given-names">N.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Holt</span>,  <span class="cit-name-given-names">J. G.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brockman</span>,  <span class="cit-name-given-names">E. R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1989a</span><strong>).</strong> <span class="cit-article-title">Genus I. <em>Polyangium</em> Link 1809, 42<sup>AL</sup></span>. In <span class="cit-source">Bergey’s Manual of Systematic Bacteriology</span>, <span class="cit-vol">vol. 3</span>, pp. <span class="cit-fpage">2159</span>–<span class="cit-lpage">2162</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Staley</span>,  <span class="cit-name-given-names">J. T.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Bryant</span>,  <span class="cit-name-given-names">M. P.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Pfennig</span>,  <span class="cit-name-given-names">N.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Holt</span>,  <span class="cit-name-given-names">J. G.</span></span>
+                                 . <span class="cit-publ-loc">Baltimore</span>: <span class="cit-publ-name">Williams &amp; Wilkins</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Genus%20I.%20Polyangium%20Link%201809%2C%2042AL&amp;author=E.%20R.%20Brockman&amp;publication_year=1989a&amp;citation_inbook_title=Bergey%E2%80%99s%20Manual%20of%20Systematic%20Bacteriology">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-4-1" title="View reference  in text"
+                           id="ref-4">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4354.4"
+                             data-doi="10.1099/00207713-39-4-495">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brockman</span>,  <span class="cit-name-given-names">E. R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1989b</span><strong>).</strong> <span class="cit-article-title"><em>Polyangium sorediatum</em> nom. rev. In <em>Validation of the Publication of New Names and New Combinations Previously Effectively Published Outside the IJSB</em>, List No. 31</span>. <abbr class="cit-jnl-abbrev">Int J Syst Bacteriol</abbr> <span class="cit-vol">39</span>, <span class="cit-fpage">495</span>–<span class="cit-lpage">497</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-39-4-495</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=PDF&amp;journalCode=ijs&amp;resid=39/4/495"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-5-1" title="View reference  in text"
+                           id="ref-5">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4354.5"
+                             data-doi="10.1099/00207713-39-4-495">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Brockman</span>,  <span class="cit-name-given-names">E. R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1989</span><strong>c).</strong> <span class="cit-article-title"><em>Polyangium spumosum</em> nom. rev. In <em>Validation of the Publication of New Names and New Combinations Previously Effectively Published Outside the IJSB</em>, List No. 31</span>. <abbr class="cit-jnl-abbrev">Int J Syst Bacteriol</abbr> <span class="cit-vol">39</span>, <span class="cit-fpage">495</span>–<span class="cit-lpage">497</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-39-4-495</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=PDF&amp;journalCode=ijs&amp;resid=39/4/495"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-6-1" title="View reference  in text"
+                           id="ref-6">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4354.6"
+                             data-doi="10.1128/JB.01091-10">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Garcia</span>,  <span class="cit-name-given-names">R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pistorius</span>,  <span class="cit-name-given-names">D.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stadler</span>,  <span class="cit-name-given-names">M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Müller</span>,  <span class="cit-name-given-names">R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2011</span><strong>).</strong> <span class="cit-article-title">Fatty acid-related phylogeny of myxobacteria as an approach to discover polyunsaturated omega-3/6 fatty acids</span>. <abbr class="cit-jnl-abbrev">J Bacteriol</abbr> <span class="cit-vol">193</span>, <span class="cit-fpage">1930</span>–<span class="cit-lpage">1942</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1128/JB.01091-10</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>21317327</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=jb&amp;resid=193/8/1930"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-7-2" title="View reference  in text"
+                           id="ref-7">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4354.7">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jahn</span>,  <span class="cit-name-given-names">E.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1924</span><strong>).</strong> <span class="cit-source">Beitraege zur Botanischen Protistologie I. Die Polyangiden</span>. <span class="cit-publ-loc">Leipzig</span>: <span class="cit-publ-name">Verlag Gebrueder Borntraeger</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Beitraege%20zur%20Botanischen%20Protistologie%20I.%20Die%20Polyangiden&amp;author=E.%20Jahn&amp;publication_year=1924">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-8-1" title="View reference  in text"
+                           id="ref-8">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4354.8">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kofler</span>,  <span class="cit-name-given-names">L.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1913</span><strong>).</strong> <span class="cit-article-title">Die Myxobakterien der Umgebung von Wien</span>. <abbr class="cit-jnl-abbrev">Sitzungsberichte der Akademie der Wissenschaften in Wien Mathematisch-naturwissenschaftliche Klasse Abteilung I</abbr> <span class="cit-vol">122</span>, <span class="cit-fpage">845</span>–<span class="cit-lpage">876</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Die%20Myxobakterien%20der%20Umgebung%20von%20Wien&amp;author=L.%20Kofler&amp;publication_year=1913&amp;journal=Sitzungsberichte%20der%20Akademie%20der%20Wissenschaften%20in%20Wien%20Mathematisch-naturwissenschaftliche%20Klasse%20Abteilung%20I&amp;volume=122&amp;pages=845-876">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-9-3" title="View reference  in text"
+                           id="ref-9">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4354.9">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Krzemieniewska</span>,  <span class="cit-name-given-names">H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Krzemieniewski</span>,  <span class="cit-name-given-names">S.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1926</span><strong>).</strong> <span class="cit-article-title">Miksobacterje Polski (Die Myxobakterien von Polen)</span>. <abbr class="cit-jnl-abbrev">Acta Societatis Botanicorum Poloniae</abbr> <span class="cit-vol">4</span>, <span class="cit-fpage">1</span>–<span class="cit-lpage">54</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Miksobacterje%20Polski%20%28Die%20Myxobakterien%20von%20Polen%29&amp;author=H.%20Krzemieniewska&amp;author=S.%20Krzemieniewski&amp;publication_year=1926&amp;journal=Acta%20Societatis%20Botanicorum%20Poloniae&amp;volume=4&amp;pages=1-54">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-10-4" title="View reference  in text"
+                           id="ref-10">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4354.10">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Krzemieniewska</span>,  <span class="cit-name-given-names">H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Krzemieniewski</span>,  <span class="cit-name-given-names">S.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1927</span><strong>).</strong> <span class="cit-article-title">Miksobacterje Polski. Uzupelnienie. (Die Myxobakterien von Polen. Anhang)</span>. <abbr class="cit-jnl-abbrev">Acta Societatis Botanicorum Poloniae</abbr> <span class="cit-vol">5</span>, <span class="cit-fpage">79</span>–<span class="cit-lpage">98</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Miksobacterje%20Polski.%20Uzupelnienie.%20%28Die%20Myxobakterien%20von%20Polen.%20Anhang%29&amp;author=H.%20Krzemieniewska&amp;author=S.%20Krzemieniewski&amp;publication_year=1927&amp;journal=Acta%20Societatis%20Botanicorum%20Poloniae&amp;volume=5&amp;pages=79-98">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-11-3" title="View reference  in text"
+                           id="ref-11">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4354.11">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Krzemieniewska</span>,  <span class="cit-name-given-names">H.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Krzemieniewski</span>,  <span class="cit-name-given-names">S.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1930</span><strong>).</strong> <span class="cit-article-title">Miksobakterje Polski. Czesc Trzecia. (Die Myxobakterien von Polen. III. Teil)</span>. <abbr class="cit-jnl-abbrev">Acta Societatis Botanicorum Poloniae</abbr> <span class="cit-vol">7</span>, <span class="cit-fpage">250</span>–<span class="cit-lpage">273</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Miksobakterje%20Polski.%20Czesc%20Trzecia.%20%28Die%20Myxobakterien%20von%20Polen.%20III.%20Teil%29&amp;author=H.%20Krzemieniewska&amp;author=S.%20Krzemieniewski&amp;publication_year=1930&amp;journal=Acta%20Societatis%20Botanicorum%20Poloniae&amp;volume=7&amp;pages=250-273">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-12-1" title="View reference  in text"
+                           id="ref-12">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4354.12">
+                           <div class="cit-metadata">
+                              <ol class="cit-ed-list">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Lapage</span>,  <span class="cit-name-given-names">S. P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Sneath</span>,  <span class="cit-name-given-names">P. H. A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Lessel</span>,  <span class="cit-name-given-names">E. F.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Skerman</span>,  <span class="cit-name-given-names">V. B. D.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Seeliger</span>,  <span class="cit-name-given-names">H. P. R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Clark</span>,  <span class="cit-name-given-names">W. A.</span></span></li>
+                              </ol><cite> <strong>(editors) (</strong><span class="cit-pub-date">1992</span><strong>).</strong> <span class="cit-source">International Code of Nomenclature of Bacteria (1990 Revision). Bacteriological Code</span>. <span class="cit-publ-loc">Washington, DC</span>: <span class="cit-publ-name">American Society for Microbiology</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=International%20Code%20of%20Nomenclature%20of%20Bacteria%20%281990%20Revision%29.%20Bacteriological%20Code&amp;author=S.%20P.%20Lapage&amp;author=P.%20H.%20A.%20Sneath&amp;author=E.%20F.%20Lessel&amp;author=V.%20B.%20D.%20Skerman&amp;author=H.%20P.%20R.%20Seeliger&amp;author=W.%20A.%20Clark&amp;publication_year=1992">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-13-5" title="View reference  in text"
+                           id="ref-13">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4354.13"
+                             data-doi="10.1099/00207713-20-3-283">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">McCurdy</span>,  <span class="cit-name-given-names">H. D.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1970</span><strong>).</strong> <span class="cit-article-title">Studies on the taxonomy of the <em>Myxobacterales</em>. II. <em>Polyangium</em> and the demise of the <em>Sporangiaceae</em></span>. <abbr class="cit-jnl-abbrev">Int J Syst Bacteriol</abbr> <span class="cit-vol">20</span>, <span class="cit-fpage">283</span>–<span class="cit-lpage">296</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-20-3-283</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=20/3/283"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-14-1" title="View reference  in text"
+                           id="ref-14">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4354.14"
+                             data-doi="10.1099/00207713-21-1-40">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">McCurdy</span>,  <span class="cit-name-given-names">H. D.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1971</span><strong>).</strong> <span class="cit-article-title">Studies on the taxonomy of the <em>Myxobacterales</em>. III. <em>Chondromyces</em> and <em>Stigmatella</em></span>. <abbr class="cit-jnl-abbrev">Int J Syst Bacteriol</abbr> <span class="cit-vol">21</span>, <span class="cit-fpage">40</span>–<span class="cit-lpage">49</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-21-1-40</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=21/1/40"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-15-5" title="View reference  in text"
+                           id="ref-15">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4354.15"
+                             data-doi="10.1007/0-387-29298-5_276">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Brenner</span>,  <span class="cit-name-given-names">D. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Garrity</span>,  <span class="cit-name-given-names">G. M.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Reichenbach</span>,  <span class="cit-name-given-names">H.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2005a</span><strong>).</strong> <span class="cit-article-title">Genus III. <em>Chondromyces</em> Berkeley and Curtis in Berkeley 1874, 64<sup>AL</sup></span>. In <span class="cit-source">Bergey’s Manual of Systematic Bacteriology</span>, <span class="cit-edition">2nd edn</span>, <span class="cit-vol">vol. 2</span>, pp. <span class="cit-fpage">1121</span>–<span class="cit-lpage">1129</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Brenner</span>,  <span class="cit-name-given-names">D. J.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Garrity</span>,  <span class="cit-name-given-names">G. M.</span></span>
+                                 . <span class="cit-publ-loc">New York</span>: <span class="cit-publ-name">Springer</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/0-387-29298-5_276</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/0-387-29298-5_276&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Genus%20III.%20Chondromyces%20Berkeley%20and%20Curtis%20in%20Berkeley%201874%2C%2064AL&amp;author=H.%20Reichenbach&amp;publication_year=2005a&amp;citation_inbook_title=Bergey%E2%80%99s%20Manual%20of%20Systematic%20Bacteriology">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-16-5" title="View reference  in text"
+                           id="ref-16">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4354.16"
+                             data-doi="10.1007/0-387-29298-5_269">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Brenner</span>,  <span class="cit-name-given-names">D. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Garrity</span>,  <span class="cit-name-given-names">G. M.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Reichenbach</span>,  <span class="cit-name-given-names">H.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2005b</span><strong>).</strong> <span class="cit-article-title">Genus I. <em>Cystobacter</em> Schroeter 1886, 170<sup>AL</sup></span>. In <span class="cit-source">Bergey’s Manual of Systematic Bacteriology</span>, <span class="cit-edition">2nd edn</span>, <span class="cit-vol">vol. 2</span>, pp. <span class="cit-fpage">1086</span>–<span class="cit-lpage">1096</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Brenner</span>,  <span class="cit-name-given-names">D. J.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Garrity</span>,  <span class="cit-name-given-names">G. M.</span></span>
+                                 . <span class="cit-publ-loc">New York</span>: <span class="cit-publ-name">Springer</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/0-387-29298-5_269</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/0-387-29298-5_269&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Genus%20I.%20Cystobacter%20Schroeter%201886%2C%20170AL&amp;author=H.%20Reichenbach&amp;publication_year=2005b&amp;citation_inbook_title=Bergey%E2%80%99s%20Manual%20of%20Systematic%20Bacteriology">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-17-2" title="View reference  in text"
+                           id="ref-17">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4354.17"
+                             data-doi="10.1007/0-387-29298-5_272">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Brenner</span>,  <span class="cit-name-given-names">D. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Garrity</span>,  <span class="cit-name-given-names">G. M.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Reichenbach</span>,  <span class="cit-name-given-names">H.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2005c</span><strong>).</strong> <span class="cit-article-title">Genus IV. <em>Melittangium</em> Jahn 1924, 7<sup>AL</sup></span>. In <span class="cit-source">Bergey’s Manual of Systematic Bacteriology</span>, <span class="cit-edition">2nd edn</span>, <span class="cit-vol">vol. 2</span>, pp. <span class="cit-fpage">1101</span>–<span class="cit-lpage">1104</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Brenner</span>,  <span class="cit-name-given-names">D. J.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Garrity</span>,  <span class="cit-name-given-names">G. M.</span></span>
+                                 . <span class="cit-publ-loc">New York</span>: <span class="cit-publ-name">Springer</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/0-387-29298-5_272</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/0-387-29298-5_272&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Genus%20IV.%20Melittangium%20Jahn%201924%2C%207AL&amp;author=H.%20Reichenbach&amp;publication_year=2005c&amp;citation_inbook_title=Bergey%E2%80%99s%20Manual%20of%20Systematic%20Bacteriology">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-18-5" title="View reference  in text"
+                           id="ref-18">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_11.4354.18"
+                             data-doi="10.1007/0-387-29298-5_274">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Brenner</span>,  <span class="cit-name-given-names">D. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Garrity</span>,  <span class="cit-name-given-names">G. M.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Reichenbach</span>,  <span class="cit-name-given-names">H.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2005d</span><strong>).</strong> <span class="cit-article-title">Genus I. Polyangium Link 1809, 42<sup>AL</sup></span>. In <span class="cit-source">Bergey’s Manual of Systematic Bacteriology</span>, <span class="cit-edition">2nd edn</span>, <span class="cit-vol">vol. 2</span>, pp. <span class="cit-fpage">1110</span>–<span class="cit-lpage">1118</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Brenner</span>,  <span class="cit-name-given-names">D. J.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Garrity</span>,  <span class="cit-name-given-names">G. M.</span></span>
+                                 . <span class="cit-publ-loc">New York</span>: <span class="cit-publ-name">Springer</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/0-387-29298-5_274</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/0-387-29298-5_274&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Genus%20I.%20Polyangium%20Link%201809%2C%2042AL&amp;author=H.%20Reichenbach&amp;publication_year=2005d&amp;citation_inbook_title=Bergey%E2%80%99s%20Manual%20of%20Systematic%20Bacteriology">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><div class="cit ref-cit ref-book no-rev-xref" id="cit-63.Pt_11.4354.19">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Brenner</span>,  <span class="cit-name-given-names">D. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Garrity</span>,  <span class="cit-name-given-names">G. M.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Reichenbach</span>,  <span class="cit-name-given-names">H.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2005e</span><strong>).</strong> <span class="cit-article-title">Order VIII. Myxococcales Tchan, Pochon and Prévot 1948, 398<sup>AL</sup></span>. In <span class="cit-source">Bergey’s Manual of Systematic Bacteriology</span><em>,</em> <span class="cit-edition">2nd edn</span>, <span class="cit-vol">vol. 2</span>, pp. <span class="cit-fpage">1059</span>–<span class="cit-lpage">1072</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Brenner</span>,  <span class="cit-name-given-names">D. J.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Garrity</span>,  <span class="cit-name-given-names">G. M.</span></span>
+                                 . <span class="cit-publ-loc">New York</span>: <span class="cit-publ-name">Springer</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Order%20VIII.%20Myxococcales%20Tchan%2C%20Pochon%20and%20Pr%C3%A9vot%201948%2C%20398AL&amp;author=H.%20Reichenbach&amp;publication_year=2005e&amp;citation_inbook_title=Bergey%E2%80%99s%20Manual%20of%20Systematic%20Bacteriology">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-20-1" title="View reference  in text"
+                           id="ref-20">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4354.20"
+                             data-doi="10.1099/00207713-30-1-225">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Skerman</span>,  <span class="cit-name-given-names">V. B. D.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">McGowan</span>,  <span class="cit-name-given-names">V.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sneath</span>,  <span class="cit-name-given-names">P. H. A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1980</span><strong>).</strong> <span class="cit-article-title">Approved lists of bacterial names</span>. <abbr class="cit-jnl-abbrev">Int J Syst Bacteriol</abbr> <span class="cit-vol">30</span>, <span class="cit-fpage">225</span>–<span class="cit-lpage">420</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-30-1-225</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=PDF&amp;journalCode=ijs&amp;resid=30/1/225"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-21-1" title="View reference  in text"
+                           id="ref-21">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4354.21"
+                             data-doi="10.1086/327531">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Thaxter</span>,  <span class="cit-name-given-names">R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1897</span><strong>).</strong> <span class="cit-article-title">Further observations on the <em>Myxobacteriaceae</em></span>. <abbr class="cit-jnl-abbrev">Bot Gaz</abbr> <span class="cit-vol">23</span>, <span class="cit-fpage">395</span>–<span class="cit-lpage">411</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1086/327531</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1086/327531&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Further%20observations%20on%20the%20Myxobacteriaceae&amp;author=R.%20Thaxter&amp;publication_year=1897&amp;journal=Bot%20Gaz&amp;volume=23&amp;pages=395-411&amp;doi=10.1086%2F327531">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-22-1" title="View reference  in text"
+                           id="ref-22">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4354.22"
+                             data-doi="10.1086/328505">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Thaxter</span>,  <span class="cit-name-given-names">R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1904</span><strong>).</strong> <span class="cit-article-title">Notes on the <em>Myxobacteriaceae</em></span>. <abbr class="cit-jnl-abbrev">Bot Gaz</abbr> <span class="cit-vol">37</span>, <span class="cit-fpage">405</span>–<span class="cit-lpage">416</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1086/328505</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1086/328505&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Notes%20on%20the%20Myxobacteriaceae&amp;author=R.%20Thaxter&amp;publication_year=1904&amp;journal=Bot%20Gaz&amp;volume=37&amp;pages=405-416&amp;doi=10.1086%2F328505">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-23-1" title="View reference  in text"
+                           id="ref-23">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_11.4354.23"
+                             data-doi="10.1016/j.syapm.2012.12.006">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Yarza</span>,  <span class="cit-name-given-names">P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Spröer</span>,  <span class="cit-name-given-names">C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Swiderski</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Mrotzek</span>,  <span class="cit-name-given-names">N.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Spring</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Tindall</span>,  <span class="cit-name-given-names">B. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Gronow</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pukall</span>,  <span class="cit-name-given-names">R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Klenk</span>,  <span class="cit-name-given-names">H. P.</span></span></li>
+                              </ol><cite> <strong>&amp; other authors (</strong><span class="cit-pub-date">2013</span><strong>).</strong> <span class="cit-article-title">Sequencing orphan species initiative (SOS): Filling the gaps in the 16S rRNA gene sequence database for all species with validly
+                                    published names</span>. <abbr class="cit-jnl-abbrev">Syst Appl Microbiol</abbr> <span class="cit-vol">36</span>, <span class="cit-fpage">69</span>–<span class="cit-lpage">73</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1016/j.syapm.2012.12.006</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>23410935</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1016/j.syapm.2012.12.006&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=23410935&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Sequencing%20orphan%20species%20initiative%20%28SOS%29%3A%20Filling%20the%20gaps%20in%20the%2016S%20rRNA%20gene%20sequence%20database%20for%20all%20species%20with%20validly%20published%20names&amp;author=P.%20Yarza&amp;author=C.%20Spr%C3%B6er&amp;author=J.%20Swiderski&amp;author=N.%20Mrotzek&amp;author=S.%20Spring&amp;author=B.%20J.%20Tindall&amp;author=S.%20Gronow&amp;author=R.%20Pukall&amp;author=H.%20P.%20Klenk&amp;publication_year=2013&amp;journal=Syst%20Appl%20Microbiol&amp;volume=36&amp;pages=69-73&amp;doi=10.1016%2Fj.syapm.2012.12.006&amp;pmid=23410935">Google Scholar</a></div>
+                        </div>
+                     </li>
+                  </ol>
+               </div><span class="highwire-journal-article-marker-end"></span></div>
+            <div class="social-bookmarking">
+               
+               <ul class="social-bookmark-links">
+                  <li class="social-bookmarking-item social-bookmarking-item-citeulike"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=CITEULIKE"><img src="/shared/img/common/social-bookmarking/citeulike.gif"
+                             alt="Add to CiteULike"
+                             title="CiteULike" /></a><span class="soc-bm-link-text">CiteULike</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-delicious"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=DEL_ICIO_US"><img src="/shared/img/common/social-bookmarking/delicious.gif"
+                             alt="Add to Delicious"
+                             title="Delicious" /></a><span class="soc-bm-link-text">Delicious</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-digg"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=DIGG"><img src="/shared/img/common/social-bookmarking/digg.gif" alt="Add to Digg"
+                             title="Digg" /></a><span class="soc-bm-link-text">Digg</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-facebook"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/short/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=FACEBOOK"
+                        class="sb-facebook"
+                        rel="external-nw"><img src="/shared/img/common/social-bookmarking/facebook.gif" alt="Add to Facebook"
+                             title="Facebook" /></a><span class="soc-bm-link-text">Facebook</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-googleplus"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=GOOGLEPLUS&amp;log_only=yes"><img src="/shared/img/common/social-bookmarking/googleplus.jpg" alt="Add to Google+"
+                             title="Google+" /></a><span class="soc-bm-link-text">Google+</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-linkedin"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=LINKEDIN"><img src="/shared/img/common/social-bookmarking/linkedin.gif" alt="Add to LinkedIn"
+                             title="LinkedIn" /></a><span class="soc-bm-link-text">LinkedIn</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-mendeley"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=MENDELEY"><img src="/shared/img/common/social-bookmarking/mendeley.gif" alt="Add to Mendeley"
+                             title="Mendeley" /></a><span class="soc-bm-link-text">Mendeley</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-reddit"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=REDDIT"><img src="/shared/img/common/social-bookmarking/reddit.gif" alt="Add to Reddit"
+                             title="Reddit" /></a><span class="soc-bm-link-text">Reddit</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-twitter"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=TWITTER"><img src="/shared/img/common/social-bookmarking/twitter.gif" alt="Add to Twitter"
+                             title="Twitter" /></a><span class="soc-bm-link-text">Twitter</span></li>
+               </ul>
+               
+               <p class="social-bookmarking-help"><a href="/help/social_bookmarks.dtl">What's this?</a></p>
+               
+            </div><span id="related-urls"></span></div>
+         <div id="col-2">
+            
+            <div class="article-nav sidebar-nav">
+               <a href="/content/63/Pt_11/4350.short" title="Previous article" class="previous">« Previous</a><span class="article-nav-sep"> | </span><a href="/content/63/Pt_11/4361.short" title="Next article" class="next">Next Article »</a>
+               
+               <span class="toc-link">
+                  				<a href="/content/63/Pt_11.toc" title="Table of Contents">Table of Contents</a>
+                  			</span>
+               
+               
+            </div>
+            <div class="free-article">
+               <span class="free-article-note">
+                  FREE ARTICLE
+                  </span>
+               
+            </div>
+            <div class="content-box" id="article-cb-main">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Article</span></h3>
+                  <div class="cb-section cb-slug">
+                     <ol>
+                        <li>
+                           <div id="slugline">
+                              
+                              
+                              	    
+                              
+                              doi:
+                              <span title="10.1099/ijs.0.056440-0" class="slug-doi">10.1099/ijs.0.056440-0
+                                 </span>
+                              <cite>
+                                 	    <abbr title="International Journal of Systematic and Evolutionary Microbiology"
+                                       class="slug-jnl-abbrev">
+                                    IJSEM</abbr><span class="slug-pub-date" itemprop="datePublished">
+                                    	    November 2013 
+                                    </span>
+                                 	    <span class="slug-vol">
+                                    vol. 63 
+                                    </span><span class="slug-issue">
+                                    no. Pt 11 
+                                    </span><span class="slug-pages">
+                                    4354-4360
+                                    </span>
+                                 </cite>
+                              
+                              	           
+                              
+                              
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section cb-views">
+                     <ol>
+                        <li class="abstract-view-link primary"><a href="/content/63/Pt_11/4354.abstract" rel="view-abstract">Abstract</a><span class="free">Free</span></li>
+                        <li class="notice full-text-view-link primary"><span class="variant-indicator">» <span>Full Text</span></span><span class="free">Free</span></li>
+                        <li class="notice full-text-pdf-view-link primary"><a href="/content/63/Pt_11/4354.full.pdf+html" rel="view-full-text.pdf">Full Text (PDF)</a><span class="free">Free</span></li>
+                        <li><a href="/content/63/Pt_11/4354/suppl/DC1" rel="supplemental-data"
+                              class="dslink-supplementary-material">Supplementary material</a></li>
+                        <li><a href="/powerpoint/63/Pt_11/4354">PPT Slides of All Figures</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible" id="cb-art-cat">
+                     <h4 class="cb-section-header"><span>Classifications</span></h4>
+                     <ol>
+                        <li>
+                           <ul class="subject-headings last-child">
+                              <li><a class="tocsection-search"
+                                    href="/search?tocsectionid=Taxonomic+Note&amp;sortspec=date&amp;submit=Submit">Taxonomic Note</a></li>
+                           </ul>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible" id="cb-art-svcs">
+                     <h4 class="cb-section-header"><span>Services</span></h4>
+                     <ol>
+                        <li class="mail-a-friend-link icon-link"><a href="/email?gca=ijs%3B63%2FPt_11%2F4354&amp;current-view-path=/content/63/Pt_11/4354.full">
+                              Email this article to a colleague</a></li>
+                        <li class="alert-link icon-link"><a href="/cgi/alerts/ctalert?alertType=citedby&amp;addAlert=cited_by&amp;cited_by_criteria_resid=ijs%3B63%2FPt_11%2F4354&amp;saveAlert=no&amp;return-type=article&amp;return_url=http://ijs.sgmjournals.org/content/63/Pt_11/4354.full">Alert me when this article is cited</a></li>
+                        <li class="alert-link icon-link"><a href="/cgi/alerts/ctalert?alertType=correction&amp;addAlert=correction&amp;correction_criteria_value=63/Pt_11/4354&amp;saveAlert=no&amp;return-type=article&amp;return_url=http://ijs.sgmjournals.org/content/63/Pt_11/4354.full">Alert me if a correction is posted</a></li>
+                        <li class="similar-link"><a href="/search?qbe=ijs%3Bijs.0.056440-0&amp;citation=Lang%20and%20Reichenbach%2063%20%28Pt%2011%29:%204354&amp;submit=yes">Similar articles in this journal</a></li>
+                        <li class="similar-link"><a href="/external-ref?access_num=ijs%3B63%2FPt_11%2F4354&amp;link_type=ISI_RELATEDRECORDS"
+                              id="cb-isi-similar-articles"
+                              class="similar-link">Similar articles in Web of Science</a></li>
+                        <li class="similar-link"><a href="/external-ref?access_num=24187023&amp;link_type=MED_NBRS"
+                              class="similar-link">Similar articles in PubMed</a></li>
+                        <li class="cit-man-link icon-link cite-link"><a href="/citmgr?gca=ijs%3B63%2FPt_11%2F4354">Download to citation manager</a></li>
+                        <li class="copyright-link icon-link"><a href="/external-ref?link_type=PERMISSIONDIRECT"><img src="/shared/img/content/permissions.gif" /></a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-cit">
+                     <h4 class="cb-section-header"><span>Citing Articles</span></h4>
+                     <ol>
+                        <li class="hw-citing-link"><a href="/content/63/Pt_11/4354.full?cited-by=yes&amp;legid=ijs;63/Pt_11/4354#cited-by"
+                              id="cb-hw-citing-articles">Load citing article information</a></li>
+                        <li><a href="/cgi/crossref-forward-links/63/Pt_11/4354" rel="external-nw"
+                              id="cb-crossref-citing-articles">Citing articles via CrossRef</a></li>
+                        <li><a href="/external-ref?access_num=%2Fijs%2F63%2FPt_11%2F4354&amp;link_type=ISI_CITING&amp;accnum_type=native"
+                              rel="external-nw"
+                              id="cb-isi-citing-articles">Citing articles via Web of Science</a></li>
+                        <li><a href="/external-ref?access_num=http://ijs.sgmjournals.org/content/63/Pt_11/4354.abstract&amp;link_type=GOOGLESCHOLAR">Citing articles via Google Scholar</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-gs">
+                     <h4 class="cb-section-header"><span>Google Scholar</span></h4>
+                     <ol>
+                        <li class="cb-art-gs-auth author-link"><a href="http://scholar.google.com/scholar?q=%22author%3ALang%20author%3AE.%22"
+                              class="cb-art-gs-auth author-link">Articles by  Lang, E.</a></li>
+                        <li class="cb-art-gs-auth author-link"><a href="http://scholar.google.com/scholar?q=%22author%3AReichenbach%20author%3AH.%22"
+                              class="cb-art-gs-auth author-link">Articles by  Reichenbach, H.</a></li>
+                        <li class="cb-art-gs-rel similar-link"><a href="/external-ref?access_num=http://ijs.sgmjournals.org/content/63/Pt_11/4354.abstract&amp;link_type=GOOGLESCHOLARRELATED">Search for related content</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-pm">
+                     <h4 class="cb-section-header"><span>PubMed</span></h4>
+                     <ol>
+                        <li class="cb-art-pm-cite cite-link icon-link"><a href="/external-ref?access_num=24187023&amp;link_type=PUBMED"
+                              class="cb-art-pm-cite cite-link icon-link">PubMed citation</a></li>
+                        <li class="cb-art-pm-auth author-link"><a href="/external-ref?access_num=Lang%20E&amp;link_type=AUTHORSEARCH"
+                              class="cb-art-pm-auth author-link">Articles by  Lang, E.</a></li>
+                        <li class="cb-art-pm-auth author-link"><a href="/external-ref?access_num=Reichenbach%20H&amp;link_type=AUTHORSEARCH"
+                              class="cb-art-pm-auth author-link">Articles by  Reichenbach, H.</a></li>
+                        <li>
+                           <div id="cb-entrez-links-placeholder"><a href="/entrez-links/24187023"></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-rel">
+                     <h4 class="cb-section-header"><span>Related Content</span></h4>
+                     <ol>
+                        <li><a href="/content/63/Pt_11/4354.full?related-urls=yes&amp;legid=ijs;63/Pt_11/4354#related-urls"
+                              id="cb-related-urls">Load related web page information</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed soc-links icon-link"
+                       id="cb-art-soc">
+                     <h4 class="cb-section-header"><span>Social Bookmarking</span></h4>
+                     <ol>
+                        <li>
+                           <div class="social-bookmarking">
+                              
+                              <ul class="social-bookmark-links">
+                                 <li class="social-bookmarking-item social-bookmarking-item-citeulike"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=CITEULIKE"><img src="/shared/img/common/social-bookmarking/citeulike.gif"
+                                            alt="Add to CiteULike"
+                                            title="CiteULike" /></a><span class="soc-bm-link-text">CiteULike</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-delicious"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=DEL_ICIO_US"><img src="/shared/img/common/social-bookmarking/delicious.gif"
+                                            alt="Add to Delicious"
+                                            title="Delicious" /></a><span class="soc-bm-link-text">Delicious</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-digg"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=DIGG"><img src="/shared/img/common/social-bookmarking/digg.gif" alt="Add to Digg"
+                                            title="Digg" /></a><span class="soc-bm-link-text">Digg</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-facebook"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/short/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=FACEBOOK"
+                                       class="sb-facebook"
+                                       rel="external-nw"><img src="/shared/img/common/social-bookmarking/facebook.gif" alt="Add to Facebook"
+                                            title="Facebook" /></a><span class="soc-bm-link-text">Facebook</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-googleplus"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=GOOGLEPLUS&amp;log_only=yes"><img src="/shared/img/common/social-bookmarking/googleplus.jpg" alt="Add to Google+"
+                                            title="Google+" /></a><span class="soc-bm-link-text">Google+</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-linkedin"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=LINKEDIN"><img src="/shared/img/common/social-bookmarking/linkedin.gif" alt="Add to LinkedIn"
+                                            title="LinkedIn" /></a><span class="soc-bm-link-text">LinkedIn</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-mendeley"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=MENDELEY"><img src="/shared/img/common/social-bookmarking/mendeley.gif" alt="Add to Mendeley"
+                                            title="Mendeley" /></a><span class="soc-bm-link-text">Mendeley</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-reddit"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=REDDIT"><img src="/shared/img/common/social-bookmarking/reddit.gif" alt="Add to Reddit"
+                                            title="Reddit" /></a><span class="soc-bm-link-text">Reddit</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-twitter"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_11/4354&amp;title=Designation%20of%20type%20strains%20for%20seven%20species%20of%20the%20order%20Myxococcales%20and%20proposal%20for%20neotype%20strains%20of%20Cystobacter%20ferrugineus%2C%20Cystobacter%20minus%20and%20Polyangium%20fumosum+--+Lang%20and%20Reichenbach%2063%20%28Pt%2011%29%3A%204354+--+IJSEM&amp;doi=10.1099/ijs.0.056440-0&amp;link_type=TWITTER"><img src="/shared/img/common/social-bookmarking/twitter.gif" alt="Add to Twitter"
+                                            title="Twitter" /></a><span class="soc-bm-link-text">Twitter</span></li>
+                              </ul>
+                              
+                              <p class="social-bookmarking-help"><a href="/help/social_bookmarks.dtl">What's this?</a></p>
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+            
+            <div class="content-box" id="article-dyn-nav">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>Navigate This Article</span></h3>
+                  <div class="cb-section" id="cb-art-nav">
+                     <ol>
+                        <li><a href="#content-block">Top</a></li>
+                        <li><a href="#abstract-1">Abstract</a></li>
+                        <li><a href="#ack-1">Acknowledgements</a></li>
+                        <li><a href="#ref-list-1">References</a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+         </div>
+         <div id="col-3">
+            
+            <div class="content-box" id="sidebar-current-issue">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Month's Issue</span></h3>
+                  <div class="cb-section">
+                     <ol>
+                        <li><span><a href="/content/current" rel="current-issue">April 2015, 65 (Pt 4)</a></span></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section">
+                     <ol>
+                        <li>
+                           <div class="current-issue"><a href="/content/current" rel="current-issue"><img src="/content/65/Pt_4.cover.gif" width="67" height="89" alt="Current Issue" /></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section sidebar-etoc-link">
+                     <ol>
+                        <li><a href="/cgi/alerts/etoc">Alert me to new issues of IJSEM
+                              </a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            <div id="sidebar-global-nav">
+               
+               		
+               <ul class="button-list pub-links">
+                  <li class="first"><a href="/site/misc/about.xhtml" title="ABOUT IJSEM"><span>ABOUT IJSEM</span></a></li>
+                  <li><a href="/site/misc/edboard.xhtml" title="EDITORIAL BOARD &amp; STAFF"><span>EDITORIAL BOARD &amp; STAFF</span></a></li>
+                  <li><a href="http://www.editorialmanager.com/ijs/" title="SUBMIT A MANUSCRIPT"><span>SUBMIT A MANUSCRIPT</span></a></li>
+                  <li><a href="/site/misc/ifora.xhtml" title="INFORMATION FOR AUTHORS"><span>INFORMATION FOR AUTHORS</span></a></li>
+                  <li><a href="/site/misc/iforr.xhtml" title="INFORMATION FOR REVIEWERS"><span>INFORMATION FOR REVIEWERS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/site/librarians/index.xhtml"
+                        title="INFORMATION FOR LIBRARIANS"><span>INFORMATION FOR LIBRARIANS</span></a></li>
+                  <li><a href="/site/misc/reprints.xhtml" title="PERMISSIONS AND REPRINTS"><span>PERMISSIONS AND REPRINTS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/subscriptions" title="SUBSCRIPTIONS"><span>SUBSCRIPTIONS</span></a></li>
+                  <li><a href="/site/misc/addir.xhtml" title="ADVERTISING"><span>ADVERTISING</span></a></li>
+                  <li class="rss-img-button"><a href="/site/misc/alerts_feeds.xhtml" title="ALERTS &amp; FEEDS"><span>ALERTS &amp; FEEDS</span></a></li>
+                  <li class="last"><a href="/feedback" title="FEEDBACK"><span>FEEDBACK</span></a></li>
+               </ul>
+               		
+               <ul class="button-list pub-links umbrella-links">
+                  <li class="first"><a href="http://mic.sgmjournals.org" title="MICROBIOLOGY"><span>MICROBIOLOGY</span></a></li>
+                  <li><a href="http://vir.sgmjournals.org" title="J GEN VIROL"><span>J GEN VIROL</span></a></li>
+                  <li><a href="http://jmm.sgmjournals.org" title="J MED MICROBIOL"><span>J MED MICROBIOL</span></a></li>
+                  <li><a href="http://jmmcr.sgmjournals.org" title="JMM CASE REPORTS"><span>JMM CASE REPORTS</span></a></li>
+                  <li class="last"><a href="http://www.sgmjournals.org" title="ALL SGM JOURNALS"><span>ALL SGM JOURNALS</span></a></li>
+               </ul>
+               		
+               <div class="sidebar-icon-group">
+                  			
+                  <div class="icons">
+                     			<a href="http://www.sgm.ac.uk/" rel="external-nw"><img src="/publisher/img/society_logo.gif" class="publisher-icon" alt="Society Logo" /></a>
+                     			<a href="http://www.the-icsp.org/" rel="external-nw"><img src="/publisher/img/icsp_logo.gif" class="publisher-icon" alt="ICSP Logo" /></a>
+                     			<a href="http://highwire.stanford.edu/" rel="external-nw"><img src="/publisher/img/hplogo.gif" class="hw-icon" alt="HighWire Press Logo" /></a>
+                     			
+                  </div>
+                  			
+                  <div class="sidebar-icon-text"><span>The <a href="http://www.sgmjournals.org"> Society for General Microbiology</a> publishes online with the assistance of <a href="http://highwire.stanford.edu">HighWire Press®</a>.</span></div>
+                  		
+               </div>
+               	
+            </div>
+            <div class="most-links-box js-marker">
+               
+               <div class="most-header">
+                  
+                  <h3>Most</h3>
+                  
+               </div>
+               
+               <ul>
+                  <li class="most-cur-sel">
+                     <h4>Viewed</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/1070?rss=1&amp;ssource=mfr">Proposal to consistently apply the International Code of Nomenclature of Prokaryotes (ICNP) to names of the oxygenic photosynthetic
+                                 bacteria (cyanobacteria), including those validly published under the International Code of Botanical Nomenclature (ICBN)/International
+                                 Code of Nomenclature for algae, fungi and plants (ICN), and proposal to change Principle 2 of the ICNP</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfr">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/316?rss=1&amp;ssource=mfr">Integrating genomics into the taxonomy and systematics of the Bacteria and Archaea</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/333?rss=1&amp;ssource=mfr">Applications of next-generation sequencing to unravelling the evolutionary history of algae</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/739?rss=1&amp;ssource=mfr">Notification that new names of prokaryotes, new combinations, and new taxonomic opinions have appeared in volume 64, part
+                                 12, of the IJSEM</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfr1.dtl" class="view-all">» View all Most Viewed articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+                  <li>
+                     <h4>Cited</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4386?rss=1&amp;ssource=mfc">Chryseobacterium hispalense sp. nov., a plant-growth-promoting bacterium isolated from a rainwater pond in an olive plant
+                                 nursery, and emended descriptions of Chryseobacterium defluvii, Chryseobacterium indologenes, Chryseobacterium wanjuense and
+                                 Chryseobacterium gregarium</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfc">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_1/138?rss=1&amp;ssource=mfc">Aquibacter zeaxanthinifaciens gen. nov., sp. nov., a zeaxanthin-producing bacterium of the family Flavobacteriaceae isolated
+                                 from surface seawater, and emended descriptions of the genera Aestuariibaculum and Gaetbulibacter</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4790?rss=1&amp;ssource=mfc">Kordia aquimaris sp. nov., a zeaxanthin-producing member of the family Flavobacteriaceae isolated from surface seawater, and
+                                 emended description of the genus Kordia</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4524?rss=1&amp;ssource=mfc">Erythrobacter odishensis sp. nov. and Pontibacter odishensis sp. nov. isolated from dry soil of a solar saltern</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfc1.dtl" class="view-all">» View all Most Cited articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+               </ul>
+               
+               
+            </div>
+            
+            
+            
+         </div>
+         <div id="footer">
+            
+            <div class="bar">
+               
+               <div class="footer-group footer-col-left">
+                  		
+                  <p class="copyright">Copyright ©
+                     		2015 International Union of Microbiological Societies
+                     	
+                  </p>
+                  	
+               </div>
+               
+               <div class="footer-group footer-col-right">
+                  	    
+                  <ul class="issns">
+                     <li>
+                        <span>Print ISSN: </span>
+                        <span class="issn">1466-5026</span>
+                        
+                     </li>
+                     <li>
+                        <span>Online ISSN: </span>
+                        <span class="issn">1466-5034</span>
+                        
+                     </li>
+                  </ul>
+                  	  
+               </div>
+               	  
+            </div>
+            
+            
+            <div class="block-2 sb-div"></div>
+            
+         </div><script type="text/javascript">
+        var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
+        document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
+        </script><script type="text/javascript">
+        try {
+        var pageTracker = _gat._getTracker("UA-189672-25");
+        pageTracker._setDomainName(".sgmjournals.org");
+        pageTracker._trackPageview();
+        } catch(err) {}
+        </script><script type="text/javascript">
+	(function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
+		(i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
+		m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
+	})(window,document,'script','//www.google-analytics.com/analytics.js','ga');
+
+	ga('create', 'UA-48529861-1', '.sgmjournals.org');
+	ga('send', 'pageview');
+	</script></div>
+   </body>
+</html>
\ No newline at end of file
diff --git a/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/fulltext.pdf b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/fulltext.pdf
new file mode 100644
index 00000000..2c9c5ebd
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/fulltext.pdf differ
diff --git a/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/ijs056440.pdf b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/ijs056440.pdf
new file mode 100644
index 00000000..15334481
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_11_4354.full/ijs056440.pdf differ
diff --git a/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_12_4586.full/52654.pdf b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_12_4586.full/52654.pdf
new file mode 100644
index 00000000..ba6b2ced
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_12_4586.full/52654.pdf differ
diff --git a/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_12_4586.full/F1.large.jpg b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_12_4586.full/F1.large.jpg
new file mode 100644
index 00000000..f2192509
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_12_4586.full/F1.large.jpg differ
diff --git a/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_12_4586.full/fulltext.html b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_12_4586.full/fulltext.html
new file mode 100644
index 00000000..80253747
--- /dev/null
+++ b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_12_4586.full/fulltext.html
@@ -0,0 +1,1263 @@
+<!DOCTYPE html
+  PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html
+      xmlns="http://www.w3.org/1999/xhtml"
+      xml:lang="en"
+      lang="en">
+   <head>
+      <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
+      <title>Spirosoma endophyticum sp. nov., isolated from Zn- and Cd-accumulating Salix caprea </title>
+      <meta name="googlebot" content="NOODP" />
+      <meta name="HW.ad-path" content="/cgi/content/full/63/Pt_12/4586" />
+      <meta content="/ijs/63/Pt_12/4586.atom" name="HW.identifier" />
+      <meta name="DC.Format" content="text/html" />
+      <meta name="DC.Language" content="en" />
+      <meta content="Spirosoma endophyticum sp. nov., isolated from Zn- and Cd-accumulating Salix caprea"
+            name="DC.Title" />
+      <meta content="10.1099/ijs.0.052654-0" name="DC.Identifier" />
+      <meta content="2013-12-01" name="DC.Date" />
+      <meta content="Society for General Microbiology" name="DC.Publisher" />
+      <meta content="Julia Fries" name="DC.Contributor" />
+      <meta content="Stefan Pfeiffer" name="DC.Contributor" />
+      <meta content="Melanie Kuffner" name="DC.Contributor" />
+      <meta content="Angela Sessitsch" name="DC.Contributor" />
+      <meta content="International Journal of Systematic and Evolutionary&#xA;                Microbiology"
+            name="citation_journal_title" />
+      <meta content="Int J Syst Evol&#xA;                Microbiol"
+            name="citation_journal_abbrev" />
+      <meta content="1466-5026" name="citation_issn" />
+      <meta content="1466-5034" name="citation_issn" />
+      <meta name="citation_author" content="Julia Fries" />
+      <meta name="citation_author_institution"
+            content="AIT Austrian Institute of Technology GmbH, Bioresources Unit, Tulln, Austria" />
+      <meta name="citation_author" content="Stefan Pfeiffer" />
+      <meta name="citation_author_institution"
+            content="AIT Austrian Institute of Technology GmbH, Bioresources Unit, Tulln, Austria" />
+      <meta name="citation_author" content="Melanie Kuffner" />
+      <meta name="citation_author_institution"
+            content="AIT Austrian Institute of Technology GmbH, Bioresources Unit, Tulln, Austria" />
+      <meta name="citation_author" content="Angela Sessitsch" />
+      <meta name="citation_author_institution"
+            content="AIT Austrian Institute of Technology GmbH, Bioresources Unit, Tulln, Austria" />
+      <meta content="Spirosoma endophyticum sp. nov., isolated from Zn- and Cd-accumulating Salix caprea"
+            name="citation_title" />
+      <meta content="12/01/2013" name="citation_date" />
+      <meta content="63" name="citation_volume" />
+      <meta content="Pt 12" name="citation_issue" />
+      <meta content="4586" name="citation_firstpage" />
+      <meta content="4590" name="citation_lastpage" />
+      <meta content="63/Pt_12/4586" name="citation_id" />
+      <meta content="63/Pt 12/4586" name="citation_id_from_sass_path" />
+      <meta content="ijs;63/Pt_12/4586" name="citation_mjid" />
+      <meta content="10.1099/ijs.0.052654-0" name="citation_doi" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_12/4586.abstract"
+            name="citation_abstract_html_url" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_12/4586.full"
+            name="citation_fulltext_html_url" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_12/4586.full.pdf"
+            name="citation_pdf_url" />
+      <meta content="/content/63/Pt_12.cover.gif" name="issue_cover_image" />
+      <meta content="http://ijs.sgmjournals.org/content/63/Pt_12/4586"
+            name="citation_public_url" />
+      <meta content="23907231" name="citation_pmid" />
+      <meta name="citation_access" content="all" />
+      <meta name="citation_fulltext_world_readable" content="" />
+      <meta name="citation_section" content="Bacteroidetes" />
+      <meta name="robots" content="noarchive,nofollow" />
+      <meta name="googlebot" content="noarchive" />
+      <link href="/content/63/Pt_12/4580.short" rel="prev" />
+      <link href="/content/63/Pt_12/4591.short" rel="next" />
+      <link rel="stylesheet" type="text/css" media="all" href="/shared/css/hw-global.css" />
+      <link rel="stylesheet" type="text/css" media="print" href="/shared/css/hw-print.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/standard-designs/design25/main.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/local/css/hw-local-global.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/jquery.fancybox-1.3.4.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-global-colexpand.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/publisher/css/hw-publisher-page-content.css" />
+      <link rel="stylesheet" type="text/css" media="all"
+            href="/shared/css/hw-global-colexpand.css" /><script type="text/javascript" id="session-d120882126e1">var callbackToken='5638CE2AFC47188';</script><script type="text/javascript" id="session-d120882126e3">
+                      var subCode='sgmjournal_sub';
+                    </script><script type="text/javascript" src="/shared/js/jquery-min.js"></script><script type="text/javascript" src="/shared/js/fingerprint.js"></script><script type="text/javascript" src="/shared/js/hw-shared.js"></script><script type="text/javascript" src="/shared/js/design/hw-design1.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-shared.js"></script><script type="text/javascript" src="/shared/js/pages/hw-content.js"></script><script type="text/javascript" src="/shared/js/fancybox/jquery.fancybox-1.3.4.js"></script><script type="text/javascript" src="/shared/js/fancybox/jquery.easing-1.3.pack.js"></script><script type="text/javascript"
+              src="/shared/js/fancybox/jquery.mousewheel-3.0.4.pack.js"></script><script type="text/javascript" src="/shared/js/util/content.jquery.addVariantLink.js"></script><script type="text/javascript" src="/publisher/js/hw-publisher-custom-free.js"></script><script type="text/javascript" src="/shared/js/util/hw-col-expand.js"></script><script type="text/javascript"
+              src="https://data.namesforlife.com/script/NamesforLife.js"></script></head>
+   <body>
+      <div class="hw-gen-page pagetype-content" id="pageid-content" itemscope="itemscope"
+           itemtype="http://schema.org/ScholarlyArticle">
+         <div id="header">
+            
+            <h1><a id="logo" href="/"><span>International Journal of Systematic and Evolutionary Microbiology</span></a></h1>
+            
+            <p id="skip-link">
+               <a href="#content-block">Skip to main page content</a>
+               
+            </p>
+            
+            <ul class="button-list header-buttons">
+               <li class="first"><a href="/" title="HOME"><span>HOME</span></a></li>
+               <li><a href="/content/current" title="CURRENT ISSUE"><span>CURRENT ISSUE</span></a></li>
+               <li><a href="/content" title="ARCHIVE"><span>ARCHIVE</span></a></li>
+               <li><a href="/search" title="SEARCH"><span>SEARCH</span></a></li>
+               <li><a href="/help" title="HELP"><span>HELP</span></a></li>
+               <li class="last"><a href="/feedback" title="CONTACT US"><span>CONTACT US</span></a></li>
+            </ul>
+            
+            
+            <div class="header-qs">
+               
+               <form class="searchbox" action="/search" method="get">
+                  <div>
+                     	<label for="header-qs-input" id="header-qs-search-label">Search for Keyword:</label>
+                     <input value="" title="Search" type="text" name="fulltext" id="header-qs-input" /><input type="hidden" name="submit" value="yes" /><label for="header-qs-search" id="header-qs-search-label">GO</label><input value="GO" alt="Link: Go" type="image" id="header-qs-search-go"
+                            src="/shared/img/standard-design/design2/go.gif" /> 
+                     
+                  </div>
+                  <div class="adv-search-link"><a href="/search">Advanced Search</a></div>
+               </form>
+               
+               
+            </div>
+            
+            <div class="header-ac-elements">
+               
+               <div id="authstring" class="suppress-header-login">
+                  
+                  <ul>
+                     <li class="subscr-ref">Institution: THE NATURAL HISTORY MUSEUM</li>
+                     <li>
+                        <a href="/login?uri=http%3A%2F%2Fijs.sgmjournals.org%2Fcontent%2F63%2FPt_12%2F4586.full">
+                           Sign In as Member / Individual
+                           </a>
+                        
+                     </li>
+                  </ul>           
+                  
+               </div> 
+               
+               <div id="hdr-login" class="suppress-header-login"></div>
+               
+            </div>
+            
+            <div class="banner-ads">
+               		
+               <ul>
+                  <li class="position-1 no-ad hdr_left"><span>  </span></li>
+               </ul>
+               	
+            </div>
+            
+            <div class="bar">
+               
+               <div class="bar-inner"></div>
+               
+            </div>
+            
+         </div>
+         <div id="content-block">
+            <div class="article fulltext-view " itemprop="articleBody"><span class="highwire-journal-article-marker-start"></span><h1 id="article-title-1" itemprop="headline"><em>Spirosoma</em> <em>endophyticum</em> sp. nov., isolated from Zn- and Cd-accumulating <em>Salix caprea</em></h1>
+               <div class="contributors">
+                  <ol class="contributor-list" id="contrib-group-1">
+                     <li class="contributor" id="contrib-1" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Julia+Fries&amp;sortspec=date&amp;submit=Submit">Julia Fries</a></span>, 
+                     </li>
+                     <li class="contributor" id="contrib-2" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Stefan+Pfeiffer&amp;sortspec=date&amp;submit=Submit">Stefan Pfeiffer</a></span>, 
+                     </li>
+                     <li class="contributor" id="contrib-3" itemprop="author" itemscope="itemscope"
+                         itemtype="http://schema.org/Person"><span class="name" itemprop="name"><a class="name-search"
+                              href="/search?author1=Melanie+Kuffner&amp;sortspec=date&amp;submit=Submit">Melanie Kuffner</a></span> and 
+                     </li>
+                     <li class="last" id="contrib-4"><span class="name"><a class="name-search"
+                              href="/search?author1=Angela+Sessitsch&amp;sortspec=date&amp;submit=Submit">Angela Sessitsch</a></span></li>
+                  </ol>
+                  <ol class="affiliation-list">
+                     <li class="aff"><a id="aff-1" name="aff-1"></a><address>AIT Austrian Institute of Technology GmbH, Bioresources Unit, Tulln, Austria</address>
+                     </li>
+                  </ol>
+                  <ol class="corresp-list">
+                     <li class="corresp" id="corresp-1"><strong>Correspondence</strong><br /> Angela Sessitsch <span class="em-link"><span class="em-addr">angela.sessitsch{at}ait.ac.at</span></span></li>
+                  </ol>
+               </div>
+               <div class="section abstract" id="abstract-1" itemprop="description">
+                  <div class="section-nav">
+                     <div class="nav-placeholder"> </div><a href="#fn-group-1" title="Next Section" class="next-section-link"><span>Next Section</span></a></div>
+                  <h2>Abstract</h2>
+                  
+                  <p id="p-4">A Gram-reaction-negative, yellow-pigmented strain, designated EX36<sup>T</sup>, was characterized using a polyphasic approach comprising phylogenetic, morphological and genotypic analyses. The endophytic
+                     strain was isolated from Zn/Cd-accumulating <em>Salix caprea</em> in Arnoldstein, Austria. Analysis of the 16S rRNA gene demonstrated that the novel strain is most closely related to members
+                     of the genus <span class="named-content genus" id="named-content-2"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                           href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span> (95 % sequence similarity with <span class="named-content species" id="named-content-3"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma linguale"
+                           href="doi:10.1601/nm.8318"><em>Spirosoma linguale</em></a></span>). The genomic DNA G+C content was 47.2 mol%. The predominant quinone was and the major cellular fatty acids were summed feature
+                     3 (iso-C<sub>15 : 0</sub> 2-OH and/or C<sub>16 : 1</sub>ω7<em>c</em>), C<sub>16 : 1</sub>ω5<em>c</em>, iso-C<sub>17 : 0</sub> 3-OH and iso-C<sub>15 : 0</sub>. On the basis of its phenotypic and genotypic properties, strain EX36<sup>T</sup> should be classified as a novel species of the genus <span class="named-content genus" id="named-content-4"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                           href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span>, for which the name <span class="named-content genus" id="named-content-5"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                           href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span> <em>endophyticum</em> sp. nov. is proposed. The type strain is EX36<sup>T</sup> ( = DSM 26130<sup>T</sup> = LMG 27272<sup>T</sup>).
+                  </p>
+                  
+               </div>
+               <div class="section fn-group" id="fn-group-1">
+                  <div class="section-nav"><a href="#abstract-1" title="Abstract" class="prev-section-link"><span>Previous Section</span></a><a href="#sec-1" title="Next Section" class="next-section-link"><span>Next Section</span></a></div>
+                  <ul>
+                     <li class="fn-other" id="fn-1">
+                        <p id="p-1">The GenBank/EMBL/DDBJ accession number for the 16S rRNA gene sequence of strain EX36<sup>T</sup> is GQ342559.
+                        </p>
+                     </li>
+                     <li class="fn-supplementary-material" id="fn-2">
+                        <p id="p-2">A supplementary figure is available with the online version of this paper.</p>
+                     </li>
+                  </ul>
+               </div>
+               <div class="license" id="license-1">
+                  <p id="p-3">This is an open-access article distributed under the terms of the Creative Commons Attribution License, which permits unrestricted
+                     use, distribution, and reproduction in any medium, provided the original work is properly cited.
+                  </p>
+               </div>
+               <p id="p-5">The genus <span class="named-content genus" id="named-content-6"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                        href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span> was first proposed by <a id="xref-ref-11-1" class="xref-bibr" href="#ref-11">Larkin &amp; Borrall (1984)</a> and belongs to the family <span class="named-content family" id="named-content-7"><a class="namesforlife" rel="namesforlife-name" title="Flexibacteraceae"
+                        href="doi:10.1601/nm.8247"><em>Flexibacteraceae</em></a></span> in the phylum <span class="named-content phylum" id="named-content-8"><a class="namesforlife" rel="namesforlife-name" title="Bacteroidetes"
+                        href="doi:10.1601/nm.7927"><em>Bacteroidetes</em></a></span>. At the time of writing the genus <span class="named-content genus" id="named-content-9"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                        href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span> includes five species, the type species <span class="named-content species" id="named-content-10"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma linguale"
+                        href="doi:10.1601/nm.8318"><em>Spirosoma linguale</em></a></span> (<a id="xref-ref-11-2" class="xref-bibr" href="#ref-11">Larkin &amp; Borrall, 1984</a>), <span class="named-content species" id="named-content-11"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma rigui"
+                        href="doi:10.1601/nm.11571"><em>Spirosoma rigui</em></a></span> (<a id="xref-ref-1-1" class="xref-bibr" href="#ref-1">Baik <em>et al.</em>, 2007</a>), <span class="named-content species" id="named-content-12"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma panaciterrae"
+                        href="doi:10.1601/nm.13622"><em>Spirosoma panaciterrae</em></a></span> (<a id="xref-ref-21-1" class="xref-bibr" href="#ref-21">Ten <em>et al.</em>, 2009</a>), <span class="named-content species" id="named-content-13"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma spitsbergense"
+                        href="doi:10.1601/nm.14214"><em>Spirosoma spitsbergense</em></a></span> and <span class="named-content species" id="named-content-14"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma luteum"
+                        href="doi:10.1601/nm.14215"><em>Spirosoma luteum</em></a></span> (<a id="xref-ref-6-1" class="xref-bibr" href="#ref-6">Finster <em>et al.</em>, 2009</a>). So far, <span class="named-content genus" id="named-content-15"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                        href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span> strains have been isolated from various habitats, such as fresh water, permafrost soil or soil from a ginseng field. Strain
+                  EX36<sup>T</sup>, which is proposed in this study to represent a novel species, was isolated in course of the analysis of bacteria associated
+                  with the heavy metal accumulating plant <em>Salix caprea</em> (<a id="xref-ref-10-1" class="xref-bibr" href="#ref-10">Kuffner <em>et al.</em>, 2010</a>).
+               </p>
+               <p id="p-6">For the isolation of strain EX36<sup>T</sup>, <em>Salix caprea</em> trees growing on a former Zn/Pb mining and processing site in Arnoldstein (Austria) were sampled (<a id="xref-ref-10-2" class="xref-bibr" href="#ref-10">Kuffner <em>et al.</em>, 2010</a>). Xylem sap extract was directly plated on 10 % tryptic soy agar (TSA, Merck Darmstadt, Germany) and after 1 week of incubation
+                  single colonies were picked and streaked on phosphate-poor MOPS medium (<a id="xref-ref-14-1" class="xref-bibr" href="#ref-14">Neidhardt <em>et al.</em>, 1974</a>) containing 0.1 % glucose and 1 mM ZnSO<sub>4</sub>. The strain was routinely cultured on 10 % TSA. For maintenance, the cell material was suspended in 10 % tryptic soy broth
+                  (TSB, Merck, Darmstadt, Germany) containing 15 % glycerol and stored at −80 °C. Endophytic colonization was confirmed by inoculating
+                  two maize and two potato cultivars, growing the plants under <em>in vitro</em> conditions and reisolating the strain from root and stem tissues.
+               </p>
+               <p id="p-7">For the extraction of bacterial DNA the Gen Elute Bacterial Genomic DNA kit (Sigma–Aldrich) was used. The 16S rRNA gene was
+                  amplified by PCR using the primers 8f (5′-AGAGTTTGATCCTGGCTCAG-3′) (<a id="xref-ref-22-1" class="xref-bibr" href="#ref-22">Weisburg <em>et al.</em>, 1991</a>) and 1520r (5′-AAGGAGGTGATCCAGCCGCA-3′) (<a id="xref-ref-5-1" class="xref-bibr" href="#ref-5">Edwards <em>et al.</em>, 1989</a>). Sequencing of the amplified PCR product was performed by LGC Genomics (Berlin, Germany). The obtained partial sequences
+                  were assembled using the programs BioEdit (<a id="xref-ref-7-1" class="xref-bibr" href="#ref-7">Hall, 1999</a>) and <span class="sc">seqman</span> <span class="sc">pro</span> (DNAstar). The consensus sequence was subjected to nucleotide <span class="sc">blast</span> analysis (<a href="http://blast.ncbi.nlm.nih.gov/Blast.cgi">http://blast.ncbi.nlm.nih.gov/Blast.cgi</a>) to search the database of the National Center for Biotechnology Information (NCBI) for the closest relatives of the bacterial
+                  strains with validly published names. Sequence comparisons indicated that the isolate belonged to the family <span class="named-content family" id="named-content-16"><a class="namesforlife" rel="namesforlife-name" title="Flexibacteraceae"
+                        href="doi:10.1601/nm.8247"><em>Flexibacteraceae</em></a></span>.
+               </p>
+               <p id="p-8">Nearly complete 16S rRNA gene sequences of strain EX36<sup>T</sup> and of all species of the genus <span class="named-content genus" id="named-content-17"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                        href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span> with validly published names and of selected species of the family <span class="named-content family" id="named-content-18"><a class="namesforlife" rel="namesforlife-name" title="Cytophagaceae"
+                        href="doi:10.1601/nm.14010"><em>Cytophagaceae</em></a></span>, which were downloaded from the NCBI GenBank sequence database, were imported into the <span class="sc">arb</span> program package (<a id="xref-ref-12-1" class="xref-bibr" href="#ref-12">Ludwig <em>et al.</em>, 2004</a>). Sequences were aligned into the <span class="sc">silva</span> SSURef 102 (<a id="xref-ref-15-1" class="xref-bibr" href="#ref-15">Pruesse <em>et al.</em>, 2007</a>) database by using the option ‘autosearch by PT_server’ of the <span class="sc">arb</span> editor. Alignments were manually corrected using the <span class="sc">arb</span> editor. A maximum-likelihood phylogenetic tree was reconstructed using RAxML v. 7.4.2 (<a id="xref-ref-18-1" class="xref-bibr" href="#ref-18">Stamatakis, 2006a</a>) by execution of the following command line in raxmlGUI v. 1.3 (<a id="xref-ref-16-1" class="xref-bibr" href="#ref-16">Silvestro &amp; Michalak, 2012</a>): raxmlHPC.exe -T 2 &lt;number of processors &gt;-f a -m GTRGAMMA -x 336 &lt;seed1 &gt;-p 115 &lt;seed2 &gt;-N 100 &lt;bootstraps &gt;-o CarHomin
+                  &lt;outgroup &gt;-s &lt;input file &gt;-O &lt;output order &gt;. We used a combination of the Gamma model of rate heterogeneity (<a id="xref-ref-23-1" class="xref-bibr" href="#ref-23">Yang, 1994</a>) and the CAT model (<a id="xref-ref-19-1" class="xref-bibr" href="#ref-19">Stamatakis, 2006b</a>), which was implemented in the rapid bootstrapping algorithm, (<a id="xref-ref-20-1" class="xref-bibr" href="#ref-20">Stamatakis <em>et al.</em>, 2008</a>) was performed with 100 replicates and using general time reversible (GTR) as the substitution matrix. In <a id="xref-fig-1-1" class="xref-fig" href="#F1">Fig. 1</a> the position of EX36<sup>T</sup> in the distinct cluster of the genus <span class="named-content genus" id="named-content-19"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                        href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span> can be clearly recognized. The calculation of pairwise sequence similarity using a global alignment algorithm (<a id="xref-ref-13-1" class="xref-bibr" href="#ref-13">Myers &amp; Miller, 1988</a>), which was implemented at the EzTaxon-e server (<a href="http://eztaxon-e.ezbiocloud.net/">http://eztaxon-e.ezbiocloud.net/</a>; <a id="xref-ref-8-1" class="xref-bibr" href="#ref-8">Kim <em>et al.</em>, 2012</a>) showed highest sequence similarity values for strain EX36<sup>T</sup> to <span class="named-content species" id="named-content-20"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma linguale"
+                        href="doi:10.1601/nm.8318"><em>Spirosoma linguale</em></a></span> DSM 74<sup>T</sup> (95.7 %), followed by <span class="named-content species" id="named-content-21"><a class="namesforlife" rel="namesforlife-name" title="S. luteum"
+                        href="doi:10.1601/nm.14215"><em>S. luteum</em></a></span> SPM-10<sup>T</sup> (93.9 %), <span class="named-content species" id="named-content-22"><a class="namesforlife" rel="namesforlife-name" title="S. spitsbergense"
+                        href="doi:10.1601/nm.14214"><em>S. spitsbergense</em></a></span> SPM-9<sup>T</sup> (93.9 %), <span class="named-content species" id="named-content-23"><a class="namesforlife" rel="namesforlife-name" title="S. rigui"
+                        href="doi:10.1601/nm.11571"><em>S. rigui</em></a></span> KCTC 12531<sup>T</sup> (93.8 %) and <span class="named-content species" id="named-content-24"><a class="namesforlife" rel="namesforlife-name" title="S. panaciterrae"
+                        href="doi:10.1601/nm.13622"><em>S. panaciterrae</em></a></span> Gsoil 1519<sup>T</sup> (92.5 %).
+               </p>
+               <div id="F1" class="fig pos-float type-figure  odd">
+                  <div class="fig-inline"><a href="4586/F1.expansion.html"><img alt="Fig. 1. " src="4586/F1.small.gif" /></a><div class="callout"><span>View larger version:</span><ul class="callout-links">
+                           <li><a href="4586/F1.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4586/F1.expansion.html">In a new window</a></li>
+                        </ul>
+                        <ul class="fig-services">
+                           <li class="ppt-link"><a href="/powerpoint/63/Pt_12/4586/F1">Download as PowerPoint Slide</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="fig-caption"><span class="fig-label">Fig. 1. </span> 
+                     
+                     <p id="p-9" class="first-child">Maximum-likelihood tree (bootstrap: 100 replicates) based on 16S rRNA gene sequence data (sequence length 1296 bp) showing
+                        the phylogenetic position of strain EX36<sup>T</sup> among related species selected from the phylum <span class="named-content phylum" id="named-content-25"><a class="namesforlife" rel="namesforlife-name" title="Bacteroidetes"
+                              href="doi:10.1601/nm.7927"><em>Bacteroidetes</em></a></span>. <span class="named-content species" id="named-content-26"><a class="namesforlife" rel="namesforlife-name" title="Cardiobacterium hominis"
+                              href="doi:10.1601/nm.2271"><em>Cardiobacterium hominis</em></a></span> ATCC 15826<sup>T</sup> (M35014) was used as an outgroup.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <p id="p-10">Growth of strain EX36<sup>T</sup> was tested at various temperatures (4, 20, 23, 28, 37 and 41 °C) on 10 % TSA plates for up to 1 week. The pH range for growth
+                  (pH 4, 5, 6, 7, 8 and 9) was determined by measuring OD<sub>600</sub> changes in cultures incubated at 28 °C with shaking at 190 r.p.m. compared with an uninoculated control. Salt tolerance was
+                  determined by amending 10 % TSB with NaCl to final concentrations of 0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.8, 1.0, 2.0, 3.0, 4.0,
+                  5.0 and 10.0 % NaCl (w/v). The Gram reaction of strain EX36<sup>T</sup> was determined by using the non-staining method described by <a id="xref-ref-3-1" class="xref-bibr" href="#ref-3">Buck (1982)</a>. Pigment analysis of cells grown on 10 % TSA was performed in triplicates by extraction with acetone according to the method
+                  described by <a id="xref-ref-4-1" class="xref-bibr" href="#ref-4">Denner <em>et al.</em> (2001)</a> using a U-2900 spectrophotometer (Hitachi). Minimal inhibition concentrations (MIC) for Zn and Cd were determined according
+                  to the method of <a id="xref-ref-9-1" class="xref-bibr" href="#ref-9">Kuffner <em>et al.</em> (2008)</a>. Additionally cells were tested for flexirubin pigments using the method described by <a id="xref-ref-2-1" class="xref-bibr" href="#ref-2">Bernardet <em>et al.</em> (2002)</a>. Oxidase and catalase activity were tested as outlined by <a id="xref-ref-17-1" class="xref-bibr" href="#ref-17">Smibert &amp; Krieg (1994)</a>. Additional biochemical tests were performed by the Identification Service of the DSMZ (Leibniz-Institut DSMZ-Deutsche Sammlung
+                  von Mikroorganismen und Zellkulturen GmbH, Braunschweig, Germany) using API 20NE (bioMérieux) and GENIII plates (Biolog).
+                  Cell morphology after 4 days of growth at 28 °C was investigated using fluorescence and bright-field microscopy (IX81, Olympus;
+                  Axiovert 200 M, Zeiss). Antibiotic susceptibility was determined by the disc diffusion method on 10 % TSA plates.
+               </p>
+               <p id="p-11">Cells of strain EX36<sup>T</sup> were rod-shaped, Gram-reaction-negative and 1.2×2−17.5 µm in size (Fig S1, available in IJSEM Online). Most cells were arranged
+                  in pairs, but filaments up to 55 µm were observed. EX36<sup>T</sup> showed yellowish, opaque, semi-translucent colonies with a smooth and shiny surface and a circular and convex shape. The
+                  diameter of colonies grown on 10 % TSA at 28 °C for 1 week varied between 1.5 and 3.0 mm. The strain was positive for catalase
+                  and oxidase activity; detailed results of biochemical and physiological analyses are listed in <a id="xref-table-wrap-1-1" class="xref-table" href="#T1">Table 1</a> and in the species description. In contrast to other species of the genus <span class="named-content genus" id="named-content-27"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                        href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span>, cells of EX36<sup>T</sup> showed a length up to 17.5 µm, did not grow at 5 and 42 °C, did not tolerate NaCl concentrations higher than 0.6 % (w/v),
+                  had the lowest genomic G+C content and showed differences in antibiotic susceptibility. Low tolerance of Cd and Zn was observed
+                  (slow growth at 4 mM Zn and 1 mM Cd). The analysis of yellow pigments showed three absorption maxima at 428, 453 and 483 nm.
+                  EX36<sup>T</sup> was negative for flexirubin-type pigments.
+               </p>
+               <div id="T1" class="table pos-float">
+                  <div class="table-inline">
+                     <div class="callout"><span>View this table:</span><ul class="callout-links">
+                           <li><a href="4586/T1.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4586/T1.expansion.html">In a new window</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="table-caption"><span class="table-label">Table 1. </span> 
+                     <span class="caption-title">Differential characteristics of strain EX36<sup>T</sup> and recognized species of the genus <span class="named-content genus" id="named-content-28"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                              href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span></span>
+                     
+                     <p id="p-12" class="first-child">Strains: 1, EX36<sup>T</sup> (data from this study); 2, <span class="named-content species" id="named-content-29"><a class="namesforlife" rel="namesforlife-name" title="S. linguale"
+                              href="doi:10.1601/nm.8318"><em>S. linguale</em></a></span> DSM 74<sup>T</sup> (<a id="xref-ref-11-3" class="xref-bibr" href="#ref-11">Larkin &amp; Borrall, 1984</a>; and this study); 3, <span class="named-content species" id="named-content-30"><a class="namesforlife" rel="namesforlife-name" title="S. luteum"
+                              href="doi:10.1601/nm.14215"><em>S. luteum</em></a></span> DSM 19990<sup>T</sup> (<a id="xref-ref-6-2" class="xref-bibr" href="#ref-6">Finster <em>et al.</em>, 2009</a>); 4, <span class="named-content species" id="named-content-31"><a class="namesforlife" rel="namesforlife-name" title="S. spitsbergense"
+                              href="doi:10.1601/nm.14214"><em>S. spitsbergense</em></a></span> DSM 19989<sup>T</sup> (<a id="xref-ref-6-3" class="xref-bibr" href="#ref-6">Finster <em>et al.</em>, 2009</a>); 5, <span class="named-content species" id="named-content-32"><a class="namesforlife" rel="namesforlife-name" title="S. rigui"
+                              href="doi:10.1601/nm.11571"><em>S. rigui</em></a></span> KCTC 12531<sup>T</sup> (<a id="xref-ref-1-2" class="xref-bibr" href="#ref-1">Baik <em>et al.</em>, 2007</a>); 6, <span class="named-content species" id="named-content-33"><a class="namesforlife" rel="namesforlife-name" title="S. panaciterrae"
+                              href="doi:10.1601/nm.13622"><em>S. panaciterrae</em></a></span> DSM 21099<sup>T</sup> (<a id="xref-ref-21-2" class="xref-bibr" href="#ref-21">Ten <em>et al.</em>, 2009</a>). All strains are catalase-positive, Gram-reaction-negative and negative for nitrate reduction, utilization of gluconate,
+                        caprate, adipate and glycerol. +, Positive; −, negative; <span class="sc">w</span>, weakly positive; <span class="sc">nd</span>, not determined; <span class="sc">r</span>, resistant; <span class="sc">s</span>, susceptible.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <p id="p-13">Analyses of cellular fatty acid composition, respiratory quinones, polar lipids and chromosomal G+C content were performed
+                  by the Identification Service of the DSMZ. The fatty acid profile was determined according to the protocol of the Microbial
+                  Identification System (MIDI). The major fatty acids of strain EX36<sup>T</sup> were summed feature 3 (iso-C<sub>15 : 0</sub> 2-OH and/or C<sub>16 : 1</sub>ω7<em>c</em>; 49.3 %), C<sub>16 : 1</sub>ω5<em>c</em> (23.8 %), iso-C<sub>17 : 0</sub> 3-OH (6.2 %) and iso-C<sub>15 : 0</sub> (5.4 %). A detailed overview of the cellular fatty acid profiles of all species of the genus <span class="named-content genus" id="named-content-34"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                        href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span> can be found in <a id="xref-table-wrap-2-1" class="xref-table" href="#T2">Table 2</a>. Differences between the fatty acid profile of EX36<sup>T</sup> and other species of the genus <span class="named-content genus" id="named-content-35"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                        href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span> were found in the amounts of iso-C<sub>15 : 0</sub>, C<sub>16 : 1</sub>ω5<em>c</em> and summed feature 3. In contrast to <span class="named-content species" id="named-content-36"><a class="namesforlife" rel="namesforlife-name" title="S. linguale"
+                        href="doi:10.1601/nm.8318"><em>S. linguale</em></a></span> DSM 74<sup>T</sup>, the fatty acids C<sub>15 : 0</sub> and anteiso-C<sub>15 : 0</sub> were not detected.
+               </p>
+               <div id="T2" class="table pos-float">
+                  <div class="table-inline">
+                     <div class="callout"><span>View this table:</span><ul class="callout-links">
+                           <li><a href="4586/T2.expansion.html">In this window</a></li>
+                           <li><a class="in-nw" href="4586/T2.expansion.html">In a new window</a></li>
+                        </ul>
+                     </div>
+                  </div>
+                  <div class="table-caption"><span class="table-label">Table 2. </span> 
+                     <span class="caption-title">Fatty acid profiles (%) of strain EX36<sup>T</sup> and its closest phylogenetic neighbours from the genus <span class="named-content genus" id="named-content-37"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                              href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span></span>
+                     
+                     <p id="p-14" class="first-child">Strains: 1, EX36<sup>T</sup> (data from this study); 2, <span class="named-content species" id="named-content-38"><a class="namesforlife" rel="namesforlife-name" title="S. linguale"
+                              href="doi:10.1601/nm.8318"><em>S. linguale</em></a></span> DSM 74<sup>T</sup> (data from this study); 3, <span class="named-content species" id="named-content-39"><a class="namesforlife" rel="namesforlife-name" title="S. luteum"
+                              href="doi:10.1601/nm.14215"><em>S. luteum</em></a></span> DSM 19990<sup>T</sup> (<a id="xref-ref-6-4" class="xref-bibr" href="#ref-6">Finster <em>et al.</em>, 2009</a>); 4, <span class="named-content species" id="named-content-40"><a class="namesforlife" rel="namesforlife-name" title="S. spitsbergense"
+                              href="doi:10.1601/nm.14214"><em>S. spitsbergense</em></a></span> DSM 19989<sup>T</sup> (<a id="xref-ref-6-5" class="xref-bibr" href="#ref-6">Finster <em>et al.</em>, 2009</a>); 5, <span class="named-content species" id="named-content-41"><a class="namesforlife" rel="namesforlife-name" title="S. rigui"
+                              href="doi:10.1601/nm.11571"><em>S. rigui</em></a></span> KCTC 12531<sup>T</sup> (<a id="xref-ref-1-3" class="xref-bibr" href="#ref-1">Baik <em>et al.</em>, 2007</a>); 6, <span class="named-content species" id="named-content-42"><a class="namesforlife" rel="namesforlife-name" title="S. panaciterrae"
+                              href="doi:10.1601/nm.13622"><em>S. panaciterrae</em></a></span> DSM 21099<sup>T</sup> (<a id="xref-ref-21-3" class="xref-bibr" href="#ref-21">Ten <em>et al.</em>, 2009</a>). <span class="sc">tr</span>, Trace amount (&lt;1 %); −, not detected.
+                     </p>
+                     
+                     <div class="sb-div caption-clear"></div>
+                  </div>
+               </div>
+               <p id="p-16">The predominant menaquinone, in accordance with all other species of the genus <span class="named-content genus" id="named-content-43"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                        href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span>, was MK-7. As polar lipids, phosphatidylethanolamine, two aminophospholipids, two aminolipids, a glycolipid and three unknown
+                  lipids were detected on the TLC plate. The DNA G+C content of strain EX36<sup>T</sup> was 47.2 mol%, which is lower than reported values for all other species of the genus <span class="named-content genus" id="named-content-44"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                        href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span> with validly published names.
+               </p>
+               <p id="p-17">The analysis of DNA−DNA similarity of strain EX36<sup>T</sup> with its nearest phylogenetic neighbour <span class="named-content species" id="named-content-45"><a class="namesforlife" rel="namesforlife-name" title="S. linguale"
+                        href="doi:10.1601/nm.8318"><em>S. linguale</em></a></span> DSM 74<sup>T</sup> was also carried out by the Identification Service of the DSMZ. The experiment was performed in duplicates. DNA−DNA hybridization
+                  showed a DNA−DNA similarity of 12.2 % (second measurement: 17.2 %), demonstrating that these two strains do not represent
+                  the same species.
+               </p>
+               <p id="p-18">The present data regarding 16S rRNA gene sequence analysis, physiological, chemotaxonomic and morphological properties indicates,
+                  that strain EX36<sup>T</sup> represents a distinct species in the genus <span class="named-content genus" id="named-content-46"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                        href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span>, for which the name <span class="named-content genus" id="named-content-47"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                        href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span> <em>endophyticum</em> sp. nov. is proposed.
+               </p>
+               <div class="section" id="sec-1">
+                  <div class="section-nav"><a href="#fn-group-1" title="Previous Section" class="prev-section-link"><span>Previous Section</span></a><a href="#ack-1" title="Acknowledgements" class="next-section-link"><span>Next Section</span></a></div>
+                  
+                  
+                  <div id="sec-2" class="subsection">
+                     
+                     <h3>Description of <span class="named-content genus" id="named-content-48"><a class="namesforlife" rel="namesforlife-name" title="Spirosoma"
+                              href="doi:10.1601/nm.8317"><em>Spirosoma</em></a></span><em>endophytica</em> sp. nov.
+                     </h3>
+                     
+                     <p id="p-19"><em>Spirosom endophyticum</em> (en.do.phy′ti.cum. Gr. Pref. <em>endo</em> within; Gr. n. <em>phyton</em> plant; L. neut. suff. ‐<em>icum</em> adjectival suffix used with the sense of belonging to; N.L. neut. adj. <em>endophyticum</em> within plant, referring to the endophytic nature of the strain and its isolation from plant tissue).
+                     </p>
+                     
+                     <p id="p-20">Cells are rod-shaped, Gram-reaction-negative, non-spore-forming, with a size of 1.2×2–17.5 µm. A yellow pigment which is not
+                        of the flexirubin type is produced. Filaments up to 55 µm may be formed. Colonies on 10 % TSA are opaque, semi-translucent
+                        with a smooth and shiny surface and a circular, convex shape. Aerobic growth occurs at 20–28 °C (optimum at 28 °C), pH 5–8
+                        (optimum at pH 7); tolerates concentrations up to 0.6 % NaCl (w/v) in the medium, whereas best growth was achieved in absence
+                        of NaCl. Positive for catalase and oxidase activity. Nitrate is not reduced and indole is not produced. Negative for glucose
+                        fermentation, hydrolysis of arginine and gelatin, and urease activities and positive for aesculin hydrolysis. Does not utilize
+                        the following substrates: arabinose, mannitol, <em>N</em>-acetylglucosamine, gluconate, caprate, adipate, malate, citrate, phenylacetate, β-methyl <span class="sc">d</span>-glucoside, <span class="sc">d</span>-salicin, <span class="sc">n</span>-acetyl-β-<span class="sc">d</span>-mannosamine, <span class="sc">n</span>-acetyl neuraminic acid, <span class="sc">d</span>-galactose, <span class="sc">d</span>-fucose, <span class="sc">l</span>-fucose, <span class="sc">l</span>-rhamnose, inosine, <span class="sc">d</span>-arabitol, <em>myo</em>-inositol, <span class="sc">d</span>-aspartic acid, <span class="sc">d</span>-serine, glycyl-<span class="sc">l</span>-proline, <span class="sc">l</span>-alanine, <span class="sc">l</span>-arginine, <span class="sc">l</span>-aspartic acid, <span class="sc">l</span>-glutamic acid, <span class="sc">l</span>-serine and pectin. The following substrates are weakly utilized: dextrin, maltose, trehalose, cellobiose, gentiobiose, sucrose,
+                        turanose, stachyose, α-lactose, melibiose, α-<span class="sc">d</span>-glucose, <span class="sc">d</span>-mannose, <span class="sc">d</span>-fructose, <span class="sc">d</span>-mannitol and <span class="sc">l</span>-histidine. <span class="sc">d</span>-Raffinose and <em>N</em>-acetyl-<span class="sc">d</span>-glucosamine are utilized. Susceptible to the following antibiotics (µg per disc): streptomycin (10), kanamycin (30), chloramphenicol
+                        (60) and rifampicin (15) and resistant to ampicillin (10), polymyxin B (20), tetracycline (15) and erythromycin (15). The
+                        major fatty acids are summed feature 3 (iso-C<sub>15 : 0</sub> 2-OH and/or C<sub>16 : 1</sub>ω7<em>c</em>), C<sub>16 : 1</sub>ω5<em>c</em>, iso-C<sub>17 : 0</sub> 3-OH and iso-C<sub>15 : 0</sub>; the complete fatty acid profile can be found in <a id="xref-table-wrap-2-2" class="xref-table" href="#T2">Table 2</a>. The predominant menaquinone is MK-7. The major polar lipid is phosphatidylethanolamine.
+                     </p>
+                     
+                     <p id="p-21">The type strain, EX36<sup>T</sup> ( = DSM 26130<sup>T</sup> = LMG 27272<sup>T</sup>), was isolated from Zn/Cd-accumulating <em>Salix caprea</em> in Arnoldstein, Austria. The DNA G+C content of the type strain is 47.2 mol%.
+                     </p>
+                     
+                  </div>
+               </div>
+               <div class="section ack" id="ack-1">
+                  <div class="section-nav"><a href="#sec-1" title="Previous Section" class="prev-section-link"><span>Previous Section</span></a><a href="#ref-list-1" title="References" class="next-section-link"><span>Next Section</span></a></div>
+                  <h2>Acknowledgements</h2>
+                  
+                  <p id="p-22">We thank Marlies Polt for technical support and Katharina Fallmann, Friederike Trognitz and Muhammad Naveed for helpful discussions.
+                     This study was supported by the Austrian Science Foundation [Förderung der wissenschaftlichen Forshung (FWF) grant no. L561-B17].
+                  </p>
+                  
+               </div>
+               <div class="section ref-list" id="ref-list-1">
+                  <div class="section-nav"><a href="#ack-1" title="Acknowledgements" class="prev-section-link"><span>Previous Section</span></a><div class="nav-placeholder"> </div>
+                  </div>
+                  <h2>References</h2>
+                  <ol class="cit-list ref-use-labels">
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-1-1" title="View reference  in text"
+                           id="ref-1">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.1"
+                             data-doi="10.1099/ijs.0.65302-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Baik</span>,  <span class="cit-name-given-names">K. S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kim</span>,  <span class="cit-name-given-names">M. S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Park</span>,  <span class="cit-name-given-names">S. C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lee</span>,  <span class="cit-name-given-names">D. W.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lee</span>,  <span class="cit-name-given-names">S. D.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ka</span>,  <span class="cit-name-given-names">J.-O.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Choi</span>,  <span class="cit-name-given-names">S. K.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Seong</span>,  <span class="cit-name-given-names">C. N.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2007</span><strong>).</strong> <span class="cit-article-title"><em>Spirosoma rigui</em> sp. nov., isolated from fresh water</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">57</span>, <span class="cit-fpage">2870</span>–<span class="cit-lpage">2873</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.65302-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>18048741</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=57/12/2870"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-2-1" title="View reference  in text"
+                           id="ref-2">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.2"
+                             data-doi="10.1099/ijs.0.02136-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bernardet</span>,  <span class="cit-name-given-names">J.-F.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Nakagawa</span>,  <span class="cit-name-given-names">Y.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Holmes</span>,  <span class="cit-name-given-names">B.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth cit-collab">Subcommittee on the taxonomy of Flavobacterium and Cytophaga-like bacteria of the International Committee on Systematics of
+                                       Prokaryotes</span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2002</span><strong>).</strong> <span class="cit-article-title">Proposed minimal standards for describing new taxa of the family <em>Flavobacteriaceae</em> and emended description of the family</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">52</span>, <span class="cit-fpage">1049</span>–<span class="cit-lpage">1070</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.02136-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>12054224</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=52/3/1049"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-3-1" title="View reference  in text"
+                           id="ref-3">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.3">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Buck</span>,  <span class="cit-name-given-names">J. D.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1982</span><strong>).</strong> <span class="cit-article-title">Nonstaining (KOH) method for determination of Gram reactions of marine bacteria</span>. <abbr class="cit-jnl-abbrev">Appl Environ Microbiol</abbr> <span class="cit-vol">44</span>, <span class="cit-fpage">992</span>–<span class="cit-lpage">993</span>.<span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>6184019</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=aem&amp;resid=44/4/992"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-4-1" title="View reference  in text"
+                           id="ref-4">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.4"
+                             data-doi="10.1099/00207713-51-3-827">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Denner</span>,  <span class="cit-name-given-names">E. B. M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Paukner</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kämpfer</span>,  <span class="cit-name-given-names">P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Moore</span>,  <span class="cit-name-given-names">E. R. B.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Abraham</span>,  <span class="cit-name-given-names">W. R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Busse</span>,  <span class="cit-name-given-names">H.-J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wanner</span>,  <span class="cit-name-given-names">G.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lübitz</span>,  <span class="cit-name-given-names">W.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2001</span><strong>).</strong> <span class="cit-article-title"><em>Sphingomonas pituitosa</em> sp. nov., an exopolysaccharide-producing bacterium that secretes an unusual type of sphingan</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">51</span>, <span class="cit-fpage">827</span>–<span class="cit-lpage">841</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/00207713-51-3-827</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>11411704</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=51/3/827"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-5-1" title="View reference  in text"
+                           id="ref-5">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.5"
+                             data-doi="10.1093/nar/17.19.7843">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Edwards</span>,  <span class="cit-name-given-names">U.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Rogall</span>,  <span class="cit-name-given-names">T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Blöcker</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Emde</span>,  <span class="cit-name-given-names">M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Böttger</span>,  <span class="cit-name-given-names">E. C.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1989</span><strong>).</strong> <span class="cit-article-title">Isolation and direct complete nucleotide determination of entire genes. Characterization of a gene coding for 16S ribosomal
+                                    RNA</span>. <abbr class="cit-jnl-abbrev">Nucleic Acids Res</abbr> <span class="cit-vol">17</span>, <span class="cit-fpage">7843</span>–<span class="cit-lpage">7853</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1093/nar/17.19.7843</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>2798131</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=nar&amp;resid=17/19/7843"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-6-1" title="View reference  in text"
+                           id="ref-6">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.6"
+                             data-doi="10.1099/ijs.0.002725-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Finster</span>,  <span class="cit-name-given-names">K. W.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Herbert</span>,  <span class="cit-name-given-names">R. A.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lomstein</span>,  <span class="cit-name-given-names">B. A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2009</span><strong>).</strong> <span class="cit-article-title"><em>Spirosoma spitsbergense</em> sp. nov. and <em>Spirosoma luteum</em> sp. nov., isolated from a high Arctic permafrost soil, and emended description of the genus <em>Spirosoma</em></span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">59</span>, <span class="cit-fpage">839</span>–<span class="cit-lpage">844</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.002725-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>19329617</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=59/4/839"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-7-1" title="View reference  in text"
+                           id="ref-7">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.7"
+                             data-doi="10.1046/j.1462-2920.2002.00362.x">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hall</span>,  <span class="cit-name-given-names">T. A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1999</span><strong>).</strong> <span class="cit-article-title">BioEdit: a user-friendly biological sequence alignment editor and analysis program for Windows 95/98/NT</span>. <abbr class="cit-jnl-abbrev">Nucleic Acids Symp Ser</abbr> <span class="cit-vol">41</span>, <span class="cit-fpage">95</span>–<span class="cit-lpage">98</span>.</cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1046/j.1462-2920.2002.00362.x&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=12460286&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=BioEdit%3A%20a%20user-friendly%20biological%20sequence%20alignment%20editor%20and%20analysis%20program%20for%20Windows%2095%2F98%2FNT&amp;author=T.%20A.%20Hall&amp;publication_year=1999&amp;journal=Nucleic%20Acids%20Symp%20Ser&amp;volume=41&amp;pages=95-98">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-8-1" title="View reference  in text"
+                           id="ref-8">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.8"
+                             data-doi="10.1099/ijs.0.038075-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kim</span>,  <span class="cit-name-given-names">O. S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Cho</span>,  <span class="cit-name-given-names">Y. J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lee</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Yoon</span>,  <span class="cit-name-given-names">S. H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kim</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Na</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Park</span>,  <span class="cit-name-given-names">S. C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jeon</span>,  <span class="cit-name-given-names">Y. S.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lee</span>,  <span class="cit-name-given-names">J. H.</span></span></li>
+                              </ol><cite> <strong>&amp; other authors (</strong><span class="cit-pub-date">2012</span><strong>).</strong> <span class="cit-article-title">Introducing EzTaxon-e: a prokaryotic 16S rRNA gene sequence database with phylotypes that represent uncultured species</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">62</span>, <span class="cit-fpage">716</span>–<span class="cit-lpage">721</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.038075-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>22140171</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=62/Pt_3/716"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-9-1" title="View reference  in text"
+                           id="ref-9">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.9"
+                             data-doi="10.1007/s11104-007-9517-9">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kuffner</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Puschenreiter</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wieshammer</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Gorfer</span>,  <span class="cit-name-given-names">M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sessitsch</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2008</span><strong>).</strong> <span class="cit-article-title">Rhizosphere bacteria affect growth and metal uptake of heavy metal accumulating willows</span>. <abbr class="cit-jnl-abbrev">Plant Soil</abbr> <span class="cit-vol">304</span>, <span class="cit-fpage">35</span>–<span class="cit-lpage">44</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/s11104-007-9517-9</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/s11104-007-9517-9&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Rhizosphere%20bacteria%20affect%20growth%20and%20metal%20uptake%20of%20heavy%20metal%20accumulating%20willows&amp;author=M.%20Kuffner&amp;author=M.%20Puschenreiter&amp;author=G.%20Wieshammer&amp;author=M.%20Gorfer&amp;author=A.%20Sessitsch&amp;publication_year=2008&amp;journal=Plant%20Soil&amp;volume=304&amp;pages=35-44&amp;doi=10.1007%2Fs11104-007-9517-9">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-10-1" title="View reference  in text"
+                           id="ref-10">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.10"
+                             data-doi="10.1111/j.1365-2672.2010.04670.x">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Kuffner</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">De Maria</span>,  <span class="cit-name-given-names">S.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Puschenreiter</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Fallmann</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Wieshammer</span>,  <span class="cit-name-given-names">G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Gorfer</span>,  <span class="cit-name-given-names">M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Strauss</span>,  <span class="cit-name-given-names">J.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Rivelli</span>,  <span class="cit-name-given-names">A. R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Sessitsch</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2010</span><strong>).</strong> <span class="cit-article-title">Culturable bacteria from Zn- and Cd-accumulating <em>Salix caprea</em> with differential effects on plant growth and heavy metal availability</span>. <abbr class="cit-jnl-abbrev">J Appl Microbiol</abbr> <span class="cit-vol">108</span>, <span class="cit-fpage">1471</span>–<span class="cit-lpage">1484</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1111/j.1365-2672.2010.04670.x</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>20132372</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1111/j.1365-2672.2010.04670.x&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=20132372&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Culturable%20bacteria%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea%20with%20differential%20effects%20on%20plant%20growth%20and%20heavy%20metal%20availability&amp;author=M.%20Kuffner&amp;author=S.%20De%20Maria&amp;author=M.%20Puschenreiter&amp;author=K.%20Fallmann&amp;author=G.%20Wieshammer&amp;author=M.%20Gorfer&amp;author=J.%20Strauss&amp;author=A.%20R.%20Rivelli&amp;author=A.%20Sessitsch&amp;publication_year=2010&amp;journal=J%20Appl%20Microbiol&amp;volume=108&amp;pages=1471-1484&amp;doi=10.1111%2Fj.1365-2672.2010.04670.x&amp;pmid=20132372">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-11-1" title="View reference  in text"
+                           id="ref-11">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_12.4586.11">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Holt</span>,  <span class="cit-name-given-names">J. G.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Larkin</span>,  <span class="cit-name-given-names">J. M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Borrall</span>,  <span class="cit-name-given-names">R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1984</span><strong>).</strong> <span class="cit-article-title">Family I. <em>Spirosomaceae</em> Larkin and Borrall 1978, 595<sup>AL</sup></span>. In <span class="cit-source">Bergey’s Manual of Systematic Bacteriology</span>, <span class="cit-vol">vol. 1</span>, pp. <span class="cit-fpage">125</span>–<span class="cit-lpage">126</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Holt</span>,  <span class="cit-name-given-names">J. G.</span></span>
+                                 . <span class="cit-publ-loc">Baltimore</span>: <span class="cit-publ-name">Williams &amp; Wilkins</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Family%20I.%20Spirosomaceae%20Larkin%20and%20Borrall%201978%2C%20595AL&amp;author=J.%20M.%20Larkin&amp;author=R.%20Borrall&amp;publication_year=1984&amp;citation_inbook_title=Bergey%E2%80%99s%20Manual%20of%20Systematic%20Bacteriology">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-12-1" title="View reference  in text"
+                           id="ref-12">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.12"
+                             data-doi="10.1093/nar/gkh293">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ludwig</span>,  <span class="cit-name-given-names">W.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Strunk</span>,  <span class="cit-name-given-names">O.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Westram</span>,  <span class="cit-name-given-names">R.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Richter</span>,  <span class="cit-name-given-names">L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Meier</span>,  <span class="cit-name-given-names">H.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Yadhukumar</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Buchner</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lai</span>,  <span class="cit-name-given-names">T.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Steppi</span>,  <span class="cit-name-given-names">S.</span></span></li>
+                              </ol><cite> <strong>&amp; other authors (</strong><span class="cit-pub-date">2004</span><strong>).</strong> <span class="cit-article-title"><span class="sc">arb</span>: a software environment for sequence data</span>. <abbr class="cit-jnl-abbrev">Nucleic Acids Res</abbr> <span class="cit-vol">32</span>, <span class="cit-fpage">1363</span>–<span class="cit-lpage">1371</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1093/nar/gkh293</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>14985472</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=nar&amp;resid=32/4/1363"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-13-1" title="View reference  in text"
+                           id="ref-13">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.13"
+                             data-doi="10.1093/bioinformatics/4.1.11">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Myers</span>,  <span class="cit-name-given-names">E. W.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Miller</span>,  <span class="cit-name-given-names">W.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1988</span><strong>).</strong> <span class="cit-article-title">Optimal alignments in linear space</span>. <abbr class="cit-jnl-abbrev">Comput Appl Biosci</abbr> <span class="cit-vol">4</span>, <span class="cit-fpage">11</span>–<span class="cit-lpage">17</span>.<span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>3382986</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=bioinfo&amp;resid=4/1/11"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-14-1" title="View reference  in text"
+                           id="ref-14">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.14">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Neidhardt</span>,  <span class="cit-name-given-names">F. C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Bloch</span>,  <span class="cit-name-given-names">P. L.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Smith</span>,  <span class="cit-name-given-names">D. F.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1974</span><strong>).</strong> <span class="cit-article-title">Culture medium for enterobacteria</span>. <abbr class="cit-jnl-abbrev">J Bacteriol</abbr> <span class="cit-vol">119</span>, <span class="cit-fpage">736</span>–<span class="cit-lpage">747</span>.<span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>4604283</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=jb&amp;resid=119/3/736"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-15-1" title="View reference  in text"
+                           id="ref-15">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.15"
+                             data-doi="10.1093/nar/gkm864">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pruesse</span>,  <span class="cit-name-given-names">E.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Quast</span>,  <span class="cit-name-given-names">C.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Knittel</span>,  <span class="cit-name-given-names">K.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Fuchs</span>,  <span class="cit-name-given-names">B. M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ludwig</span>,  <span class="cit-name-given-names">W.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Peplies</span>,  <span class="cit-name-given-names">J.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Glöckner</span>,  <span class="cit-name-given-names">F. O.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2007</span><strong>).</strong> <span class="cit-article-title"><span class="sc">silva</span>: a comprehensive online resource for quality checked and aligned ribosomal RNA sequence data compatible with <span class="sc">arb</span></span>. <abbr class="cit-jnl-abbrev">Nucleic Acids Res</abbr> <span class="cit-vol">35</span>, <span class="cit-fpage">7188</span>–<span class="cit-lpage">7196</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1093/nar/gkm864</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>17947321</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=nar&amp;resid=35/21/7188"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-16-1" title="View reference  in text"
+                           id="ref-16">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.16"
+                             data-doi="10.1007/s13127-011-0056-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Silvestro</span>,  <span class="cit-name-given-names">D.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Michalak</span>,  <span class="cit-name-given-names">I.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2012</span><strong>).</strong> <span class="cit-article-title">raxmlGUI: A graphical front-end for RAxML</span>. <abbr class="cit-jnl-abbrev">Org Divers Evol</abbr> <span class="cit-vol">12</span>, <span class="cit-fpage">335</span>–<span class="cit-lpage">337</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/s13127-011-0056-0</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/s13127-011-0056-0&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=raxmlGUI%3A%20A%20graphical%20front-end%20for%20RAxML&amp;author=D.%20Silvestro&amp;author=I.%20Michalak&amp;publication_year=2012&amp;journal=Org%20Divers%20Evol&amp;volume=12&amp;pages=335-337&amp;doi=10.1007%2Fs13127-011-0056-0">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-17-1" title="View reference  in text"
+                           id="ref-17">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_12.4586.17">
+                           <div class="cit-metadata">
+                              <ol class="duplicate">
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Gerhardt</span>,  <span class="cit-name-given-names">P.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Murray</span>,  <span class="cit-name-given-names">R. G. E.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Wood</span>,  <span class="cit-name-given-names">W. A.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span></li>
+                              </ol>
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Smibert</span>,  <span class="cit-name-given-names">R. M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1994</span><strong>).</strong> <span class="cit-article-title">Phenotypic characterization</span>. In <span class="cit-source">Methods for General and Molecular Bacteriology</span>, pp. <span class="cit-fpage">607</span>–<span class="cit-lpage">654</span>. Edited by 
+                                 <span class="cit-ed"><span class="cit-name-surname">Gerhardt</span>,  <span class="cit-name-given-names">P.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Murray</span>,  <span class="cit-name-given-names">R. G. E.</span></span>, 
+                                 <span class="cit-ed"><span class="cit-name-surname">Wood</span>,  <span class="cit-name-given-names">W. A.</span></span> &amp; 
+                                 <span class="cit-ed"><span class="cit-name-surname">Krieg</span>,  <span class="cit-name-given-names">N. R.</span></span>
+                                 . <span class="cit-publ-loc">Washington, DC</span>: <span class="cit-publ-name">American Society for Microbiology</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Phenotypic%20characterization&amp;author=R.%20M.%20Smibert&amp;author=N.%20R.%20Krieg&amp;publication_year=1994&amp;citation_inbook_title=Methods%20for%20General%20and%20Molecular%20Bacteriology">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-18-1" title="View reference  in text"
+                           id="ref-18">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.18"
+                             data-doi="10.1093/bioinformatics/btl446">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stamatakis</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2006a</span><strong>).</strong> <span class="cit-article-title">RAxML-VI-HPC: maximum likelihood-based phylogenetic analyses with thousands of taxa and mixed models</span>. <abbr class="cit-jnl-abbrev">Bioinformatics</abbr> <span class="cit-vol">22</span>, <span class="cit-fpage">2688</span>–<span class="cit-lpage">2690</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1093/bioinformatics/btl446</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>16928733</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=bioinfo&amp;resid=22/21/2688"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-19-1" title="View reference  in text"
+                           id="ref-19">↵</a><div class="cit ref-cit ref-book" id="cit-63.Pt_12.4586.19">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stamatakis</span>,  <span class="cit-name-given-names">A.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2006b</span><strong>).</strong> <span class="cit-article-title">Phylogenetic models of rate heterogeneity: a high performance computing perspective</span>. In: <span class="cit-source">Proc. of IPDPS2006</span>, pp. <span class="cit-fpage">253</span>. <span class="cit-publ-name">IEEE Computer Society</span>. <span class="cit-publ-loc">Washington, DC</span>.</cite></div>
+                           <div class="cit-extra"><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Phylogenetic%20models%20of%20rate%20heterogeneity%3A%20a%20high%20performance%20computing%20perspective&amp;author=A.%20Stamatakis&amp;publication_year=2006b&amp;citation_inbook_title=Proc.%20of%20IPDPS2006">Google Scholar</a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-20-1" title="View reference  in text"
+                           id="ref-20">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.20"
+                             data-doi="10.1080/10635150802429642">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Stamatakis</span>,  <span class="cit-name-given-names">A.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Hoover</span>,  <span class="cit-name-given-names">P.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Rougemont</span>,  <span class="cit-name-given-names">J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2008</span><strong>).</strong> <span class="cit-article-title">A rapid bootstrap algorithm for the RAxML Web servers</span>. <abbr class="cit-jnl-abbrev">Syst Biol</abbr> <span class="cit-vol">57</span>, <span class="cit-fpage">758</span>–<span class="cit-lpage">771</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1080/10635150802429642</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>18853362</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=sysbio&amp;resid=57/5/758"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-21-1" title="View reference  in text"
+                           id="ref-21">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.21"
+                             data-doi="10.1099/ijs.0.002436-0">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Ten</span>,  <span class="cit-name-given-names">L. N.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Xu</span>,  <span class="cit-name-given-names">J.-L.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Jin</span>,  <span class="cit-name-given-names">F.-X.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Im</span>,  <span class="cit-name-given-names">W.-T.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Oh</span>,  <span class="cit-name-given-names">H.-M.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lee</span>,  <span class="cit-name-given-names">S.-T.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">2009</span><strong>).</strong> <span class="cit-article-title"><em>Spirosoma panaciterrae</em> sp. nov., isolated from soil</span>. <abbr class="cit-jnl-abbrev">Int J Syst Evol Microbiol</abbr> <span class="cit-vol">59</span>, <span class="cit-fpage">331</span>–<span class="cit-lpage">335</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1099/ijs.0.002436-0</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>19196773</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=ijs&amp;resid=59/2/331"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-22-1" title="View reference  in text"
+                           id="ref-22">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.22">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Weisburg</span>,  <span class="cit-name-given-names">W. G.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Barns</span>,  <span class="cit-name-given-names">S. M.</span></span>, 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Pelletier</span>,  <span class="cit-name-given-names">D. A.</span></span> &amp; 
+                                 </li>
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Lane</span>,  <span class="cit-name-given-names">D. J.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1991</span><strong>).</strong> <span class="cit-article-title">16S ribosomal DNA amplification for phylogenetic study</span>. <abbr class="cit-jnl-abbrev">J Bacteriol</abbr> <span class="cit-vol">173</span>, <span class="cit-fpage">697</span>–<span class="cit-lpage">703</span>.<span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>1987160</span></cite></div>
+                           <div class="cit-extra"><a href="/cgi/ijlink?linkType=ABST&amp;journalCode=jb&amp;resid=173/2/697"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-ijlinks"><span class="cit-reflinks-abstract">Abstract</span><span class="cit-sep cit-reflinks-variant-name-sep">/</span><span class="cit-reflinks-full-text"><span class="free-full-text">FREE </span>Full Text</span></a></div>
+                        </div>
+                     </li>
+                     <li><span class="ref-label ref-label-empty"></span><a class="rev-xref-ref" href="#xref-ref-23-1" title="View reference  in text"
+                           id="ref-23">↵</a><div class="cit ref-cit ref-journal" id="cit-63.Pt_12.4586.23"
+                             data-doi="10.1007/BF00160154">
+                           <div class="cit-metadata">
+                              <ol class="cit-auth-list">
+                                 <li><span class="cit-auth"><span class="cit-name-surname">Yang</span>,  <span class="cit-name-given-names">Z. H.</span></span></li>
+                              </ol><cite> <strong>(</strong><span class="cit-pub-date">1994</span><strong>).</strong> <span class="cit-article-title">Maximum likelihood phylogenetic estimation from DNA sequences with variable rates over sites: approximate methods</span>. <abbr class="cit-jnl-abbrev">J Mol Evol</abbr> <span class="cit-vol">39</span>, <span class="cit-fpage">306</span>–<span class="cit-lpage">314</span>.<span class="cit-pub-id-sep cit-pub-id-doi-sep"> </span><span class="cit-pub-id cit-pub-id-doi"><span class="cit-pub-id-scheme-doi">doi:</span>10.1007/BF00160154</span><span class="cit-pub-id cit-pub-id-pmid"><span class="cit-pub-id-scheme-pmid">pmid:</span>7932792</span></cite></div>
+                           <div class="cit-extra"><a href="/external-ref?access_num=10.1007/BF00160154&amp;link_type=DOI"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-webofscience">CrossRef</a><a href="/external-ref?access_num=7932792&amp;link_type=MED"
+                                 class="cit-ref-sprinkles cit-ref-sprinkles-medline">Medline</a><a target="_blank"
+                                 href="http://scholar.google.com/scholar_lookup?title=Maximum%20likelihood%20phylogenetic%20estimation%20from%20DNA%20sequences%20with%20variable%20rates%20over%20sites%3A%20approximate%20methods&amp;author=Z.%20H.%20Yang&amp;publication_year=1994&amp;journal=J%20Mol%20Evol&amp;volume=39&amp;pages=306-314&amp;doi=10.1007%2FBF00160154&amp;pmid=7932792">Google Scholar</a></div>
+                        </div>
+                     </li>
+                  </ol>
+               </div><span class="highwire-journal-article-marker-end"></span></div>
+            <div class="social-bookmarking">
+               
+               <ul class="social-bookmark-links">
+                  <li class="social-bookmarking-item social-bookmarking-item-citeulike"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=CITEULIKE"><img src="/shared/img/common/social-bookmarking/citeulike.gif"
+                             alt="Add to CiteULike"
+                             title="CiteULike" /></a><span class="soc-bm-link-text">CiteULike</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-delicious"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=DEL_ICIO_US"><img src="/shared/img/common/social-bookmarking/delicious.gif"
+                             alt="Add to Delicious"
+                             title="Delicious" /></a><span class="soc-bm-link-text">Delicious</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-digg"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=DIGG"><img src="/shared/img/common/social-bookmarking/digg.gif" alt="Add to Digg"
+                             title="Digg" /></a><span class="soc-bm-link-text">Digg</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-facebook"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=FACEBOOK"
+                        class="sb-facebook"
+                        rel="external-nw"><img src="/shared/img/common/social-bookmarking/facebook.gif" alt="Add to Facebook"
+                             title="Facebook" /></a><span class="soc-bm-link-text">Facebook</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-googleplus"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=GOOGLEPLUS&amp;log_only=yes"><img src="/shared/img/common/social-bookmarking/googleplus.jpg" alt="Add to Google+"
+                             title="Google+" /></a><span class="soc-bm-link-text">Google+</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-linkedin"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=LINKEDIN"><img src="/shared/img/common/social-bookmarking/linkedin.gif" alt="Add to LinkedIn"
+                             title="LinkedIn" /></a><span class="soc-bm-link-text">LinkedIn</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-mendeley"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=MENDELEY"><img src="/shared/img/common/social-bookmarking/mendeley.gif" alt="Add to Mendeley"
+                             title="Mendeley" /></a><span class="soc-bm-link-text">Mendeley</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-reddit"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=REDDIT"><img src="/shared/img/common/social-bookmarking/reddit.gif" alt="Add to Reddit"
+                             title="Reddit" /></a><span class="soc-bm-link-text">Reddit</span></li>
+                  <li class="social-bookmarking-item social-bookmarking-item-twitter"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=TWITTER"><img src="/shared/img/common/social-bookmarking/twitter.gif" alt="Add to Twitter"
+                             title="Twitter" /></a><span class="soc-bm-link-text">Twitter</span></li>
+               </ul>
+               
+               <p class="social-bookmarking-help"><a href="/help/social_bookmarks.dtl">What's this?</a></p>
+               
+            </div><span id="related-urls"></span></div>
+         <div id="col-2">
+            
+            <div class="article-nav sidebar-nav">
+               <a href="/content/63/Pt_12/4580.short" title="Previous article" class="previous">« Previous</a><span class="article-nav-sep"> | </span><a href="/content/63/Pt_12/4591.short" title="Next article" class="next">Next Article »</a>
+               
+               <span class="toc-link">
+                  				<a href="/content/63/Pt_12.toc" title="Table of Contents">Table of Contents</a>
+                  			</span>
+               
+               
+            </div>
+            <div class="open-access-note">
+               <span class="open-access-note">OPEN ACCESS ARTICLE</span>
+               
+            </div>
+            <div class="content-box" id="article-cb-main">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Article</span></h3>
+                  <div class="cb-section cb-slug">
+                     <ol>
+                        <li>
+                           <div id="slugline">
+                              
+                              
+                              	    <span class="slug-metadata-note ahead-of-print">
+                                 	
+                                 Published online ahead of print
+                                 
+                                 <span class="slug-ahead-of-print-date">August 1, 2013</span>,
+                                 doi:
+                                 <span title="10.1099/ijs.0.052654-0" class="slug-doi">10.1099/ijs.0.052654-0
+                                    </span>
+                                 </span>
+                              
+                              <cite>
+                                 	    <abbr title="International Journal of Systematic and Evolutionary Microbiology"
+                                       class="slug-jnl-abbrev">
+                                    IJSEM</abbr><span class="slug-pub-date" itemprop="datePublished">
+                                    	    December 2013 
+                                    </span>
+                                 	    <span class="slug-vol">
+                                    vol. 63 
+                                    </span><span class="slug-issue">
+                                    no. Pt 12 
+                                    </span><span class="slug-pages">
+                                    4586-4590
+                                    </span>
+                                 </cite>
+                              
+                              	           
+                              
+                              
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section cb-views">
+                     <ol>
+                        <li><span class="oa-article">Free via Open Access: <span>OA</span></span></li>
+                        <li><span class="creative-commons-article">Free via Creative Commons: <span>CC</span></span></li>
+                        <li><span class="ccv cc-version-by/2.5/"></span></li>
+                        <li class="abstract-view-link primary"><span class="oa-view">OA </span><a href="/content/63/Pt_12/4586.abstract" rel="view-abstract">Abstract</a><span class="free">Free</span></li>
+                        <li class="notice full-text-view-link primary"><span class="variant-indicator">» <span>Full Text</span></span><span class="free">Free</span></li>
+                        <li class="notice full-text-pdf-view-link primary"><a href="/content/63/Pt_12/4586.full.pdf+html" rel="view-full-text.pdf">Full Text (PDF)</a><span class="free">Free</span></li>
+                        <li><a href="/content/63/Pt_12/4586/suppl/DC1" rel="supplemental-data"
+                              class="dslink-supplementary-material">Supplementary material</a></li>
+                        <li><a href="/powerpoint/63/Pt_12/4586">PPT Slides of All Figures</a></li>
+                        <li class="cb-versions">
+                           <div><span id="pap-all-versions-label">All Versions of this Article:</span><ol class="version-list">
+                                 <li><a href="/content/early/2013/08/01/ijs.0.052654-0">ijs.0.052654-0v1</a></li>
+                                 <li class="current-li"><span>63/Pt_12/4586</span> <span class="current-version">most recent</span></li>
+                              </ol>
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible" id="cb-art-cat">
+                     <h4 class="cb-section-header"><span>Classifications</span></h4>
+                     <ol>
+                        <li>
+                           <ul class="subject-headings">
+                              <li>New Taxa
+                                 <ul class="subject-sub-headings last-child">
+                                    <li><a class="tocsection-search"
+                                          href="/search?tocsectionid=Bacteroidetes&amp;sortspec=date&amp;submit=Submit">Bacteroidetes</a></li>
+                                 </ul>
+                              </li>
+                           </ul>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible" id="cb-art-svcs">
+                     <h4 class="cb-section-header"><span>Services</span></h4>
+                     <ol>
+                        <li class="mail-a-friend-link icon-link"><a href="/email?gca=ijs%3B63%2FPt_12%2F4586&amp;current-view-path=/content/63/Pt_12/4586.full">
+                              Email this article to a colleague</a></li>
+                        <li class="alert-link icon-link"><a href="/cgi/alerts/ctalert?alertType=citedby&amp;addAlert=cited_by&amp;cited_by_criteria_resid=ijs%3B63%2FPt_12%2F4586&amp;saveAlert=no&amp;return-type=article&amp;return_url=http://ijs.sgmjournals.org/content/63/Pt_12/4586.full">Alert me when this article is cited</a></li>
+                        <li class="alert-link icon-link"><a href="/cgi/alerts/ctalert?alertType=correction&amp;addAlert=correction&amp;correction_criteria_value=63/Pt_12/4586&amp;saveAlert=no&amp;return-type=article&amp;return_url=http://ijs.sgmjournals.org/content/63/Pt_12/4586.full">Alert me if a correction is posted</a></li>
+                        <li class="similar-link"><a href="/search?qbe=ijs%3Bijs.0.052654-0&amp;citation=Fries%20et%20al.%2063%20%28Pt%2012%29:%204586&amp;submit=yes">Similar articles in this journal</a></li>
+                        <li class="similar-link"><a href="/external-ref?access_num=ijs%3B63%2FPt_12%2F4586&amp;link_type=ISI_RELATEDRECORDS"
+                              id="cb-isi-similar-articles"
+                              class="similar-link">Similar articles in Web of Science</a></li>
+                        <li class="similar-link"><a href="/external-ref?access_num=23907231&amp;link_type=MED_NBRS"
+                              class="similar-link">Similar articles in PubMed</a></li>
+                        <li class="cit-man-link icon-link cite-link"><a href="/citmgr?gca=ijs%3B63%2FPt_12%2F4586">Download to citation manager</a></li>
+                        <li class="copyright-link icon-link"><a href="/external-ref?link_type=PERMISSIONDIRECT"><img src="/shared/img/content/permissions.gif" /></a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-cit">
+                     <h4 class="cb-section-header"><span>Citing Articles</span></h4>
+                     <ol>
+                        <li class="hw-citing-link"><a href="/content/63/Pt_12/4586.full?cited-by=yes&amp;legid=ijs;63/Pt_12/4586#cited-by"
+                              id="cb-hw-citing-articles">Load citing article information</a></li>
+                        <li><a href="/cgi/crossref-forward-links/63/Pt_12/4586" rel="external-nw"
+                              id="cb-crossref-citing-articles">Citing articles via CrossRef</a></li>
+                        <li><a href="/external-ref?access_num=%2Fijs%2F63%2FPt_12%2F4586&amp;link_type=ISI_CITING&amp;accnum_type=native"
+                              rel="external-nw"
+                              id="cb-isi-citing-articles">Citing articles via Web of Science</a></li>
+                        <li><a href="/external-ref?access_num=http://ijs.sgmjournals.org/content/63/Pt_12/4586.abstract&amp;link_type=GOOGLESCHOLAR">Citing articles via Google Scholar</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-gs">
+                     <h4 class="cb-section-header"><span>Google Scholar</span></h4>
+                     <ol>
+                        <li class="cb-art-gs-auth author-link"><a href="http://scholar.google.com/scholar?q=%22author%3AFries%20author%3AJ.%22"
+                              class="cb-art-gs-auth author-link">Articles by  Fries, J.</a></li>
+                        <li class="cb-art-gs-auth author-link"><a href="http://scholar.google.com/scholar?q=%22author%3ASessitsch%20author%3AA.%22"
+                              class="cb-art-gs-auth author-link">Articles by  Sessitsch, A.</a></li>
+                        <li class="cb-art-gs-rel similar-link"><a href="/external-ref?access_num=http://ijs.sgmjournals.org/content/63/Pt_12/4586.abstract&amp;link_type=GOOGLESCHOLARRELATED">Search for related content</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-pm">
+                     <h4 class="cb-section-header"><span>PubMed</span></h4>
+                     <ol>
+                        <li class="cb-art-pm-cite cite-link icon-link"><a href="/external-ref?access_num=23907231&amp;link_type=PUBMED"
+                              class="cb-art-pm-cite cite-link icon-link">PubMed citation</a></li>
+                        <li class="cb-art-pm-auth author-link"><a href="/external-ref?access_num=Fries%20J&amp;link_type=AUTHORSEARCH"
+                              class="cb-art-pm-auth author-link">Articles by  Fries, J.</a></li>
+                        <li class="cb-art-pm-auth author-link"><a href="/external-ref?access_num=Sessitsch%20A&amp;link_type=AUTHORSEARCH"
+                              class="cb-art-pm-auth author-link">Articles by  Sessitsch, A.</a></li>
+                        <li>
+                           <div id="cb-entrez-links-placeholder"><a href="/entrez-links/23907231"></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed" id="cb-art-rel">
+                     <h4 class="cb-section-header"><span>Related Content</span></h4>
+                     <ol>
+                        <li><a href="/content/63/Pt_12/4586.full?related-urls=yes&amp;legid=ijs;63/Pt_12/4586#related-urls"
+                              id="cb-related-urls">Load related web page information</a></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section collapsible default-closed soc-links icon-link"
+                       id="cb-art-soc">
+                     <h4 class="cb-section-header"><span>Social Bookmarking</span></h4>
+                     <ol>
+                        <li>
+                           <div class="social-bookmarking">
+                              
+                              <ul class="social-bookmark-links">
+                                 <li class="social-bookmarking-item social-bookmarking-item-citeulike"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=CITEULIKE"><img src="/shared/img/common/social-bookmarking/citeulike.gif"
+                                            alt="Add to CiteULike"
+                                            title="CiteULike" /></a><span class="soc-bm-link-text">CiteULike</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-delicious"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=DEL_ICIO_US"><img src="/shared/img/common/social-bookmarking/delicious.gif"
+                                            alt="Add to Delicious"
+                                            title="Delicious" /></a><span class="soc-bm-link-text">Delicious</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-digg"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=DIGG"><img src="/shared/img/common/social-bookmarking/digg.gif" alt="Add to Digg"
+                                            title="Digg" /></a><span class="soc-bm-link-text">Digg</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-facebook"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=FACEBOOK"
+                                       class="sb-facebook"
+                                       rel="external-nw"><img src="/shared/img/common/social-bookmarking/facebook.gif" alt="Add to Facebook"
+                                            title="Facebook" /></a><span class="soc-bm-link-text">Facebook</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-googleplus"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=GOOGLEPLUS&amp;log_only=yes"><img src="/shared/img/common/social-bookmarking/googleplus.jpg" alt="Add to Google+"
+                                            title="Google+" /></a><span class="soc-bm-link-text">Google+</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-linkedin"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=LINKEDIN"><img src="/shared/img/common/social-bookmarking/linkedin.gif" alt="Add to LinkedIn"
+                                            title="LinkedIn" /></a><span class="soc-bm-link-text">LinkedIn</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-mendeley"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=MENDELEY"><img src="/shared/img/common/social-bookmarking/mendeley.gif" alt="Add to Mendeley"
+                                            title="Mendeley" /></a><span class="soc-bm-link-text">Mendeley</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-reddit"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=REDDIT"><img src="/shared/img/common/social-bookmarking/reddit.gif" alt="Add to Reddit"
+                                            title="Reddit" /></a><span class="soc-bm-link-text">Reddit</span></li>
+                                 <li class="social-bookmarking-item social-bookmarking-item-twitter"><a href="/external-ref?tag_url=http://ijs.sgmjournals.org/cgi/content/long/63/Pt_12/4586&amp;title=Spirosoma%20endophyticum%20sp.%20nov.%2C%20isolated%20from%20Zn-%20and%20Cd-accumulating%20Salix%20caprea+--+Fries%20et%20al.%2063%20%28Pt%2012%29%3A%204586+--+IJSEM&amp;doi=10.1099/ijs.0.052654-0&amp;link_type=TWITTER"><img src="/shared/img/common/social-bookmarking/twitter.gif" alt="Add to Twitter"
+                                            title="Twitter" /></a><span class="soc-bm-link-text">Twitter</span></li>
+                              </ul>
+                              
+                              <p class="social-bookmarking-help"><a href="/help/social_bookmarks.dtl">What's this?</a></p>
+                              
+                           </div>
+                        </li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+            
+            <div class="content-box" id="article-dyn-nav">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>Navigate This Article</span></h3>
+                  <div class="cb-section" id="cb-art-nav">
+                     <ol>
+                        <li><a href="#content-block">Top</a></li>
+                        <li><a href="#abstract-1">Abstract</a></li>
+                        <li><a href="#ack-1">Acknowledgements</a></li>
+                        <li><a href="#ref-list-1">References</a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            
+         </div>
+         <div id="col-3">
+            
+            <div class="content-box" id="sidebar-current-issue">
+               <div class="cb-contents">
+                  <h3 class="cb-contents-header"><span>This Month's Issue</span></h3>
+                  <div class="cb-section">
+                     <ol>
+                        <li><span><a href="/content/current" rel="current-issue">April 2015, 65 (Pt 4)</a></span></li>
+                     </ol>
+                  </div>
+                  <div class="cb-section">
+                     <ol>
+                        <li>
+                           <div class="current-issue"><a href="/content/current" rel="current-issue"><img src="/content/65/Pt_4.cover.gif" width="67" height="89" alt="Current Issue" /></a></div>
+                        </li>
+                     </ol>
+                  </div>
+                  <div class="cb-section sidebar-etoc-link">
+                     <ol>
+                        <li><a href="/cgi/alerts/etoc">Alert me to new issues of IJSEM
+                              </a></li>
+                     </ol>
+                  </div>
+               </div>
+            </div>
+            <div id="sidebar-global-nav">
+               
+               		
+               <ul class="button-list pub-links">
+                  <li class="first"><a href="/site/misc/about.xhtml" title="ABOUT IJSEM"><span>ABOUT IJSEM</span></a></li>
+                  <li><a href="/site/misc/edboard.xhtml" title="EDITORIAL BOARD &amp; STAFF"><span>EDITORIAL BOARD &amp; STAFF</span></a></li>
+                  <li><a href="http://www.editorialmanager.com/ijs/" title="SUBMIT A MANUSCRIPT"><span>SUBMIT A MANUSCRIPT</span></a></li>
+                  <li><a href="/site/misc/ifora.xhtml" title="INFORMATION FOR AUTHORS"><span>INFORMATION FOR AUTHORS</span></a></li>
+                  <li><a href="/site/misc/iforr.xhtml" title="INFORMATION FOR REVIEWERS"><span>INFORMATION FOR REVIEWERS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/site/librarians/index.xhtml"
+                        title="INFORMATION FOR LIBRARIANS"><span>INFORMATION FOR LIBRARIANS</span></a></li>
+                  <li><a href="/site/misc/reprints.xhtml" title="PERMISSIONS AND REPRINTS"><span>PERMISSIONS AND REPRINTS</span></a></li>
+                  <li><a href="http://www.sgmjournals.org/subscriptions" title="SUBSCRIPTIONS"><span>SUBSCRIPTIONS</span></a></li>
+                  <li><a href="/site/misc/addir.xhtml" title="ADVERTISING"><span>ADVERTISING</span></a></li>
+                  <li class="rss-img-button"><a href="/site/misc/alerts_feeds.xhtml" title="ALERTS &amp; FEEDS"><span>ALERTS &amp; FEEDS</span></a></li>
+                  <li class="last"><a href="/feedback" title="FEEDBACK"><span>FEEDBACK</span></a></li>
+               </ul>
+               		
+               <ul class="button-list pub-links umbrella-links">
+                  <li class="first"><a href="http://mic.sgmjournals.org" title="MICROBIOLOGY"><span>MICROBIOLOGY</span></a></li>
+                  <li><a href="http://vir.sgmjournals.org" title="J GEN VIROL"><span>J GEN VIROL</span></a></li>
+                  <li><a href="http://jmm.sgmjournals.org" title="J MED MICROBIOL"><span>J MED MICROBIOL</span></a></li>
+                  <li><a href="http://jmmcr.sgmjournals.org" title="JMM CASE REPORTS"><span>JMM CASE REPORTS</span></a></li>
+                  <li class="last"><a href="http://www.sgmjournals.org" title="ALL SGM JOURNALS"><span>ALL SGM JOURNALS</span></a></li>
+               </ul>
+               		
+               <div class="sidebar-icon-group">
+                  			
+                  <div class="icons">
+                     			<a href="http://www.sgm.ac.uk/" rel="external-nw"><img src="/publisher/img/society_logo.gif" class="publisher-icon" alt="Society Logo" /></a>
+                     			<a href="http://www.the-icsp.org/" rel="external-nw"><img src="/publisher/img/icsp_logo.gif" class="publisher-icon" alt="ICSP Logo" /></a>
+                     			<a href="http://highwire.stanford.edu/" rel="external-nw"><img src="/publisher/img/hplogo.gif" class="hw-icon" alt="HighWire Press Logo" /></a>
+                     			
+                  </div>
+                  			
+                  <div class="sidebar-icon-text"><span>The <a href="http://www.sgmjournals.org"> Society for General Microbiology</a> publishes online with the assistance of <a href="http://highwire.stanford.edu">HighWire Press®</a>.</span></div>
+                  		
+               </div>
+               	
+            </div>
+            <div class="most-links-box js-marker">
+               
+               <div class="most-header">
+                  
+                  <h3>Most</h3>
+                  
+               </div>
+               
+               <ul>
+                  <li class="most-cur-sel">
+                     <h4>Viewed</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/1070?rss=1&amp;ssource=mfr">Proposal to consistently apply the International Code of Nomenclature of Prokaryotes (ICNP) to names of the oxygenic photosynthetic
+                                 bacteria (cyanobacteria), including those validly published under the International Code of Botanical Nomenclature (ICBN)/International
+                                 Code of Nomenclature for algae, fungi and plants (ICN), and proposal to change Principle 2 of the ICNP</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfr">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/316?rss=1&amp;ssource=mfr">Integrating genomics into the taxonomy and systematics of the Bacteria and Archaea</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/333?rss=1&amp;ssource=mfr">Applications of next-generation sequencing to unravelling the evolutionary history of algae</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/65/Pt_3/739?rss=1&amp;ssource=mfr">Notification that new names of prokaryotes, new combinations, and new taxonomic opinions have appeared in volume 64, part
+                                 12, of the IJSEM</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfr1.dtl" class="view-all">» View all Most Viewed articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+                  <li>
+                     <h4>Cited</h4>
+                     
+                     
+                     <div class="most-list">
+                        
+                        <ol>
+                           <li class="first-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4386?rss=1&amp;ssource=mfc">Chryseobacterium hispalense sp. nov., a plant-growth-promoting bacterium isolated from a rainwater pond in an olive plant
+                                 nursery, and emended descriptions of Chryseobacterium defluvii, Chryseobacterium indologenes, Chryseobacterium wanjuense and
+                                 Chryseobacterium gregarium</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_2/346?rss=1&amp;ssource=mfc">Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation
+                                 of prokaryotes</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/64/Pt_1/138?rss=1&amp;ssource=mfc">Aquibacter zeaxanthinifaciens gen. nov., sp. nov., a zeaxanthin-producing bacterium of the family Flavobacteriaceae isolated
+                                 from surface seawater, and emended descriptions of the genera Aestuariibaculum and Gaetbulibacter</a></li>
+                           <li><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4790?rss=1&amp;ssource=mfc">Kordia aquimaris sp. nov., a zeaxanthin-producing member of the family Flavobacteriaceae isolated from surface seawater, and
+                                 emended description of the genus Kordia</a></li>
+                           <li class="last-item"><a href="http://ijs.sgmjournals.org/cgi/content/short/63/Pt_12/4524?rss=1&amp;ssource=mfc">Erythrobacter odishensis sp. nov. and Pontibacter odishensis sp. nov. isolated from dry soil of a solar saltern</a></li>
+                        </ol>
+                        <a href="http://ijs.sgmjournals.org/reports/mfc1.dtl" class="view-all">» View all Most Cited articles</a>
+                        
+                     </div>
+                     
+                     
+                  </li>
+               </ul>
+               
+               
+            </div>
+            
+            
+            
+         </div>
+         <div id="footer">
+            
+            <div class="bar">
+               
+               <div class="footer-group footer-col-left">
+                  		
+                  <p class="copyright">Copyright ©
+                     		2015 International Union of Microbiological Societies
+                     	
+                  </p>
+                  	
+               </div>
+               
+               <div class="footer-group footer-col-right">
+                  	    
+                  <ul class="issns">
+                     <li>
+                        <span>Print ISSN: </span>
+                        <span class="issn">1466-5026</span>
+                        
+                     </li>
+                     <li>
+                        <span>Online ISSN: </span>
+                        <span class="issn">1466-5034</span>
+                        
+                     </li>
+                  </ul>
+                  	  
+               </div>
+               	  
+            </div>
+            
+            
+            <div class="block-2 sb-div"></div>
+            
+         </div><script type="text/javascript">
+        var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
+        document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
+        </script><script type="text/javascript">
+        try {
+        var pageTracker = _gat._getTracker("UA-189672-25");
+        pageTracker._setDomainName(".sgmjournals.org");
+        pageTracker._trackPageview();
+        } catch(err) {}
+        </script><script type="text/javascript">
+	(function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
+		(i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
+		m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
+	})(window,document,'script','//www.google-analytics.com/analytics.js','ga');
+
+	ga('create', 'UA-48529861-1', '.sgmjournals.org');
+	ga('send', 'pageview');
+	</script></div>
+   </body>
+</html>
\ No newline at end of file
diff --git a/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_12_4586.full/fulltext.pdf b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_12_4586.full/fulltext.pdf
new file mode 100644
index 00000000..5c2ed86f
Binary files /dev/null and b/examples/ijsem-quickscrape/ijsemout-rsu-scraper/http_ijs.sgmjournals.org_content_63_Pt_12_4586.full/fulltext.pdf differ
diff --git a/examples/ijsem-quickscrape/mounce-old-ijsem.json b/examples/ijsem-quickscrape/mounce-old-ijsem.json
new file mode 100644
index 00000000..86dddcc7
--- /dev/null
+++ b/examples/ijsem-quickscrape/mounce-old-ijsem.json
@@ -0,0 +1,81 @@
+{
+  "url": "ijs\\.sgmjournals\\.org",
+  "elements": {
+    "publisher": {
+      "selector": "//meta[@name='DC.Publisher']",
+      "attribute": "content"
+    },
+    "journal": {
+      "selector": "//meta[@name='citation_journal_title']",
+      "attribute": "content"
+    },
+    "title": {
+      "selector": "//meta[@name='citation_title']",
+      "attribute": "content"
+    },
+    "authors": {
+      "selector": "//meta[@name='citation_author']",
+      "attribute": "content"
+    },
+    "date": {
+      "selector": "//meta[@name='citation_date']",
+      "attribute": "content"
+    },
+    "doi": {
+      "selector": "//meta[@name='citation_doi']",
+      "attribute": "content"
+    },
+    "volume": {
+      "selector": "//meta[@name='citation_volume']",
+      "attribute": "content"
+    },
+    "issue": {
+      "selector": "//meta[@name='citation_issue']",
+      "attribute": "content"
+    },
+    "firstpage": {
+      "selector": "//meta[@name='citation_firstpage']",
+      "attribute": "content"
+    },
+    "abstract": {
+      "selector": "//div[contains(@class, 'section abstract')]",
+      "attribute": "text"
+    },
+    "fulltext_html": {
+      "selector": "//meta[@name='citation_fulltext_html_url']",
+      "attribute": "content",
+      "download": {
+        "rename": "fulltext.html"
+      }
+    },
+    "fulltext_pdf": {
+      "selector": "//meta[@name='citation_pdf_url']",
+      "attribute": "content",
+      "download": {
+        "rename": "fulltext.pdf"
+      }
+    },
+    "supplementary_material": {
+      "selector": "//a[@rel='supplemental-data']",
+      "attribute": "href",
+      "download": true
+    },
+    "figure": {
+      "selector": "//div[contains(@class, 'fig-inline')]/a/img",
+      "attribute": "src",
+      "download": true
+    },
+    "figure_caption": {
+      "selector": "//div[contains(@class, 'fig-caption')]",
+      "attribute": "text"
+    },
+    "license": {
+      "selector": "//div[contains(@class, 'license')]",
+      "attribute": "text"
+    },
+    "copyright": {
+      "selector": "//div/p[contains(@class, 'copyright')]",
+      "attribute": "text"
+    }
+  }
+}	
diff --git a/examples/ijsem-quickscrape/rsu-new-ijsem.json b/examples/ijsem-quickscrape/rsu-new-ijsem.json
new file mode 100644
index 00000000..da95aa91
--- /dev/null
+++ b/examples/ijsem-quickscrape/rsu-new-ijsem.json
@@ -0,0 +1,93 @@
+{
+  "url": "ijs\\.sgmjournals\\.org",
+  "followables": {
+    "figure_expansion": {
+      "selector": "//div[contains(@class, 'fig-inline')]//a[text()='In this window']",
+      "attribute": "href"
+    },
+    "suppdata_expansion": {
+      "selector": "//a[@rel='supplemental-data']",
+      "attribute": "href"
+    }
+  },
+  "elements": {
+    "publisher": {
+      "selector": "//meta[@name='DC.Publisher']",
+      "attribute": "content"
+    },
+    "journal": {
+      "selector": "//meta[@name='citation_journal_title']",
+      "attribute": "content"
+    },
+    "title": {
+      "selector": "//meta[@name='citation_title']",
+      "attribute": "content"
+    },
+    "authors": {
+      "selector": "//meta[@name='citation_author']",
+      "attribute": "content"
+    },
+    "date": {
+      "selector": "//meta[@name='citation_date']",
+      "attribute": "content"
+    },
+    "doi": {
+      "selector": "//meta[@name='citation_doi']",
+      "attribute": "content"
+    },
+    "volume": {
+      "selector": "//meta[@name='citation_volume']",
+      "attribute": "content"
+    },
+    "issue": {
+      "selector": "//meta[@name='citation_issue']",
+      "attribute": "content"
+    },
+    "firstpage": {
+      "selector": "//meta[@name='citation_firstpage']",
+      "attribute": "content"
+    },
+    "abstract": {
+      "selector": "//div[contains(@class, 'section abstract')]",
+      "attribute": "text"
+    },
+    "fulltext_html": {
+      "selector": "//meta[@name='citation_fulltext_html_url']",
+      "attribute": "content",
+      "download": {
+        "rename": "fulltext.html"
+      }
+    },
+    "fulltext_pdf": {
+      "selector": "//meta[@name='citation_pdf_url']",
+      "attribute": "content",
+      "download": {
+        "rename": "fulltext.pdf"
+      }
+    },
+    "supplementary_material": {
+      "follow": "suppdata_expansion",
+      "selector": "//div[@id='content-block']//a",
+      "attribute": "href",
+      "download": true
+    },
+    "figure": {
+      "follow": "figure_expansion",
+      "selector": "//div[contains(@class, 'fig-expansion')]/a",
+      "attribute": "href",
+      "download": true
+    },
+    "figure_caption": {
+      "selector": "//div[contains(@class, 'fig-caption')]",
+      "attribute": "text"
+    },
+    "license": {
+      "selector": "//div[contains(@class, 'license')]",
+      "attribute": "text"
+    },
+    "copyright": {
+      "selector": "//div/p[contains(@class, 'copyright')]",
+      "attribute": "text"
+    }
+  }
+}
diff --git a/examples/ijsem/small/ijs.0.000026-0-000.pbm2/image/ijs.0.000026-0-000.pbm2.png b/examples/ijsem/small/ijs.0.000026-0-000.pbm2/image/ijs.0.000026-0-000.pbm2.png
new file mode 100644
index 00000000..35d9f3ef
Binary files /dev/null and b/examples/ijsem/small/ijs.0.000026-0-000.pbm2/image/ijs.0.000026-0-000.pbm2.png differ
diff --git a/examples/ijsem/small/ijs.0.000109-0-000.pbm/image/ijs.0.000109-0-000.pbm.png b/examples/ijsem/small/ijs.0.000109-0-000.pbm/image/ijs.0.000109-0-000.pbm.png
new file mode 100644
index 00000000..784f114c
Binary files /dev/null and b/examples/ijsem/small/ijs.0.000109-0-000.pbm/image/ijs.0.000109-0-000.pbm.png differ
diff --git a/examples/ijsem/small/ijs.0.000117-0-000.pbm/image/ijs.0.000117-0-000.pbm.png b/examples/ijsem/small/ijs.0.000117-0-000.pbm/image/ijs.0.000117-0-000.pbm.png
new file mode 100644
index 00000000..8d0720c4
Binary files /dev/null and b/examples/ijsem/small/ijs.0.000117-0-000.pbm/image/ijs.0.000117-0-000.pbm.png differ
diff --git a/examples/ijsem/small/ijs.0.000158-0-000.pbm/image/ijs.0.000158-0-000.pbm.png b/examples/ijsem/small/ijs.0.000158-0-000.pbm/image/ijs.0.000158-0-000.pbm.png
new file mode 100644
index 00000000..1256630a
Binary files /dev/null and b/examples/ijsem/small/ijs.0.000158-0-000.pbm/image/ijs.0.000158-0-000.pbm.png differ
diff --git a/examples/ijsem/small/ijs.0.000174-0-000.pbm/image/ijs.0.000174-0-000.pbm.png b/examples/ijsem/small/ijs.0.000174-0-000.pbm/image/ijs.0.000174-0-000.pbm.png
new file mode 100644
index 00000000..b78652c8
Binary files /dev/null and b/examples/ijsem/small/ijs.0.000174-0-000.pbm/image/ijs.0.000174-0-000.pbm.png differ
diff --git a/examples/ijsem/small/ijs.0.000257-0-000.pbm/image/ijs.0.000257-0-000.pbm.png b/examples/ijsem/small/ijs.0.000257-0-000.pbm/image/ijs.0.000257-0-000.pbm.png
new file mode 100644
index 00000000..5e672768
Binary files /dev/null and b/examples/ijsem/small/ijs.0.000257-0-000.pbm/image/ijs.0.000257-0-000.pbm.png differ
diff --git a/examples/ijsem/small/ijs.0.000265-0-000.pbm/image/ijs.0.000265-0-000.pbm.png b/examples/ijsem/small/ijs.0.000265-0-000.pbm/image/ijs.0.000265-0-000.pbm.png
new file mode 100644
index 00000000..98860bcc
Binary files /dev/null and b/examples/ijsem/small/ijs.0.000265-0-000.pbm/image/ijs.0.000265-0-000.pbm.png differ
diff --git a/examples/ijsem/small/ijs.0.000349-0-001.pbm/image/ijs.0.000349-0-001.pbm.png b/examples/ijsem/small/ijs.0.000349-0-001.pbm/image/ijs.0.000349-0-001.pbm.png
new file mode 100644
index 00000000..0bdaa1c0
Binary files /dev/null and b/examples/ijsem/small/ijs.0.000349-0-001.pbm/image/ijs.0.000349-0-001.pbm.png differ
diff --git a/examples/ijsem/small/ijs.0.000364-0-002.pbm/image/ijs.0.000364-0-002.pbm.png b/examples/ijsem/small/ijs.0.000364-0-002.pbm/image/ijs.0.000364-0-002.pbm.png
new file mode 100644
index 00000000..ca931e8b
Binary files /dev/null and b/examples/ijsem/small/ijs.0.000364-0-002.pbm/image/ijs.0.000364-0-002.pbm.png differ
diff --git a/examples/ijsem/small/ijs.0.000364-0-004.pbm/image/ijs.0.000364-0-004.pbm.png b/examples/ijsem/small/ijs.0.000364-0-004.pbm/image/ijs.0.000364-0-004.pbm.png
new file mode 100644
index 00000000..db9336d3
Binary files /dev/null and b/examples/ijsem/small/ijs.0.000364-0-004.pbm/image/ijs.0.000364-0-004.pbm.png differ
diff --git a/examples/ijsem/small/ijs.0.000406-0-000.pbm/image/ijs.0.000406-0-000.pbm.png b/examples/ijsem/small/ijs.0.000406-0-000.pbm/image/ijs.0.000406-0-000.pbm.png
new file mode 100644
index 00000000..57a52686
Binary files /dev/null and b/examples/ijsem/small/ijs.0.000406-0-000.pbm/image/ijs.0.000406-0-000.pbm.png differ
diff --git a/examples/theses/20130912_Fei_YAO.pdf b/examples/theses/20130912_Fei_YAO.pdf
new file mode 100644
index 00000000..3083fc2d
Binary files /dev/null and b/examples/theses/20130912_Fei_YAO.pdf differ
diff --git a/examples/theses/20130912_Fei_YAO/fulltext.pdf b/examples/theses/20130912_Fei_YAO/fulltext.pdf
new file mode 100644
index 00000000..3083fc2d
Binary files /dev/null and b/examples/theses/20130912_Fei_YAO/fulltext.pdf differ
diff --git a/examples/theses/20130912_Fei_YAO/fulltext.pdf.txt b/examples/theses/20130912_Fei_YAO/fulltext.pdf.txt
new file mode 100644
index 00000000..d27d2820
--- /dev/null
+++ b/examples/theses/20130912_Fei_YAO/fulltext.pdf.txt
@@ -0,0 +1,4116 @@
+Carbon-Based Nanomaterials as an Anode for Lithium
+Ion Battery
+Fei Yao, Costel Sorin Cojocaru
+To cite this version:
+Fei Yao, Costel Sorin Cojocaru. Carbon-Based Nanomaterials as an Anode for Lithium Ion
+Battery. Micro and nanotechnologies/Microelectronics. Ecole Polytechnique X, 2013. English.
+<pastel-00967913>
+HAL Id: pastel-00967913
+https://pastel.archives-ouvertes.fr/pastel-00967913
+Submitted on 31 Mar 2014
+HAL is a multi-disciplinary open access L’archive ouverte pluridisciplinaire HAL, est
+archive for the deposit and dissemination of sci- destine´e au de´poˆt et a` la diffusion de documents
+entific research documents, whether they are pub- scientifiques de niveau recherche, publie´s ou non,
+lished or not. The documents may come from e´manant des e´tablissements d’enseignement et de
+teaching and research institutions in France or recherche franc¸ais ou e´trangers, des laboratoires
+abroad, or from public or private research centers. publics ou prive´s.
+                      
+ 
+ 
+ 
+ 
+ 
+ 
+Carbon-Based Nanomaterials as an Anode 
+for Lithium Ion Battery 
+ 
+ 
+ 
+ 
+ 
+ 
+Fei YAO 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+LPICM-École Polytechnique, CNRS (UMR 7647)  
+Laboratoire de Physique des Interfaces et Couches Minces 
+Route de Saclay; 91128 PALAISEAU Cedex , France 
+ 
+ 
+ 
+ 
+The Graduate School 
+Sungkyunkwan University 
+Department of Energy Science (DOES) 
+IBS Center for Integrated Nanostructure Physics  
+300 Cheoncheon-dong, Jangan-gu, Suwon 440-746, R. O. Korea 
+ 
+ 
+                     
+ 
+THÈSE 
+ 
+Présentée pour obtenir le grade de 
+DOCTEUR DE L’ ÉCOLE POLYTECHNIQUE 
+Spécialité: Physique 
+Par 
+Fei YAO 
+ 
+ 
+ 
+Carbon-Based Nanomaterials as an Anode 
+for Lithium Ion Battery 
+ 
+ 
+ 
+ 
+ 
+ 
+Soutenue le 27 / 06 / 2013 devant le jury constitué de : 
+ 
+ 
+M. Jean-Pierre Pereira-Ramos Directeur de Recherche CNRS Rapporteur 
+M. Kee Seok Nahm Professor à Chonbuk National University Rapporteur 
+M. Won Sub Yoon Professor à Sungkyunkwan University Examinateur 
+M. Marc Chatelet Directeur de Recherche CNRS Examinateur 
+M. Costel-Sorin Cojocaru Chargé de recherche au CNRS Directeur de Thèse 
+Enseignant à l’École polytechnique  
+M. Young Hee Lee Professor à Sungkyunkwan University Directeur de Thèse 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+LABORATOIRE DE PHYSIQUE DES INTERFACES ET COUCHES MINCES (LPICM) 
+CNRS, UMR7647, ÉCOLE POLYTECHNIQUE 
+ 
+ 
+ 
+  
+ 
+The Graduate School 
+Sungkyunkwan University 
+June 2013
+ 
+ 
+ACKNOWLEDGMENTS 
+First and foremost, I would like to express my greatest gratitude to Prof. 
+Young Hee Lee and Dr. Costel Sorin Cojocaru, my advisors of graduate research, for 
+their patient guidance and continuous support throughout the last three years. They 
+taught me strict sense of research, humble attitude of study, and correct path in life. I 
+feel so lucky and honored for being their student in the most important days of my 
+growth. Their great fairness, concern and understanding will be appreciated through 
+all my life. 
+My sincerely thanks are extended to all my coworks, Dr. Fethullah Güneş, Mr. 
+Bing Li, Dr. Kangpyo So, Mr. Huy Quang Ta, Mr. Jian Chang, Mr. An Quoc Vu, Mr. 
+Seung Jin Chae, Dr. Hongyan Yue, Prof. Didier Pribat and Prof. Sishen Xie, in 
+Sungkyunkwan University. And also Dr. Seung Mi Lee from Center for 
+Nanocharacterization, Korea Research Institute of Standards, Dr. Kyeu Yoon Sheem 
+from Science and Samsung SDI Corporate R&D Center. 
+I would like to dedicate this thesis to my parents and sister for their continuous 
+understanding, support, and love. My deepest appreciation to my beloved husband, 
+Humin Li, for his love, encouragement and accompanying all the time!  
+ 
+ 
+TO MY PARENTS… 
+ 
+ 
+ ABSTRACT 
+ 
+ 
+ 
+In this thesis work, carbon-based nanomaterials using as an anode for 
+lithium ion battery have been generally investigated. Compared to typical 
+micron-sized carbon materials, nanosized carbon materials exhibited great 
+potentials not only in practical anode application but also in the fundamental 
+science exploration of Li ion diffusion. In the case of practical application, one 
+dimensional carbon nanofibers (CNFs) fabricated by electrospinning was 
+prepared for anode material. The structure involves neither a metal substrate nor 
+binders and therefore eventually benefited the capacity and long term stability. 
+Yet, the energy density is still limited to 370 mAh/g of conventional carbon. In 
+order to improve the capacity of raw carbon nanofibers, silicon, a high Li storage 
+material, was incorporated by electrochemical deposition. The resulted Si/CNF 
+mat improved clearly the capacity of carbon materials more than twice for most 
+of cases.  
+ 
+In the case of fundamental study, chemical vapor deposition (CVD)-
+synthesized two dimensional graphene was chosen to be a media to reveal the 
+diffusion pathways of Li ion. Compared to typical graphite which contains both 
+basal and edge planes, a well defined basal plane with large area can be realized 
+in graphene to provide a comprehensive picture of lithium diffusion mechanism. 
+We have discovered that electrochemical reaction of electrode 
+(substrate/graphene) not only is related to the number of graphene layers but also 
+relies on the defect sites on the basal plane of graphene. Combing the 
+experimental results and density functional theory calculations, we proved that 
+basal plane hindered lithium ion diffusion with a high diffusion barrier height, 
+whereas divacancies and higher order defects can be shortcuts for lithium ion 
+diffusion. 
+ 
+ 
+Keyworks: nanocarbon materials, lithium ion battery, carbon nanofiber, silicon, 
+graphene, lithium ion diffusion 
+ 
+ 
+ 
+ 
+I 
+ 
+RESUME 
+ 
+ 
+ 
+Dans ce travail de thèse, nous avons exploré l’utilisation des nanomatériaux 
+à base de carbone comme anode pour les batteries lithium-ion. Par rapport aux 
+matériaux d’anode classiques qui sont de type carbone graphitique a des tailles de 
+grains de l’ordre du micromètre, les matériaux de carbone de taille nanométrique 
+présentent un grand potentiel non seulement pour l'application pratique en tant 
+que matériau d'anode, mais aussi du point de vue de la science fondamentale car 
+permettent l'exploration fine des phénomènes de diffusion des ions lithium. Dans 
+le cadre de l'application pratique, nous avons exploré les nanofibres 
+unidimensionnelles de carbone (CNF) en tant que matériau d'anode. Cette 
+structure d’anode comporte un substrat métallique comme collecteur de courant 
+mais n’avons pas utilisé des liants ce qui bénéficie a la stabilité à long terme. 
+Pourtant, la densité d'énergie que nous avons obtenu était encore limitée à 370 
+mAh /g similaire à celle du carbone conventionnel. Afin d'améliorer la capacité 
+des nanofibres de carbone bruts, nous les avons recouverts de silicium (par dépôt 
+électrochimique), un matériau d’insertion de lithium avec une bien plus 
+importante capacité de stockage. Le tapis hybrides Si / CNF ont permis 
+d'améliorer nettement la capacité des matériaux de carbone jusqu'à deux fois de 
+plus pour la plupart des cas. 
+ 
+    Du point de vue des études fondamentales, le graphène matériau 
+bidimensionnel, a été synthétisé par dépôt chimique en phase vapeur (CVD) et 
+utilisé comme un support pour mettre en évidence les chemins de diffusion des 
+ions lithium. Par rapport à du graphite classique qui contient à la fois les deux 
+plans de type basal et prismatique, seulement un plan basal bien défini et d’une 
+grande surface spécifique peut être réalisé dans le cas du graphène. Nous avons 
+découvert que la réaction électrochimique a l'électrode (substrat / graphène) est 
+non seulement liée au nombre de couches de graphène mais s'appuie également 
+sur la présence de défauts dans le plan de graphène. Combinant les résultats 
+expérimentaux et les calculs de théoriques, nous avons pu prouver que le plan 
+basal empêche la diffusion des ions de lithium avec une hauteur de barrière de 
+diffusion élevé, alors que les divacancies et les défauts d'ordre supérieur peuvent 
+constituer des raccourcis pour la diffusion des ions de lithium. 
+ 
+ 
+Keyworks: Matériaux des nanocarbonés, batterie lithium-ion, nanofibre de 
+carbone, Silicium, graphène, diffusion des ions lithium 
+II 
+ 
+Table of Contents 
+1 
+Introduction 
+Bibliography of Introduction 4 
+Chapter 1. Overview of Rechargeable Lithium Ion Battery 
+1.1   Electrochemical Energy Storage Systems 6 
+1.2  Rechargeable Lithium Based Battery 8 
+1.3  Rechargeable Lithium Ion Battery 11 
+Bibliography of Chapter 1 13 
+Chapter 2. Carbonaceous Materials as An Anode of Li-Ion Battery  
+2.1   Operation Mechanism of Li-Ion Battery 16 
+2.2  Classification of Carbonaceous Materials 21 
+2.2.1  Graphitic Carbon 21 
+2.2.2 Non-graphitic Carbon 22 
+2.3   Lithium Intercalation into Carbonaceous Materials 24 
+2.3.1 Lithium Intercalation into Graphitic Carbon Materials 24 
+2.3.1-1  Description 24 
+2.3.1-2  Charge/Discharge Profile of Graphitic Carbon Materials 26 
+2.3.2  Lithium Intercalation into Non-graphitic Carbon Materials 29 
+III 
+ 
+2.3.2-1  Low Specific Charge Carbon 29 
+2.3.2-2  High Specific Charge Carbon 31 
+2.4  Summary of Chapter Two 36 
+Bibliography of Chapter 2 38 
+Chapter 3. Silicon-Coated Carbon Nanofiber Mat for Anode of Lithium 
+Ion Battery  
+One Dimensional Carbon Materials as an Anode Material for 
+3.1   51 
+LIB 
+3.1.1  General Introduction of CNFs and CNTs 51 
+3.1.2  CNFs and CNTs Using as an Anode Material for LIB 56 
+3.1.3  Fabrication Methods of CNFs and CNTs 58 
+3.1.3-1  Chemical Vapor Deposition for Both CNFs and CNTs 58 
+3.1.3-2  Electrospinning Method for CNFs Mat 63 
+Electrospinning Fabricated CNFs Mat as an Anode Material 
+3.2   66 
+for LIB 
+SEM and Raman Characterization of CNFs Synthesized 
+3.2.1  67 
+Through Electrospinning 
+Anode Performance of CNFs Synthesized Through 
+3.2.2  69 
+Electrospinning 
+3.3.3 Anode Performance of CNF-Si Mat 83 
+IV 
+ 
+3.4   Summary of Chapter Three 95 
+Bibliography of Chapter 3 97 
+Chapter 4. Diffusion Mechanism of Lithium Ions through Basal Plane of 
+Layered Graphene 
+4.1 Brief Introduction of Two Dimensional Graphene 105 
+4.1.1 General Physical Properties of Graphene 105 
+4.1.2 Synthesis Methods of Graphene 110 
+Diffusion Mechanism of Lithium Ions through Basal Plane of 
+4.2 113 
+Layered Graphene 
+4.2.1 Material Preparation 116 
+4.2.2 Transfer Process of Graphene 116 
+4.2.3 Characterization of Graphene 117 
+4.2.4 Anode Performance of Graphene 121 
+4.3 Summary of Chapter Four 140 
+Bibliography of Chapter 4 141 
+ 
+ 
+ 
+ 
+V 
+ 
+List of Tables 
+Table 3.1 Anode performance comparison of silicon/CNF composites 89 
+fabricated by different methods. CNF film is usually fabricated 
+by mixing CNF powder with a binder. CNF mat is binder-free 
+freestanding film fabricated by electrospinning method. 
+Table 4.1 Defects related Li adsorption energy, and Li atomic charges 137 
+calculated by Mulliken, Hirshfeld, and electrostatic potential 
+(ESP) at the minimum energy configurations (M) and the barrier 
+states (B). Positive charge indicates charge depletion from 
+lithium atom.  
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+VI 
+ 
+List of Figures 
+Fig. 1.1 Ragone plot showing energy density vs. power density for 7 
+various energy storage devices. 
+Fig. 1.2  Comparison of the different battery technologies in terms of 8 
+volumetric and gravimetric energy density. 
+Fig. 1.3 Schematic representation of lithium batteries. a, Rechargeable 10 
+lithium-metal battery, dendrite formation was shown in the 
+negative electrode. b, Rechargeable lithium-ion battery.   
+Fig. 1.4 Current issues remaining in different types of anode materials. 12 
+Fig. 2.1 Schematic illustration of detailed charge/discharge process in Li- 15 
+ion battery.   
+Fig. 2.2 Potential profile of anode and cathode during charge/discharge.    17 
+Fig. 2.3 Charge curves of different metals (M) with respect to highly 18 
+oriented turbostratic pitch carbon fibers.    
+Fig. 2.4 Left: Schematics of the crystal structure of hexagonal graphite 20 
+with an AB stacking order. Right: view perpendicular to the 
+basal plane of graphite. Edges can be subdivided into arm-chair 
+and zigzag faces.     
+Fig. 2.5 Schematic indications of (a) graphite and (b) non-graphitic 23 
+(disordered) carbonaceous material. 
+Fig. 2.6 Structure indications of LiC6. (a) Left: schematic drawing 25 
+showing the AA layer stacking sequence with Li intercalation. 
+Right: simplified representation. (b) Perpendicular view to the 
+basal plane of LiC6. (c) Enlarged schematic of AA stacking 
+order. 
+VII 
+ 
+Fig. 2.7 Schematic indication of stage formation during Li ion 26 
+intercalation into graphite layers. 
+Fig. 2.8 Constant current charge/discharge curves of the graphite 27 
+(Timrex KS 44, Cirr is the irreversible specific charge, and Crev is 
+the reversible specific charge). 
+Fig. 2.9 Constant current charge/discharge curves of a coke (Conoco). 31 
+(Cirr is the irreversible specific charge, Crev the reversible 
+specific charge).  
+Fig. 2.10 a) Storage mechanisms of Li ions in graphite. b) Li storage in a 33 
+form of Li2 covalent molecules. c) Schematic model of Li 
+storage in cavities and nanopores. d) Li adsorption on the two 
+sides of an isolated graphene sheet.  
+Fig. 2.11 Constant current charge/discharge curves (1st and 2nd cycle) of 34 
+a high specific charge carbon material after heat treatment at 700 
+°C. (Cirr is the irreversible specific charge, Crev the reversible 
+specific charge). 
+Fig. 3.1 Schematic comparison of the diameter dimensions on a log scale 52 
+for various types of fibrous carbons.        
+Fig. 3.2 Wrapping of graphene sheet to form SWNT. 53 
+Fig. 3.3 Schematic indications of (a) SWCNT, (b) MWCNT, and the 54 
+corresponding TEM images in (c) and (d). 
+Fig. 3.4 Chiral vector  and chiral angle θ definition for a (2, 4) 55 
+nanotube on graphene sheet.  and .are the unit cell vectors 
+of the two-dimensional hexagonal graphene sheet. The 
+circumference of nanotube is given by the length of chiral 
+vector. The chiral angle θ is defined as the angle between 
+VIII 
+ 
+chiral vector and the zigzag axis. 
+Fig. 3.5 CVD process-fabricated (a) CNT power, (b) vertically aligned 59 
+CNTs, and (c) CNF planar network. 
+Fig. 3.6 Typical anode assembling based on CVD process fabricated 62 
+carbon powder. 
+Fig. 3.7 Schematic of CNF mat fabrication processes: (a) schematic of 65 
+electrospinning apparatus and (b) the fabricated nanofiber 
+network. 
+Fig. 3.8 SEM images of as-synthesized CNFs with (a) top view and (b) 68 
+cross-sectional images. 
+Fig. 3.9 Micro Raman spectra of CNFs mat fabricated by electrospinning 68 
+method. 
+Fig. 3.10 (a) Voltage profiles electrospinning fabricated CNF mat between 70 
+0.01 and 2 V at a charging rate of 0.1 C. The cycle numbers are 
+indicated in the figure. (b) Rate performance and columbic 
+efficiency of the above sample. 
+Fig. 3.11 (a) Structure deformation indication of Si based film/particles 73 
+before and after charge/discharge cycling. (b) SEI images of 
+st th
+CVD deposited Si thin film on Cu stustrate after 1  and 30  
+cycles of charge/discharge. 
+Fig. 3.12 Schematic of the apparatus for electrodeposition of Si. The cell 74 
+consists of three electrodes: woking electrode (as-fabricated 
+CNF mat), counter electrode (Pt wire) and reference electrode 
++
+(Ag/Ag ). During the deposition, a Si-containing electrolyte 
+(SiCl4 in PC) was add into the cell and a cyclic voltage scan (20 
+-1
+mV s ) was applied to the electrodes. 
+IX 
+ 
+Fig. 3.13 (a) Cyclic voltammograms of silicon electrodeposition in PC 76 
+-1
+solution with/without SiCl4 at a scan rate of 20 mV s . (b) Mass 
+and thickness of Si/CNF mat with respect to different silicon 
+deposition cycles. The error bar is added in the figure. 
+Fig. 3.14 (a) Micro-Raman spectra of bare CNF mat and Si/CNF mat with 78 
+200 cycles of Si deposition before/after annealing, indicated as 
+Si-200-p and as Si-200-a in the figure. (b) XPS spectra of the 
+electrode surface with active materials consisting of Si-200-p 
+and Si-200-a, respectively. 
+Fig. 3.15 SEM images of (a) Si-200-p and (b) Si-200-a samples. Dark 79 
+color portion indicates electrolyte residues on the surface of 
+CNF mat. After 1000 °C annealing, the uniform mat surface was 
+observed by the removal of electrolyte, as shown in (b).    
+Fig. 3.16 (a) SEM images of as-synthesized bare CNFs and (b) Si-200-a. 80 
+The cross-sectional images are shown in the insets. (c) AFM 
+image of Si-200-a. The high resolution image of dashed square 
+in (c) is shown in (d). 
+Fig. 3.17 (a) TEM image of Si-200-a. The EDS line profile along the 81 
+dashed line is shown in (b). 
+Fig. 3.18 High-resolution XPS spectra of Si/CNF with 200 cycles of Si 83 
+deposition before and after annealing. Figure (a) and (c) are C 1s 
+and Si 2p fitted peaks before annealing. (b) and (d ) are C 1s and 
+Si 2p fitted peaks after 1000 °C annealing. Peak positions and 
+relative ratios are shown in the figure. 
+Fig. 3.19 (a) CV profile comparison between bare CNF mat and CNF mat 84 
+° stafter 1000 C annealing. The curves were recorded after 1  CV 
+-1
+scan between 0.01 to 2 V at a scan rate of 0.1 mV s . (b) AC 
+X 
+ 
+impedance spectra of the above two electrodes. The spectra were 
+recorded right after the cell assembling before cycling. 
+nd th
+Fig. 3.20 (a) The 2  and 10  cyclic voltammograms of CNF-a (square), 86 
+Si-200-p (dashed line) and Si-200-a (solid line) mats between 
+-1
+0.01 and 2 V at a scan rate of 0.1 mV s . (b) and (c) are voltage 
+profiles of Si-200-p/Si-200-a and CNF-a/Si-200-a between 0.01 
+and 2 V at a charging rate of 0.1 C. The cycle numbers are 
+indicated in the figure. (d) Charge/discharge capacity and 
+Coulombic efficiency of Si-200-a for the first 80 cycles. 
+Fig. 3.21 (a) Charge (filled symbols)/discharge (open symbols) capacity in 90 
+terms of different numbers of silicon deposition cycles after high 
+temperature annealing. Capacity was calculated based on silicon 
+mass only. Sample indications are shown in the right dashed 
+square. (b) AC impedance spectra of the above five electrodes. 
+The spectra were recorded right after the cell assembling before 
+cycling. The equivalent circuit is shown in the inset. The related 
+resistance value in Figure (b) was plotted in Figure (c) with 
+respect to different silicon deposition cycles. 
+Fig. 3.22 SEM images of (a-b) Si-1500-p and (c-d) Si-1500-a samples. 92 
+Fig. 3.23 Charaterizations of Si-200-a electrode after 80 cycles 94 
+charge/discharge. (a) Top-view SEM image, (b) Cross-sectional 
+SEM image, (c) High resolution TEM image, and (d) AFM 
+image. The SEI layer was selectively removed by washing the 
+sample with acetonitrile and diluted HCl. 
+Fig. 4.1 Graphene is a basic 2D building block for other carbon 106 
+allotropes with different dimensionalities. 
+Fig. 4.2 a) Honeycomb lattice of graphene with two carbon atoms per 107 
+XI 
+ 
+unit cell. b) Tight-binding band structure of graphene π-bands, 
+considering only nearest neighbor hopping. c) Band structure 
+near K point showing the linear dispersion relation. 
+Fig. 4.3 Electronic Structure of: a) Metal: Finite Density of States (DOS) 109 
+at Fermi energy. b) Semiconductor: Gap at Fermi energy. c) 
+Graphene: Zero gap Semiconductor. Zero DOS metal. 
+Fig. 4.4 Production techniques of graphene: a) Micro-cleavage method, 112 
+isolating graphitic layers from graphite into monolayer graphene 
+flakes with the help of a cohesive tape, b) epitaxial growth of 
+graphene by decomposition of SiC into graphene, c) chemical 
+vapor deposition method by decomposition of hydrocarbon 
+gases on metal substrates, and d) chemical exfoliation of 
+graphite oxide by weakening van der Waals cohesive force via 
+insertion of reactants into interlayer space. 
+Fig. 4.5 Schematic of fabrication process with Cu-grown SLG or Ni- 117 
+grown MLG (left panel). Bilayer and trilayer graphene can be 
+fabricated by transferring monolayer graphene repeatedly. 
+Photograph of as-prepared monolayer graphene (PMMA on top) 
+floating in water and CR 2032 coin cell case (right panel). 
+Fig. 4.6 Schematic of a coin cell structure with Cu-grown SLG or Ni- 118 
+grown MLG. Bilayer and trilayer graphene coin cells were 
+fabricated by transferring monolayer graphene repeatedly. 
+Fig. 4.7 Optical micrographs of (a) Cu-grown SLG and (b) Ni-grown 120 
+MLG on SiO2/Si substrate. White dashed lines indicate wrinkles. 
+Some portion of thicker graphene is indicated by arrows. (c) 
+Schematic of (i) SLG with a well defined basal plane and (ii) 
+edge plane enriched MLG. (d) Micro-Raman spectra of SLG and 
+MLG. Confocal Raman mapping of D/G intensity ratio of (e) 
+XII 
+ 
+SLG and (f) MLG from squared positions of (a) and (b). The 
+contrast is normalized to 0.4 to visualize the defect distribution 
+for both images. (g) Wavelength-dependent transmittance 
+(values are provided at a wavelength of 550 nm) and (h) optical 
+photographs of different number of graphene layers on PET 
+substrate. 
+Fig. 4.8 (a) Cyclic voltammograms of different number of graphene 123 
+layers samples at a scan rate of 0.1 mV/s. SUS-related redox 
+reaction peaks (SO, SR) and lithium intercalation/deintercalation 
+st
+related peaks (LiIn/LiDe) are marked in the figure. (b) 1  and (c) 
+nd
+2  galvanostatic charge/discharge profiles of different number 
+2
+of graphene layers at a current density of 5 µA/cm . (d) The 
+related layer-dependent capacities. Two regimes of corrosion-
+dominant and lithiation-dominant are indicated. 
+nd
+Fig. 4.9 Cyclic voltammograms at a scan rate of 0.1 mV/s (a) and 2  125 
+galvanostatic charge/discharge profiles at a current density of 5 
+2
+µA/cm  (b) of bare CR2032 coin cell case and foil SUS 316. 
+Fig. 4.10 AC impedance spectra obtained by applying a sine wave with an 128 
+amplitude of 10 mV over a frequency range from 100 kHz to 10 
+mHz. The inset shows impedance at higher frequency region to 
+demonstrate charge transfer resistance. 
+Fig. 4.11 Theoretically estimated capacity based on LiC6 intercalation. No 130 
+absorption of Li ions occurs at monolayer graphene. 
+Fig. 4.12 (a) Raman spectra, (b) cyclic voltammograms at a scan rate of 134 
+0.1 mV/s, and (c) 2nd galvanostatic charge/discharge profiles at 
+2
+a current density of 5 A/cm  for monolayer graphene treated by 
+Ar plasma with different plasma powers (15 W and 100 W). (d) 
+nd
+Capacity of 2  charge as a functional of number of graphene 
+XIII 
+ 
+layers under different Ar plasma powers. Absolute slopes 
+according to different plasma powers and critical layer thickness 
+(lc) are indicated in the figure. (e) Schematics of proposed Li 
+diffusion mechanism through defects on the basal plane with 
+different defect population. Broad down arrows indicate Li ion 
+diffusion through defect sites of basal plane. Red glows 
+represent steric hindrance for Li ion diffusion formed by the 
+accumulated Li ions or functional groups. The inset in the right 
+indicates the relative magnitude of diffusion coefficient. (f) 
+Relationship of D/G ratio with the extracted slope from (d). 
+Fig. 4.13 Side and top views of atomic configurations (top panel), 137 
+isosurface images of electrostatic potential (second panel), bond 
+ 
+ lengths and local charge distributions at the barrier states (third 
+ 
+panel), and the diffusion barrier profiles of Li (bottom panel) 
+ 
+ through (a) graphene hexagonal site (H site), (b) Stone-Wales 
+ 
+(SW) defect (c) monovacancy (V1), and (d) divacancy (V2). 
+ 
+ 3Isovalue for rendering isosurfaces is 0.25 e/Å . The insets in the 
+ 
+third panel show isosurface image of electrostatic potential for 
+ 
+ each corresponding structure without Li ion. Bond lengths 
+ 
+(yellow color) and electrostatic potential charges (white color) 
+ 
+ are in units of Å and electrons, respectively. 
+ 
+  
+ 
+ 
+ 
+ 
+  
+XIV 
+ 
+INTRODUCTION 
+ 
+The issue of the sustainability of energy supply has attracted worldwide 
+concern due to the crisis in rapid depletion of fossil energy resources along with 
+serious environmental pollution issues. Over the past several decades, 
+tremendous efforts have been made in developing alternative technologies to 
+harvest and store sustainable clean energy. Thanks to the development of 
+nanoscience and nanotechnology, clean energy technologies are progressing 
+impressively which makes them more practical and price competitive with fossil 
+fuels. Clean energy technology covers production, storage, and conversion. 
+Researches on energy production from renewable natural resources include solar 
+energy conversion, wind, geothermal and hydraulic energy and involve often 
+heavy engineering works. Our main concern using nanoscience from basic 
+science point of view is energy storage. Among all different kinds of energy 
+storage systems, rechargeable lithium-ion battery (LIB) is one of the greatest 
+successes of modern material electrochemistry. It has drawn the most attention 
+not only because of its higher energy density and longer cycle life compared to 
+any existing battery systems but also its lightweight and compact which benefit 
+the application in hybrid vehicles and portable electronics [1]. 
+ 
+LIB consists of an anode (negative electrode) and a cathode (positive 
+electrode). These two electrodes are capable of reversibly hosting lithium in ionic 
+1 
+ 
+form. Common candidates for the cathode are lithiated metal oxides and 
+carbonaceous materials for the anode. Prior to the discovery of graphite anode 
+materials, lithium metal had been used. However, possibility of thermal runaway 
+caused by the internal shorts triggered by the formation of lithium dendrites has 
+been a long standing issue [2]. The use of graphite as an anode material for 
+intercalating lithium ions in rechargeable LIB was then proposed [3]. It is still the 
+main stream of anode material for commercial LIB up to now due to its well 
+defined layered structure for lithium intercalation, low operating potential, and 
+remarkable interfacial stability [4]. Unfortunately, the intercalation capacity of 
+lithium ions in graphite is limited to 372 mAh/g with LiC6 stoichiometry. 
+Numerous efforts have been made to increase this value by modifying the 
+crystallinity, the microstructure, and the micromorphology of the carbonaceous 
+material [5-8]. These structural parameters play a crucial part in determining and 
+optimizing the electrochemical performance of carbon anodes. 
+ 
+The exploration of nanomaterials and nanocomposites provides us new 
+opportunities to improve the anode performance of LIB. Compared to 
+micrometer-scaled carbon material, nanostructured carbon exhibits differences 
+not only in dimensionality and morphology, but also in the distribution of 
+chemical bonding which allows the mixtures of local electronic structures 
+2 3 
+between sp  and sp [9] Therefore, carrier transport properties are different from 
+classic carbon material when nanometer-scaled carbon is in contact with 
+2 
+ 
+reactants. Nanostructured carbon materials with high accessible surface areas and 
+short diffusion time for lithium ions open new perspectives for high energy 
+density and high power density LIB.  
+ 
+In order to fully develop the potential of nanoscaled carbon as an anode for 
+LIB, a systematical study is needed. In this thesis work, after a brief overview of 
+LIB (chapter one), fundamentals that provide the basic idea of operation 
+mechanism in LIB, types of conventional carbon anode materials, and their 
+anode performance will be reviewed in chapter two. Chapter three will mainly 
+focus on studying the one dimensional carbon nanofiber anode material. An easy 
+fabrication process, electrospinning, which is a good for mass production is 
+introduced for raw carbon nanofiber synthesis. In order to improve the 
+performance of raw carbon nanofiber, Si, a high Li storage material, is 
+incorporated through electrochemical deposition method. Using nanoscaled 
+carbon material for fundamental research of lithium ion diffusion pathway is 
+given in chapter four. Here, two dimensional graphene synthesized by chemical 
+vapor deposition is chosen to study the nature of Li ion diffusion since it is the 
+basic building block of graphite which is the most common material for anode. 
+ 
+Finally, a general conclusion and perspectives are given. 
+ 
+ 
+3 
+ 
+Bibliography of Introduction 
+[1] J. M. Tarascon, M. Armand, Nature 2001, 414, 359.  
+[2] F. Orsini, et al., J. Power Source 1999, 81, 918. 
+[3] M. Armand, P. Touzain, Materials Science and Engineering 1977, 31, 
+319. 
+[4] M. Winter, O. J. Besenhard, E. M. Spahr, P. Novák, Adv. Mater. 1998, 
+10, 725. 
+[5] M. Winter, J. O. Besenhard, Lithium Ion Battery: Fundamentals and 
+Performance 1998 (Eds.: M. Wahihara, O. Yamamoto), Wiley-VCH, 
+Weinheim. 
+[6] A. Mabuchi, K. Tokumitsu, H. Fujimoto, T. Kasuh, J. Electrochem. Soc. 
+1995, 142, 1041. 
+[7] W. Ruland, J. Appl. Phys. 1967, 38, 3585. 
+[8] M. Endo, C. Kim, K. Nishimura, T. Fujino, K. Miyashita, Carbon 2000, 
+38, 183. 
+[9] D. S. Su, R. Schlögl, ChemSusChem, 2010, 3, 136. 
+  
+  
+  
+4 
+ 
+ Outline of Chapter One 
+ 
+Overview of Rechargeable Lithium Ion Battery 
+ 
+ 
+1.1   Electrochemical Energy Storage Systems 6 
+1.2  Rechargeable Lithium Based Battery 8 
+1.3  Rechargeable Lithium Ion Battery 11 
+Bibliography of Chapter 1 13 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+5 
+ 
+CHAPTER ONE 
+Overview of Rechargeable Lithium Ion Battery  
+1.1 Electrochemical Energy Storage Systems 
+Systems for electrochemical energy storage convert chemical energy into 
+electrical energy. Electrochemical energy storage devices basically include 
+batteries, fuel cells, and electrochemical capacitors (ECs). Although the 
+mechanisms for energy storage and conversion are different, similarities do exist 
+among these three systems. Common features are that batteries, fuel cells, and 
+ECs consist of two electrodes which in contact with electrolyte. Requirements 
+upon electron and ion conduction in electrodes and electrolyte are valid for all 
+three systems. Furthermore, electron and ion transport are separated during the 
+charge/discharge processes which take place at the phase boundary of the 
+electrode/electrolyte interface [1]. The main difference between battery, fuel cell 
+and ECs is the way of elec trical energy generation. In batteries and fuel cells, 
+electrical energy is produced by conversion of chemical energy via redox 
+reactions (Faradic process) at the anode and cathode. On the other hand, in ECs, 
+energy may not be delivered via redox reactions but rather via the formation of 
+electrical double layers (non-Faradic process) by orientation of electrolyte ions at 
+the electrode/electrolyte interface, and thus the use of the terms anode and 
+cathode may not be appropriate [2].  
+ 
+6 
+ 
+In order to value the energy contents of a system, terms of “energy density” 
+(or “specific energy”) and “power density” (or “specific power”) are used. 
+“Energy density” is expressed in watt-hours per liter (Wh/L) [or in watt-hours per 
+kilogram (Wh/kg)] and “power density” is expressed in watt per liter (W/L) [or 
+in watt per kilogram (W/kg)] [2]. To compare the performance of various energy 
+storage devices, a reprehensive chart known as the Ragone plot was developed. 
+In such a plot, the values of specific energy (in Wh/kg) are plotted versus specific 
+power [3], as shown in Figure 1.1. It is clear to see that fuel cell can be 
+considered as high energy density system and supercapacitor as high power 
+density system. However, battery has intermediate energy and power 
+characteristics. Compared to fuel cells and supercapacitors, batteries have 
+realized the biggest application markets so far. Whereas supercapacitors have 
+found its own position as memory protection in several electronic devices and 
+instantaneous power backup systems, fuel cells are basically still in the 
+development stage [1]. 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+7 
+ 
+Figure 1.1. Ragone plot showing energy density vs. power density 
+for various energy storage devices. Cited and modified from Ref. [3]. 
+ 
+1.2 Rechargeable Lithium Based Battery 
+There are two types of batteries: primary batteries that are designed to be 
+used once and discarded, and secondary batteries that are designed to be 
+recharged and used multiple times. Therefore, they are also named as disposable 
+batteries and rechargeable batteries. Common types of disposable batteries such 
+as zinc–carbon battery cannot be reliably recharged, since the chemical reactions 
+are not easily reversible and active materials cannot recover to the original forms 
+[4]. On the other hand, electrochemical reactions in rechargeable batteries such as 
+nickel-cobalt battery and lithium-based batteries are electrically reversible.  
+ 
+Figure 1.2. Comparison of the different battery technologies in terms 
+8 
+ 
+of volumetric and gravimetric energy density. Cited from Ref. [5]. 
+ 
+Considering the requirements of modern society with popular portable 
+electronics, rechargeable batteries are more favorable nowadays. The 
+development of rechargeable batteries is a long story. To this date, among various 
+existing technologies, such as lead-acid, Ni-Cd, nickel-metal hydride (Ni-MeH), 
+Li-based batteries draw the most attention because of their high energy density 
+and possibility of compact-flexible design, as indicated in Figure 1.2. Combining 
+the profound mechanism study and the involvement of advanced materials, they 
+have become the most dominant power source for cell phones, digital cameras, 
+laptops etc. According to the recent market investigation, the share of worldwide 
+sales for Ni–Cd and Ni–MeH batteries are 23 and 14%. However, Li-ion portable 
+batteries take up to 63% of the battery market [5]. 
+     
+The starting point of incorporating lithium metal in battery technology is the 
+fact that lithium is the most electropositive (–3.04 V Vs standard hydrogen 
+electrode) as well as the lightest (specific gravity ρ= –30.53 g cm ) metal which 
+benefits the design of high energy density system [5]. Lithium metal as an anode 
+was firstly reported in 1970 where TiS2 was used as a cathode [6-8]. However, 
+Li-metal cell encountered many problems. One of shortcomings is redeposition 
+of lithium as a form of metal and uneven dendrite formation during subsequent 
+charge/discharge cycle, as shown in Figure. 1.3a. This could lead to a short 
+9 
+ 
+circuit problem and thus explosion issues [9]. Therefore, even though Li-metal 
+based cells exhibit the highest energy density as shown in Figure 1.2, their 
+practical application is limited. Upon the inspiration of the development on the 
+positive electrode which used LixMO2 (where M is Co, Ni or Mn) as a host 
+material for Li ions [10-11], the Li metal is not necessarily required, therefore a 
+concept so-called Li-ion or rocking-chair battery which introduced a second 
+host material to replace Li metal was emerged to solve the safety issues in 
+rechargeable Li-metal battery, as shown in Figure 1.3b [12-15].  
+ 
+Figure 1.3. Schematic representation of lithium batteries. a, 
+10 
+ 
+Rechargeable lithium-metal battery, dendrite formation was shown 
+in the negative electrode. b, Rechargeable lithium-ion battery. 
+Cited from Ref. [5]. 
+ 
+1.3 Rechargeable Lithium Ion Battery 
+The configuration of Li-ion battery electrodes is two types of lithium host 
+materials (Figure 1.3b). The storage capacity of the battery is given by the 
+amount of Li that can be stored reversibly in these two electrodes. To be clear, for 
+rechargeable Li-metal batteries, the positive host electrode does not need to be 
+lithiated before cell assembly since the use of metallic Li as the negative 
+electrode. In contrast, for Li-ion batteries, the positive host electrode usually acts 
+as a source of Li since the common negative electrode such as carbon, Si, 
+transition metal oxide contains no Li. Thus, air-stable Li-based intercalation 
+compounds in positive electrode are required to complete the cell assembly.  
+ 
+The structural stability of the host material during insertion and de-insertion 
+of Li ions is a critical factor since it determines the long term stability of Li-ion 
+battery. Generally, anode materials can be classified into three categories 
+according to the Li storage mechanisms besides graphite: alloying, insertion, 
+conversion. Most of these materials show different disadvantages compared to 
+graphite, as indicated in Figure 1.4. In the case of Li alloy (Si, Sn, Ge, Al, Pb 
+etc) and conversion-based electrodes (CoO, Fe2O3 etc), the volume change 
+11 
+ 
+between the Li-containing states and the corresponding lithium-free states is very 
+large due to the mechanical stresses generated during charge/discharge cycles. 
+Therefore, the cracks are easily produced and thus the electrodes collapse. So the 
+cycle life is very much limited. In the case of insertion based materials (TiO2, 
+MoO2 etc), rather low capacity is the key factor needed to be improved. In 
+contrast, materials with two dimensional layered structure such as carbonaceous 
++
+materials, show good cycling behavior since this kind of Li  insertion materials 
+exhibits low mechanical strain with small volume changes [2, 5, 12-15]. At the 
+present time, research and development activities are mainly focused on such 
+highly reversible carbonaceous materials. 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+Figure 1.4. Current issues remaining in different types of anode 
+materials.  
+ 
+ 
+12 
+ 
+Bibliography of Chapter 1 
+ 
+[1] M. Winter, R. J. Brodd, Chem. Rev 2004, 104, 4245. 
+[2] B. E. Conway, Electrochemical Supercapacitors: Scientific Fundamentals 
+and Technological Applications 1999. 
+[3] The plot shown here is based on the data provided by Maxwell 
+Technologies: http://www.maxwell.com. 
+[4] Alkaline Manganese Dioxide Handbook and Application Manual, 2008. 
+[5] J. M. Tarascon, M. Armand, Nature 2001, 414, 359. 
+[6] T. Ikeda, H. Tamura, Proc. Manganese Dioxide Symp. 1975, Vol. 1, (IC 
+sample Office, Cleveland, OH). 
+[7] M. S. Whittingham, Science 1976, 192, 1226. 
+[8] M. S. Whittingham, US Patent 4009052. 
+[9] F. Orsini, et al., J. Power Sources 1999, 81, 918. 
+[10] K. Mizushima, P. C. Jones, P. J. Wiseman, J. B. Goodenough, Mat. Res. 
+Bull.1980, 15, 783. 
+[11] M. M. Thackeray, W. I. F. David, P. G. Bruce, J. B. Goodenough, Mat. 
+Res. Bull. 1983, 18, 461. 
+[12] D. W. Murphy, F. J. DiSalvo, J. N. Carides, J. V. Waszczak, Mat. Res. 
+Bull. 1978, 13, 1395. 
+[13] M. Lazzari, B. Scrosati, J. Electrochem. Soc.1980, 127, 773. 
+[14] M. Mohri, et al., J. Power Sources 1989, 26, 545. 
+[15] J. R. Dahn, U. V. Sacken, M. W. Juzkow, H. Al-Janaby, J. Electrochem. 
+13 
+ 
+Soc. 1991, 138, 2207. 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+14 
+ 
+ Outline of Chapter Two 
+ 
+Carbonaceous Materials as an Anode of Li-Ion Battery 
+ 
+2.1   Operation Mechanism of Li-Ion Battery 16 
+2.2  Classification of Carbonaceous Materials 21 
+2.2.1  Graphitic Carbon 21 
+2.2.2 Non-graphitic Carbon 22 
+2.3   Lithium Intercalation into Carbonaceous Materials 24 
+2.3.1 Lithium Intercalation into Graphitic Carbon Materials 24 
+2.3.1-1  Description 24 
+2.3.1-2  Charge/Discharge Profile of Graphitic Carbon Materials 26 
+2.3.2  Lithium Intercalation into Non-graphitic Carbon Materials 29 
+2.3.2-1  Low Specific Charge Carbon 29 
+2.3.2-2  High Specific Charge Carbon 31 
+2.4  Summary of Chapter Two 36 
+Bibliography of Chapter 2 38 
+ 
+15 
+ 
+CHAPTER TWO 
+Carbonaceous Materials as an Anode of Li-Ion Battery 
+2.1 Operation Mechanism of Li-Ion Battery 
+Carbon as one of the most abundant elements on earth plays a critical role in 
+the development of human society. For thousands of years, human history is 
+closely associated with the struggle to extract and utilize the power from carbon 
+materials. Carbonaceous materials have been adopted in various electrochemical 
+energy storage systems previously. This was motivated by the good electrical 
+2
+conductance of sp -hybridized solid carbon, its high chemical stability, and its 
+enormous adaptability to different interface processes [1]. Li-ion battery is one 
+typical example to utilize the carbonaceous materials in energy storage devices. 
+Commercialized LIB usually consists of layered LiCoO2 as a cathode and 
+carbonaceous materials as an anode. These two electrodes are usually separated 
+by a porous polymer membrane and the ionic transport within the cell is ensured 
+by an aprotic organic electrolyte which is a good ionic conductor and electronic 
+insulator [2]. Nowadays, the most common electrolyte is a solution of LiPF6 in a 
+mixture of alkyl carbonates such as ethylene carbonate, diethyl carbonate, and 
+dimethyl carbonate which provides high-permittivity and low-viscosity.  
+ 
+In common Li-ion battery cells, during the charging process, Li ions are 
+extracted from the LiCoO2 electrode (cathode) and simultaneously 
+16 
+ 
+inserted/intercalated into the carbon electrode (anode) by forming a 
+lithium/carbon intercalation compound indicated as LixCn, coupled with 
+negatively charged electrons to keep overall charge neutrality, as shown on the 
+left side of Figure 2.1. During the discharging process, Li ions are reversibly 
+extracted/deintercalated from the negative electrode and simultaneously inserted 
+into the positive electrode, as shown on the right side of Figure 2.1. This 
+charge/discharge process can be summarized by the typical chemical equations as 
+shown below [3]: 
+ 
+Figure. 2.1. Schematic illustration of detailed charge/discharge 
+process in Li-ion battery. 
+ 
+Positive Electrode:   LiCoO2 
++ - 
+ Li1-x CoO2 + xLi  + xe
++ -  
+Negative Electrode:  Cn + xLi  + xe   LixCn
+           Overall:            LiCoO2+ Cn  Li1-xCoO2 + LixCn 
+17 
+ 
+Compared to ECs whose electrodes are composed of same materials which 
+therefore exhibit the same potential, an inherent potential difference exists 
+between LiCoO2 and carbonaceous material in LIB, as simply indicated in 
+Figure 2.2. The original potentials of LiCoO2 and carbon materials are usually ~ 
++
+4 V and ~ 0.2-0.5 V (depending on types of carbon) vs. Li/Li , respectively [2,4]. 
++
+During the charge process, the cathode will release Li  under the influence of 
+external power and the potential of cathode will increase to 4.2 V, whereas the 
++
+anode potential will decrease to approximately 0.01 V vs. Li/Li  upon Li ion 
+insertion, thus delivering an output voltage of nearly 4 V to the external load. 
+Here, the cut off voltage of LiCoO2 and graphite is usually limited to 4.2 
+(corresponding to a removal of 0.5 mol Li) and 0.01 V in order to maintain the 
+structural stability [5]. On the other hand, during the spontaneous discharge 
+process, Li0.5CoO2 needs to go back to its original potential state which is more 
+energetically stable therefore Li ions go back to Li0.5CoO2 and the electrode 
+potential goes back to the original state, and the system is thus ready for the next 
+charge process.  
+ 
+ 
+ 
+ 
+ 
+ 
+18 
+ 
+Figure 2.2. Potential profile of anode and cathode during 
+charge/discharge. 
+ 
+The discovery of different carbon allotropes associated with nanoscience 
+and nanotechnology provided us a room to further improve the performance of 
+anode material. Therefore, carbonaceous material used as an anode in LIB is 
+chosen to be the main focus in this work. Before moving to the details, we 
+summarize one more time the advantages of carbon-based anode material. 
+Compared to transition-metal oxides and chalcogenides, carbonaceous materials 
+such as graphite and hard carbons are more preferable not only because of (1) the 
+unstable inherent nature of the transition-metal oxides and chalcogenides 
+materials as mentioned at the end of Chapter 1 and (2) the dimensional stability 
+and good conductivity of carbonaceous materials, but also (3) the lowest 
++
+potential versus Li/Li  which gives higher output cell voltage compared to other 
+composite alloys, three dimensional metal oxides and so on. For instance, the 
++
+potential of many Li alloys is ~0.3 to ~1.0 V vs. Li/Li  whereas it is only ~0.1 V 
++
+vs. Li/Li  for graphite, as indicated in Figure 2.3 [6]. 
+ 
+ 
+ 
+ 
+ 
+19 
+ 
+  
+ 
+ 
+ 
+ 
+ 
+Figure 2.3. Charge curves of different metals (M) with respect to 
+highly oriented turbostratic pitch carbon fibers. Cited from Ref. [6].  
+ 
+One good carbonaceous anode material needs to fulfill high capacity, long 
+cycle life, fast charge etc. in addition to high energy/power density, good 
+conductivity and stability, as mentioned above. A charge/discharge curve can be 
+used as one of the most straightforward tools to demonstrate the storage 
+capability, cyclic ability, rate of charge/discharge. The charge/discharge curve 
+(capacity-voltage curve) is converted from a voltage-time profile with one or 
+several constant current densities that are fixed in advance. The capacity (mAh) 
+therefore equals to the current (mA) multiply the time (h). The charge/discharge 
+curve usually exhibits very different features according to the structure of carbon 
+materials. Thus, in order to further improve the performance of carbonaceous 
+anode and to assist in explaining the phenomenon of nanocarbon-based anode 
+later, the classification of carbon materials upon the structure and also their 
+20 
+ 
+associated charge/discharge profiles need to be elaborated first. The related topics 
+are explained in detail in the following section. 
+ 
+2.2 Classification of Carbonaceous Materials 
+Carbonaceous materials that are capable of reversible lithium reaction can 
+be roughly classified into two categories according to their structures: graphitic 
+and non-graphitic (disordered) carbon. The non-graphitic carbon can be further 
+categorized into soft carbon/hard carbon upon annealing and high specific charge 
+carbon/low specific charge carbon according to the capability of reversible 
+lithium storage. Charge/discharge behaviors of each type of carbon are presented 
+and analyzed in detail in the following context.  
+ 
+2.2.1 Graphitic Carbon 
+Graphitic carbon is a well-defined layered structure. Normally, a number of 
+structural defects could appear in graphitic carbon. The term of “graphite” was 
+derived from crystallographic point of view which should be only applied to 
+carbons whose layered lattice structure follows a perfect stacking order of 
+graphene layers. That is to say it contains the layer stacking order of either the 
+common AB (hexagonal graphite, Figure 2.4 and Figure 2.5a) or the rather rare 
+ABC (rhombohedral graphite). However, since the transformation energy from 
+AB stacking to ABC stacking (and vice versa) is rather small, perfectly stacked 
+graphite crystals are not readily available. Therefore the term of “graphite” is 
+21 
+ 
+often used regardless of well-defined stacking order [7]. The terms of natural 
+graphite, artificial graphite, and pyrolytic graphite are commonly used, although 
+the materials are polycrystalline [8]. The actual structure of carbonaceous 
+materials typically deviates more or less from the ideal graphite structure. 
+Materials consisting of aggregates of graphite crystallites are called graphites as 
+well. 
+Figure 2.4. Left: Schematics of the crystal structure of hexagonal 
+graphite with an AB stacking order. Right: view perpendicular to the 
+basal plane of graphite. Edges can be subdivided into arm-chair and 
+zigzag faces. Cited from Ref. [7]. 
+ 
+2.2.2 Non-Graphitic Carbon 
+Non-graphitic (disordered) carbonaceous materials consist of carbon atoms 
+that are mainly arranged in a planar hexagonal network but no crystallographic 
+order in the c-direction compared to graphite, as shown in Figure 2.5c [7,9]. The 
+22 
+ 
+structure of those carbons is characterized by amorphous areas embedded and 
+cross-linked in the network. Non-graphitic carbons are mostly prepared by 
+pyrolysis of organic polymer or hydrocarbon precursors at temperature below 
+~1500°C [10-12].  
+      (a) graphite      (b) graphitizable carbon   (c) non-graphitizable carbon 
+Figure 2.5. Schematic indications of (a) graphite and (b) non-
+graphitic (disordered) carbonaceous material. 
+ 
+Heat treatment of most non-graphitic carbons (from ~1500 to ~3000°C) 
+allows us to further classify non-graphitic carbon into two sub-categories: soft 
+carbon and hard carbon. In the case of soft carbons, crosslinking between the 
+carbon layers is weak and therefore the layers are mobile enough to form 
+graphite-like crystallites and develop the graphite structure continuously during 
+the heating process, as shown in Figure 2.5b [9]. In the case of hard carbons, 
+since the carbon layers are immobilized by crosslinking, they show no real 
+development of the graphite structure even at temperatures of 2500 ~ 3000 °C 
+[10]. The representative figure is shown in Figure 2.5c. 
+23 
+ 
+2.3 Lithium Intercalation into Carbonaceous Materials 
+2.3.1 Lithium Intercalation into Graphitic Carbon Materials 
+2.3.1-1 Description 
+Lithium-intercalated graphitic carbon compounds (GICs) are known with 
+the configuration LixCn. It is well known that Li intercalation reaction occurs 
+only at the edge plane of graphite. Through the basal plane, intercalation is 
+possible only at defect sites [13-16]. The maximum lithium content for highly 
+crystalline graphitic carbons is one Li guest atom per six carbon host atoms (i.e. 
+n  6 in LiCn or x  1 in LixC6) at ambient pressure [17]. That is to say it follo
+ws the equation as below:  
+ 
++ -
+6 C + x Li  +x e   LixC6, where, x = 1 in LixC6 (the maximum Li conte
+nt). 
+ 
+In LiC6, lithium avoids to occupy the nearest neighbor sites due to the 
+Columbic repulsive force of Li, as shown in Figure 2.6. Two major changes in 
+graphite structure point of view occur when Li intercalats into graphite layers: (1) 
+the stacking order of the carbon layers (i.e. graphene layers) shifts to AA stacking, 
+see Figure 2.6a and Figure 2.6c. (2) The interlayer distance between the 
+graphene layers increases moderately (10.3% has been calculated for LiC6) due 
+to the lithium intercalation, as indicated in the right panel in Figure 2.6a [18-21]. 
+24 
+ 
+      
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+Figure 2.6. Structure indications of LiC6. (a) Left: schematic 
+drawing showing the AA layer stacking sequence with Li 
+intercalation. Right: simplified representation. (b) Perpendicular 
+view to the basal plane of LiC6. (c) Enlarged schematic of AA 
+stacking order. Cited and modified from Ref. [20-21]. 
+ 
+An important feature of Li intercalation into graphite is the “stage 
+formation”. Stage formation means a stepwise formation of a periodic pattern of 
+unoccupied graphitic layer gaps at low concentrations of Li [23-31]. This 
+stepwise process can be described by the stage index, s (s = I, II, III, IV) which is 
+equal to the number of graphene layers between two nearest guest layers as 
+shown in Figure 2.7. Note that stage IV is not indicated in the figure because Li 
+concentration is too low in graphene layers. It is also known as a dilute stage 
+25 
+ 
+when s > IV [32]. Two factors determine the formation of stages during Li 
+intercalation into graphite i) the energy required to expand van der Waals gap 
+between two graphene layers [31,33] and ii) the repulsive interactions between 
+guest species. Therefore, compared to a random distribution of Li in the graphitic 
+layers during charge process, Li ions prefer to occupy van der Waals gaps with 
+high density first to reach an energetically stable state [7]. 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+      
+     Figure 2.7. Schematic indication of stage formation during Li ion      
+     intercalation into graphite layers. 
+ 
+2.3.1-2 Charge/Discharge Profile of Graphitic Carbon Materials 
+Stage formation as mentioned above is one of the most important 
+characteristic of charge profile for graphitic carbon. It can be easily observed in 
+the form of plateaus by constant current measurement (i.e. in charge/discharge 
+curve), as indicated in Figure 2.8. The associated stages are marked in bottom 
+26 
+ 
+panel of the figure. The plateaus indicate the coexistence of two phases [24,34]. 
+The formation of stages II, IIL (a transition stage of stage II and stage III), III, 
+and IV have been identified from experimental electrochemical curves [18,35,37-
+40] and confirmed by X-ray diffraction and Raman spectroscopy [17,25,27-
+28,35-38]. A schematic potential / composition curve for galvanostatic reduction 
+of graphite to LiC6 is shown in the bottom panel in Figure 2.8.  
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+Figure 2.8. Constant current charge/discharge curves of the graphite 
+(Timrex KS 44, Cirr is the irreversible specific charge, and Crev is the 
+reversible specific charge). Modified and replotted from Ref. [7]. 
+27 
+ 
++
+Ideally, Li  intercalation into carbons should be fully reversible and the 
+maximum Li storage capacity should not exceed 372 mAh/g according to LiC6 
+configuration. However, the charge accumulated in the first cycle usually larger 
+than the maximum theoretical specific capacity, as shown in Figure 2.8. 
+Compared to the first charge, the first discharge capacity is much smaller. The 
+excess charge generated in the first cycle which cannot be recovered can be 
+ascribed to a film formation of the solid electrolyte interface (SEI) which is 
++
+caused by the decomposition of the Li  containing electrolyte, such as propylene 
+carbonate and ethylene carbonate [41-46]. The decomposition of electrolyte 
++
+usually takes place at less than 1 V vs. Li/Li  and appears as the first plateau in 
+the charge curve, as indicated in Figure 2.8 [47]. The advantage of the SEI 
+formation is that it can prevent further electrolyte decomposition and create a 
+rather stable state for the surface of GIC [48-53]. On the other hand, the 
++
+formation of SEI is a charge-consuming side reaction in the first few Li  
+st
+intercalation/deintercalation cycles, especially in the 1  charge cycle. 
+Considering that the positive electrode is responsible to provide the Li ion in LIB, 
+the charge and lithium losses are detrimental to the specific energy of the whole 
+cell and have to be minimized. Because of the irreversible consumption of 
+lithium and electrolyte, a corresponding charge loss exists, so called “irreversible 
+specific charge” as indicated in Figure 2.8. The reversible lithium intercalation is 
+called “reversible specific charge”.  
+ 
+28 
+ 
+2.3.2 Lithium Intercalation into Non-Graphitic Carbon Materials 
+According to the capability of reversible lithium storage, non-graphitic 
+carbons can be further classified into two categories: high specific charge carbon 
+and low specific charge carbon.  
+ 
+2.3.2-1 Low Specific Charge Carbon 
+(i) Definition 
+Low specific charge carbons are carbonaceous materials which incorporate 
+only a considerably lower amount of lithium than graphite. That is to say it follo
+ws the equation as below:  
+ 
++ -
+6C + xLi  +xe   LixC6, where x = 0.5~0.8 in LixC6 at the maximum 
+stoichiometry.  
+ 
+(ii) Examples of Low Specific Charge Carbon 
+Cokes [68,77-83] and carbon blacks [81,84-85] are typical disordered 
+carbons with low specific charges. During the charge process, Li intercalation-
+induced formation of AA stacking is hindered due to the existence of crosslinking 
+of carbon sheets as mentioned in chapter 2.1.2. This will eventually affect the 
+accommodation of a higher Li amount into graphitic sites and deliver a lower 
+specific charge [86-88].  
+  
+29 
+ 
+Turbostratic carbon [43,86-90] which can also be classified into the category 
+of graphitizing/soft carbon is one type of low specific charge carbon. The lower 
+amount of Li intercalation than graphite is due to not only the effect of 
+crosslinking as mentioned in cokes and carbon blacks, but also larger amount of 
+wrinkled and buckled structural segments existing in the structure, and thus 
+available lithium intercalation sites is rather low therefore the specific charge is 
+lower than graphite [91-92]. 
+ 
+(iii) Charge/Discharge Profile of Low Specific Charge Carbon 
++
+Figure 2.9 shows the first Li  intercalation/deintercalation cycle of a coke-
+containing electrode. The potential profile of low specific carbon differs 
++
+considerably from that of graphite, as the reversible intercalation of Li  begins at 
++
+around 1.2 V vs. Li/Li , and the curve slopes without distinguishable plateaus. 
+This behavior is a consequence of the disordered structure providing 
+electronically and geometrically nonequivalent sites, whereas for a particular 
+intercalation stage in highly crystalline graphite, the sites are equivalent [93-94]. 
+30 
+ 
+  
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+Figure 2.9. Constant current charge/discharge curves of a coke (Conoco). 
+(Cirr is the irreversible specific charge, Crev the reversible specific charge). 
+Cited and redrawn from Ref. [7]. 
+ 
+2.3.2-2 High Specific Charge Carbon 
+(i) Definition 
+High specific charge carbons can store more lithium than graphite. That is to 
+say it follows the equation as below:  
+31 
+ 
++ -
+6 C + x Li  +x e   LixC6, where x > 1 in LixC6.  
+ 
+Li storage capacity of high specific charge carbons could vary from 400 
+Ah/kg to ~2000 Ah/kg which corresponding to x = ~1.2 to ~5 in LixC6. The 
+difference in the capacity depends on the heat treatment temperature, organic 
+precursor, and electrolyte. Even though the higher specific capacity (in terms of 
+Ah/kg) is desired in LIB, a larger volume of the carbonaceous matrix is usually 
+needed to accommodate the excess intercalated Li which indicates lower charge 
+density in terms of Ah/L [7].  
+ 
+(ii) Origin of the Excess Charges 
+Several different scenarios have been proposed in order to explain 
+origin of excess charges. These different models provide the intuitive 
+understanding even though some of them are still debatable [54-58]. A few 
+well known examples are listed below. Extra capacity can be realized 
+through: (1) The formation of Li2 molecules between layers which indicates 
+that lithium molecules occupy the nearest neighbor sites in intercalated 
++
+carbons [59]. (2) The presence of charged Li  clusters in the cavities [60]. 
+(3) The “adsorption” of lithium on both sides of single-layer sheets that are 
+arranged like a “falling cards” [61]. All of mechanisms are indicated in 
+Figure 2.10.  
+32 
+ 
+  
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+Figure 2.10. a) Storage mechanisms of Li ions in graphite. b) Li 
+storage in a form of Li2 covalent molecules. c) Schematic model of Li 
+storage in cavities and nanopores. d) Li adsorption on the two sides of 
+an isolated graphene sheet. Cited from Ref. [3]. 
+ 
+(iii) Charge/discharge Profile of High Specific Charge Carbon 
+For both graphitizing (soft) and non-graphitizing (hard) carbons prepared < 
+o
+1000 C, the typical charge/discharge profile is shown in Figure 2.11. 
+33 
+ 
+  
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+st nd
+Figure 2.11. Constant current charge/discharge curves (1  and 2  cycle) of 
+a high specific charge carbon material after heat treatment at 700 °C. (Cirr 
+is the irreversible specific charge, Crev the reversible specific charge). Cited 
+and redrawn from Ref. [7]. 
+ 
+It is clear to see a SEI-related plateau appears at around 0.6V and a high 
+specific charge of around 3720 Ah/kg was achieved during the first charge, as 
+34 
+ 
+shown in the top panel in Figure 2.11. The special feature of this kind of carbon 
+material is that it exhibits a larger voltage hysteresis between charge and 
+discharge processes compared to that of graphite (Figure 2.8). To be more 
+specific, the second charge/discharge is shown at the bottom of Figure 2.11 
+which does not show the effect of SEI. The potential for Li insertion is close to 0 
++
+V vs. Li/Li  whereas the one for Li de-insertion is much more positive [54-55,62-
+65] in the second charge/discharge process. According to the previous study, it 
+has been shown that the extent of hysteresis is proportional to the hydrogen 
+content in the carbon since Li is somehow bound near the hydrogen [66-67]. 
+ 
+Since hydrogen can be removed with increasing temperature, the specific 
+charges achieved after the removal of hydrogen need to be evaluated. It was 
+found that the value of specific charge after high temperature annealing strongly 
+depend on the structure of the non-graphitic material [55,65,68-75]. (i) In the 
+case of soft carbon, it will deliver a lower value of specific charge (x < ~0.5 in 
+LixC6) which is similar to the low specific charge carbon [54,75-76], when heat 
+treated at ~1000 °C. And the specific charge again increases when the 
+temperature is > 1000 °C [73,74]. (ii) In the case of hard carbon, it can still 
+display a specific charge of several hundred Ah/kg when heat-treated at ~1000 °
++
+C. But Li inserts at a very low potential of a few millivolts versus Li/Li  and a 
+smaller hysteresis is shown in charge/discharge profile. In contrast to soft carbon, 
+a drastically reduction of specific charge is observed when the temperature is > 
+35 
+ 
+1000 °C [72,76].  
+ 
+Although the high specific charge carbons show much higher specific 
+capacity than graphite, they have some serious drawbacks such as higher 
+irreversible specific charges, larger hysteresis and poorer cycling performance 
+than graphite [54-55,62,95-96,98,100-101,103-104]. Although the cycling 
+performance of non-graphitizing (hard) carbons heat-treated at ~1000 °C is 
+reasonable and almost no hysteresis occurs, the end of the charge potential of the 
+carbons is very close to metallic lithium [62,75,102]. Under such a charging 
+regime, lithium deposition occurs, which will induce safety issue like Li-metal 
+battery [7]. 
+ 
+2.4 Summary of Chapter Two 
+The operation mechanism of Li-ion battery and the charge/discharge 
+behavior based on different types of carbonaceous materials were generally 
+reviewed in this chapter. This kind of information provides fundamental 
+knowledge to characterize and understand the anodic behavior of nanoscaled 
+carbon materials which will be covered in Chapter 3. 
+ 
+Based on this chapter, it is clear to see that there are so many unsolved 
+issues related to carbonaceous materials. In the case of graphite, it exhibits good 
+cyclic performance and structure stability but the capacity is limited. On the 
+36 
+ 
+contrary, in the case of high specific carbon, the capacity is higher than that of 
+graphite but the long time stability and safety issues remain unsolved.  
+ 
+Although the current understanding of the origins of excess charge is limited, 
+it is clear that numerous factors such as surface area, crystallinity, defect 
+population, basal/edge plane effects and so on could affect the storage capacity. 
+Compared to graphite, the analysis of non-graphitic carbon is more complicated 
+since so many unpredictable factors exist. Ahead of understanding of Li storage 
+mechanisms and the realization of high capacity anode materials, one preliminary 
+issue still remains unclear, that is the Li diffusion pathway in carbonaceous 
+materials. Therefore, further understanding of Li diffusion pathway through 
+graphene plane and the role of defects in Li diffusion is highly required to 
+provide more information to reveal the mystery of Li-C system. In order to 
+improve the limited capacity of graphite and also to overcome various problems 
+in non-graphitic carbons, incorporation of a second material which contains 
+higher Li storage capacity on rather stable carbon matrix could be an alternative 
+way to satisfy the requirements on anode part. The related issues will be further 
+discussed in Chapter 4.  
+ 
+ 
+ 
+37 
+ 
+Bibliography of Chapter Two 
+[1] S. L. Candelaria, Y. Y. Shao, W. Zhou, X. L. Li, J. Xiao, J. G. Zhang, Y. 
+Wang, J. Liu, J. H. Li, G. Z. Cao, Nano Energy 2012, 1,195. 
+[2] J. M. Tarascon, M. Armand, Nature 2001, 414, 359. 
+[3] D. S. Su, R. Schlögl, ChemSusChem 2010, 3, 136. 
+[4] B. Xu, D. Qian, Z. Wang, Y. Meng, Materials Science and Engineering 
+R 2012, 73, 51.. 
+[5] T. Ohzuku, A. Ueda, N. Nagayama, Y. Iwakoshi, H. Komori, 
+Electrochim Acta 1993, 38, 1159. 
+[6] J. O. Besenhard, J. Yang, M. Winter, J. Power Sources 1997, 68, 87. 
+[7] M. Winter, J. O. Besenhard, M. E. Spahr, P. Novák, Adv. Mater. 1998, 
+10, 725 
+[8] H. O. Pierson, Handbook of Carbon, Graphite, Diamond and Fullerenes, 
+Noyes, Park Ridge, NJ 1993, 43. 
+[9] I. Mochida, S. Yoon, W. Qiao, J. Braz. Chem. Soc. 2006, 17 (6), 1059. 
+[10] R. E. Franklin, Proc. R. Soc. London A 1951, 209, 196.. 
+[11] K. Kinoshita, Carbon: Electrochemical and Physicochemical Properties 
+1987 Wiley, New York.. 
+[12] K. Inada, K. Ikeda, Y. Sato, A. Itsubo, M. Miyabashi, H. Yui, in Primary 
+and Secondary Ambient Temperature Lithium Batteries (Eds: J.-P. 
+Gabano, Z. Takehara, P. Bro), Electrochemical Society, Pennington, NJ 
+1988, 88-6, 530. 
+[13] T. Tran, K. Kinoshita, J. Electroanal. Chem. 1995, 386, 221. 
+[14] K. Persson, A. V. Sethuraman, J. L. Hardwick, Y. Hinuma, S. Y. Meng,   
+38 
+ 
+A. Ven, V. Srinivasan, R. Kostecki, G. Ceder, Phys. Chem. Lett. 2010, 1,  
+1176. 
+[15] T. Placke, V. Siozios, R. Schmitz, S. F. Lux, P. Bieker, C. Colle, H.-W. 
+Meyer, S. Passerini, M. Winter, J. Power Sources 2012, 200, 83. 
+[16] B. Jungblut, E. Hoinkis, Phys. Rev. B 1989, 40, 10810. 
+[17] T. D. Tran, K. Kinoshita, J. Electroanal. Chem. 1995, 386, 22. 
+[18] D. Billaud, E. McRae, A. Hérold, Mater. Res. Bull. 1979, 14, 857. 
+[19] X. Y. Song, K. Kinoshita, T. D. Tran, J. Electrochem. Soc. 1996, 143, 
+L120. 
+[20] H. H. Lee, C. C. Wan, Y. Y. Wang, Journal of Power Sources 2003,1,7. 
+[21] C. Casas, W. Li, Journal of Power Sources 2012, 208, 74. 
+[22] E. Jomehzadeh, A. R. Saidi, N. M. Pugno, Physica E: Low-dimensional 
+Systems and Nanostructures 2012, 44 (10), 1973. 
+[23] J. O. Besenhard, H. P. Fritz, Angew. Chem. Int. Ed. 1983, 95,950. 
+[24] A. Hérold, Chemical Physics of Intercalation 1987 (Eds: A. P. 
+Legrand,S. Flandrois), NATO ASI Series B, 172, 3. 
+[25] A. Hérold, Bull. Soc. Chim. Fr. 1955, 187, 999. 
+[26] W. Rüdorff, U. Hofmann, Z. Anorg. Allg. Chem. 1938, 238, 1. 
+[27] N. Daumas, A. Hérold, C. R. Acad. Sci. Paris 1969, 268C, 373. 
+[28] N. Daumas, A. Hérold, Bull. Soc. Chim. 1971, 5, 1598. 
+[29] L. B. Ebert, Annu. Rev. Mater. Sci. 1976, 6, 181. 
+[30] W. Rüdorff, Advances in Inorganic Chemistry and Radiochemistry 1959, 
+39 
+ 
+(Eds: H. J. Eméleus, A. G. Sharpe), Academic, New York, 1, 223. 
+[31] R. Schlögl, Progress in Intercalation Research 1994 (Eds: W. Müller-
+Warmuth, R. Schöllhorn), Kluwer, Dordrecht, The Netherlands, 83. 
+[32] D. Billaud, F. X. Henry, M. Lelauraint, P. Willmanns, J. Phys. Chem. 
+Solids 1996 , l57(6-8), 775. 
+[33] J. O. Besenhard, M. Winter, Proc. of the 2. Ulmer Elektrochemische 
+Tage, Ladungsspeicherung in der Doppelschicht 1995 (Ed: W. 
+Schmickler), Universitätsverlag Ulm, Germany, 47. 
+[34] J. R. Dahn, Phys. Rev. B 1991, 44, 9170. 
+[35] J. E. Fisher, Chemical Physics of Intercalation 1987 (Eds: A. P. Legrand, 
+S. Flandrois), NATO ASI Series B, 172, 59. 
+[36] M. Bagouin, D. Guerard, A. Hérold, C. R. Acad. Sci. Paris 1966, 262C, 
+557. 
+[37] C. Casas, W. Li, Journal of Power Sources 2012, 208, 74. 
+[38] P. Pfluger,V. Geiser, S. Stolz, H.-J. Güntherodt, Synth. Met. 1981, 3, 27. 
+[39] D. Billaud, F. X. Henry, P. Willmann, Mater. Res. Bull. 1993, 28, 477. 
+[40] D. Billaud, F. X. Henry, P. Willmann, Mol. Cryst. Liq. Cryst. 1994, 245, 
+159. 
+[41] J. R. Dahn, A. K. Sleigh, H. Shi, B. M. Way, W. J. Weydanz, J. N. 
+Reimers, Q. Zhong, U. von Sacken, Lithium Batteries: New Materials, 
+Developments and Perspectives 1994 (Ed: G. Pistoia), Elsevier, 
+Amsterdam, 1. 
+[42] R. Fong, U. von Sacken, J. R. Dahn, J. Electrochem. Soc. 1990, 137, 
+40 
+ 
+2009. 
+[43] K. Yokoyama, N. Nagawa, New Sealed Rechargeable Batteries and 
+Supercapacitors 1993 (Eds: B. M. Barnett, E. Dowgiallo, G. Halpert, 
+Y.Matsuda, Z. Takehara), Electrochemical Society, Pennington, NJ, 
+PV93-23, 270. 
+[44] R. Kanno, Y. Kawamoto, Y. Takeda, S. Ohashi, N. Imanishi, O. 
+Yamamoto, J. Electrochem. Soc. 1992, 139, 3397. 
+[45] M. Winter, P. Novµk, A. Monnier, J. Electrochem. Soc. 1998, 145, 428. 
+[46] F. Joho, P. Novµk, O. Haas, A. Monnier, F. Fischer, Mol. Cryst. Liq. 
+Cryst., in press. 
+[47] P. G. Bruce, B. Scrosati, J. M. Tarascon, Angew. Chem. Int. Ed. 2008, 47, 
+2930. 
+[48] S. Mori, H. Asahina, H. Suzuki, A. Yonei, E. Yasukawa, J. Power 
+Sources 1997, 68, 59. 
+[49] Y. Ein-Eli, B. Markovsky, D. Aurbach, Y. Carmeli, H. Yamin, S. Luski, 
+Electrochim. Acta 1994, 39, 2559. 
+[50] D. Aurbach, Y. Ein-Eli, B. Markovsky, A. Zaban, A. Schechter, S. Luski, 
+Y. Carmeli, H. Yamin, Rechargeable Lithium and Lithium- Ion Batteries 
+1995 (Eds: S. Megahed, B. M. Barnett, L. Xie), Electrochemical Society, 
+Pennington, NJ, PV94-28, 26. 
+[51] D. Aurbach, Y. Ein-Eli, B. Markovsky, A. Zaban, S. Lusky, Y. Carmeli, 
+H. Yamin, J. Electrochem. Soc. 1995, 142, 2882. 
+[52] D. Aurbach, Y. Ein-Eli, O. Chusid, Y. Carmeli, M. Babai, H. Yamin, J. 
+Electrochem. Soc. 1994, 141, 603. 
+41 
+ 
+[53] D. Aurbach, Y. Ein-Eli, J. Electrochem. Soc. 1995, 142, 1746. 
+[54] T. Zheng, J. S. Xue, J. R. Dahn, Chem. Mater. 1996, 8, 389. 
+[55] T. Zheng, Y. Liu, E. W. Fuller, S. Tseng, U. von Sacken, J. R. Dahn, J. 
+Electrochem. Soc. 1995, 142, 2581. 
+[56] L. B. Ebert, Carbon 1996, 34, 671. 
+[57] J. R. Dahn, T. Zheng, Y. Liu, J. S. Xue, Science 1995, 270, 590. 
+[58] P. Zhou, P. Papanek, C. Bindra, R. Lee, J.E. Fischer, J. Power Sources 
+1997, 68, 297. 
+[59] K. Sato, M. Noguchi, A. Demachi, N. Oki, M. Endo, Science 1994, 264, 
+556. 
+[60] M. Winter, J. O. Besenhard, Lithium Ion Battery: Fundamentals and 
+Performance 1998 (Eds.: M. Wahihara, O. Yamamoto), Wiley-VCH, 
+Weinheim. 
+[61] T. Zheng, W. Xing, J. R. Dahn, Carbon 1996, 34, 1501.. 
+[62] J. S. Xue, J. R. Dahn, J. Electrochem. Soc. 1995, 142, 3668. 
+[63] J. R. Dahn, J. S. Xue,W. Xing, A. M.Wilson, A. Gibaud, Extended 
+Abstracts of the 8th Int. Mtg. on Lithium Batteries 1996, Nagoya, Japan, 
+89. 
+[64] T. Zheng, J. R. Dahn, J. Power Sources 1997, 68, 201. 
+[65] T. Zheng, W. R. McKinnon, J. R. Dahn, J. Electrochem. Soc. 1996, 143, 
+2137. 
+[66] S. Wang, Y. Zhang, L. Yang, Q. Liu, Solid State Ionics 1996, 86, 919. 
+[67] P. Zhou, P. Papanek, R. Lee, J.E. Fisher, W. A. Kamitakahara, J. 
+42 
+ 
+Electrochem. Soc. 1997, 144, 1744. 
+[68] A. Satoh, N. Takami, T. Ohsaki, Solid State Ionics 1995, 80, 291. 
+[69] A. Satoh, N. Takami, T. Ohsaki, M. Kanda, Rechargeable Lithium 
+and Lithium-Ion Batteries 1995 (Eds: S. Megahed, B. M. Barnett, L. 
+Xie), Electrochemical Society, Pennington, NJ, PV94-28,143. 
+[70] K. Tatsumi, A. Mabuchi, N. Iwashita, H. Sakaebe, H. Shioyama, H. 
+Fujimoto, S. Higuchi, Batteries and Fuel Cells for Stationary and 
+Electric Vehicle Applications1993 (Eds: A. R. Landgrebe, Z. Takehara) 
+Electrochemical Society, Pennington, NJ, PV 93-8, 64. 
+[71] A. Mabuchi, H. Fujimoto, K. Tokumitsu, T. Kasuh, J. Electrochem. 
+Soc. 1995, 142, 3049. 
+[72] K. Tokumitsu, A. Mabuchi, H. Fujimoto, T. Kasuh, Rechargeable 
+Lithium and Lithium-Ion Batteries1995 (Eds: S. Megahed, B. M. Barnett, 
+L. Xie), Electrochemical Society, Pennington, NJ, PV94-28,136. 
+[73] K. Tatsumi, T. Akai, T. Imamura, K. Zaghib, N. Iwashita, S. Higuchi,Y. 
+Sawda, J. Electrochem. Soc. 1996, 143, 1923. 
+[74] K. Tatsumi, N. Iwashita, H. Sakaebe, H. Shioyama, S. Higuchi, A. 
+Mabuchi, H. Fujimoto, J. Electrochem. Soc. 1995, 142, 716. 
+[75] Y. Liu, J. S. Xue, T. Zheng, J. R. Dahn, Carbon 1996, 34, 193. 
+[76] H, Iomoto, A. Omaru, A. Azuma, Y. Nishi, Lithium Batteries 1993 (Eds: 
+S. Surampudi, V. R. Koch), Electrochemical Society, Pennington, NJ, 
+PV93-24, 9. 
+[77] J. R. Dahn, A. K. Sleigh, H. Shi, J. N. Reimers, Q. Zhong, B. M. Way, 
+43 
+ 
+Electrochim. Acta 1993, 38, 1179. 
+[78] M. Jean, C. Desnoyer, A. Tranchant, R. Messina, J. Electrochem. Soc. 
+1995, 142, 2122. 
+[79] R. V. Moshtev, P. Zlatilova, B. Puresheva, V. Manev, J. Power Sources 
+1995, 56, 137. 
+[80] J. M. Chen, C. Y. Yao, C. H. Cheng, W. M. Hurng, T. H. Kao, J. Power 
+Sources 1995, 54, 494. 
+[81] A. K. Sleigh, U. von Sacken, Solid State Ionics 1992, 57, 99. 
+[82] S. Ma, J. Li, X. Jing, F. Wang, Solid State Ionics 1996, 86-88, 911. 
+[83] R. Alcµntara, J. M. JiminØz-Mateos, P. Lavela, J. Morales, J. L. Tirado, 
+Mater. Sci. Eng. 1996, B39, 216. 
+[84] K. Takei, N. Terada, K. Kumai, T. Iwahori, T. Uwai, T. Miura, J. Power  
+Sources 1995, 55, 191. 
+ 
+[85] K. Takei, K. Kumai, Y. Kobayashi, H. Miyashiro, T. Iwahori, T. Uwai, 
+T. Miura, J. Power Sources 1995, 54, 171. 
+[86] T. Zheng, J. R. Dahn, Synth. Met. 1995, 73, 1. 
+[87] T. Zheng, J. R. Dahn, Phys. Rev. B 1996, 53, 3061. 
+[88] T. Zheng, J. N. Reimers, J. R. Dahn, Phys. Rev. B 1995, 51, 734. 
+[89] B. Di Pietro, M. Patriarca, B. Scrosati, J. Power Sources 1982, 8, 289. 
+[90] K. Sawai, Y. Iwakoshi, T. Ohzuku, Solid State Ionics 1994, 69, 273. 
+[91] J. O. Besenhard, Progress in Intercalation Research 1994 (Eds: W. 
+44 
+ 
+Müller-Warmuth, R. Schöllhorn), Kluwer, Dordrecht, The Netherlands,    
+457. 
+[92] J. O. Besenhard, Soft Chemistry Routes to New Materials1994 (Eds: J. 
+Rouxel, M. Tournoux, R. Brec), Materials Science 152, Trans Tech, 
+Aedermannsdorf, Switzerland, 13. 
+[93] J. R. Dahn, A. K. Sleigh, H. Shi, B. M. Way, W. J. Weydanz, J. N. 
+Reimers, Q. Zhong, U. von Sacken, Lithium Batteries: New Materials, 
+Developments and Perspectives1994 (Ed: G. Pistoia), Elsevier, 
+Amsterdam, 1. 
+[94] J. O. Besenhard, M. Winter, Proc. of the 2. Ulmer Elektrochemische 
+Tage, Ladungsspeicherung in der Doppelschicht 1995 (Ed: W. 
+Schmickler), Universitätsverlag Ulm, Germany, 47. 
+[95] O. Yamamoto, Y. Takeda, N. Imanishi, R. Kanno, New Sealed 
+Rechargeable Batteries and Supercapacitors1993 (Eds: B. M. Barnett, E. 
+Dowgiallo, G. Halpert, Y. Matsuda, Z. Takehara), Electrochemical 
+Society, Pennington, NJ, PV93-23,302. 
+[96] H. Fujimoto, A. Mabuchi, K. Tokumitsu, T. Kasuh, J. Power Sources 
+1995, 54, 440. 
+[97] K. Tokumitsu, A. Mabuchi, H. Fujimoto, T. Kasuh, J. Power Sources 
+1995, 54, 444. 
+[98] S. Yata, H. Kinoshita, M. Komori, N. Ando, T. Kashiwamura, T. Harada, 
+K. Tanaka, T. Yamabe, Synth. Met. 1994, 62, 153. 
+ 
+[99] S. Yata, K. Sakurai, T. Osaki, Y. Inoue, K. Yamaguchi, Synth. Met. 1990, 
+45 
+ 
+33, 177. 
+[100] S. Yata, Y. Hato, H. Kinoshita, N. Ando, A. Anekawa, T. Hashimoto, M. 
+Yamaguchi, K. Tanaka, T. Yamabe, Synth. Met. 1995, 73, 273. 
+[101] Y. Mori, T. Iriyama, T. Hashimoto, S. Yamazaki, F. Kawakami, H. 
+Shiroki, T. Yamabe, J. Power Sources 1995, 56, 205. 
+[102] T. Zheng, Q. Zhong, J. R. Dahn, J. Electrochem. Soc. 1995, 142, L211. 
+[103] M. Alamgir, Q. Zuo, K. M. Abraham, J. Electrochem. Soc. 1994, 141, 
+L143. 
+[104] T. Iijima, K. Suzuki, Y. Matsuda, Synth. Met. 1995, 73, 9. 
+ 
+46 
+ 
+                  Outline of Chapter Three 
+ 
+Silicon-Coated Carbon Nanofiber Mat for Anode of Lithium 
+Ion Battery 
+ 
+One Dimensional Carbon Materials as an Anode Material for 51 
+3.1   
+LIB 
+3.1.1  General Introduction of CNFs and CNTs 51 
+3.1.2  CNFs and CNTs Using as an Anode Material for LIB 56 
+3.1.3  Fabrication Methods of CNFs and CNTs 58 
+3.1.3-1  Chemical Vapor Deposition for Both CNFs and CNTs 58 
+3.1.3-2  Electrospinning Method for CNFs Mat 63 
+3.2   Electrospinning Fabricated CNFs Mat as an Anode Material 66 
+for LIB 
+3.2.1  SEM and Raman Characterization of CNFs Synthesized 67 
+ Through Electrospinning 
+3.2.2  Anode Performance of CNFs Synthesized Through 69 
+ Electrospinning 
+3.3   Silicon-Coated Carbon Nanofiber Mat for Anode of Lithium 71 
+47 
+ 
+Ion Battery 
+3.3.1 Introduction 72 
+3.3.2  Characterizations of CNF-Si Mat 76 
+3.3.3 Anode Performance of CNF-Si Mat 83 
+3.4 Summary of Chapter Three 95 
+Bibliography of Chapter 3 97 
+48 
+ 
+CHAPTER THREE 
+Silicon-Coated Carbon Nanofiber Mat for Anode of Lithium 
+Ion Battery 
+Owing to the current performance deficiencies of micron-sized carbon 
+anode materials such as graphites and hard carbons, researchers have been 
+struggling a long time to develop new materials and new structures to meet the 
+ever-growing market demands. Just as indicated by Richard Feynman in 1959 
+that “there is plenty of room at the bottom” [1], the emergency of nanoscience 
+and nanotechnology which leads to revolution in basic material science and 
+engineering provided us new opportunities to improve carbonaceous anode 
+performance. The discovery of nanoscaled carbon materials covers carbon 
+nanotubes (CNTs), carbon nanofibers (CNFs), and graphene (Gr) which had 
+profound impact on the development of clean energy storage and conversion 
+systems. Compared to bulk carbon materials, low dimensional carbons exhibit 
+novel properties which are often superior to their bulk counterparts associated 
+with decreased size, unique shape, and defects. Therefore, Li storage mechanism 
+and anodic behavior could be very different from bulk graphite.  
+ 
+Nanocarbon materials enable electrode reactions to occur that cannot take 
+place for materials composed of micrometer-sized particles. The diffusion time 
+2
+constant for Li ions is given by t=L /D, where L is the diffusion length and D the 
+49 
+ 
+diffusion constant [2]. The reduced dimensions increase significantly the rate of 
+lithium insertion/removal and also the electron transport because of the short 
+distances for Li ion transport within the particles [3]. High surface area permits 
+high contact area with electrolyte and hence high Li ions flux across the interface. 
+The strain associated with intercalation is expected to be better accommodated 
+[4] in nanosized carbons. Due to the advantages as mentioned above, nanocarbon 
+materials have been extensively investigated as an anode of LIB.  
+ 
+However, it was found that nanocarbon materials can only provide certain 
+degree of capacity improvement which is still far lower than that people expected. 
+Thus, incorporation of another cheap and high capacity material such as silicon 
+-1
+whose specific capacity can reach 3572 mA h g  at room temperature provides a 
+new way to overcome the above issue [5]. Nevertheless, severe structural 
+pulverization induced by the large volume expansion during charge/discharge 
+makes this material impractical [5]. Therefore, anode capacity improvement by 
+Si while maintaining the structural stability is another big challenge. Thus, the Si-
+coated CNF mat was synthesized by combining electrospinning and 
+electrochemical deposition in this work. The original idea is to improve the Si 
+structure stability by taking advantage of the entangled three dimensional CNF 
+network which consists of good conductivity and porosity. The structure-related 
+characterization and anode performance of CNF/Si mat will be given in detail. 
+Before that, the relatively popular one dimensional carbon materials such as 
+50 
+ 
+CNFs and CNTs will be discussed and compared based on their general 
+properties and the potential to be applied as an anode in LIB. Then the detailed 
+fabrication process of CNF mat through electrospinning method and the anodic 
+performance of as-fabricated CNF mats will be provided in this chaper. 
+ 
+3.1 One Dimensional Carbon Materials as an Anode Material for LIB 
+One dimensional carbon materials, carbon nanofibers (CNFs) and carbon 
+nanotubes (CNTs) are of great practical and scientific importance. Owing to their 
+similar cylinder shapes, the definitions of CNTs and CNFs are often misleading. 
+Due to the material and structural similarity, common features do exist in their 
+basic properties and Li storage mechanisms. Nevertheless, they are similar in 
+form but distinct in (1) general physical properties, (2) Li storage mechanisms 
+and (3) means of production which will eventually affect the practical application 
+in anode. Therefore, before the detailed discussion of electrospinning fabricated 
+CNF mat, the main anode material applied in this chapter, the general 
+comparison between CNFs and CNTs based on these three different factors is 
+provided here for comprehensive understanding of one dimensional anode 
+materials.  
+ 
+3.1.1 General Physical Property of CNFs and CNTs   
+If one takes a close look at the basic structure of CNTs and CNFs, the 
+51 
+ 
+geometry differences can be easily observed between them. CNFs can be 
+visualized as regularly stacked truncated conical or planar layers along the 
+filament length without hollow core [5–8] whereas, CNTs are formed by rolling 
+up graphene sheets to form concentric tubes containing an entire hollow core. In 
+fact, some of the carbon nanotubes being investigated actually qualify as carbon 
+nanofibers because the lack of long-range order as in graphitic materials and/or 
+they have imperfectly rolled graphene sheets. Generally, diameters of CNFs and 
+CNTs can be used as a criterion to distinguish these two kinds of materials, as 
+shown in Figure 3.1[9].The diameter of CNTs is around few tens of nanometers 
+whereas the diameter of CNFs is usually larger than hundred nanometers. Both 
+nanomaterials are available in various lengths and could be up to several hundred 
+micrometers depending on the feedstock and the production method.  
+ 
+ 
+ 
+ 
+ 
+Figure 3.1 Schematic comparison of the diameter dimensions on a log 
+52 
+ 
+scale for various types of fibrous carbons. Cited form Ref. [9]. 
+In the case of CNFs, the most important feature is that it exposes large 
+portion of graphene edge planes on its surfaces. In the case of CNTs, since it was 
+formed by rolling up graphene sheets, the basal plane of graphene is exposed, as 
+shown in Figure 3.2 [10]. This general difference in structure will eventually 
+affect the Li storage mechanism which will be discussed later. Compared to the 
+rather simple configuration of CNFs, CNTs display several different structures 
+based on the number of graphene layers and the rolling direction.  
+ 
+ 
+ 
+ 
+ 
+Figure 3.2 Wrapping of graphene sheet to form SWNT. Cited and 
+modified form Ref. [10]. 
+ 
+According to the number of graphene layers, CNTs can be further 
+distinguished into SWNTs and MWNTs. SWNT is a single graphene sheet rolled 
+into a form of a tube, whereas MWNTs are composed of several concentric tubes 
+53 
+ 
+of graphenes. The diameter of CNTs varies from a few nanometers in the case of 
+SWNTs to several tens of nanometers in the case of MWNTs. The representative 
+TEM figures of SWNT and MWNT are shown in Figure 3.3 [11].  
+ 
+Figure 3.3 Schematic indications of (a) SWCNT, (b) MWCNT, and 
+the corresponding TEM images in (c) and (d). Cited and replotted 
+from Ref. [11]. 
+ 
+According to the rolling directions, SWNTs can be completely described by 
+a single vector   (called chiral vector), as shown in Figure 3.4. Two atoms in 
+a planar graphene sheet are chosen and one set to be origin. The chiral vector  
+is pointed from the first atom toward the second one and is defined by the 
+relation  = n  + m , where n and m are integers,  and  are the unit 
+cell vectors of the two-dimensional lattice formed by the graphene sheets. The 
+54 
+ 
+direction of the nanotube axis is perpendicular to this chiral vector. The angle 
+between the chiral vector and zigzag nanotube axis is the chiral angle θ 
+(Figure 3.4). With the integers of n and m already introduced before, this angle 
+can be defined by θ −1  = tan (  ). SWNTs can be described by 
+the pair of integers (n,m) which is related to the chiral vector. Three types of 
+SWNTs are revealed with these values: when n = m, the nanotube is called 
+“armchair” type (θ = 0◦); when m = 0, then it is of the “zigzag” type (θ = 30◦). 
+Otherwise, when n ≠ m, it is a “chiral” tube and θ takes a value between 0◦ 
+and 30◦. The value of (n,m) determines the chirality of the nanotube and affects 
+the electronic property. SWNTs with |n-m| = 3q are metallic and those with |n-
+m| = 3q±1 are semiconducting (q is an integer) [12].  
+ 
+Figure 3.4. Chiral vector  and chiral angle θ definition for a (2, 
+4) nanotube on graphene sheet.  and .are the unit cell vectors 
+55 
+ 
+of the two-dimensional hexagonal graphene sheet. The circumference 
+of nanotube is given by the length of chiral vector. The chiral angle 
+θ is defined as the angle between chiral vector and the zigzag axis. 
+Cited and modified from Ref. [12]. 
+ 
+Compared to SWNTs which display complex structure-determined 
+electronic properties, MWNTs are multi-surface graphene with various chiral 
+angles and would lose special electronic properties, and thus they reveal an 
+average effect of all chiral tubes and thus usually exhibit a metallic property 
+since their diameters are large.  [11]. In comparison with CNTs, CNFs show 
+relatively low conductivity. As a result, in the aspect of material conductivity, 
+CNTs could be better choice for LIB anode. 
+ 
+3.1.2 CNFs and CNTs Using as an Anode Material for LIB  
+The limited capacity of graphite as introduced in chapter two has hindered 
+the further development of battery technology. The interesting properties of one 
+dimensional carbon materials therefore have been widely studied to substitute 
+graphite as an anode material of LIB. Generally, CNTs and CNFs show similar 
+advanced properties with graphite. On the one hand, they preserve even exceed 
+the common graphite in the sense of high chemical stability and low resistance; 
+On the other hand, they show other favorable characteristics which could further 
+56 
+ 
+benefit the performance of anode. For example, CNTs and CNFs exhibit high 
+specific area which increases the contact area of electrode and electrolyte leading 
+to higher charge/discharge rates. The high mechanical strength and flexibility is 
+again superb for a long cycle life [13-16] and potential application in flexible 
+electronics, respectively.  
+ 
+The storage mechanisms of Li in CNFs and CNTs are similar to each other 
+and resemble that of bulk carbon materials combing the characteristics of 
+graphite and non-graphitic carbon. Li ions could be stored through: (1) 
+intercalation (LiC6 stoichiometry); (2) adsorption and accumulation on the outer 
+surface, (3) void space between bundles, (4) defect sites, cavities and nanopores. 
+These kind of storage mechanisms have been well illustrated in chapter two, see 
+Figure 2.10 [17-18].  
+ 
+However, one main difference does exist between CNFs and CNTs. In the 
+case of CNTs, lithium insertion through the walls (basal plane of graphene sheet) 
+or the capped ends is energetically not favorable as suggested by Kar et al. who 
+investigated lithium insertion into CNTs by ab initio and DFT methods [19]. On 
+the other hand, lithium ions can be inserted through CNF walls since it is mainly 
+composed of edge plane of graphene sheets [5-9]. More comprehensive 
+information related to Li insertion through these two kinds of graphene planes 
+will be provided in chapter 4. Thus, in the aspect of feasibility of Li penetration 
+57 
+ 
+which is closely related to the storage capacity and charge/discharge rate, CNFs 
+using as anode material could be more advanced compared to CNTs.  
+ 
+In addition to the differences in basic material property and Li storage 
+mechanism as mention above, one more important factor that needs to be 
+considered is the means of fabrication for one dimensional carbon materials. As a 
+matter of fact, styles of the produced carbon materials, feasibility for further 
+processing into LIB anode, and also cost all have huge influences for the real 
+application of CNFs and CNTs. Thus, the following section will mainly focus on 
+discussion of two popular fabrication methods of CNFs and CNTs. 
+ 
+3.1.3 Fabrication Methods of CNFs and CNTs 
+3.1.3-1 Chemical Vapor Deposition for CNFs and CNTs 
+Owing to material and structure similarity, both CNFs and CNTs can be 
+synthesized through chemical vapor deposition (CVD). CVD is a well known 
+production method for carbon based materials. One dimensional CNF/CNT and 
+two dimensional graphene can be fabricated using this method. Three basic 
+elements for CVD growth are catalyst, carbon precursor, and sufficient thermal 
+energy for gas decomposition and reaction to occur. Briefly, the CVD method 
+involves the decomposition of a gaseous or volatile compound of carbon, 
+catalyzed by metallic nanoparticles with external energy supply, which will also 
+58 
+ 
+serve as nucleation sites for the initiation of low dimensional carbon growth. The 
+most frequently used catalysts are transition metals, primarily Fe, Co, or Ni. The 
+energy source is heat from a furnace of CVD [11]. By varying the conditions, 
+powder-like samples or film-like samples consist of vertically aligned CNTs or 
+network of CNFs/CNTs which are supposed to benefit the fabrication process of 
+LIB electrodes, can be easily obtained, as shown in Figure 3.5. The length, 
+diameter, and morphology of CNFs and CNTs also can be controlled during the 
+synthesis process.  
+Figure 3.5 CVD process-fabricated (a) CNT power, (b) vertically 
+aligned CNTs, and (c) CNF planar network. Cited from Ref. [11]. 
+ 
+One dimensional carbon anode usually consists of a thin layer of 
+CNFs/CNTs which is mounted onto a metal current collector. Compared to 
+vertically aligned CNFs/CNTs electrode, planar network-like (film or mat) 
+morphology is preferred not only because it is suitable to the conventional coin 
+cell battery fabrication but also the short circuit problem triggered by material 
+59 
+ 
+piercing through the separator can be avoided. In the case of as-grown CNFs or 
+CNTs network, the remaining impurities such as catalyst for growth and also an 
+appropriate substrate for growth need to be considered before anode preparation. 
+Combining all of the factors, power-like CNFs/CNTs samples are widely used 
+nowadays. In order to form a network style CNFs or CNTs film from the as-
+synthesized powder, material functionalization and dispersion in liquid are 
+usually required before the electrode fabrication.  
+ 
+Since CNFs expose graphene edge planes on its surfaces, the surface state 
+can be easily modified through chemical functionalization or thermal treatments 
+whenever necessary. Functionalizing and dispersing the CNFs are possible to be 
+performed using traditional, scalable, and fast processing methods. On the other 
+hand, the CNT functionalization was usually performed before dispersion by first 
+creating defect sites along the side walls of tubes, which can then be utilized for 
+attaching functional groups. This kind of method usually reduces the 
+conductivity and mechanical strength of CNTs and requires several processing 
+steps. Thus CNTs are more difficult and more costly to scale-up with respect to 
+CNFs.  
+ 
+Furthermore, in the case of CNTs, due to their smaller sizes than CNFs, van 
+der Waals forces are stronger which induce the formation of ropes or reassemble 
+after being dispersed. Therefore, chemical dispersants or functionalization 
+60 
+ 
+techniques are usually required to aid and maintain dispersion. Unlike CNTs, 
+CNFs with a stacked-cup style are less affected by van der Waals forces and tend 
+to stay dispersed for a longer period of time. This difference enables CNFs to be 
+dispersed through purely mechanical processing techniques without the need for 
+additional, and costly, processing steps, making CNFs easier and cheaper to 
+process. 
+ 
+Finally, the prices of CNTs and CNFs are very different depending on the 
+producer but in general, the cost of CNFs is typically an order-of-magnitude 
+lower than that of CNTs. CNFs are available in large volumes (up to 70,000 
+pounds per year) and range in price from as low as $ 100 per pound to as high as 
+$ 500 per pound. As to CNTs, the price varies widely and is strongly dependent 
+on the quality and purity of the products. One can find commercialized CNT 
+powder with the price as low as $100 per pound to as high as $ 750 per gram or 
+more. Therefore, the costs for just the raw material plus the one for the extra cost 
+of additional processing steps (such as purification and functionalization) are 
+much higher than that of CNFs. The series of post-treatment procedures also 
+significantly increase the complexity of the application of CNTs.  
+ 
+To conclude all of the factors as mentioned above, it is clear that CNFs 
+could be simpler and more cost effective material to be adopted in LIB compared 
+to CNTs. However, CVD method for the production of CNFs still remains 
+61 
+ 
+unsolved in many aspects. The complex experimental setup such as certain 
+vacuum level, toxic gases protection, and even plasma or microwave 
+involvement makes it less cost effective. Also, metals that are introduced as 
+catalysts during the synthesis usually exist in the sample which interferes with 
+the desired properties of CNFs and cause a serious impediment in detailed 
+characterization and applications [10-12,20].  
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+Figure 3.6 Typical anode assembling based on CVD process 
+fabricated carbon powder. Cited and modified from Ref. [20] 
+ 
+Furthermore, it is worth noting that a metal current collector and binders are 
+required to complete the final assembly of CVD-grown CNFs powder electrode, 
+as shown in Figure 3.6 [20]. The use of metal substrate not only increases the 
+mass of electrode which decreases the specific capacity but also causes a 
+62 
+ 
+corrosion-related issue in a long run. As for the use of binder, the conductivity 
+and effective mass of the electrode also will be affected. Therefore, a mature 
+CNF network fabrication method which is catalyst-free, easy, cost-effective 
+combining a mat/film style sample as a final product to avoid the multiple steps 
+of post treatments is highly demanded in the industrial field of anode fabrication.  
+ 
+3.1.3-2 Electrospinning Method for CNF Mat 
+Fortunately, free-standing CNFs mat can be fabricated by electrospinning as 
+an alternative method of CVD. Electrospinning uses an electrical charge to draw 
+very fine (typically on the micro or nano scale) fibres from liquid. This 
+traditional method usually combines electrospinning of organic polymers and 
+thermal treatment in an inert atmosphere. The electrospinning technique has been 
+considered to be one of the advanced fiber formation techniques from polymer 
+solution by using electrostatic forces [21-24]. Electrospun-based nanofibers 
+exhibited noticeable properties, such as nanosized diameter, high surface area, 
+and thin web morphology, which make them applicable to the fabrication of 
+high-performance nanocomposites and energy storage devices [25-31]. The 
+simple experimental setup and rather easy process compared to CVD are 
+particularly suitable for the production of CNFs in large scale. Since this method 
+was adopted in the research part in this work, the fundamental mechanism and 
+detailed experimental procedures will be further explained as following.   
+ 
+63 
+ 
+In the electrospinning process, a polymer solution held by its surface tension 
+at the end of a capillary tube is subjected to an electric field. Charge is induced 
+on the liquid surface by an electric field. Mutual charge repulsion causes a force 
+directly opposite to the surface tension. As the intensity of the electric field is 
+increased, the hemispherical surface of the solution at the tip of the capillary tube 
+elongates to form a conical shape known as the Taylor cone [32]. When the 
+electric field reaches a critical value in which the repulsive electric force 
+overcomes the surface tension force, a charged jet of the solution is ejected from 
+the tip of the Taylor cone. Since this jet is charged, its track can be controlled by 
+an electric field. As the jet travels in air, the solvent evaporates, leaving behind a 
+charged polymer fiber which lays itself randomly on a collecting metal screen. 
+Thus, continuous fibers are laid to form a fabric film [32].  
+ 
+The above description of the process suggests that the following parameters 
+affect the process: solution properties including viscosity, conductivity, and 
+surface tension; controlled variables including hydrostatic pressure in the 
+capillary, electric potential at the tip, and the distance between the tip and the 
+collection screen; and ambient parameters including temperature, humidity, and 
+air velocity in the electrospinning chamber. By appropriately varying one or 
+more of the above parameters, fibers with desired properties can be successfully 
+produced [32].  
+ 
+64 
+ 
+  
+ 
+ 
+Figure 3.7. Schematic of CNF mat fabrication processes: (a) 
+schematic of electrospinning apparatus and (b) the fabricated 
+nanofiber network. 
+ 
+To be more specific, here, fabrication process of polyimide (PI)-based CNFs 
+which were also characterized as an anode in LIB in the following section are 
+taken as an example. The apparatus used in the electrospinning process is shown 
+in Figure 3.7. It consists of a glass syringe with a maximum volume of 20 ml. 
+The glass syringe was filled with a Poly(amic acid) (PAA) solution, inside where 
+a metal needle (figure not shown) was embedded at the tip of the solution. A 
+syringe pump (figure not shown) was used to keep the solution at the tip of the 
+tube and also control the flow rate (injection rate) of solution. The solution was 
+65 
+ 
+charged by connecting the metal electrode to a high voltage power supply. A 
+cylindrical collector wrapped with aluminum foil was used as collecting devices 
+for the charged fibers.  
+ 
+The Poly(amic acid) (PAA) was synthesized by pyromellitic dianhydride 
+(PMDA, Sigma Aldrich) and oxydianiline (ODA). PMDA of 4.4 g was added 
+into ODA (4.0 g) pre-dissolved DMF solution (21 g). The mixture was stirred for 
+30 min with a magnetic bar. 413 μL triethyl amine (TEA) was then added to 
+control the molecular weight. The as-prepared solution was then electrospun into 
+PAA nanofibers. The separation distance between the needle and collector, DC 
+bias voltage, and solution flow rate were 15 cm, 20 kV, and 0.2 mL h-1, 
+respectively. The PAA nanofiber mat with aluminum foil was then put into 
+stabilization oven and converted into polyimide (PI) mat after seven different 
+-1
+oxidation steps at a rate of 1°C min .[52] The PI mat was then peeled off from 
+the aluminum foil and transferred into high temperature furnace. CNF mat was 
+formed by annealing the PI mat according to three steps annealing procedures 
+(firstly from room temperature to 600 °C in 1 h, then 600 °C to 1000 °C  in 1.3 
+h, and finally maintaining in 1000 °C for 1 h) under argon gas environment by 
+following the previous publication [33].  
+ 
+3.2 Electrospinning Fabricated CNFs Mat as an Anode Material for 
+LIB 
+66 
+ 
+3.2.1 SEM and Raman Characterization of CNFs Synthesized Through 
+Electrospinning 
+The as-fabricated CNFs mat was free-standing film with a large area up to 
+2
+15 x 15 cm . CNF mat were carefully weighted by using the A&D BM-22 
+microbalance located inside the dry room after cut into a 1.5 cm diameter round 
+shape. The average mass of the film was around 1mg with a thickness of 25 ± 3 
+m. Typical SEM images of CNFs mat were shown in Figure 3.8. The average 
+diameter of the fiber was around 180 nm and the surface of CNFs was smooth 
+and clean. The micro-Raman spectra was shown in Figure 3.9. It clearly showed 
+-1
+a G-band near 1592 cm , which is related to the optical E2g phonon at the 
+2
+Brillouin zone center indicating sp  hybridization of carbon network and a D-
+−1
+band near 1352 cm , which corresponds to transverse optical phonon near the K 
+3
+point and indicates sp  hybridization of carbon network [34]. The intensity ratio 
+of D band to G band (ID/IG) was around 0.83. This fairly high value of ID/IG 
+indicates the existence of large amount of disorder carbon phase and rather poor 
+conductivity of CNFs. This could lead to a poor electrochemical cycle 
+performance. Further extensive high temperature (> 1000 °C) and high vacuum 
+treatment could improve the crystallinity of the as-synthesized CNFs mat, but the 
+degree of the flexibility and the extra cost need to be considered. 
+ 
+ 
+ 
+67 
+ 
+  
+ 
+ 
+ 
+ 
+Figure 3.8. SEM images of as-synthesized CNFs with (a) top view and (b) 
+cross-sectional images. 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+Figure 3.9. Micro-Raman spectra of CNFs mat fabricated by 
+electrospinning method. 
+ 
+This kind of free-standing CNF mat fabricated through a simple 
+electrospinning method is of great interest to be studied as an anode material in 
+LIB because not only the sample exhibits a film-like nature right after the 
+68 
+ 
+fabrication, which avoids the use of binder and metal substrate, but also the well-
+interconnected three-dimensional network structure provides a good porosity and 
+reasonable conductivity compared to common graphite. Therefore, the as-
+fabricated CNF mat was applied and tested as an anode in the following section. 
+ 
+3.2.2 Anode Performance of CNFs Synthesized Through 
+Electrospinning 
+The electrospinning fabricated CNF mat were directly used as an anode for 
+LIB test in the section. Electrochemical measurements were carried out with a 
+CR 2032 coin cell using VMP3 instrument (BioLogic Science Instruments). The 
+cell was assembled in a dry room using CR 2032 cell case with bare CNF mat as 
+a working electrode, lithium metal foil as a counter/reference electrode, and 1 M 
+of LiPF6 in a 1:1 (v/v) mixture of ethylene carbonate (EC) and diethyl carbonate 
+(DEC) as electrolyte. No extra metal current collector, binder or conducting agent 
+were used. A glassy carbon microfiber was used as a separator. The cells were 
++
+charged and discharged galvanostatically between 2.0 and 0.01 V vs. Li/Li . Here, 
+-1
+we defined 1 C to be 372 mA h g . The general charge/discharge profile is shown 
+in Figure 3.10a. 
+ 
+The charge/discharge (CD) profiles of CNF mat show a gradual change in a 
+broad voltage window during charge/discharge, revealing a V-shape feature. This 
+is in good contrast with a U-shaped graphite CD curve due to the existence of 
+69 
+ 
+st
+disordered carbon phase in our CNF mat [35-36]. In the 1  charge of CNF, a 
+plateau near 0.7 V vs. Li/Li+ can be attributed to the formation of solid-
+electrolyte interface (SEI) via electrolyte decomposition [35]. In the discharge 
++
+process, the slope of the curve started approximately at 0.3 V vs. Li/Li  and has 
+-1 +
+delivered a specific capacity around 100 mA h g  below 0.1 V vs. Li/Li . The 
+capacity from the potential region above 0.1 V may be ascribed to the faradic 
+capacitance on the surface of CNFs and the capacity from the region lower than 
+0.1 V can be related to the lithium intercalation into CNFs [36-38]. This is in 
+good agreements with combining effect of graphite and non-graphitic carbon as 
+analyzed in chapter two. The CNF mat delivered a charge and discharge capacity 
+-1 st
+of 776 and 458 mA h g  in the 1  cycle and nearly saturated to 280 and 281 mA 
+-1
+h g  after 50 cycles. The related capacity of each cycle, the rate performance  
+ 
+Figure 3.10. (a) Voltage profiles electrospinning fabricated CNF mat 
+between 0.01 and 2 V at a charging rate of 0.1 C. The cycle numbers 
+70 
+ 
+are indicated in the figure. (b) Rate performance and columbic 
+efficiency of the above sample. 
+ 
+with higher current and columbic efficiency were summarized in Figure 3.10b. It 
+is clear to see the columbic efficiency which is defined as discharge capacity 
+divide by the charge capacity in the first cycle was only 60% and increased to 
+almost 100% in the following cycle. The small columbic efficiency is induced by 
+the large irreversible capacity which is related to the SEI formation as mentioned 
+in chapter two. 
+In summary, although both lithium intercalation and other storage 
+mechanisms are possible in CNF mat, the slightly higher lithium storage capacity 
+compared to graphite in the beginning of the cycling is far lower than we 
+expected. Furthermore, similar problems of surface-electrolyte interface (SEI) 
+formation and rather large Li insertion potential window as mentioned in non-
+graphitic carbon in chapter two still exist. As a result, CNFs do not seem to offer 
+a major route to improve the anode performance. Thus, searching for 
+nanomaterial-based alternatives for graphite that combine inherent protection 
+against lithium deposition, low cost, low toxicity, fast lithium insertion/removal 
+speed and also higher capacity still remains challenging. 
+ 
+3.3 Silicon-Coated Carbon Nanofiber Mat for Anode of Lithium Ion 
+71 
+ 
+Battery 
+3.3.1 Introduction 
+In order to improve the capacity of conventional carbon based materials, 
+researchers have been focusing on the discovery of high capacity materials. 
+Recently, silicon, a high lithium storage capacity material (specific capacity of 
+-1
+3572 mA h g  at room temperature, corresponding to Li15Si4) has been proposed 
+[39]. Yet, large volume expansion up to 400 % during charge/discharge causes a 
+severe structural pulverization, making this material impractical. For instance, a 
+simple deposition of Si thin film on metal substrate leaves crack formation during 
+cycling and therefore a contact loss between active material and current collector 
+occurs, leading to a poor cyclability, as shown in Figure 3.11 [40]. Si 
+nanowires/nanotubes (NWs/NTs) fabricated by various methods on metal 
+substrate could be an ideal approach to accommodate the volume change due to 
+existence of sufficient empty space between adjacent NWs/NTs [41-42]. 
+However, poor root adhesion with substrate and its brittle nature usually create 
+troubles in traditional coin cell fabrication process. On the other hand, the major 
+issue for Si nanoparticles, compared to Si NWs/NTs, is the formation and 
+preservation of electrical contact between each nanoparticle and substrate [43]. 
+This means that additional binder and conductive additives are usually needed, 
+which is similar to carbon based powder materials as mentioned in section 3.1.3-
+1 and will in turn increase the dead mass and thus reduce the capacity of the 
+72 
+ 
+electrode.  
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+Figure 3.11. (a) Structure deformation indication of Si based 
+film/particles before and after charge/discharge cycling. (b) SEI 
+st
+images of CVD deposited Si thin film on Cu stustrate after 1  and 
+th
+30  cycles of charge/discharge. Cited and modified from Ref. [20]. 
+Owing to these difficulties, several Si/nanocarbon composites have been 
+proposed. Silicon has been successfully deposited onto carbon fibers or CNFs 
+through chemical vapor deposition or sputtering [44-53]. Although Li storage 
+capacity was improved due to the contribution of deposited Si layers, 
+inhomogeneous deposition of Si atoms on fibers along the depth of the film 
+diminishes the effect of Si layers. Si nanoparticles have been deposited on CNFs 
+73 
+ 
+by dispersing them in organic solution and then co-spinning onto metal substrate 
+followed by heat treatment [50-53]. This causes again undefined nature of 
+adhesion between Si nanoparticles and CNFs, which is closely related to the 
+efficiency of charge transport across the interface. Electrochemical deposition of 
+silicon onto CNF substrate is rather promising, since the liquid reaction is easy to 
+handle with low cost and also the shape of silicon can be controlled by the 
+deposition conditions. Apart from the fabrication benefits, the CNF mat is a free-
+standing three dimensional skeleton and is conductive and porous so that the use 
+of binders and conductive additives can be avoided.  
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+Figure 3.12.Schematic of the apparatus for electrodeposition of Si. 
+The cell consists of three electrodes: woking electrode (as-fabricated 
+CNF mat), counter electrode (Pt wire) and reference electrode 
+74 
+ 
++
+(Ag/Ag ). During the deposition, a Si-containing electrolyte (SiCl4 in 
+-1
+PC) was add into the cell and a cyclic voltage scan (20 mV s ) was 
+applied to the electrodes. 
+ 
+In this study, the free-standing CNF mat was fabricated by using 
+electrospinning of polymer solution followed by stabilization and carbonization, 
+as introduced in section 3.1.3-2. Si was deposited on the surface of CNFs by 
+electrodeposition method through a home-made three-electrode cell. The cell 
+configuration was shown in Figure 3.12. By varying the deposition conditions, a 
+spaghetti-like Si layer with high surface area and porosity was formed. Si layer 
+was uniformly coated over nanofibers independent of the depth of the film. More 
+importantly, volume expansion was easily accommodated on the cylindrical 
+fibers and highly porous network of CNF mat. High temperature annealing of 
+1000 °C was performed to improve material purity and construct stable Si and 
+CNF interface by forming Si-C bond. This free-standing Si-coated CNF mat was 
+directly used as an anode material for LIB without using any additional metal 
+substrate or extra binder materials. The capacity of Si/CNF mat anode was 
+clearly improved by almost twice compared to that of graphite material. The 
+detailed electrochemical analysis was provided in conjunction with structural 
+properties.  
+ 
+75 
+ 
+3.3.2 Characterizations of CNF-Si Mat 
+Figure 3.13a shows typical cyclic voltammograms (CVs) at a scan rate of 
+-1
+20 mV s  for CNF in PC electrolyte with/without adding SiCl4. It is clear to see a 
+reduction peak centered at around -2.0 V only in the case of electrolyte 
+containing SiCl4. This suggests that Si ion is reduced into Si and deposited onto 
+-
+CNF mat during CV test following the electrochemical reaction SiCl4 + 4 eSi 
++
++ 4Cl . Si loading amount on CNF mat was controlled by varying number of CV 
+deposition cycles, as shown in Figure 3.13b. Mass (thickness) of Si/CNF mat 
+keeps increasing from ~ 1 mg to ~ 4 mg (from ~ 25 m to 130 m), as the 
+number of Si deposition cycles increased to 1000 cycles.  
+ 
+  
+Figure 3.13. (a) Cyclic voltammograms of silicon electrodeposition 
+-1
+in PC solution with/without SiCl4 at a scan rate of 20 mV s . (b) 
+Mass and thickness of Si/CNF mat with respect to different silicon 
+76 
+ 
+deposition cycles. The error bar is added in the figure. 
+ 
+ A series of structure characterizations of Si/CNF mat of with 200 cycles 
+CV deposition are shown in Figure 3.14. Micro-Raman spectra of bare CNF mat 
+(also shown in Figure 3.9) and pristine Si/CNF mat (without annealing, indicated 
+as Si-200-p) in Figure 3.14a shows intensity ratio of D band to G band (ID/IG) 
+remained unchanged (∼ 0.83) between bare CNF and Si-200-p after 
+electrodeposition of Si, indicating that carbon material is remarkably stable 
+compared to traditional metal substrate in severe electrochemical environment 
+[37]. However, in the case of Si/CNF mat after 1000 °C annealing (indicated as 
+Si-200-a), the value of ID/IG slightly decreased to ~ 0.79, suggesting an improved 
+graphitization in the CNF network. It is of note that no Si related peak can be 
+found in Si-200-p. This could be ascribed to the highly disordered nature of the 
+deposited Si which is caused by electrostatic clustering with alkyl terminators 
+and also the presence of deposited electrolyte residues on the surface, as shown 
+in Figure 3.15a [54]. On the other hand, three additional Si related peaks were 
+shown in the spectrum of Si-200-a. It is known that first order transverse-optical 
+−1 
+(TO) phonon mode of crystalline Si (c-Si) will display a sharp peak at 520 cm
+which usually becomes broaden and is downshifted when the long-range order in 
+-1
+Si is lost [55]. In our case, the peak located at around 500 cm  was assigned to 
+microcrystalline or nanocrystalline (c/nc) Si and a broad band at the low energy 
+-1
+side originated from the presence of amorphous Si (a-Si). The peak near 300 cm  
+77 
+ 
+resembles transverse acoustic (TA) phonon mode of c-Si and could be softened in 
+-1 
+a-Si [55-57]. In addition, c-Si usually exhibits a small peak at 950 cm which is 
+related to the chemisorption of atomic/molecular oxygen species [58]. Here, we 
+-1 -1
+also found a softened peak at 920 cm in Si-200-a. A red shift of 30 cm  is 
+ 
+possibly caused by the existence of a-Si [57]. All of these factors demonstrate 
+that as-deposited Si is completely disordered and evolves into more distinct a-Si 
+and c/nc-Si with additional oxygen species after high temperature annealing.  
+ 
+ 
+ 
+Figure 3.14. (a) Micro-Raman spectra of bare CNF mat and Si/CNF 
+mat with 200 cycles of Si deposition before/after annealing, indicated 
+as Si-200-p and as Si-200-a in the figure. (b) XPS spectra of the 
+electrode surface with active materials consisting of Si-200-p and Si-
+200-a, respectively. 
+   
+Figure 3.14b plots the XPS spectra of Si/CNF mat with 200 cycles 
+78 
+ 
+deposition before and after1000 °C annealing. It is obvious to see that the 
+intensities of Si 2s and Si 2p peaks increased clearly while the C 1s peak 
+relatively decreased. In addition, Cl 2p peak which appeared in Si-200-p 
+disappeared after annealing. After Si electrodeposition, certain amount of 
+electrolyte could be decomposed and remained on the Si surface. After annealing, 
+the residual film which mainly contained C, O, and Cl was removed, as seen in 
+Figure 3.15. This is also in good corroboration with Figure 3.14a. 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+Figure 3.15. SEM images of (a) Si-200-p and (b) Si-200-a samples. 
+Dark color portion indicates electrolyte residues on the surface of 
+CNF mat. After 1000 °C annealing, the uniform mat surface was 
+observed by the removal of electrolyte, as shown in (b).  
+ 
+Figure 3.16a is the SEM image of the bare CNF mat which already 
+explained in Figuer 3.8. On the other hand, the Si-200-a sample displayed a 
+79 
+ 
+rough spaghetti-like surface, as shown in Figure 3.16b. The cross sectional view 
+of Si-CNF core-shell structure was shown in the inset of Figure 3.16b. It is of 
+note that the core-shell structure was formed uniformly independent of the depth 
+over hundred micrometers, which is in good contrast with other methods such as 
+sputtering and CVD, in which Si is not uniformly deposited along the depth of 
+the sample. AFM morphology of the same sample was provided in Figure 3.16c 
+with an amplified phase image in Figure 3.16d, again demonstrating rough Si 
+surface on the surface of CNFs. This unique spaghetti-like Si structure provided 
+large surface area compared to the flat Si thin film which can facilitate the charge 
+transfer at the electrolyte/Si interface. Moreover, the volume expansion can be 
+accommodated to certain degree by the high porosity of Si under the condition of 
+200 cycles deposition which is certainly better than the thick Si layers.  
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+80 
+ 
+Figure 3.16. (a) SEM images of as-synthesized bare CNFs and (b) 
+Si-200-a. The cross-sectional images are shown in the insets. (c) 
+AFM image of Si-200-a. The high resolution image of dashed square 
+in (c) is shown in (d). 
+ 
+Figure 3.17a is the TEM image of the Si-200-a sample. The layer thickness 
+of deposited Si was ~ 20 nm in this case. The existence of Si on the surface of 
+CNF was again confirmed by EDS line profile along the dashed line in the TEM 
+figure, as shown in Figure 3.17b. The spaghetti shape of Si was not visible here 
+probably due to the sample damage during TEM sample preparation process with 
+sonication. Since the thin film of electrodeposited silicon is highly active and 
+therefore can be oxidized immediately upon exposure to air during transfer from 
+the glove box to TEM, or X-ray diffraction (XRD) measurements, the crystalline 
+nature of the electrodeposited Si film is unlikely to be directly observed [59].  
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+81 
+ 
+Figure 3.17. (a) TEM image of Si-200-a. The EDS line profile 
+along the dashed line is shown in (b). 
+ 
+To obtain information of interface between CNF and Si, C 1s and Si 2p 
+peaks in XPS were deconvoluted, as shown in Figure 3.18. C 1s peaks before 
+and after annealing were clearly distinct with each other. Clear Si-C peak near 
+2 3
+283 eV was visible in addition to small sp  and sp  peaks after annealing, while 
+2 3
+only intense sp  and sp  peaks were shown before annealing [60-61]. It is of note 
+3 2
+that the ratio of sp  to sp  peak was slightly reduced after annealing (from 62 % 
+reduced to 48 %), revealing similar trend to the change of D/G ratio in Raman 
+spectra, shown in Figure 3.14a. In addition, COx peak near 288 eV slightly 
+increased after annealing [62]. Similar phenomenon was observed in Si 2p peak 
+(Figure 3.18c, d). Before annealing, the main peak near 102.2 eV was SiOx peak 
+with additional Si-Si peak near 99.3 eV [62]. After annealing, SiOx content was 
+slightly increased due to ambient oxidation, in good agreement with C 1s peak 
+analysis. More importantly, Si-C peak near 100.8 eV appeared after annealing 
+[60]. The Si-C peak shown in C 1s and Si 2p after annealing comes from 
+chemical bonding between CNF and Si at the interface. This peak is small due to 
+narrow interface region, which is hardly observable by Raman spectroscopy, as 
+shown in Figure 3a. The presence of such Si-C bonds at the interface may not 
+contribute to Li storage but plays an important role in strengthening adhesion of 
+Si layer to CNFs and furthermore efficient charge transfer at the interface during 
+82 
+ 
+lithiation/delithiation process [63-64].  
+ 
+Figure 3.18. High-resolution XPS spectra of Si/CNF with 200 
+cycles of Si deposition before and after annealing. Figure (a) and (c) 
+are C 1s and Si 2p fitted peaks before annealing. (b) and (d) are C 
+1s and Si 2p fitted peaks after 1000 °C annealing. Peak positions 
+and relative ratios are shown in the figure. 
+3.3.3 Anode Performance of CNF-Si Mat 
+The electrochemical performance of bare CNF and Si/CNF mat was 
+investigated in LiPF6/EC+ DEC solution. For better comparison, the bare CNF 
+83 
+ 
+mat was annealed (indicated as CNF-a) at the same condition as the composite 
+mat. The electrochemical performance comparison between CNF-a and non-
+annealed CNF was shown in Figure 3.19. In Figure 3.19a, lithiation/delithiation 
+occurred below ~ 0.3 V in the cathodic/anodic scan which resembled the 
+characteristic of hard carbon in the case CNF [35,38]. However, the cathodic 
+peak below 0.1 V and the anodic peak at ~ 0.1 V belong to the characteristic of Li 
+intercalation/deintercalation into graphitic layers in CNF-a [65-66].This 
+manifests that our as-fabricated CNF mat contains a certain degree of 
+graphitization and disordered phase which is consistent with Figure 3.14a and 
+Figure 3.18 and also the improved graphitization degree of CNFs after 1000 °C 
+annealing. In Figure 3.19b, the impedance profiles show decrease of both series 
+resistance (the starting point) and charge transfer resistance (the radius of 
+semicircle ) after 1000 °C annealing. This again can be attributed to the higher 
+graphitization degree of CNF after annealing. 
+ 
+84 
+ 
+Figure 3.19. (a) CV profile comparison between bare CNF mat and 
+CNF mat after 1000 °C annealing. The curves were recorded after 
+st -1
+1  CV scan between 0.01 to 2 V at a scan rate of 0.1 mV s . (b) AC 
+impedance spectra of the above two electrodes. The spectra were 
+recorded right after the cell assembling before cycling. 
+ 
+The CV curves of CNF-a and Si/CNF mat with 200 cycles of Si deposition 
+were shown in Figure 3.20a. In the case of Si/CNF mat, no appreciable peaks 
+related to LixSi alloy formation were observed in Si-200-p (dashed line). On the 
+contrary, two pairs of redox reaction peaks were observed in Si-200-a (solid line). 
+The sharp cathodic peak at ~ 0.01 V can be attributed to a combination effect of 
+CNF mat and c-Si/a-Si. The cathodic peak (Li alloy) at 0.2 V and anodic peaks 
+(Li dealloy) at 0.37 V and 0.52 V are due to the formation of amorphous LixSi 
+phase and delithiation back to a-Si, respectively [67-68]. The increase of the peak 
+intensities of a-Si with increasing the scan cycle numbers can be ascribed to the 
+conversion of the c/nc-Si into amorphous phase during the repeated CV scans. 
+The electrochemical analysis in Figure 3.20a provides us further understanding 
+of the Si crystallinity which is again in good agreement with Figure 3.14a.  
+85 
+ 
+ nd th
+Figure 3.20. (a) The 2  and 10  cyclic voltammograms of CNF-a 
+(square), Si-200-p (dashed line) and Si-200-a (solid line) mats 
+-1
+between 0.01 and 2 V at a scan rate of 0.1 mV s . (b) and (c) are 
+voltage profiles of Si-200-p/Si-200-a and CNF-a/Si-200-a between 
+0.01 and 2 V at a charging rate of 0.1 C. The cycle numbers are 
+indicated in the figure. (d) Charge/discharge capacity and Coulombic 
+efficiency of Si-200-a for the first 80 cycles. 
+ 
+th
+The 1, 2, 10, 30, 50  galvanostatic charge/discharge (CD) profiles between 
+86 
+ 
+0.01 and 2 V of Si/CNF mat with 200 cycles deposition before/after 1000 °C 
+annealing are plotted in Figure 3.20b. The CD rate was 0.1 C, where 1 C is 
+-1
+defined to be 372 mA h g . Compared to Si-200-p which delivers a capacity 
+-1
+around 300 mA h g , Si-200-a exhibited much higher capacity of almost 900 mA 
+-1 st -1 th
+h g  at 1  discharge and 730 mA h g  at 50  discharge according to the total 
+mass of Si and CNF with an average fading rate of 0.34 % per cycle. This can be 
+attributed to the presence of a mixed phase of Si (c-Si and a-Si) and also the 
+improved material purity after annealing by removing the electrolyte residues as 
+discussed. Figure 3.20c is the galvanostatic CD profiles of CNF-a mat and Si-
+200-a. The CD profiles of CNF-a mat has already explained in Figure 3.10. 
+Compared to CNF-a mat, the Si-200-a sample showed a large capacity of 1650 
+-1 st
+mA h g in the 1  charge and a higher capacity by almost three times (730 mA h 
+-1 th
+g ) after 50  cycles, since Si contains a higher Li storage capacity than carbon. 
+However, the large capacitance loss of the first cycle related to the formation of 
+the SEI layer was observed. Figure 3.20d shows capacity retention of the Si-200-
+nd
+a sample at the specific charging rates. The discharge capacity at the 2  cycle 
+-1 -1 -1
+was 710 mA h g  at 0.2 C, 637 mA h g  at 1 C and 565 mA h g  at 2 C. The 
+Coulombic efficiency is defined as the ratio of the discharge to charge capacity 
+and plotted in the same figure. The Coulombic efficiency of Si-200-a sample 
+st
+approached to 54 % at the 1  cycle due to the SEI formation and increased to 
+99 % after 20 cycles at 0.1 C rate. The value was smaller than the ideal efficiency 
+because of the reformation of SEI layer on newly exposed Si during cycling with 
+87 
+ 
+  
+a cost of Li consumption [69]. Compared to the Si thin film on the two 
+dimensional Cu substrate, the improved cyclic life was attributed to the highly 
+porous three dimensional CNF substrate and also the unique Si spaghetti 
+structure, which can both accommodate Si volume expansion. The comparison 
+between our work and previous publications with respect to the different 
+fabrication methods of Si/CNF composite structure was shown in Table 3.1. It is 
+clear to see that our result showed reasonable capacity and also capacity retention. 
+More importantly, our structure involved no metal substrate compared to others.  
+ 
+Table 1. Anode performance comparison of silicon/CNF composites 
+fabricated by different methods. CNF film is usually fabricated by 
+mixing CNF powder with a binder. CNF mat is binder-free 
+freestanding film fabricated by electrospinning method. 
+ 
+ 
+ 
+ 
+88 
+ 
+Current 
+Si deposition Mass Si mass Capacity@cycles Capacity Structural 
+Structure -2 density -1 Remarks 
+Method [mg cm ] ratio -1 [mA h g ][a] retention features 
+[mA g ] 
+[44]
+Si@CNF  CVD 2 75 % 500 1600@55 80 % film Metal substrate 
+[45] CF mesh as a 
+Si@CNF  CVD 4 37 % 50 766@20 80.3 % film 
+substrate 
+[46]
+Si@Hollow CNF  CVD — 25 % 0.5C[b] 750@100 68.2 % film Metal substrate 
+[47]
+Si@CNFs  Sputtering 0.4 16 % 50 1200@105 90 % film Metal substrate 
+VACNFs grown 
+[48] 2752@ 
+Si@VACNFs  Sputtering 0.2 49 % 323 89 % — on metal 
+100[c] 
+substrate 
+[49]
+SiNWs@CNF  VLS 3.6 80 % 342 1400@40 77 % film — 
+[50] Si NPs in DMF & 
+Si/CNF  — 16 % 100 773@20 90.4 % mat Metal substrate 
+electrospinning 
+[51]
+Si/CNF  As above 1.6 26 % 50 726@40 46.8 % mat Metal substrate 
+Si-CNF 
+[52] As above — 50 % 240 1300@100 1 film Metal substrate 
+core-shell  
+[53] Si NPs in DI & 
+Si/CNF  — 41 % 35 892@50 — mat Metal substrate 
+electrospinning 
+No substrate 
+Si/CNF (Ours) Electro-deposition 1 43 % 37 730@50 85 % mat 
+No binder 
+[a] Capacity is calculated based on silicon & carbon mass. [b] C rate is not mentioned in the reference. [c] Capacity is 
+calculated based on silicon mass.  
+ 
+89 
+ 
+  
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+Figure 3.21. (a) Charge (filled symbols)/discharge (open symbols) 
+capacity in terms of different numbers of silicon deposition cycles 
+after high temperature annealing. Capacity was calculated based on 
+silicon mass only. Sample indications are shown in the right dashed 
+square. (b) AC impedance spectra of the above five electrodes. The 
+spectra were recorded right after the cell assembling before cycling. 
+The equivalent circuit is shown in the inset. The related resistance 
+value in Figure (b) was plotted in Figure (c) with respect to different 
+silicon deposition cycles. 
+90 
+ 
+For better understanding of the structure-related Li storage capacity, 
+different Si amount was deposited on the CNF mat by varying the number of 
+electrodeposition cycles. The capacity retention of Si/CNF mats (all after 
+1000 °C annealing) upon the different Si deposition cycle numbers are 
+summarized in Figure 3.21a. Here, the specific capacity was expressed in terms 
+of net Si mass excluding carbon mass. The specific capacity with respect to net 
+Si mass from the composite was calculated from the following equation: 
+QSi  = mCNF/mSi {Qcomposite (1+ mSi/mCNF) – QCNF} 
+ 
+where “Qcomposite” is the total capacity of CNF-Si composite according to the total 
+mass of Si+CNF electrode. QSi (QCNF) is the specific capacity based on the net 
+mass of Si (CNF). Here mSi (mCNF) is the mass of deposited Si (CNF) in the 
+-1
+composite. The values of specific capacity was ~ 1545 mA h g  at the beginning 
+of charge/discharge and were similar to each other regardless of the Si deposition 
+cycle numbers. However, capacity retention became poorer as the Si loading 
+amount increased, for example, the capacity of 200 and 1500 Si electrodeposition 
+-1 -1
+cycles was 1354 mA h g  and 873 mA h g , respectively. As the Si thickness 
+increases, deformation energy of Si increases as well, inducing more crack 
+initiation and propagation. In other words, in the case of thicker Si layers, crack 
+generation caused by volume variation is more significant [43]. Therefore, 
+thicker Si layer peels off easily and eventually the capacity degradation occurs 
+more severely than that of thinner Si layer. The cohesive energy of Si-C bonds at 
+91 
+ 
+the interface between Si and CNF is helpful for structure stabilization against the 
+increased deformation energy. Deformation energy is proportional to the 
+thickness, while interfacial energy is constant. When deformation energy exceeds 
+interfacial cohesive energy at critical layer thickness of Si, the structure of Si 
+breaks down. On the other hand, Si shape transformation was observed from 
+spaghetti-like to granule-like when CV deposition cycles keep increasing from 
+200 to 1500, as shown in Figure 3.22. The thin Si layer fabricated with 200 
+cycles CV deposition revealed a highly porous structure (See Figure 3.16), and 
+therefore the volume expansion can be minimized compared to the thick granular 
+shape Si layers.  
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+   
+ 
+ 
+ 
+92 
+ 
+Figure 3.22. SEM images of (a-b) Si-1500-p and (c-d) Si-1500-a 
+samples.  
+ 
+Nyquist plots of Si/CNF mat with different Si loading masses are plotted in 
+Figure 3.21b. The curves were collected right before electrochemical 
+charge/discharge cycling. All of the curves showed a depressed semicircle and a 
+tail, which indicates the mixed kinetics and diffusion process. The semicircle in 
+the high frequency range indicates the charge transfer resistance (Rct) at the 
+interface between electrode and electrolyte. The tail at low frequency region 
+implies a diffusion-controlled process. An equivalent circuit is shown in the inset 
+where Rs, Cdl, and Zw represent respective series resistance of 
+electrolyte/electrolyte contact, double layer capacitance, and Warburg impedance 
+related to the diffusion of ions in the bulk electrode [70-71]. The value of Rs (first 
+point) and Rct (diameter of semicircle) were extracted from Figure 3.21b and 
+replotted in Figure 3.21c. As the Si loading amount increased, Rs slightly 
+increased due to lower conductivity of Si. The Rct decreased sharply with Si 
+deposition and then increased gradually as the Si coating amount increased. The 
+origin of large value of Rct observed in bare CNF-a sample compared to the Si-
+coated CNF sample could be the morphology difference between CNF-a and Si. 
+The Si shell exhibited much rougher surface than that of bare CNF-a (See Figure 
+3.16), which benefited the charge transfer process through large surface area. The 
+different lithiation mechanisms between silicon and carbon may also play a role 
+93 
+ 
+here. The increase of Rct in Si/CNF mat with increasing Si deposition cycles is 
+attributed to the larger granular size and less porosity of the deposited Si layers 
+(See Figure 3.22a). The straight line can be interpreted as the resistance for the 
+diffusion process of lithium ions into the electrode. The smaller angle between 
+real axis and the straight line as the Si loading amount increases simply indicates 
+again the limited diffusion of Li ions with increasing Si loading amount.  
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+Figure 3.23. Charaterizations of Si-200-a electrode after 80 cycles 
+charge/discharge. (a) Top-view SEM image, (b) Cross-sectional SEM 
+image, (c) High resolution TEM image, and (d) AFM image. The SEI 
+layer was selectively removed by washing the sample with acetonitrile 
+94 
+ 
+and diluted HCl. 
+  
+ Figure 3.23a and b show SEM images for the structural changes of Si-
+200-a after cycling test. The SEI layer was selectively removed by using 
+acetonitrile and then HCl prior to imaging [72]. Si layer became rough hairy and 
+highly porous, compared to the one before cycling test in Figure 3.16. The lower 
+density of Si suggested that some spaghetti type Si at the outermost surface was 
+removed, as can be seen in the TEM image of Figure 3.23c. This is why capacity 
+was degraded during cycling. Nevertheless, compared to the sample with hgiher 
+Si loading amount (Figure 3.22c,d), the major portion of Si remained after 
+cycling test (See AFM image of Figure 3.23d), retaining relatively high capacity 
+and reasonable capacity retention. This is in fact corroborated to the robust Si-C 
+bonds formed at the interface between Si and CNF which was achieved by 
+1000 °C annealing. Free-standing CNF mat assembled through electospinning 
+process without a binder or a metal substrate is a good platform to provide such 
+3
+robust Si-C bonds due to abundant existence of sp  bonds at the surface of CNF, 
+as discussed in Figure 3.14 and Figure 3.18. 
+ 
+3.4 Summary of Chapter Three 
+In this chapter, general introduction of common one dimensional carbon 
+materials like CNFs and CNTs has been given. Compared to higher conductivity 
+of CNTs, CNFs exhibit an easier Li insertion pathway and a cost effective 
+95 
+ 
+property which make them a good candidate for anode of LIB. Especially, the 
+electrospinning method synthesized free-standing CNF mat has been intensively 
+studied in this work since it prevents the use of metal substrate, binder and 
+conducting polymers which usually increase the mass of electrode, degrade the 
+long term stability and reduce the anode capacity. Due to the unsatisfied capacity 
+of as-fabricated CNF mat, Si, a high capacity media was introduced into the three 
+dimensional CNF network through electrochemical deposition. Once again, the 
+structure involves neither a metal substrate nor binders. This could help us in 
+designing anode structures with high capacity and long cycle life in an economic 
+way. Thermal annealing of the combined mat at 1000 °C was necessary to 
+remove undesired residues formed during electrodeposition process and to form 
+strong Si-C bonds at the interface between Si layer and CNFs, which eventually 
+improved adhesion of Si to CNF and furthermore facilitated efficient charge 
+transfer between Si and CNF during lithiation/delithiation. This resulted in clear 
+improvement of the capacity of carbon materials more than twice for most of 
+cases. Optimization to improve composite structures for capacity, charge transfer, 
+and cycle life is further required for industry applications.  
+ 
+ 
+ 
+ 
+96 
+ 
+Bibliography of Chapter Three 
+[1] R. Feynman, Caltech's Engineering and Science Magazine 1960. 
+[2] Y. Ren, R. A. Armstrong, F. Jiao, G. P. Bruce, J. Am. Chem. Soc. 
+2010,132, 996. 
+[3] D. S. Su, R. Schlögl, ChemSusChem 2010, 3, 136. 
+[4] A. S. Airco, P. Bruce, B. Scrosati, J.Tarascon, W. V. Schalkwijk, Nature 
+Mater. 2005, 4, 365. 
+[5] N.M. Rodriguez, A. Chambers, R.T.K. Baker, Langmuir 1995, 11, 3862. 
+[6] M. Endo, Y.A. Kim, T. Fukai, T. Hayashi, K. Oshida, M. Terrones, T. 
+Yanagisawa, S. Higaki, M.S., Appl. Phys. Lett. 2002, 80, 1267. 
+[7] S.H. Yoon, S. Lim, Y. Song, Y. Ota, W.M. Qiao, A. Tanaka, I. Mochida , 
+Carbon 2004, 42, 1723. 
+[8] S.H. Yoon, C.W. Park, H.J. Yang, Y. Korai, I. Mochida, R.T.K. Baker, 
+N.M. Rodriguez, Carbon 2004, 42, 21. 
+[9] Springer Handbook of Springer Handbook of Nanomaterials 2011, 
+chapter 7. 
+[10] J. Prasek, J. Drbohlavova, J. Chomoucka, J. Hubalek, O. Jasek, V. 
+Adamc, R. Kizek, J. Mater. Chem. 2011, 21, 15872. 
+[11] N. Saifuddin, A. Z. Raziah, A. R. Junizah, J. Mater. Chem. 2013, 
+http://dx.doi.org/10.1155/2013/676815.  
+[12] T. Belin, F. Epron, Materials Science and Engineering B 2005, 119,105. 
+[13] J. Zhao, A. Buldum, J. Han, Phys. Rev. Lett. 2000, 85, 1706. 
+[14] A.S. Claye, J.E. Fischer, C.B. Huffman, A.G. Rinzler, R.E. Smalley, J. 
+97 
+ 
+Electrochem. Soc. 2000, 147) 2845 
+[15] W. Lu, D.D.L. Chung, Carbon 2001, 39, 493–496. 
+[16] H. Shimoda, B. Gao, X.P. Tang, A. Kleinhammes, L. Fleming, Y.Wu, O. 
+Zhou, Phys. Rev. Lett. 2002, 88. 015502. 
+[17] H. H. Lee, C. C. Wan, Y. Y. Wang, Journal of Power Sources 2003,1,7. 
+[18] C. Casas, W. Li, Journal of Power Sources 2012, 208, 74. 
+[19] T. Kar, J. Pattanayak, S. Scheiner, J. Phys. Chem. A 2001, 105, 10397. 
+[20] C. K. Chan, H. Peng, G. Liu, K. McIlwrath, X.Zhang, R. A. Huggins, 
+Y.Cui. Nature Nanotech. 2007, 3, 31. 
+[21] S. Ramakrishna, K. Fujihara, W.-E. Teo, T.-C. Lim, Z. Ma, World 
+Scientific, Singapore 2005. 
+[22] D.H. Renecker, A.L. Yarine, H. Fong, S. Koombhongse, J. Appl. Phys. 
+2000, 87, 4531. 
+[23] Y.M. Shin, M.M. Hohman, G.C. Martin, Polymer 1999, 40, 7397. 
+[24] I.D. Norris, M.M. Shaker, F.K. Ko, A.G. MacDiarmid, Synth. Met. 2000, 
+114, 109–114. 
+[25] F. Ko, Y. Gogotsi, A. Ali, N. Naguib, H. Ye, G. Yang, C. Li, P. Willis, 
+Adv. Mater. 2003, 15, 1161. 
+[26] C. Vozzi, C.J. Flaim, F. Bianchi, A. Ahluwalia, S. Bhatia, Sci. Eng. 2002, 
+20, 43. 
+[27] C. Kim, K.S. Yang, Appl. Phys. Lett. 2003, 83, 1216. 
+[28] R. Dersch, M. Steinhart, U. Boudriot, A. Greiner, J.H. Wendorff, Polym. 
+Adv. Technol. 2005, 16, 276. 
+98 
+ 
+[29] K. Aoki, Y. Usui, N. Narita, N. Ogiwara, N. Iashigaki, K. Nakamura, H. 
+Kato, K. Sano, N. Ogiwara, K. Kametani, C. Kim, S. Taruta, Y.A. Kim, 
+M. Endo, N. Saito, Small 2009, 5, 1540. 
+[30] C. Kim, K.S. Yang, M. Kojima, K. Yoshida, Y.J. Kim, Y.A. Kim, M.  
+Endo Adv.Funct. Mater. 2006, 16, 2393. 
+[31] R. Bacon: Production of graphite whiskers, J. Appl. Phys. 1960, 31, 283. 
+[32] J. Doshi, D. H. Reneker, Journal of Electrostatics 1995, 35, 151. 
+[33] N. T. Xuyen, E. J. Ra, H. Z. Geng, K. K. Kim, K. H. An, Y. H. Lee, J. 
+Phys. Chem. B 2007, 111, 11350. 
+[34] K. Nakamoto, in Infrared and Raman spectra of inorganic and 
+coordination compounds. Part A: theory and applications in inorganic 
+chemistry – 6th ed. Wiley 2009 
+[35] P. G. Bruce, B. Scrosati, J. M. Tarascon, Angew. Chem. Int. Ed. 2008, 47, 
+2930. 
+[36] E. J. Yoo, J. Kim, E. Hosono, H. S. Zhou, T. Kudo, I. Honma, Nano Lett.  
+2008, 8, 2277. 
+[37] F. Yao, F. Günes, H. Q. Ta, S. M. Lee, S. J. Chae, K. Y. Sheem, C. S. 
+Cojocaru, S. S. Xie, Y. H. Lee, J. Am. Chem. Soc. 2012, 134, 8646. 
+[38] C. C. Li, X. M. Yin, L. B. Chen, Q. H. Li, T. H. Wang, J. Phys. Chem. C 
+2009, 113, 13438. 
+[39] T. D. Hatchard, J. R. Dahn, J. Electrochem. Soc. 2004, 151, A838. 
+[40] J. P. Maranchi, A. F. Hepp, A. G. Evans, N. T. Nuhfer, P. N. Kumta, J.  
+Electrochem. Soc. 2006, 153, A1246. 
+99 
+ 
+[41] C. K. Chan, H. L. Peng, G. Liu, K. Mcilwarth, X. F. Zhang, R. A. 
+Huggins, Y. Cui, Nature Nanotechnology 2008, 3, 31. 
+[42] H. Wu, G. Chan, J. W. Choi, I. Ryu, Y. Yao, M. T. McDowell, S. W. 
+Lee, A. Jackson, Y. Yang, L. B. Hu, Y. Cui, Nature Nanotechnology 
+2012, 7, 310. 
+[43] H. Wua, Y. Cui, Nano today 2012, 7, 414. 
+[44] L. F. Cui, Y. Yang, Ch. M. Hsu, Y. Cui, Nano Lett. 2009, 9, 3370. 
+[45] G. K. Simona, B. Maruyama, M. F. Durstock, D. J. Burton, T. Goswami, 
+J. Power Sources 2011, 196, 10254. 
+[46] J. Y. Howe, D. J. Burton, Y. Qi, H. M. Meyer III, M. Nazri, G. A. Nazri, 
+A. C. Palmer, P. D. Lake, J. Power Sources 2013, 221, 455. 
+[47] P. C. Chen, J. Xu, H. T. Chen, C. W. Zhou, Nano Res. 2011, 4, 290 
+[48] S. A. Klankowski, R. A. Rojeski, B. A. Cruden, J. W. Liu, J. Wu, J. Li,  
+DOI: 0.1039/c2ta00057a. 
+[49] J. W. Choi, L. B. Hu, L. F. Cui, J. R. McDonough, Y. Cui, J. Power 
+Sources 2010, 195, 8311. 
+[50] L. W. Ji, K. H. Jung, A. J. Medford, X. W. Zhang, J. Mater. Chem. 2009, 
+19, 4992 
+[51] L. W. Ji, X. W. Zhang, Energy Environ. Sci. 2010, 3, 124. 
+[52] T. H. Hwang, Y. M. Lee, B. S. Kong, J. S. Seo, J. W. Choi, Nano Lett. 
+2012, 12, 802. 
+[53] X. Fan, L. Zou, Y. P. Zheng, F. Y. Kang, W. C. Shen, Electrochemical and 
+Solid-State Lett. 2009, 12, A199. 
+100 
+ 
+[54] H. J. Kim, M. H. Seo, M. H. Park, J. P. Cho, Angew. Chem. Int. Ed. 2010, 
+49, 2146. 
+[55] M. Holzapfel, H. Buqa, L. J. Hardwick, M. Hahn, A. Würsig, W. 
+Scheifele, P. Novák, R. Kötz, C. Veit, F. M. Petrat, Electrochimica Acta 
+2006, 52, 973. 
+[56] G. Kanellis, J. F. Morhange, M. Balkanski, Physical Review B 1980, 21,  
+1543. 
+[57] J. E. Smith, Jr., M. H. Brodsky, B. L. Crowder, M. I. Nathan, A. Pinczuk,  
+Phys. Rev. Lett. 1971, 26,642. 
+[58] K. Nakamoto, in Infrared and Raman spectra of inorganic and 
+coordination compounds. Part A: theory and applications in inorganic  
+chemistry – 6th ed. Wiley 2009. 
+[59] X. Chen, K. Gerasopoulos, J. Guo, A. Brown, C. Wang, R. Ghodssi, J. N.  
+Culve, Adv. Fun, Mater. 2011, 21, 380.  
+[60] S. Contarini, S. P. Howlett, C. Rizzo, B. A. De Angelis, Applied Surface  
+Science 1991, 51, 177. 
+[61] M. Rybachuk, J. M. Bell, Carbon 2009, 47, 2481. 
+[62] N. Fourches, G. Turban, B. Grolleau, Applied Surface Science 1993, 68, 
+149. 
+[63] A. M. Wilson, J. R. Dahn, J. Electrochem. Soc. 1995, 142, 326. 
+[64] W. Wang, P. N. Kumta, J. Power Sources 2007, 172, 650. 
+[65] K. A. Striebel, A. Sierra, J. Shim, C. W. Wang, A. M. Sastry, J. Power  
+Sources 2004, 134, 241. 
+101 
+ 
+[66] M. D. Levi, C. Wang, J. S. Gnanaraj, D. Aurbach, J. Power Sources 
+2003, 119–121, 538. 
+[67] X. L. Chen, X. L. Li, F. Ding, W. Xu, J. Xiao, Y. L. Cao, P. Meduri, J. 
+Liu, G. L. Graff, J. G. Zhang, Nano Lett. 2012, 12, 4124. 
+[68] Y. Yao, M. T. McDowell, I. Ryu, H. Wu, N. Liu, L. B. Hu, W. D. Nix, 
+Y. Cui,  Nano Lett. 2011, 11, 2949. 
+[69] P. R. Abel, Y. M. Lin, H. Celio, A. Heller, C. B, Mullins, ACS Nano 
+2012, 6, 2506. 
+[70] K. Naoi, N. Ogihara, Y. Igarashi, A. Kamakura, Y. Kusachi, K. Utsugi, J.  
+Electrochem. Soc. 2005, 152, A1047. 
+[71] J. B. Gong, H. Q. Wu, Electrochimica Acta 2000, 45, 1753. 
+[72] H. Wu, G. Y. Zheng, N. Liu, T. J. Carney, Y. Yang, Y. Cui, Nano Lett. 
+2012, 12, 904. 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+102 
+ 
+Outline of Chapter Four 
+ 
+Diffusion Mechanism of Lithium Ions through Basal Plane of 
+Layered Graphene 
+ 
+4.1 Brief Introduction of Two Dimensional Graphene 105 
+4.1.1 General Physical Properties of Graphene 105 
+4.1.2 Synthesis Methods of Graphene 110 
+4.2 Diffusion Mechanism of Lithium Ions through Basal Plane of 113 
+Layered Graphene 
+4.2.1 Material Preparation 116 
+4.2.2 Transfer Process of Graphene 116 
+4.2.3 Characterization of Graphene 117 
+4.2.4 Anode Performance of Graphene 121 
+4.3 Summary of Chapter Four 140 
+Bibliography of Chapter 4 141 
+ 
+ 
+ 
+ 
+ 
+103 
+ 
+CHAPTER FOUR 
+Diffusion Mechanism of Lithium Ions through Basal Plane of 
+Layered Graphene 
+Recently, graphene, composed of monolayer of carbon atoms arranged in a 
+honeycomb network, has emerged explosively and attracted much attention in the 
+fields of materials science and condensed-matter physics. High mobility of 
+graphene is probably the most fascinating properties for physicists and engineers, 
+which is attributed to the linear band dispersion, leading to massless Dirac 
+quasiparticle feasture. On the other hand, as the thinnest carbon material, 
+graphene and graphene-based materials have promising applications in numerous 
+energy sciences, for instance, Li-ion batteries (LIBs), fuel cells, and solar cells. 
+In particular, these materials have superior electrical conductivities to graphitic 
+2
+carbons and higher surface area of over 2600 m /g than CNTs, and a broad 
+electrochemical window that would be more advantageous in energy storage. 
+Thus, a series of research works on LIB based on graphene were performed 
+intensively with the similar routes to the CNTs-based electrode materials for LIB 
+[1-6]. Some scientists used graphene sheets directly as an anode material for LIB 
+and found that they had improved electrochemical properties. For example, the 
+first reversible specific capacity of the prepared graphene sheets with a specific 
+2 -1
+surface area of 492.5 m /g was as high as 1264 mAh g  at a current density of 
+-1
+100 mA/g. After 40 cycles, the reversible capacity was still kept at 848 mAh g  
+at a current density of 100 mA/g, higher than that of CNTs or CNF electrodes [7].     
+104 
+ 
+The interesting single atomic layer structure of Gr can also be used for 
+fundamental science and a good candidate for the fundamental study of Li ion 
+diffusion pathway in addition to its real applications as an anode in LIB. Large 
+area single layer graphene (SLG) which consists of a clean basal plane for the 
+study of Li insertion prevents the coexistence of both edge plane and basal plane 
+in graphite that often hinders the understanding of lithium ion diffusion 
+mechanism. Therefore, in this chapter, after a brief introduction which includes 
+the general properties and production methods of Gr, the diffusion mechanism of 
+lithium ion through basal plane of layered graphene has been intensively studied. 
+In this case, two types of graphene samples were prepared by chemical vapor 
+deposition (CVD): i) well-defined basal plane single layer graphene grown on Cu 
+foil, ii) edge plane-enriched graphene layers grown on Ni film. Electrochemical 
+performance of graphene electrodes has been examed based on different number 
+of graphene layers and also different defect population on graphene basal plane. 
+Density functional theory calculations were also provided to clarify the diffusion 
+barrier heights for various types of defects.  
+ 
+4.1 Brief Introduction of Two Dimensional Graphene 
+4.1.1 General Physical Properties of Graphene   
+Graphene, as a two-dimensional (2D) honeycomb lattice structure consists of 
+2
+sp -hybridized carbon atoms in the form of one-atom thick planar sheet. This 
+105 
+ 
+unique material is a basic building block for many other carbon-based graphitic 
+materials such as zero-dimensional (0D) fullerenes, one-dimensional (1D) carbon 
+nanotubes, and three-dimensional (3D) graphite and is an excellent basic model 
+for many other 2D materials (Figure 4.1) With its unique structure, graphene 
+exhibits extraordinary thermal, mechanical, and electrical properties, which 
+makes it a popular material in many different research areas, theoretically and 
+experimentally.  
+ 
+Figure 4.1. Graphene is a basic 2D building block for other carbon 
+allotropes with different dimensionalities. Cited from Ref.[8]. 
+ 
+The unusual electronic properties of graphene are originated from its unique 
+106 
+ 
+band structure. In the lattice of graphene, carbon atoms are located at each corner 
+of hexagons binding with three neighboring carbon atoms. Carbon atom has four 
+valance electrons, of which three of them were used for covalent σ-bonding with 
+adjacent carbon atoms in graphene lattice. The remaining π-orbital determines 
+the electronic structure of graphene which is "coupled" with the other π-electrons 
+on adjacent carbon atoms. Each π-electron is delocalized, i.e., has a "field of 
+influence" of 360 degrees around its own carbon atom within an individual 
+graphene layer. The unit cell of graphene contains two π-orbitals (π and π*), 
+which disperse to form two π-bands that can be considered as bonding (the lower 
+energy valence band) and anti-bonding (the higher energy conduction band) in 
+nature.  
+ 
+Figure 4.2. a) Honeycomb lattice of graphene with two carbon atoms 
+per unit cell. b) Tight-binding band structure of graphene π-bands, 
+considering only nearest neighbor hopping. c) Band structure near K 
+point showing the linear dispersion relation. Cited from Ref. [9]. 
+107 
+ 
+   The bonding-antibonding gap closes at the corners of the Brillouin zone, or 
+the K points. (See Figure 4.2) As a result, the π-band dispersion is approximately 
+linear around the K points: E = ħvF |k| where k is the wave vector measured from 
+K, ħ is Planck’s constant, h divided by 2π, and vF is the Fermi velocity in 
+6
+graphene, approximately 10  m/s. Since the electrons in graphene have kinetic 
+energies exceeding their mass energy, electrons behave like photons or ultra-
+relativistic particles with an energy-independent velocity vF that is approximately 
+300 times smaller than the speed of light in vacuum, allowing relativistic effects 
+to be observed in graphene without using particle accelerators [9]. These 
+quasiparticles, called massless Dirac fermions, can be seen as electrons that have 
+lost their rest mass m0 or as neutrinos that acquired the electron charge e [10]. 
+This linear (or “conical") dispersion relation at low energies, electrons and holes 
+near these six points, two of which are inequivalent, behave 
+like relativistic particles described by the Dirac equation for spin 1/2 particles 
+[11]. Dirac fermions behave in unusual ways when compared to ordinary 
+electrons if subjected to magnetic ﬁelds, leading to new physical phenomena [12-
+14] such as the anomalous integer quantum Hall effect (IQHE) measured 
+experimentally [14-15]. The IQHE in graphene can be observed at room 
+temperature because of the large cyclotron energies for “relativistic” electrons 
+[16]. In fact, the anomalous IQHE is the signature of Dirac fermion behavior. 
+With these properties, graphene is a perfect mixture of semiconductor (zero 
+density of states) and a gapless metal which is quite different from other metals 
+108 
+ 
+and semiconductors with its very long mean free paths (Figure 4.3).  
+Figure 4.3. Electronic Structure of: a) Metal: Finite Density of States 
+(DOS) at Fermi energy. b) Semiconductor: Gap at Fermi energy. c) 
+Graphene: Zero gap Semiconductor. Zero DOS metal. Cited from Ref. 
+[18].The interesting 2D structure of graphene makes it a good 
+candidate for electronic device applications [17]. Unlike an ordinary 
+metal, in which any impurities in the crystal scatter electrons and so 
+lead to energy loss, the electrical resistance in graphene is independent 
+of the number of impurities. This means that electrons can travel for 
+several microns without colliding with impurities, making graphene a 
+promising material for a potential high-speed electronic switching 
+devices called a “ballistic transistor”. Experimental transport 
+measurements show that graphene has a unusual high electron 
+2 -1 -1
+mobility even at room temperature in excess of 15,000 cm v s , of 
+which mobilities for holes and electrons are nearly same [9,14,18-19]. 
+Graphene has a number of other extraordinary properties such as strong 
+109 
+ 
+mechanical properties and high flexibility allowing strain based graphene 
+electronics [20-21]. Another important aspect of graphene is its high thermal 
+conductivity up to 5000 W/mK at room temperature, 20 times higher than that of 
+copper, which could be exploited to applications in microelectronics and thermal 
+management structures [22]. Its optical properties are strongly related to its 
+electronic properties such as its low energy electronic structure where conical 
+bands of electron and hole meet at the Dirac point resulting in unexpected high 
+opacity. An atomic monolayer of graphene absorbs πα ≈ 2.3% of white light, 
+where α is the fine-structure constant [23]. It has been shown that graphene 
+system exhibits electrochromic behavior, allowing tuning of both linear and 
+ultrafast optical properties [24-25]. 
+ 
+4.1.2 Synthesis Methods of Graphene 
+First attempts to understand graphene basic properties was made by micro-
+cleavage method, which is a simple method to isolate graphitic layers from 
+graphite into monolayer graphene flakes with the help of a cohesive tape [26]. 
+Although many basic electronic properties of graphene such as the bipolar 
+transistor effect, ballistic transport of charges, large quantum oscillations, etc., 
+was explored by this method, for the large area graphene applications it was 
+necessary to find other synthesis methods (Figure 4.4). For this purpose, 
+epitaxial synthesis of graphene on different substrates was realized. Many 
+110 
+ 
+important graphene properties have been identified in graphene produced by SiC 
+substrate. In this method, the face of SiC, silicon or carbon-terminated, is used 
+for graphene formation in ultra high vacuum furnaces at very high temperatures 
+o
+(>1100 C) to decompose SiC into graphene [27]. Another approach for epitaxial 
+growth of graphene is studied on metal substrates, such as ruthenium, iridium, 
+and nickel [28-30]. Although these substrates have been employed to obtain 
+graphene, the interaction of graphene with underlying substrate and conducting 
+behavior of these substrates necessitated the transfer of graphene layers onto 
+other substrates for the application. Synthesis of large area few-layered graphene 
+together with transferring onto another substrate has been realized by chemical 
+vapor deposition (CVD) method on polycrystalline metallic substrates such as Ni 
+and Cu [31-33]. Unlike the epitaxial growth techniques, CVD method has been 
+realized by decomposition of carbon gases such as ethylene and methane 
+followed by either carburization-precipitation, or surface adsorption of carbon 
+gases. To fabricate devices, graphene, then, can be transferred by 
+polymethylmethacrylate (PMMA) as a supporting layer after dissolving the 
+underlying metallic substrate in a metal etchant and “fishing” the single-layer 
+graphene up onto a desired substrate (e.g., SiO2/Si). This method will be 
+explained in detail later. Graphene has been also derived from graphite oxide by 
+thermal annealing or chemical reduction by hydrazine [34-35]. This method 
+combining with the typical powder process (involves metal current collector and 
+binders) as mentioned in chapter three has been considered as one of the most 
+111 
+ 
+popular one used in battery electrode fabrication. However, graphene produced 
+by graphite oxide reduction is lower in quality compared to graphene obtained by 
+aforementioned production methods due to incomplete removal of various 
+functional groups by existing reduction methods.  
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+Figure 4.4 Production techniques of graphene: a) Micro-cleavage 
+method, isolating graphitic layers from graphite into monolayer 
+graphene flakes with the help of a cohesive tape, b) epitaxial growth 
+of graphene by decomposition of SiC into graphene, c) chemical 
+vapor deposition method by decomposition of hydrocarbon gases on 
+metal substrates, and d) chemical exfoliation of graphite oxide by 
+weakening van der Waals cohesive force via insertion of reactants 
+into interlayer space.     
+112 
+ 
+4.2 Diffusion Mechanism of Lithium Ions through Basal Plane 
+of Layered Graphene 
+Graphite has been widely used for anode material in lithium ion battery due 
+to its well defined layered structure for lithium intercalation, low operating 
+potential, and remarkable interfacial stability [36]. Graphite has two 
+characteristic planes: basal plane and edge plane which are parallel and 
+perpendicular to the c-axis, respectively. It is known in general that the basal 
+plane and edge plane exhibit different physical and chemical activities in many 
+aspects, leading to different lithiation capabilities in graphite [37-38]. The 
+diffusion time constant for Li ion insertion within the active graphitic flakes is 
+governed by the formula τ = L2/2D, where L is the diffusion length (or radius of 
+spherical flake) and D is diffusion coefficient [39]. Although lithium diffusion 
+through basal plane is rather limited, lithium diffusion may still occur through 
+several defect sites such as vacancies and grain boundaries [40-41]. Lithium 
+diffusion through edge plane of graphitic flakes can be easily facilitated but 
+further complicated by the presence of different functional groups such as 
+hydroxyl and carboxyl groups. In other words, lithiation through these two 
+different planes is highly anisotropic [42-46].  
+One ambiguity in understanding diffusion pathway of lithium ions in 
+graphite is the coexistence of both edge plane and basal plane in the sample. The 
+presence of these two different interfaces is unavoidable in conventional graphite 
+[32,47]. Currently available highly oriented pyrolytic graphite (HOPG), which is 
+113 
+ 
+well known as highly ordered crystallographic structure, has a finite size of 
+flakes whose edge planes are still abundant in addition to basal planes. Therefore, 
+lithium ion diffusion through basal plane cannot be observed exclusively [40-
+43].Thus, a well defined basal plane of graphite with large area is required to 
+have a comprehensive picture of lithium diffusion mechanism in lithium ion 
+battery. 
+ 
+Recently large area monolayer and multi-layer graphene have been 
+synthesized by chemical vapor deposition (CVD) [32,47]. This paves a new route 
+for exploring numerous new fundamental sciences and moreover developing 
+numerous technological breakthroughs in electronics and energy storage [48-50]. 
+Large area graphene can be transferred onto any substrate by a simple transfer 
+process and therefore an anode electrode with layered graphene without leaving 
+edge plane (or negligible portion of edge plane) is easily attainable. This provides 
+an opportunity to study diffusion of lithium ions exclusively through the basal 
+plane of graphene. 
+ 
+On the other hand, in lithium ion battery, corrosion of conventional current 
+collectors such as Al, Cu, and stainless steel (SUS) can adversely affect life time 
+and safety through increased internal resistance, passivation of active materials, 
+and consumption of electrolyte/ active electrode materials [51-57]. Anode 
+performance of thin graphene layers can be misguided by the strong substrate 
+114 
+ 
+reaction since the most reactive lithium ions exist in electrolyte [58-59]. It has 
+been proposed that monolayer graphene can be used as a protective layer for 
+ 
+substrate against air oxidation and mild electrochemical reaction [60-61].
+Therefore, information on the critical layer thickness of graphene (lc) to minimize 
+the substrate effect and the influence of defects to lc are key ingredients to 
+understand electrochemical reaction and protective nature of graphene layers 
+under severe electrochemical condition.   
+ 
+The main purpose of this work is twofold: i) To clarify lithium diffusion 
+pathway through basal plane of graphene layers and ii) to investigate the 
+influence of defect population to lithium ion diffusion and the protective ability 
+of graphene layers. In this article, we prepared Cu-grown monolayer graphene 
+(SLG) samples and Ni-grown multi-layered graphene (MLG) samples that are 
+dominated with graphene basal plane and edge plane, respectively. We found that 
+the electrochemical performance of few-layer graphenes (FLGs) which are 
+overlapped up to three layers of SLG is strongly affected by the substrate 
+reaction. Experiments with Ar plasma treatment indicated that 6 layers of basal 
+plane-enriched large area graphene were needed to provide sufficient substrate 
+protection. Combing the experimental results and density functional theory 
+calculations, we proved that basal plane hindered lithium ion diffusion with a 
+high diffusion barrier height, whereas divacancies and higher order defects can 
+be shortcuts for lithium ion diffusion. 
+115 
+ 
+4.2.1 Material Preparation 
+Large area SLG was synthesized on copper foil by atmospheric pressure 
+(AP) CVD. Cu foil purchased from Nilaco (Lot No. 113321, 99.96 %, 100 μm in 
+thickness) was preannealed to 1060 °C for two hours with 100 sccm of Ar gas 
+and 200 sccm of H2 gas to enlarge Cu grain size and then chemico-mechanically 
+polished with FeCl3 solution for flattening. The prepared Cu foil was then 
+brought into the growth chamber. The temperature of the chamber was heated up 
+to 1060 °C with 1000 sccm of Ar gas and 200 sccm of H2 gas for 20 min. 
+Methane (5sccm) was then introduced with 10 sccm H2 gas for 5 min. After 
+growth, the sample was cooled down to room temperature naturally in the same 
+atmosphere. In the case of MLG synthesis, Ni thin film (300 nm) was deposited 
+on SiO2 (300 nm)/Si by a thermal evaporator. This was placed in rapid thermal 
+CVD chamber. Temperature was increased to 1000 °C in 5 min in vacuum. Ni 
+surface was reduced by flowing 45 sccm H2 gas at 1000 °C. The gas mixing ratio 
+of C2H2:H2 was optimized to 2:45 sccm and flown for a minute. After completion 
+of growth, the gas supply was terminated and the chamber was cooled down to 
+ 
+room temperature. The detail has been described elsewhere [62-63].
+ 
+4.2.2 Transfer Process of a Graphene  
+    PMMA (e-beam resist, 950 k C4, Microchem) was spin-coated on the 
+graphene/Cu foil (Ni film) at 1000 rpm for 60 s. To etch away Cu foil (Ni film), 
+the sample was submerged in a copper etchant (CE-100, Transene) for ∼30 min 
+116 
+ 
+(4 hours for Ni film). After rinsing by deionized water for a few times, 
+PMMA/graphene layer was fished onto the CR 2032 cell case coated with 
+lithium-reaction resistive polymer, as shown in Figure 4.5. PMMA was removed 
+by acetone later after graphene was completely dried and attached onto the cell 
+case. The transferred sample was then annealed up to 650 °C for 5 h in high 
+-6
+vacuum (1 x 10  Torr) for further removal of PMMA [63-64].  
+ 
+Figure 4.5. Schematic of fabrication process with Cu-grown SLG 
+or Ni-grown MLG (left panel). Bilayer and trilayer graphene can be 
+fabricated by transferring monolayer graphene repeatedly. 
+Photograph of as-prepared monolayer graphene (PMMA on top) 
+floating in water and CR 2032 coin cell case (right panel). 
+  
+4.2.3 Characterization of a Graphene 
+117 
+ 
+Figure 4.6 shows a schematic of the CR 2032 coin cell type battery. The 
+half cell was then fabricated with a counter/reference electrode of Li foil for the 
+test of Li diffusion through well defined basal graphene plane (Figure 1f). 
+Bilayer and trilayer graphene coin cells were also fabricated by transferring 
+monolayer graphene repeatedly. MLG was synthesized on Ni film to represent 
+graphene where the edge plane was enriched and the half cell was fabricated 
+similarly. 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+Figure 4.6. Schematic of a coin cell structure with Cu-grown SLG 
+or Ni-grown MLG. Bilayer and trilayer graphene coin cells were 
+fabricated by transferring monolayer graphene repeatedly. 
+ 
+In order to clarify the quality and layer number of graphene, a series of 
+characterization was done, as shown in Figure 4.7. Figure 4.7a and b are optical 
+118 
+ 
+micrographs of the transferred SLG and MLG on SiO2/Si substrate, respectively. 
+The SLG grown on Cu foil was rather flat except small portion (~ 4%) of bilayer 
+and trilayer graphene domains represented by the dark spots (arrows) in the 
+image (Figure 4.7a). Some wrinkles indicated by the white dashed lines 
+introduced during transfer process were also visible. Contrary to this, Ni-grown 
+MLG showed multi-layered flakes represented by the white spots (arrows) in 
+Figure 4.7b, creating numerous edge planes, as can be visualized in Figure 4.7c. 
+−1
+Micro-Raman spectra in Figure 4.7d clearly show G-band near 1590 cm , 
+2
+which is related to optical E2g phonon at the Brillouin zone center indicating sp  
+hybridization of carbon network, and G’ −1-band around 2694 cm , which is also 
+ 
+known as 2D-band, an overtone of D-band, in both samples [66]. Large G’/G 
+−1
+intensity ratio (~ 2) with a small D-band near 1350 cm , which corresponds to 
+3
+transverse optical phonon near the K point and indicates sp  hybridization of 
+carbon network, was observed in SLG, indicating high quality monolayer 
+graphene. On the other hand, the intensity ratio of G’/G which is less than one 
+reveals multi-layered properties of Ni-grown graphene. Defect distribution was 
+shown in the images of confocal Raman mapping of D/G intensity ratio in 
+Figure 4.7e and Figure 4.7f. Defects indicated by bright spots were scattered 
+uniformly over the surface, while grain boundary lines were faintly visible in 
+SLG. Small flakes were visible in MLG (Figure 4.7f). Although D-band 
+intensity was barely visible in Figure 4.7d, we clearly observed from D/G band 
+mapping that some defects were distributed in both samples. Transmittance of 
+119 
+ 
+each graphene layer transferred onto PET substrate was provided in Figure 4.7g. 
+The transmittance of SLG was 96.5%, slightly smaller than HOPG value of 
+97.7%, which may be attributed to some portion of multi-layered domains 
+formation as described in Figure 4.7a [67]. Correspondingly, bilayer and trilayer 
+graphene samples revealed a systematic reduction in the transmittance. The Ni-
+grown MLG showed 63.6% of transmittance, corresponding to 15 layers in 
+average by assuming 2.3 % absorption per each layer [68]. Optical photographs 
+were provided to visualize different transmittances with different number of 
+graphene layers in Figure 4.7h.  
+ 
+Figure 4.7. Optical micrographs of (a) Cu-grown SLG and (b) Ni-
+grown MLG on SiO2/Si substrate. White dashed lines indicate 
+wrinkles. Some portion of thicker graphene is indicated by arrows. 
+(c) Schematic of (i) SLG with a well defined basal plane and (ii) 
+edge plane enriched MLG. (d) Micro-Raman spectra of SLG and 
+120 
+ 
+MLG. Confocal Raman mapping of D/G intensity ratio of (e) SLG 
+and (f) MLG from squared positions of (a) and (b). The contrast is 
+normalized to 0.4 to visualize the defect distribution for both 
+images. (g) Wavelength-dependent transmittance (values are 
+provided at a wavelength of 550 nm) and (h) optical photographs of 
+different number of graphene layers on PET substrate. 
+ 
+4.2.4 Anode Performance of a Graphene 
+Electrochemical measurements of different layers of Gr samples were 
+performed with a CR2032 coin cell using VMP3 instrument (BioLogic Science 
+Instruments). The cell was assembled in a dry room using CR 2032 cell case with 
+different number of graphene layers and bare foil (SUS 316) as a working 
+electrode, lithium metal foil as a counter/reference electrode, and a 1 M of LiPF6 
+in a 1:1 (v/v) mixture of ethylene carbonate (EC) and diethyl carbonate (DEC) as 
+an electrolyte. A glassy carbon microfiber was used as a separator. The cells 
+were charged and discharged galvanostatically between 3.0 and 0.01 V at a 
+ 2constant current of 5 A/cm . The AC impedance spectra were obtained by 
+applying a sine wave with an amplitude of 10 mV over a frequency range of 100 
+kHz to 10 mHz [69]. Figure 4.8a shows cyclic voltammograms (CV) of different 
+number of graphene layers at a scan rate of 0.1 mV/s from 0.01 V to 3 V. The 
+bare SUS electrode showed an anodic peak near 1.03 V (SO) and a cathodic peak 
+around 0.78 V (SR). These redox peaks involve chemical reactions with Li ions 
+121 
+ 
+and possibly electrolytes. Both anodic and cathodic peaks were reduced in the 
+monolayer graphene electrode. These peaks were reduced consecutively in 
+bilayer and trilayer graphene electrodes. It is obvious to see that the redox 
+reaction of the bare SUS electrode was suppressed by the coated graphene layers. 
+An additional cathodic peak appeared near 0.28 V in bilayer and trilayer samples. 
+Origin of these peaks could be ascribed to defect-associated lithium adsorption 
+[41]. At MLG (15 layer graphenes) sample, a sharp cathodic peak near 0.01 V 
+(LiIn) is identified as lithium intercalation and a rather broad peak near 0.12 V 
+(LiDe) is related to decomposition of graphitic intercalation compound (GIC) 
+stages [58]. It is of note that the bare SUS-related peak was nearly compressed in 
+this case. Both LiDe and LiIn peaks appeared in this case, in good contrast with 
+FLG samples in which only a clear LiIn peak was observed, suggesting that no 
+GIC stages were formed in FLGs. The distinct CV behavior of FLGs and MLG 
+demonstrates that lithium ion intercalation becomes more effective in MLG 
+induced by the considerable amount of edge planes, as shown in Figure 4.7b. 
+122 
+ 
+ Figure 4.8. (a) Cyclic voltammograms of different number of 
+graphene layers samples at a scan rate of 0.1 mV/s. SUS-related 
+redox reaction peaks (SO, SR) and lithium 
+intercalation/deintercalation related peaks (LiIn/LiDe) are marked in 
+st nd
+the figure. (b) 1  and (c) 2  galvanostatic charge/discharge profiles 
+of different number of graphene layers at a current density of 5 
+123 
+ 
+ 2A/cm . (d) The related layer-dependent capacities. Two regimes of 
+corrosion-dominant and lithiation-dominant are indicated. 
+ 
+st
+Figure 4.8b shows the 1  galvanostatic charge/discharge profile with a 
+2
+voltage sweeping range of 0.01 ~ 3 V at a constant current of 5 A/cm . As the 
+number of graphene layers increased, long tail appeared in the charge curve at 
+low voltage region. At MLG sample, a plateau appeared in the range of 1.25 - 0.6 
+V. In graphitic material, the solid-electrolyte interface (SEI) formation via 
+electrolyte decomposition takes place in the range of less than 1.0 V [43, 68, 70-
+71]. The SEI formation potential varies with types of graphite planes. In general, 
+SEI forms at higher potential in edge plane than in basal plane [72-74]. 
+Therefore, we ascribed this plateau in MLG to edge plane-related SEI formation. 
+nd
+In the 2  cycle, the voltage profile shows a gradual change in a wide range of 
+voltages during charge/discharge, revealing a V-shape curve, i.e., no plateau 
+region, as shown in Figure 4.8c. This is in good contrast with a U-shape curve in 
+graphite electrode, where the edge plane intercalation is dominant in the plateau 
+region of low voltage within 0.1 V [68,75] Capacities of graphene coated 
+electrodes in Figure 4.8c were consistently smaller than that of the bare electrode, 
+and furthermore much smaller by about 30 times than the recently reported 
+graphene battery result [51]. The huge capacity difference comes from the use of 
+different substrates, as shown in Figure 4.9. 
+124 
+ 
+ Figure 4.9. Cyclic voltammograms at a scan rate of 0.1 mV/s (a) 
+nd
+and 2  galvanostatic charge/discharge profiles (b) at a current 
+2
+density of 5 µA/cm  of bare CR2032 coin cell case and foil SUS 
+316. 
+ 
+Abundant reaction peaks and larger area of CV curve indicate that more 
+severe corrosion reaction occurs in the case of foil SUS 316 in Figure 4.9a. The 
+capacity indicating substrate corrosion intensity obtained from the cell case in 
+Figure 4.9b shows almost 8 times smaller than that of the SUS 316. This huge 
+capacity difference can be attributed to the corrosion resistive polymer coated on 
+2
+the cell case. The capacity of bare foil SUS (~14 µAh/cm ) is still smaller than 
+2
+the reported value for graphene on Cu substrate (~ 40 µAh/cm ) in Ref. 53, i.e., 
+Cu reaction is much stronger than SUS 316 reaction. Therefore, the relative 
+higher capacity can be understood by the effect of Cu substrate.This also implies 
+125 
+ 
+that in spite of graphene layers coated on the electrode with well defined basal 
+plane, the reaction with electrode did occur inevitably.   
+ 
+The related layer-dependent capacities are summarized in Figure 4.8d. As 
+st
+the number of graphene layers increased, the 1  charge capacity increased rapidly 
+up to trilayer graphene electrode and saturated at the MLG electrode. As 
+described in the schematic of Figure 4.7c, the basal plane is exposed during 
+lithiation up to three layers, whereas both edge plane and basal plane are present 
+in 15 layers. Two different types of SEI are formed: i) basal-plane associated SEI 
+(b-SEI) which is formed up to 3 graphene layers and ii) edge-plane associated 
+SEI (e-SEI) which is formed in MLG sample. It has been known that b-SEI 
+formed at lower potential is associated with solvent reduction, while e-SEI 
+ 
+formed at higher potential is associated with salt ions [72-74, 43]. Since our basal 
+plane contains abundant defect sites, as observed from Figure 4.7d and e, some 
+decomposed solvent molecules may further diffuse into the subjacent layers 
+along with Li ions or in a form of lithium salvation and form additional b-SEI 
+layer. This is why b-SEI increases as the number of graphene layers increases at 
+FLG samples. At MLG electrode, both b-SEI and e-SEI are formed. Although e-
+SEI increases in this case, b-SEI is reduced compared to FLG electrodes due to 
+the decrease of effective basal plane area of 15 layers (See Figure 4.7c) and 
+st
+therefore the capacity from SEI formation is saturated in the 1  charge.  
+ 
+126 
+ 
+st
+    On the other hand, the 1  discharge capacity decreased gradually up to 
+three layer graphene electrode and increased at 15 layer electrode. Similar trend 
+nd
+was also observed in the 2  charge/discharge profile. The discharge capacities of 
+nd st
+the 2  cycle were not much different from those of the 1  cycle. Large capacity 
+of the bare SUS electrode was reduced by coating graphene layers up to three 
+layers. This gradual reduction was also expected from the reduced areas of CV 
+curves in FLGs (Figure 4.8a). This implies several facts: i) SUS substrate 
+reaction is systematically suppressed with increasing number of graphene layers 
+ii) Because lithium ions can diffuse through basal plane of graphene, monolayer 
+graphene is not sufficient to prohibit substrate reaction. Since the pure basal 
+plane presumably does not allow Li diffusion, the diffusion may be provoked 
+through some defect sites that exist on the graphene plane, as observed from the 
+D/G intensity ratio of confocal Raman mapping in Figure 4.7e. This will be 
+described later in detail. In FLG samples, If we presume capacity only to be 
+0.028 μAhcm-2 contributed from intercalation ( / interlayer in the case of LiC6), 
+the intercalation capacity reaches 0.056 μAh/cm2 at trilayer graphene sample. 
+μAh/cm2This value is negligible to the capacity (0.73 ) observed in our 
+experiment. This tells us that even if intercalation of lithium ions was invoked, 
+the observation was still obscured by the dominant SUS redox reaction. By 
+noting a linear decrease of the capacity and hence extrapolating to a minimum 
+capacity, lc to sufficiently prohibit the SUS redox reaction is predicted to be ~ 6 
+127 
+ 
+layers. As the number of graphene layers increases, the capacity from the SUS 
+redox reaction decreases, while the capacity reduction will be compensated by 
+the intercalation capacity between graphene layers. After 6 layers, the capacity 
+starts increasing by the pure intercalation. We can define substrate corrosion-
+dominant region up to 6 layers and lithiation-dominant region after 6 layers, as 
+visualized in Figure 4.8d.  
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+Figure 4.10. AC impedance spectra obtained by applying a sine 
+wave with an amplitude of 10 mV over a frequency range from 100 
+kHz to 10 mHz. The inset shows impedance at higher frequency 
+region to demonstrate charge transfer resistance. 
+128 
+ 
+In order to get the complete image of substrate-related corrosion behavior, 
+we performed AC impedance measurement to 6 layers of graphene in the full 
+frequency range of 100 kHz to 10 mHz by applying a sine wave with an 
+amplitude of 10 mV, as shown in Figure 4.10. All of the impedance spectra 
+consisted of a depressed semicircle in higher frequency (Figure 4.10 inset) and a 
+straight line with different angles to the real axis in the lower frequency range. 
+The depressed semicircle usually can be deconvoluted into two semicircles, 
+resulting from SEI formation and charge transportation. Since this measurement 
+was carried out without any charge/discharge test, the formation of the SEI 
+would be minimized. Therefore, the main contribution of this semicircle could be 
+attributed to the charge transport. The charge transport resistances of graphene-
+coated samples were obviously larger than that of bare SUS coin cell case which 
+can be indicated by the increased diameters of semicircles. Smaller angles of 
+graphene electrodes than SUS electrode in the straight line region again 
+demonstrated difficulty of lithium ion diffusion into graphene electrodes. All of 
+these proved that graphene can be a good protective layer by limiting the ion 
+diffusion process at the SUS/graphene interface. Especially, at six layers of 
+graphene electrode, the charge transport resistance is largest and the angle of 
+straight line is smallest compared to the electrodes coated with one, two, and 
+three layers of graphene. This is because further overlapping of larger area 
+129 
+ 
+graphene can further minimize lithium ion diffusion which will provide much 
+better protective ability compared to less number of graphene layers.  
+ 
+Figure 4.11. Theoretically estimated capacity based on LiC6 
+intercalation. No absorption of Li ions occurs at monolayer 
+graphene. 
+The theoretically estimated capacity at 15 layers (or effectively 9 layers, see 
+Figure 4.11), is 0.2 μAh/cm2. However, this value is still far smaller than the 
+observed value of 1.30 μAh/cm2. This extra capacity could be ascribed to the 
+lithium adsorption on defects of the graphene surface, which can be supported by 
+the widely distributed defects observed from confocal Raman mapping in our 
+nd
+experiments (Figure 4.7f). In the 2  cycle, the discharge capacity was smaller 
+130 
+ 
+than the charge capacity consistently, nearly independent of the thickness of 
+graphene layers. This difference of 0.35 μAh/cm2 in the charge/discharge 
+capacity is irreversible capacity and can be ascribed to strongly adsorbed lithium 
+ions on defects such as vacancies or grain boundaries formed on the graphene 
+layers. This will be discussed in the theory section later.  
+ 
+Since defects on graphene basal plane seem to play an important role in 
+lithium diffusion, a systematic study is required for comprehensive analysis. 
++
+Thus, structural defects of graphene were created by Ar  bombardment with 
+different plasma powers (15W, 100W) for one minute. The transferred graphene 
+-6
+was brought into vacuum chamber with a base pressure of 1 x 10  Torr and then 
+filled with Ar gas of 100 sccm for a minute, followed by the plasma ignition. 
++
+This was repeated layer by layer to obtain Ar  plasma-treated FLG samples. 
+Figure 4.12a shows Raman spectra of Ar plasma-treated monolayer graphene. At 
+15 W plasma power, D/G intensity ratio was increased to 0.56 from 0.19 in no 
+plasma-treated pristine graphene, implying structural defect formation in the 
+-1
+graphene plane. At 100 W, one additional peak near 1620 cm  (D’) appeared in 
+addition to further increase of D-band intensity (D/G intensity ratio is 1.66), 
+indicating plausible formation of structural defects. No peak splitting of G-band 
++ -
+into G  and G  peaks indicates that our process does not involve strain-induced 
+effect. Figure 4.12b shows CV diagrams for SLG electrode with different 
+plasma powers at a scan rate of 0.1 mV/s. It is obvious to see that the redox 
+131 
+ 
+reaction peak intensities of SO and SR related peaks were enhanced and the 
+related peak positions were also shifted after plasma treatment. Those peaks are a 
+combination of defect-associated adsorption and SUS substrate reaction, as 
+mentioned in Figure 4.8a. Additional redox reaction due to the generated basal 
+plane defects by plasma treatment is provoked. Since the protective layer is 
+monolayer graphene, extra lithium ions adsorbed on defects could easily reach 
+nd
+the SUS substrate, thus increasing the substrate redox reaction. The 2  
+galvanostatic charge/discharge capacity of SLG increased accordingly compared 
+to the pristine graphene sample, as shown in Figure 4.12c. The enhanced 
+capacity was attributed to the increased adsorption of Li ions on defects and 
+nd
+increased substrate reaction, as mentioned in Figure 4.12b. The 2  charge 
+capacity kept increasing with increasing plasma power, independent of the 
+number of graphene layers, as summarized in Figure 4.12d. The substrate redox 
+reaction was also suppressed, which is identified by the capacity decrease with 
+increasing number of graphene layers similar to that of pristine graphene samples.  
+ 
+Smaller capacity was increased in FLG electrodes compared to that of SLG 
+after plasma treatment and generated different slopes, as shown in Figure 4.12d. 
+The absolute slope increased from 0.26 to 0.56 with increasing the plasma power. 
+Extrapolation of these slopes, which determines the critical layer thickness to 
+prohibit substrate reaction, gave rise to lc of ~ 6 layers independent of the plasma 
+power, i.e., defect population. This is rather surprising, because creation of more 
+132 
+ 
+defects in the basal plane is expected to increase basal-plane diffusion of Li ions 
+which will eventually increase substrate redox reaction (See Figure 4.12b, c) and 
+thereby larger critical layer thickness should be required after strong plasma 
+treatment. In order to explain this contradictory phenomenon, a schematic of Li 
+diffusion through defects in the basal plane is provided in Figure 4.12e. In the 
+case of SLG, Li ion diffusion is allowed through defect sites and no lateral 
+diffusion limitation is expected, since the graphene layer is fully surrounded by 
+Li ions in electrolyte. Therefore, higher defect population will enhance Li ion 
+adsorption and also substrate reaction. In the case of FLGs where large area basal 
+plane is dominant, graphene layers are overlapped with each other so that Li ions 
+will diffuse through defects perpendicular to the plane of top layer first and 
+diffuse along the plane of subjacent graphene layer until they meet another defect 
+site. Since these Li ions may accumulate near the defect sites generated by Ar 
+plasma, Li diffusion along the plane direction will be limited by the steric 
+hindrance from aggregated Li atoms, which is different from the SLG case. 
+Therefore further Li diffusion through graphene basal planes in FLGs is 
+constrained severely by the lateral diffusion at higher defect density. Thus, when 
+FLGs are used as a protective layer, the defects-related lithium adsorption on 
+subjacent graphene layers and actual lithium ion reaction with substrate are 
+suppressed, which is again consistent with the reduction of reaction with 
+substrate are suppressed, which is again consistent with the reduction of the 
+peaks in CV diagram. As a consequence of these phenomena, the critical layer 
+133 
+ 
+thickness gives rise to the same value, independent of the defect population. It 
+will be worth mentioning the possibility of forming oxygen-related functional 
+groups on defect sites. Li ions can be also adsorbed on such sites and thus our 
+argument of lateral diffusion suppression by the steric hindrance is still valid.  
+ 
+ 
+ 
+ 
+134 
+ 
+Figure 4.12. (a) Raman spectra, (b) cyclic voltammograms at a scan 
+rate of 0.1 mV/s, and (c) 2nd galvanostatic charge/discharge 
+2
+profiles at a current density of 5 A/cm  for monolayer graphene 
+treated by Ar plasma with different plasma powers (15 W and 100 
+nd
+W). (d) Capacity of 2  charge as a functional of number of 
+graphene layers under different Ar plasma powers. Absolute slopes 
+according to different plasma powers and critical layer thickness (lc) 
+are indicated in the figure. (e) Schematics of proposed Li diffusion 
+mechanism through defects on the basal plane with different defect 
+population. Broad down arrows indicate Li ion diffusion through 
+defect sites of basal plane. Red glows represent steric hindrance for 
+Li ion diffusion formed by the accumulated Li ions or functional 
+groups. The inset in the right indicates the relative magnitude of 
+diffusion coefficient. (f) Relationship of D/G ratio with the 
+extracted slope from (d). 
+ 
+It is intriguing to see the relationship between D/G intensity ratio from 
+Raman spectra and the slope extracted from charge/discharge profiles, as shown 
+in Figure 4.12f. The slope which indicates Li diffusion through graphene layers 
+is correlated to the population of defects in the graphene plane. The larger slope 
+implies the slower diffusion rate and vice versa. Li ion diffusion is limited by the 
+Li aggregates adsorbed on the increased defect sites described in the schematic 
+135 
+ 
+Figure 4.12e. Thus, information of Li diffusion obtained from electrochemical 
+test could be used as a metric for evaluating the graphene crystallinity, an 
+important material parameter of graphene.  
+ 
+In order to understand what type of defects allows Li ion diffusion through 
+basal plane of graphene, we conducted density functional theory calculations for 
+various defects: ideal hexagonal site (H site), Stone-Wales defect (SW), 
+monovacancy (V1), and divacancy (V2). The density functional theory 
+calculations were performed within generalized gradient approximation as 
+implemented in DMol3 code. All electron Kohn-Sham wave functions were 
+expanded in a local atomic orbital basis set with each basis function defined 
+numerically on an atomic centered spherical mesh. A double numeric polarized 
+basis sets (DNP) were used for all elements. The dangling bonds of graphene 
+edge were saturated by hydrogen atoms and the atomic cluster structure which 
+consists of 120 carbon atoms and 48 hydrogen atoms were relaxed fully until the 
+-4
+force on each atom is less than 10  eV/Å and the total energy change is less than 
+-5 -6
+5×10  eV. The damped atom-pairwise dispersion corrections of the form C6R  
+were also considered for calculations. Li adsorption energy was calculated by 
+Ead(Li) = Etot(Li+carbon) - Etot(Li)- Etot(carbon), where Etot(Li) is the self energy 
+of lithium atom and Etot(carbon) is the total energy of carbon system. Various 
+local charges were also calculated using Mulliken, Hirshfeld, and electrostatic 
+potential (ESP).  
+136 
+ 
+  
+ 
+ 
+137 
+ 
+Figure 4.13. Side and top views of atomic configurations (top 
+panel), isosurface images of electrostatic potential (second panel), 
+bond lengths and local charge distributions at the barrier states 
+(third panel), and the diffusion barrier profiles of Li (bottom panel) 
+through (a) graphene hexagonal site (H site), (b) Stone-Wales (SW) 
+defect (c) monovacancy (V1), and (d) divacancy (V2). Isovalue for 
+3
+rendering isosurfaces is 0.25 e/Å . The insets in the third panel 
+show isosurface image of electrostatic potential for each 
+corresponding structure without Li ion. Bond lengths (yellow color) 
+and electrostatic potential charges (white color) are in units of Å 
+and electrons, respectively. 
+ 
+Li atom adsorbs on the H site with a bond length of 2.35 Å above the 
+graphene plane and with an adsorption energy of -1.69 eV, as shown in the upper 
+panel of Figure 4.13a and Table 4.1. Li ESP charge at H site is partially depleted 
+to 0.62 e. The ESP charge of Li atom at barrier state is 0.28 e, much less 
+compared to that at the binding site. This charge difference between adsorption 
+and barrier state is an important variable in determining the Coulomb interaction 
+energy. As the Li approaches to the barrier site, the available space for Li is 
+narrow with a short separation distance of 1.52 Å, invoking severe charge 
+overlapping between Li and adjacent carbon atoms, as can be seen in the 
+electrostatic potential contour in the second panel of Figure 4.13a. This increases 
+138 
+ 
+repulsive forces, giving rise to large diffusion barrier height of 10.2 eV, similar to 
+the previous report (Table 4.1) validating our approaches. Similar situation takes 
+place in the SW defect which is abundant in the graphene grain boundary. The Li 
+adsorption energy near the heptagon is -1.94 eV, slightly stronger than that of H 
+site. Although the charge overlapping is still severe, a longer separation distance 
+of 1.60 Å and also much less charge difference between adsorption and barrier 
+state (0.04 e) forms a relatively smaller activation barrier height of 6.35 eV than 
+that of H site, as shown in Figure 4.13b. In the case of V1, Li adsorbs at the 
+vacancy site with an adsorption energy of -3.12 eV, keeping closer distance (2.03 
+Å), as shown in the top panel of Figure 4.13c. The excess charge difference of Li 
+atom between adsorption and barrier site is 0.18 e and the closest separation 
+distance at the barrier site is 1.36 Å. Charges are distributed not only on the Li 
+and carbon sites but also between them, implying both covalent bonding and 
+ionic bonding characters due to charge depletion from Li atom. This produces a 
+large diffusion barrier height of 8.86 eV. On the other hand, V2 provides a rather 
+large open space with an adsorption energy of -2.36 eV near the middle of the 
+two dimers (top panel of Figure 4.13d) such that a large separation distance of 
+2.90 Å is maintained. This gives minimizes electrostatic charge overlapping and 
+a large bond length of 1.83 Å at the barrier state, i.e., steric hindrance is 
+minimized, as shown in the second and third panels in Figure 4.13d. The charge 
+difference between the adsorption and the barrier states is 0.04 e. All of these 
+factors induced a smallest diffusion barrier height (2.36 eV) among the defects 
+139 
+ 
+we studied. This barrier height can be overcome under the typical charging 
+conditions of the battery. 
+ 
+4.3 Summary of Chapter Four 
+We have studied lithium diffusion pathways with two types of graphene 
+samples prepared by CVD; i) well-defined basal plane graphene grown on Cu 
+foil and ii) edge plane-enriched graphene layers grown on Ni film. We have 
+discovered that electrochemical reaction of electrode (substrate/graphene) not 
+only is related to the number of graphene layers but also relies on the defect sites 
+on the basal plane of graphene. The experimental and calculated results related to 
+the specific type of defects such as divacancies and higher order defects that can 
+assist lithium ion diffusion through basal plane could help us in designing high 
+capacity and highly conductive corrosion-free electrode for lithium ion battery. It 
+would be reasonable to expect that substrate protective nature of few-layer 
+graphenes could be the basis of further investigation of preparing original 
+substrate which remains unaltered properties and has longer lifetime under severe 
+electrochemical corrosion conditions for battery. Furthermore, by correlating the 
+lithium diffusion in graphene layers to the D/G intensity ratio from Raman 
+spectra, we developed a way of predicting the graphene crystallinity from 
+electrochemical method.  
+140 
+ 
+Bibliography of Chapter Four 
+[1] K.S. Novoselov, et al., Science 2004, 306, 666.  
+[2] Y.B. Zhang, Y.W. Tan, H.L. Stomer, P. Kim, Nature 2005, 438, 201. 
+[3] A. Altland, Phys. Rev. Let. 2006, 97, 236802. 
+[4] D. Chen, L.H. Tang, J.H. Li, Chem. Soc. Rev. 2010, 39,3157. 
+[5] D.A.C. Brownson, D.K. Kampouris, J. Power Sources 2011, 196, 4873. 
+[6] M. Pumera, En. Env. Sci. 2011, 4, 668. 
+[7] P. Lian, et al., Electrochimica Acta 2010, 55, 3909. 
+[8] A.K.Geims, K.S. Novoselvo, Nat. Mater. 2007, 6, 183. 
+[9] M.S. Fuhrer, C.N. Lau, A. H. MacDonald, MRS Bull. 2010, 35, 289. 
+[10] A. K. Geim, K. S. Novoselov, Nature Mater. 2007, 6, 183. 
+[11] G. W. Semenoff, Phys. Rev. Lett. 1984, 53, 5449. 
+[12] V. P. Gusynin, S. G. Sharapov, Phys. Rev. Lett. 2005, 95, 146801. 
+[13] N. M. R. Peres, A. H. Castro Neto, F. Guinea, Phys. Rev. B 2006, 73, 
+195411. 
+[14] K. S. Novoselov, A. K. Geim, S. V. Morozov, D. Jiang, M. I. Katsnelson, 
+I. V. Grigorieva, S. V. Dubonos, A. A. Firsov, Nature 2005, 438, 197. 
+[15] Y. Zhang, Y.-W. Tan, H. L. Stormer, P. Kim, Nature 2005, 438, 20. 
+[16] K. S. Novoselov, Z. Jiang, Y. Zhang, S. V. Morozov, H. L. Stormer, U. 
+Zeitler, J. C. Maan, G. S. Boebinger, P. Kim, A. K. Geim, Science 2007, 
+315, 1379. 
+[17] J.-C. Charlier, P. C. Eklund, J. Zhu, A. C. Ferrari, Ed. Jorio, A., G. 
+141 
+ 
+Dresselhaus, M. S. Dresselhaus, Berlin/Heidelberg: Springer-Verlag, 
+2008. 
+[18] Ph.D. Thesis, Dr. Vladimiras Gavriusinas, Faculty of Physics, Vilnius 
+University, Lithuania, 2008. 
+[19] A. H. C. Neto, F. Guinea, M. N. Peres, R., K. S. Novoselov, A. K. Geim, 
+Rev. Mod. Phys. 2009, 81, 109. 
+[20] C. Lee, X. D. Wei, J. W. Kysar, J. Hone, Science 2008, 321, 385. 
+[21] V. M. Pereira, A.H. Neto, 2008, arXiv:0810.4539v1. 
+[22] A. A. Balandin, S. Ghosh, W. Bao, I. Calizo, D. Teweldebrhan, F. Miao,  
+C. N. Lau, Nano Lett. 2008, 8, 902. 
+[23] R. R. Nair,  P. Blake,  A. N. Grigorenko, K. S. Novoselov,  T. J. 
+Booth,  T. Stauber,  N. M. R. Peres, A. K. Geim, Science 2008, 
+320, 1308. 
+[24] U. Kürüm, O. Ö. Ekiz; H. G. Yaglioglu, A. Elmali,  M. Ürel, H. Güner, 
+A. K. Mızrak,  B. Ortaç, A. Dâna, Appl. Phys. Lett. 2011, 98, 141103. 
+[25] Q. Bao, H. Zhang, Y. Wang, Z. Ni, Y. Yan, Z. X. Shen, K. P. Loh, D. Y. 
+Tang, Adv. Funct. Mater. 2009 19, 3077. 
+[26] K. S. Novoselov, A. K. Geim, S. V. Morozov, D. Jiang,  Y. Zhang, S. V. 
+Dubonos, I. V. Grigorieva, A. A. Firsov, Science 2004, 306, 666.  
+[27] P. Sutter, Nat. Mater. 2009, 8, 171. 
+[28] P. W. Sutter, J.-I. Flege, E. A. Sutter, Nat. Mater. 2008, 7, 406. 
+[29] I. Pletikosić, M. Kralj,  P. Pervan,  R. Brako,  J. Coraux, A. T.   
+N’Diaye,   C. Busse, T. Michely, Phys. Rev. Lett. 2009, 102, 056808. 
+142 
+ 
+[30] M. Eizenberg, J. M. Blakely, Surf. Sci. 1970, 82, 228. 
+[31] A. Reina, X. Jia, J. Ho, D. Nezich, H. Son, V. Bulovic, M. S. 
+Dresselhaus, J. Kong,Nano Lett., 2009, 9, 30. 
+[32] K.S. Kim, Y. Zhao, H. Jang, S.Y. Lee, J.M. Kim, J.H. Ahn, P. Kim, J.Y. 
+Choi, B.H. Hong, Nature 2009, 457, 706. 
+[33] F. Güneş, G. H. Han, K. K. Kim, E. S. Kim, S. J. Chae, M. H. Park, H.-K. 
+Jeong, S. C. Lim, Y. H. Lee, Nano 2009, 4, 83. 
+[34] X. Li, W. Cai,  J. An,  S. Kim,  J. Nah,  D. Yang,  R. Piner, A. 
+Velamakanni,  I. Jung, E. Tutuc, S. K. Banerjee, L. Colombo,  R. S. 
+Ruoff, Science 2009, 324, 1312. 
+[35] H. P. Boehm, A. Clauss, G. O. Fischer, U. Hofmann, Zeitschrift für 
+anorganische und allgemeine Chemie 1962, 316, 119. 
+[36] X. Gao, J. Jang, S. Nagase, J. Phys. Chem. C 2010, 114, 832. 
+[37] M.Winter, O. J.Besenhard, E. M. Spahr, P. Novák, Adv. Mater. 1998, 10, 
+725. 
+[38] M.Winter, P. Novák, A. Monnierb, J. Electrochem. Soc. 1998, 145, 428.  
+[39] D. Bar-Tow, E. Peled, L. Bursteinb, J. Electrochem. Soc. 1999, 146, 824. 
+[40] Y. Ren, R. A. Armstrong, F. Jiao, G. P. Bruce, J. Am. Chem. Soc. 2010, 
+132, 996. 
+[41] T. Tran, K. Kinoshita, J. Electroanal. Chem. 1995, 386, 221. 
+[42] K. Persson, A. V. Sethuraman, J. L. Hardwick, Y. Hinuma, S. Y. Meng,  
+A. Ven, V. Srinivasan, R. Kostecki, G. Ceder, Phys. Chem. Lett. 2010, 1, 
+1176.  
+143 
+ 
+[43] Meyer, S. Passerini, M. Winter, J. Power Sources 2012, 200, 83. 
+[44] B. Jungblut, E. Hoinkis, Phys. Rev. B 1989, 40, 10810. 
+[45] Y. Yamada, K. Miyazaki, T. Abe, Langmuir 2010, 26(18), 14990. 
+[46] J. M. Tarascon, D.G. Guyomard, Extended Abstracts, Spring Meeting of  
+the Electrochemical Society, May 16-21, 1993, 93-1, Honolulu, HI, no. 
+69. 
+[47] T. Takamura, K. Endob, L. Fuc, Y. Wu, K. J. Lee, T. Matsumoto, 
+Electrochim. Acta, 2007, 53, 1055. 
+[48] X. S. Li, W. W. Cai, J. H. An, S. Kim, J. Nah, D. X. Yang, R. D. Piner,  
+A.Velamakanni, I. Jung, E. Tutuc, S. K. Banerjee, L. Colombo, R. S.     
+Ruoff, Science 2009, 324, 1312. 
+[49] C. Biswas, Y. H. Lee, Adv. Func. Mater. 2011, 21, 3806. 
+[50] W. J. Yu, S. H. Chae, S. Y. Lee, D. L. Duong, Y. H. Lee, Adv. Mater. 
+2011, 23(16), 1889. 
+[51] A. L. M. Reddy, A. Srivastava, R. S. Gowda, H. Gullapalli, M. Dubey, 
+M. P. Ajayan, ACS Nano 2010, 4, 6337. 
+[52] J. Vetter, P. Novák, M.R. Wagner, C. Veit, K.- C. Möller, J.O. Besenhard, 
+M. Winter, M. Wohlfahrt-Mehrens, C. Vogler, A. Hammouche, J. Power 
+Sources 2005, 147, 269. 
+[53] P. Arora, E. R. White, J. Electrochem. Soc. 1998, 145, 3647. 
+[54] T. Wijesinghe, D. Blackwood, Corrosion Science 2007, 49, 1755. 
+[55] S. Kadry, European. J. Scientific Research 2008, 22, 508. 
+[56] C.T. Hyams, J. Go, M.T. Devinea, J. Electrochem. Soc. 2007, 154, C390. 
+144 
+ 
+[57] S.-W. Song, J. T. Richardson, V. G. Zhuang, M. T. Devine, W. J. Evans,  
+Electrochim. Acta 2004, 49, 1483. 
+[58] X. Zhang, B. Winget, M. Doeff, W. J. Evans, M. T. Devine, J.  
+Electrochem. Soc. 2005, 152, B448. 
+[59] E. Pollak, B. Geng, K.-J. Jeon, T. I. Lucas, J. T. Richardson, F. Wang, R.  
+Kostecki, Nano Lett. 2010, 10, 3386. 
+[60] A. L. M. Reddy, A. Srivastava, R. S. Gowda, H. Gullapalli, M. Dubey, 
+M. P. Ajayan, ACS Nano 2010, 4, 6337. 
+[61] S. Chen, L. Brown, M. Levendorf, W. W. Cai, S.-Y. Ju, J. Edgeworth,  
+X. Li, C. Magnuson, A. Velamakanni, D. R. Piner, J. Kang, J. Park, S. R. 
+Ruoff, ACS Nano 2011, 5, 1321. 
+[62] D. Prasai, J. C. Tuberquia, R. R. Harl, G. K. Jennings, K. I. Bolotin, ACS 
+Nano 2012, 6 (2), 1102. 
+[63] G. H. Han, F. Güneş, J. J. Bae, E. S. Kim, S. J. H.-J. Shin, J.-Y. Choi, D. 
+Pribat, Y. H. Lee, Nano Lett. 2011, 11, 4144. 
+[64] S. J. Chae, F. Güneş, K. K. Kim, E. S. Kim, G. H. Han, S. M. Kim. H.-J.  
+Shin, S.- M. Yoon, J.-Y. Choi, M. H. Park, C. W. Yang, D. Pribat, Y. H. 
+Lee, Adv. Mater. 2009, 19(16), 2553. 
+[65] F. Güneş, G. H. Han, H.-J. Shin, S. Y. Lee, M. Jin, D. L. Duong, S. J. 
+Chae, E. S. Kim,; F. Yao, A. Benayad, J.-Y. Choi, Y. H. Lee, Nano 2011, 
+6, 409. 
+[66] C. Casiraghi, S. Pisana, K. S. Novoselov, A. K. Geim, A. C. Ferrari, 
+Appl. Phys. Lett. 2007, 91, 233108. 
+145 
+ 
+[67] R. R. Nair, P. Blake, A. N. Grigorenko, K. S. Novoselov, T. J. Booth, T. 
+Stauber, N. M. R. Peres, A. K. Geim, Science 2008, 320, 1308. 
+[68] E.J. Yoo, J. Kim, E. Hosono, H. S. Zhou, T. Kudo, I. Hunma, Nano  
+Lett. 2008, 8, 2277. 
+[69] J. P. Perdew, K. Burke, M. Ernzerhof, Phys. Rev. Lett. 1996, 77, 3865. 
+[70] Li, X.; Geng, D.; Zhang, Y.; Meng, X.; Li, R.; Su, X. Electrochem. 
+Commu. 2011, 13, 822. 
+[71] P.G. Bruce, B. Scrosati, J. - M. Tarascon, Angew. Chem. Int. Ed. 
+2008,47, 2930. 
+[72] J. Yan, J. Zhang, Y.C. Su, X. G. Zhang, B. Xia, J. Electrochim. Acta.  
+2010, 55, 1785. 
+[74] K. N. Kudin, B. Ozbas, H. C. Schniepp, R. K. Prud’homme, I. A.  
+Aksay, R. Car, Nano Lett. 2008, 8, 36. 
+[75] T. M. G. Mohiuddin, A. Lombardo, R. R. Nair, A. Bonetti, G. Savini, R. 
+Jalil, N. Bonini, D. M. Basko, C. Galiotis, N. K. Marzari, S. Novoselov, 
+A. K. Geim, A. C. Ferrari, Phys. Rev. B 2009, 79, 205433. 
+ 
+146 
+ 
+SUMMARY 
+ 
+Carbon-Based Nanomaterials as an Anode for Lithium Ion 
+Battery 
+The improvement of the capacity of raw CNF mat has been realized in the 
+current research through electrochemical deposition of Si. The Si/CNF mat 
+prevents the use of metal substrate, binder, and conducting polymers. However, 
+several drawbacks of the current free-standing Si/CNF mat structure need to be 
+mentioned: (i) The as-fabricated CNF mat exhibited a rather lower conductivity 
+compared to that of CNTs which could be the reason for the original low capacity 
+(< 300 mAh/g) of raw CNF mat. (ii) The flexibly of the as-fabricated CNF mat 
+reduces after high temperature annealing which hinders the further investigation 
+for flexible anode applications. These two factors can be further improved by the 
+incorporation of CNTs, graphene flakes or other more advanced materials. (iii) 
+Although the interfacial binding strength of Si and CNF was improved by the 
+formation of Si-C bond through annealing as discussed in the context, structural 
+pulverization of deposited Si film induced by the large volume expansion during 
+charge/discharge was still observed in the current structure. Therefore, increasing 
+the Si anchoring sites on the CNF mat by the surface functionalization and 
+enhancing the degree of entanglement through the introduction of CNTs could 
+provide better structure stability. The optimization to improve composite 
+147 
+ 
+structures for capacity, charge transfer, and cycle life is further required for 
+industry applications. 
+ 
+On the other hand, in order to clarify the Li diffusion pathways through 
+graphene plane and the role of defects in Li diffusion to reveal the mystery of Li-
+C system, graphene was used as a media for the study of this fundamental 
+science of diffusion in this work. We found that the electrochemical performance 
+of few-layer graphenes which are overlapped up to three layers of single layer 
+graphene is strongly affected by the substrate reaction. Experimental results 
+showed that 6 layers of basal plane-enriched large area graphene were needed to 
+provide sufficient substrate protection from severe electrolyte attack. Li diffusion 
+across the pure basal plane of graphene is strongly limited and nevertheless non-
+negligible diffusion is still allowed, suggesting possible diffusion through defects 
+that might be formed on the graphene plane. Combing the experimental results 
+and density functional theory calculations, we found that divacancies and higher 
+order defects can be shortcuts for lithium ion diffusion with respect to the 
+graphene basal plane. Further exploration of high energy density and long 
+lifetime anode by fabricating high capacity materials on graphene could be an 
+interesting research direction in the future. 
+ 
+Key Words:  nanocarbon materials, lithium ion battery, carbon nanofiber, silicon,  
+            Graphene 
+148 
+ 
+CURRICULUM VITAE 
+ 
+FEI YAO 
+ 
+LPICM-École Polytechnique, CNRS (UMR 7647)  
+Laboratoire de Physique des Interfaces et Couches Minces 
+Route de Saclay; 91128 PALAISEAU Cedex, France 
+ 
+IBS Center for Integrated Nanostructure Physics, Institute for Basic Science, Department of 
+Energy Science, Sungkyunkwan University 
+Room 85689, Corporate Collaboration Center, 300 Cheoncheon-dong, Jangan-gu, Suwon, 
+Gyeonggi-do 440-746, Korea · 82-31-299-6509 ·  
+Mobile: +82-10-2757-1299  
+E-mail: apaperyao@gmail.com, yaofei@skku.edu 
+ 
+ 
+Education 
+______________________________________________________ 
+ 
+  
+2010.08 ~           P h .D . candidate 
+LPICM-École Polytechnique 
+Laboratoire de Physique des Interfaces et Couches Minces, 
+Route de Saclay; 91128 PALAISEAU Cedex , France; 
+ 
+ 
+IBS Center for Integrated Nanostructure Physics, Institute for 
+Basic Science, Department of Energy Science, 
+Sungkyunkwan University, 
+Korea. 
+Advisor:  Professor Young Hee Lee 
+ 
+         Dr. Costel-Sorin Cojocaru 
+  
+2008.03 ~ 2010.08    M  .S    
+Sungkyunkwan Advanced Institute of Nanotechnology 
+ Sungkyunkwan University 
+Korea. 
+ Advisor:  Professor Young Hee Lee 
+149 
+ 
+2003.09~2007.09     B . S   
+Department of Electronic Information Engineering 
+ Shandong Normal University 
+China. 
+ 
+ 
+ 
+RESEARCH EXPERIENCE 
+_____________________________________________________________________ 
+ 
+1. CNT gas sensor fabrication 
+- Enhancement of sensitivity to NO2, SO2, NH3 gases etc. 
+- Selectivity among NO2, SO2, NH3 gases etc. 
+2. Dispersion of SWCNTs / MWCNTs  
+- In water with surfactant (SDS, NaDDBS etc) 
+- In organic solution (NMP, DCE etc) 
+3. Synthesis of graphene and carbon nanotubes by chemical vapor deposition 
+- Large-area few-layer graphene synthesis on metal substrates (Ni, Cu), etching & 
+transfer onto desired substrates (SiO2, PET etc.) 
+- Large-area monolayer graphene growth on Cu foil, etching & transfer processes 
+- Synthesis of SWCNTs network and MWCNTs by chemical vapor deposition 
+4. Doping of graphene for electrode applications 
+    - P-type doping by metal-salts and acid solutions for enhancement of conductivity 
+for flexible transparent conducting film applications  
+  - Multiple-layered graphene film preparation and investigation of conductivity 
+enhancement by Layer-by-Layer (LBL) doping 
+5. Carbon nanofiber fabrication using electrospinning method for energy application 
+- Carbon nanofibers with CNT composite  
+- Carbon nanofiber with Si composite 
+6. Si-based material synthesis and energy storage applications 
+- Si thin film deposition by PECVD for energy application (lithium ion battery, 
+solar cell) 
+- Si nanoparticle deposition by electrochemical method for battery application. 
+7. Fuel cell application with carbon-based materials 
+ 
+ 
+ 
+ 
+150 
+ 
+EQUIPMENTS 
+_____________________________________________________________________ 
+ 
+- Plasma enhanced CVD, Thermal CVD, Atomosphere pressure CVD 
+- E-beam and thermal evaporator 
+- Magnetron sputter 
+- Micro Raman and confocal Raman spectroscopy 
+- High resolution scanning electron microscope (HR-SEM) 
+- Atomic force microscope (AFM) 
+- UV-NIR absorption spectroscopy 
+- Potentiostat /Galvanostat equipment 
+- Spray equipment 
+- Electrospinning equipment 
+ 
+ 
+ 
+PUBLICATIONS (SCI journal) 
+━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 
+ 
+12. Fethullah Gunes ,⃰  Fei Yao ,⃰  Hongyan Yue, Hung T. Nguyen, Bing Li, and Young 
+Hee Lee, 'A direct synthesis of Si-nanowires on a 3D porous graphene as high 
+performance anode material for Li-ion batteries', 2013, submitted. 
+ 
+11. M. Jin, Fei Yao, J. Chang, and Y. H. Lee, 'Graphene sheets as anode materials with 
+super high rate and large capacity for Lithium ion batteries' 2013, in preparation. 
+ 
+10. Jian Chang, Meihua Jin, Fei Yao, and Young Hee Lee, 'Asymmetric Supercapacitors 
+Based on Graphene/MnO2 Nanospheres and Graphene/MoO3 Nanosheets with High 
+Energy Density ' 2013, Adv. Func. Mater., accepted. 
+ 
+9. Seung Mi Lee, Fei Yao, and Young Hee Lee, 'Lithium ion diffusion through basal 
+plane of graphene: A density functional theory study' 2013, J. Nanoscience and 
+nanotechnology, submitted. 
+ 
+8. Fei Yao, Bing Li., Fethullah Gunes, Costel Sorin Cojocaru, and Lee, Y. H. 'Silicon 
+and carbon nanofiber composite as an anode material for lithium ion battery' 2013, 
+Nanoscale, submitted. 
+ 
+151 
+ 
+    
+7. Thuc Hue Ly, Dinh Loc Duong,Quang Huy Ta, Fei Yao, Quoc An Vu, Hye Yun Jeong,
+Sang Hoon Chae, and Young Hee Lee, 'Nondestructive Characterization of Graphene 
+Defects' 2013, Adv. Func. Mater, accepted. 
+ 
+6. Fei Yao, Fethullah Gunes, Huy Quang Ta, Seung Mi Lee, Seung Jin Chae, Kyeu 
+Yoon Sheem, Costel Sorin Cojocaru, Si Shen Xie, and Young Hee Lee, 'Diffusion 
+Mechanism of Lithium Ion through Basal Plane of Layered Graphene', J. Am. Chem. 
+Soc., 134(20), 8646-8654, (May 23, 2012). 
+ 
+5. Hung T. Nguyen, Fei Yao, Mihai R. Zamfir, Chandan Biswas, Kang Pyo So, Young 
+Hee Lee, Seong Min Kim, Seung Nam Cha, Jong Min Kim, Didier Pribat, 'Highly 
+Interconnected Si Nanowires for Improved Stability Li-Ion Battery Anodes', Advanced 
+Energy Materials ,1(6), 1154–1161, (Nov, 2011). 
+ 
+4. Fethullah Güneş, Gang Hee Han, Hyeon-Jin Shin, Si Young Lee, Meihua Jin, Dinh 
+Loc Duong, Seung Jin Chae, Eun Sung Kim, Fei Yao, Anass Benayad, Jae-Young Choi 
+and Young Hee Lee, ‘UV Light-Assisted Oxidative Sp3-Hybridization of Graphene’, 
+NANO, 6 (5),409–418, (May 26, 2011). 
+ 
+3. Fei Yao, Dinh Loc Duong, Seong Chu Lim, Seung Bum Yang, Ha Ryong Hwang, 
+Woo Jong Yu, Il Ha Lee, Fethullah Gunes, and Young Hee Lee, 'Humidity-assisted 
+selective reactivity between NO2 and SO2 gas on carbon nanotubes', J. Mat. Chem., 
+21(12), 4502-4508, (Mar. 28, 2011).  
+ 
+2.Il Ha Lee, Un Jeong Kim, Hyung Bin Son, Seon-Mi Yoon, Fei Yao, Woo Jong Yu, 
+Dinh Loc Duong, Jae-Young Choi, Jong Min Kim, Eun Hong Lee and Young Hee Lee, 
+'Hygroscopic Effects on AuCl3-Doped Carbon Nanotubes', Journal of Physical 
+Chemistry C, 114(26), 11618-11622 ,(Jun. 10. 2010). 
+ 
+1. Fei Yao, Seong Chu Lim, Woo Jong Yu, Il Ha Lee, Fethullah Gunes, Ha Ryong 
+Hwang, Seung Bum Yang, Kang Pyo So, Gang Hee Han, and Young Hee Lee, 'AC 
+Response to Gas Exposure in Vertically Aligned Multiwalled Carbon Nanotube 
+Electrode', J. Phys. Chem. C, 114(8), 3659-3663, (Feb. 5, 2010). 
+ 
+ 
+PATENTS (Korea) 
+━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 
+ 
+152 
+ 
+Large Area Graphene as a Protecting Layer for Metal Corrosion, submitted. 
+Presentations  
+━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 
+6. Fei Yao, Bing Li, Kangpyo So, Jian Chang, Vu Quoc An, Didier Priba1, Costel Sorin 
+Cojocaru, Hongyan Yue, Sishen Xie, Young Hee Lee1, 'Silicon-Coated Carbon 
+Nanofiber Mat for Anode of Lithium Ion Battery', Imaginenano 2013, Bilbao, Spain, 
+April 23~26, 2013, oral. 
+ 
+5. Fei Yao, Fethullah Gunes, Ta Quang Huy, Seung Mi Lee, Seung Jin Chae, Kyeu Yoon 
+Shem, Costel Sorin Cojocaru, Si Shen Xie, Young Hee Lee, 'Lithium Ion Diffusion 
+Through Basal Plane of Layered Graphene Synthesized by Chemical Vapor Deposition', 
+16th International Meeting on Lithium Batteries (New Era for Smart Energy Storage) 
+(IMLB 2012), ICC Jeju, Korea, June 17~22, 2012, p.104. 
+ 
+4. Fei Yao, Hung Tran Nguyen, Kang Pyo So, Chandan Biswas, Giduk Kwon, Si Thanh 
+Pham, Zamfir Mihai Robert, Young Hee Lee and Didier Pribat, 'Carbon Nanofiber/Si 
+Nanowire As an Anodematerial for Li-Ion Battery', 1st Korean-French Seminar On 
+Nanomaterials for Energy, Sungkyunkwan University, Mar. 6-8,2011, p.50 
+ 
+3. Fei Yao, Hung Tran Nguyen, Kang Pyo So, Chandan Biswas, Giduk Kwon, Si Thanh 
+Pham, Zamfir Mihai Robert, Young Hee Lee, Dider Pribat, 'Carbon Nanofiber/Si 
+Nanowire as An Anode Material for Li-Ion Battery', A3 Symposium on Emerging 
+Materials: Nanocarbons and Nanowires for Energy, Core-Riviera Hotel, Jeonju, Nov. 7-
+11. 2010, p.61 
+ 
+2. Fei Yao, Duong Dinh Loc, Seong Chu Lim, Seung Bum Yang, Ha Ryong Hwang, 
+Woo Jong Yu, Fethullah Gunes, Young Hee Lee, 'Humidity-assisted selective reactivity 
+between NO2 and SO2 gas on carbon nanotubes', NT10(11th International Conference 
+on the Science and Application of Nanotubes 2010), Hilton Bonaventure Montreal, 
+Quebec, Canada, Jun 27-Jul 2. 2010, p.96 
+ 
+1. Fei Yao, Seong Chu Lim, Woo Joong Yu, Fethullah Gunes and Young Hee Lee 
+'Capacitive Gas Sensor of Vertically Aligned Carbon Nanotubes', International Green 
+Energy Nanocarbon Conference 2009,Jeollabuk-do provincial office, Jeonju, Korea, 
+Nov. 3~6. 2009, p.155 
+ 
+ 
+153 
+ 
+ 154 
+ 
diff --git a/examples/theses/HalThesis1.pdf b/examples/theses/HalThesis1.pdf
new file mode 100644
index 00000000..d8672ac7
Binary files /dev/null and b/examples/theses/HalThesis1.pdf differ
diff --git a/examples/theses/HalThesis1/fulltext.pdf b/examples/theses/HalThesis1/fulltext.pdf
new file mode 100644
index 00000000..d8672ac7
Binary files /dev/null and b/examples/theses/HalThesis1/fulltext.pdf differ
diff --git a/examples/theses/HalThesis2.pdf b/examples/theses/HalThesis2.pdf
new file mode 100644
index 00000000..a052067a
Binary files /dev/null and b/examples/theses/HalThesis2.pdf differ
diff --git a/examples/theses/HalThesis2/fulltext.pdf b/examples/theses/HalThesis2/fulltext.pdf
new file mode 100644
index 00000000..a052067a
Binary files /dev/null and b/examples/theses/HalThesis2/fulltext.pdf differ
diff --git a/examples/theses/HalThesis2/fulltext.pdf.txt b/examples/theses/HalThesis2/fulltext.pdf.txt
new file mode 100644
index 00000000..cad8e6ab
--- /dev/null
+++ b/examples/theses/HalThesis2/fulltext.pdf.txt
@@ -0,0 +1,3548 @@
+Development of higher efficiency photocathodes for gas
+filleddetectors
+Guillaume Potdevin
+To cite this version:
+Guillaume Potdevin. Development of higher efficiency photocathodes for gas filleddetectors.
+Physics. Universite´ Joseph-Fourier - Grenoble I, 2008. English. <tel-00275299>
+HAL Id: tel-00275299
+https://tel.archives-ouvertes.fr/tel-00275299
+Submitted on 23 Apr 2008
+HAL is a multi-disciplinary open access L’archive ouverte pluridisciplinaire HAL, est
+archive for the deposit and dissemination of sci- destine´e au de´poˆt et a` la diffusion de documents
+entific research documents, whether they are pub- scientifiques de niveau recherche, publie´s ou non,
+lished or not. The documents may come from e´manant des e´tablissements d’enseignement et de
+teaching and research institutions in France or recherche franc¸ais ou e´trangers, des laboratoires
+abroad, or from public or private research centers. publics ou prive´s.
+THE`SE
+pour obtenir le titre de
+Docteur de l’Universite´ Joseph Fourier
+Discipline :
+Physique
+pre´sente´e et soutenue publiquement par
+Guillaume POTDEVIN
+Sujet de the`se :
+Development of higher efficiency photocathodes for gas filled
+detectors
+Soutenance le 29 Janvier 2008 devant le jury compose´ de :
+Franc¸ois Montanet LPSC, CNRS, Grenoble Repre´sentant de l’universite´
+Imad Laktineh IPNL, CNRS, Lyon Rapporteur
+Ralf Menk Elettra, Trieste Rapporteur
+Johann Collot LPSC, CNRS, Grenoble Directeur Acade´mique
+Menhard Kocsis ESRF, Grenoble Superviseur a` l’ESRF
+2
+Contents
+1 Introduction 1
+1.1 Why Detectors ? . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 1
+1.1.1 A small history of X-ray sources . . . . . . . . . . . . . . . . . . . . . . . . . . 2
+1.1.2 A new Science is born: Photon Science . . . . . . . . . . . . . . . . . . . . . . . 4
+1.1.3 A typical experimental setup . . . . . . . . . . . . . . . . . . . . . . . . . . . . 6
+1.1.4 The place of the detector in the chain . . . . . . . . . . . . . . . . . . . . . . . 9
+1.2 Detectors in the hard X-ray energy range . . . . . . . . . . . . . . . . . . . . . . . . . 10
+1.2.1 What are the detector main characteristics? . . . . . . . . . . . . . . . . . . . . 10
+1.2.2 The Detective Quantum Efficiency . . . . . . . . . . . . . . . . . . . . . . . . . 11
+1.2.2.1 The DQE dependence on the Quantum Efficiency. . . . . . . . . . . . 12
+1.2.2.2 The dependence of the DQE on the spatial resolution . . . . . . . . . 13
+1.2.3 The mode of operation, speed and behavior of one detector at large intensities 15
+1.3 Spectroscopy detectors . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 18
+1.4 Imaging detectors . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 21
+1.4.1 current mature technologies . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 21
+1.4.2 technologies under developments . . . . . . . . . . . . . . . . . . . . . . . . . . 23
+1.4.2.1 Spectroscopy Detectors under development . . . . . . . . . . . . . . . 23
+1.4.2.2 Imaging Detectors under development . . . . . . . . . . . . . . . . . . 23
+2 The basics of gas-filled detectors 29
+2.1 historical background . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 29
+2.2 Principle of gas-filled detectors . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 30
+2.2.1 The X-ray absorption in the gas . . . . . . . . . . . . . . . . . . . . . . . . . . 30
+2.2.2 The amplification and the modes of operation of gas-filled detectors . . . . . . 31
+2.2.3 The benefits of gas-filled detectors . . . . . . . . . . . . . . . . . . . . . . . . . 33
+2.2.4 The limitations of gas-filled detectors . . . . . . . . . . . . . . . . . . . . . . . . 33
+2.3 Recent Evolutions of gas-filled detectors . . . . . . . . . . . . . . . . . . . . . . . . . . 35
+ii CONTENTS
+2.4 Gas amplification compared to Microchannel plates . . . . . . . . . . . . . . . . . . . . 37
+2.5 A promising approach to overcome Gas-filled detectors limitations . . . . . . . . . . . 38
+3 Photocathode for gas-filled detectors 41
+3.1 Basics of Photocathodes . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 41
+3.2 Improved Models of Photocathodes . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 45
+3.3 Major technologies of photocathodes currently available . . . . . . . . . . . . . . . . . 45
+3.3.1 Metallic Photocathode . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 46
+3.3.2 Semiconducting Photocathode . . . . . . . . . . . . . . . . . . . . . . . . . . . 46
+3.3.3 Organic Photocathode . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 47
+3.3.4 CsI . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 47
+3.3.5 Conclusions on available technologies of Photocathodes and the issues related
+to their use . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 48
+4 The Simulations by Monte Carlo Method 55
+4.1 A first approach to Monte Carlo . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 55
+4.1.1 History . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 55
+4.1.2 Description of the Monte Carlo Method . . . . . . . . . . . . . . . . . . . . . . 56
+4.1.3 The Monte Carlo Method in Particle Transport . . . . . . . . . . . . . . . . . . 57
+4.2 The Geant4 toolkit for particle transport into matter . . . . . . . . . . . . . . . . . . . 57
+4.2.1 The way Geant4 computes particle propagation . . . . . . . . . . . . . . . . . . 58
+4.2.1.1 The tracking of the particles . . . . . . . . . . . . . . . . . . . . . . . 58
+4.2.1.2 The physical interactions in Geant4 . . . . . . . . . . . . . . . . . . . 61
+4.2.1.3 Analysis and Representation tools . . . . . . . . . . . . . . . . . . . . 62
+4.2.2 The simulation tool developed . . . . . . . . . . . . . . . . . . . . . . . . . . . 62
+4.2.2.1 Description and Functionalities . . . . . . . . . . . . . . . . . . . . . . 62
+4.2.2.2 The test of the code, comparison with experimental values . . . . . . 64
+4.2.2.3 The limits of the Monte Carlo Method . . . . . . . . . . . . . . . . . 66
+4.3 The simulation performed . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 67
+4.3.1 The simulations performed . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 67
+4.3.2 Use of the simulations for thickness optimization . . . . . . . . . . . . . . . . . 70
+4.3.3 Simulation of the impact of structures on the photocathode . . . . . . . . . . . 71
+4.4 Conclusion on this part of the work . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 71
+5 Experimental Setup and Sample Preparation 77
+5.1 Design of the measurement setup . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 77
+5.1.1 A few general considerations . . . . . . . . . . . . . . . . . . . . . . . . . . . . 77
+5.1.2 The chamber and the ammeter . . . . . . . . . . . . . . . . . . . . . . . . . . . 78
+5.1.2.1 The Photocathode holder, the electrical shielding . . . . . . . . . . . 78
+5.1.2.2 The Chamber . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 80
+5.1.2.3 The Keithley 6430 ammeter . . . . . . . . . . . . . . . . . . . . . . . 81
+CONTENTS iii
+5.1.3 Results of calibration and test of the chamber . . . . . . . . . . . . . . . . . . . 81
+5.1.4 Conclusion concerning the setup . . . . . . . . . . . . . . . . . . . . . . . . . . 83
+6 The different concepts to make a photocathode 87
+6.1 Indirect conversion . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 87
+6.1.1 Photocathodes in visible and UV . . . . . . . . . . . . . . . . . . . . . . . . . . 88
+6.1.2 Scintillation materials . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 89
+6.1.3 Possible combinations . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 90
+6.1.4 Conclusion . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 91
+6.2 Direct conversion . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 92
+6.2.1 Modify the geometry to increase the yield of one material . . . . . . . . . . . . 92
+6.2.1.1 Porous Photocathodes . . . . . . . . . . . . . . . . . . . . . . . . . . . 93
+6.2.1.2 Regular Structures . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 93
+6.2.2 Field emission . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 97
+6.2.3 A new material: CsI3 . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 98
+7 Experimental tests and discussion of the results 101
+7.1 Modify the geometry to increase the yield of a material . . . . . . . . . . . . . . . . . 101
+7.1.1 Analysis of the microstructures characteristics . . . . . . . . . . . . . . . . . . . 102
+7.1.2 Efficiency measurements . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 103
+7.2 Field Emission . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 103
+7.2.1 Analysis of the microstructure characteristics . . . . . . . . . . . . . . . . . . . 103
+7.2.2 Efficiency Measurements . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 104
+7.3 CsI3 as a new photocathodes material . . . . . . . . . . . . . . . . . . . . . . . . . . . 104
+7.3.0.1 Physical and chemical characteristics . . . . . . . . . . . . . . . . . . 104
+7.3.1 The CsI3 samples . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 105
+7.3.1.1 Preparation of the different samples . . . . . . . . . . . . . . . . . . . 106
+7.3.1.2 Analysis of the microstructures of the samples and their evolution . . 107
+7.3.2 CsI3 quantum efficiency and comparison with CsI. . . . . . . . . . . . . . . . . 110
+7.3.2.1 The quantum efficiency of CsI and its evolution in air . . . . . . . . . 110
+7.3.2.2 The quantum efficiency of CsI3, its evolution in air and comparison
+with CsI. . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 112
+7.3.3 Analysis of the results obtained with CsI3 . . . . . . . . . . . . . . . . . . . . . 118
+7.3.4 Conclusion on the use of CsI3 as a photocathode . . . . . . . . . . . . . . . . . 120
+8 Conclusion 123
+A Detector characteristics 125
+A.1 Position resolution in the case of gas-filled detectors . . . . . . . . . . . . . . . . . . . 125
+A.2 Energy Resolution . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 125
+A.3 Space Charging in gas-filled detectors . . . . . . . . . . . . . . . . . . . . . . . . . . . 126
+iv CONTENTS
+Annexes 125
+B Monte Carlo Application Examples 129
+B.1 Simple Examples of statistical sampling methods . . . . . . . . . . . . . . . . . . . . . 129
+B.1.1 Calculus of an integral . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 129
+B.1.2 An historical example: Buffon’s needles . . . . . . . . . . . . . . . . . . . . . . 130
+Chapter 1
+Introduction
+1.1 Why Detectors ?
+Probably the first human being already was driven by a strong sense of curiosity, as it is some of the
+deepest law of human nature. This force has pushed mankind to develop more and more powerful
+investigation tools to help him understand its environment. Outstanding examples in the past are the
+telescope used by Galile´e to make the first observation for Jupiter’s satellites, or Van Leewenhoek ’s
+microscope, which enabled the discovery of microscopic animals... In this frame, X-rays are nothing
+but an extension to humans’ capabilities to explore the world, and X-ray detectors are their eyes,
+adapted for such investigations.
+This work is intended to contribute to the development of modern tools for matter studies. It is part
+of a more global program to provide modern light sources with reliable and efficient detectors, able
+to answer the growing needs of the scientific community in this domain.
+2 Introduction
+1.1.1 A small history of X-ray sources
+Figure 1.1 : Conrad Wilhelm RO¨NTGEN (March
+27, 1845 - February 10, 1923), German physicist. Figure 1.2 : Brilliance of various light sources.
+The brilliance enables to measure the quality of a
+light source.
+Since their first identification by Wilhelm Ro¨ntgen in the late 18th century (for which he was awarded
+the first Nobel Prize for Physics in 1901), X-rays have been at the origins of several revolutions in
+numerous fields of research.
+This broadening of the usefulness of X-rays is mainly due to the fantastic development of X-ray
+sources. The following lines give a short history of those sources.
+Discharge tubes or Crookes tube
+William Crookes, an English physicist, is the inventor of the first artificial source of X-rays: while he
+was studying the effects of electric currents in gas at low pressure, he used glass vacuum cylinders,
+containing electrodes for discharges of a high voltage electric current1. He noticed that unexposed
+photographic plates were shadowed when approached from those tubes, even though he did not
+identify this to be caused by a particular sort of radiation.
+Fernando Sanford later bettered this principle of emissions and published in 1893 in the Journal
+Physical Review an article entitledObserved tubes with energy rays extending from a negative electrode.
+It is interesting to note that even after deeper studies by Heinrich Hertz of those specific radiations,
+they were not identified as a new sort of radiation. Only the work of Wilhelm Ro¨ntgen with Vacuum
+tubes enabled to actually identify X-rays as a new kind of ray.
+Those tubes are actually the ancestors of modern X-ray tubes, which are the result of a technological
+1this sort of tube had already been used by the physicist Johann Hittorf who observed tubes with energy rays
+extending from a negative electrode.
+1.1 Why Detectors ? 3
+improvement of the original Crookes tube.
+Synchrotron radiation sources
+Figure 1.3 : The General electric particle accelerator, at the origin of the discovery of synchrotron radiations.
+The arrow indicates the trace of the synchrotron radiation beam on the picture. It is the first observation of
+synchrotron radiations.
+The history of synchrotron radiations is closely related to that of particle physics. First considered
+as a nuisance sapping the energy of the particles, it was later recognized as a powerful tool to study
+matter. One usually distinguishes three major steps on the way to modern light sources:
+First Generation Sources were mainly synchrotrons built for the study of particle physics (High
+Energy Physics HEP), which were refurbished as light sources, as the frontiers of HEP were
+pushed forward. This way, it is often said that the use of those synchrotrons as light sources
+was a sort of parasitic operation of the synchrotrons. A big step occurred in the 50’s as
+the first electron storage rings were built, providing a much more stable, fixed energy, and
+continuous beam of particles (and thus photon beam). Those machines have been the models
+for all synchrotron light sources until now.
+Second Generation Sources were the first machines dedicated for light emission. They were the
+first machines able to operate a large number of beamlines, with optimized emittance parameters
+(quality of the beam), stable energy and beam position. The development of those machines
+4 Introduction
+was associated to important developments in optics and gave birth to new types of experiments
+such as EXAFS or large protein crystallography.
+Third Generation Sources are storage rings optimized to have numerous long straight sections,
+in which undulators and wrigglers can take place, so providing a much higher brightness and
+flux of photon beams. This is the birth of large facilities (800 to 1400m) offering several tens
+of beamlines, typically welcoming several thousands of users every year.
+The future of light sources will probably see a parallel development of the third generation light
+sources, which keep bettering in terms of performance, and the birth of the fourth generation sources,
+also called Free electron lasers (FEL). FEL will be able to offer peak of brightness of several
+order of magnitude higher than third generation sources, as well as pulses as short as 100 fs and
+highly coherent. FELs will be constituted of very long undulators in high-energy linear accelerators.
+Those devices will offer a new range of possibility of investigation of matter, but will not directly
+compete with third generation sources as they will not be able to offer the many beamlines that
+storage rings have.
+Indeed, several projects of third and fourth generation sources have been launched recently or are
+even in their commissioning phase (the synchrotrons Diamond and Soleil in Oxford and Paris, the
+European X-FEL in Hamburg...). Yet it is unlikely that all those sources will be able to answer the
+growing demand for high brightness sources.
+1.1.2 A new Science is born: Photon Science
+Figure 1.4 : The ESRF seen from top. The ESRF is one the modern lightsources able to provide high
+brightness photon beams.©P.Ginter/ESRF.
+Photon Sciences encompass all the techniques using high brilliance photon beams, such as those pro-
+duced in Synchrotron Radiation Facilities, and Free Electron Lasers. Those sophisticated and perma-
+nently evolving machines enable the production of highly intense beams of photons. The brilliance
+(which measures the quality of the beam) is now more than 10 orders of magnitudes higher than that
+of conventional sources (see Figure 1.2).
+1.1 Why Detectors ? 5
+Among those new generation sources, a majority of them are dedicated to the production of X-rays,
+and to the development of techniques making use of them.
+Since their first direct application (photography of Wilhelm Ro¨ntgen’s wife’s hand), X-rays have
+become the base of applications as various as:
+Medical imaging and treatment: radiography techniques, scanners, cancer treatments, computer to-
+mography, are just some of the numerous applications of X-rays in medicine.
+Now modern sources have pushed the development of new techniques, like: high-resolution
+3D tomography imaging techniques, therapeutic treatments, drugs research,
+Physics: Numerous physical characterization techniques are based on X-rays. If historically X-rays
+first enabled the study of crystals by mean of the crystallography, they are now routinely
+used to study soft matter (diffuse scattering), the chemical composition of elements (spec-
+troscopy), magnetic structures (magnetic scattering-magnetic dichroism), the surface and
+interface properties of various materials (small angle scattering) etc...
+Biology. Biology always beneficiated from the development of physics techniques for its development
+(the structure of DNA was discovered thanks to the X-ray diffraction technique). Now a
+wide range of techniques is specifically devoted to biological applications: macromolecular
+crystallography has become a science on its own, and more and more techniques benefit
+from developments specific to biological applications.
+Archeology and art. Archeological and artistic pieces are by definition unique and fragile. Since most
+X-ray based techniques are non destructive, they are of prime interest to learn more on
+those precious ”samples”.
+Figure 1.6 : example of a protein structure resolved
+Figure 1.5 : Toumai’s skull, as obtained thanks to by diffraction technique.
+a tomographic technique.
+For example it is now possible to know with a precision better than one Angstrom, the position of
+each atoms in biological macromolecules (typically several thousands of amino acids). One can find
+in all kind of samples the rarest traces of impurities, and get extremely useful information on the
+history of the sample, or on its composition. It is possible to reconstruct in 3 dimensions the structure
+of various samples with a precision of the order of a few microns, to determine the inner structure of
+micro-objects, and directly study the properties of nanometer size objects...
+6 Introduction
+Another big advantage is the fact that those analysis are mostly non destructive.
+→ It is possible to study unique samples, like archeological objects or space objects (brought
+back by various space missions or even by the fall of asteroids)
+→ It is possible to follow in situ complex process like chemical or biological reactions with a time
+resolution of the picosecond or even less.
+→ It enables eventually to repeat the experiment, which is not always easy to do when the sample
+itself is hard to make.
+→ It is possible to combine different techniques on the same sample.
+As a result, there are more and more ”photon factories” in the world to answer the growing need
+of scientists for those techniques of analysis. Experiments, which were just impossible to do even
+20 years ago are now routinely achieved in synchrotrons and have become the standard in a lot
+of fields. The area of interest for synchrotrons and the future X-FELs also keeps growing as new
+applications (such as medical applications, nano-analysis) arise and revolutionize the possibilities in
+their respective fields.
+In the future, it is likely that the demand for high quality sources will keep growing, especially with
+the arrival of more and more hybrid techniques, combining various apparatus like electron imaging
+combined with magnetic dichroism imaging or atomic force microscopes combined with nano-focused
+photon beams, LEED analysis and photoemission spectroscopy...
+1.1.3 A typical experimental setup
+An experiment using high quality sources involves a lot of elements, each being highly optimized.
+A typical beamline (where the photon beams is shaped and positioned, and where experiments are
+carried out ) is almost always composed of four main parts (see fig. 1.7):
+• A source
+• An optics hutch,
+• An experimental hutch,
+• A control hutch.
+The source is composed of the particles circulating in the storage ring. Charged particles like
+electrons or positrons used in synchrotrons emit light when submitted to acceleration. For those
+particles have a very high energy (several GeV), the emitted light is tangential to their direction of
+motion. This results in a very concentrated beam with a low divergence, and high flux.
+1.1 Why Detectors ? 7
+Figure 1.7 : Schematic of a typical beamline. After
+Figure 1.8 : Picture of a (blue) bending Mag-
+the beam was produced in the storage ring, it en-
+net. The bending magnets are one type of source
+ters the optic cabin and then the experimental cabin
+of photon beam in synchrotron radiation facilities.
+where it hits the sample. All elements are remotely
+©P.Ginter/ESRF
+controlled from the control cabin.
+The storage ring in reality is a large polygon. At each of its angles one can find bending magnets,
+which produce an intense magnetic field, where the particles trajectory is bent. This is also the place
+where light is produced. Beamline find their origins in those bending magnets.
+In addition, elements called insertion devices are specifically made to produce a very large flux (see
+picture 1.10 for the example of an undulator). Those elements consist of straight sections in which an
+alternative magnetic field is applied on the pathway of particles (with a small period and permanent
+magnet they are called undulators, and with long period electromagnets, they are called wigglers).
+In those elements the particles follow a zigzag trajectory. The quantity of light obtained is largely
+increased, as each turn adds light to that of the previous one, and because the emitted light is all
+emitted in the direction of the straight section and not spread all along a large curve, like in bending
+magnets.
+In the case of undulators (small period) the light emitted by the device is coherent enough (spatially
+and temporally) to create a phenomenon of interference. This results in the concentration of the
+emitted energies at a fundamental frequency and a few harmonics. The Figure 1.9 gives the respective
+spectrums of a bending magnet, a wiggler and an undulator. One can clearly see the gain in terms
+of flux and monochromaticity (in particular when comparing undulators to bending magnets).
+8 Introduction
+Figure 1.10 : Photo of an Undulator. Undulators
+are the brightest sources of photon beams in syn-
+Figure 1.9 : Emission Spectrum of a bending mag- chrotron radiation facilities. ©P.Ginter/ESRF
+net, a wriggler, and an undulator
+The optics hutch contains the elements, which shape the beam: it usually contains several elements
+such as:
+→ a shutter, which controls the entrance of the beam in the hutch (this is a crucial element for
+the safety of persons).
+→ slits. They give its shape to the spot, by removing the non-focused part of the beam (especially
+in the case of the bending magnets),
+→ monochromator. It selects very precisely the energy (selects the good wavelengths from the
+white beam),
+→ focusing mirrors and/or lenses. They concentrate the beam to a spot, which can be as small
+as a few microns or even less. Alternatively, they can be used to make a very wide and
+homogeneous beam (ex. case of medical tomography).
+The experimental hutch provides all the sample environment and detection systems needed to
+carry out the experiments.
+• The sample Environment is made of elements, which control the conditions of the experiment:
+vacuum chambers and high pressure gaskets, sample heaters and cryogenic coolers, gas flows
+and electrochemistry cells are some examples of systems mandatory to make several sorts of
+experiments.
+• The detector. The detector is in charge of collecting the information provided by the interaction
+of the beam with the sample. It will be further detailed in the next section.
+1.1 Why Detectors ? 9
+Figure 1.12 : A beamline seen from the top. The
+Figure 1.11 : An example of experimental storage beam is hidden behind the concrete blocks on
+setup, illustrating the complexity of experimental the left side of the picture. Photons enter the beam-
+setup to provide the right sample environment. line at the top of the photo. ©P.Ginter/ESRF
+©P.Ginter/ESRF
+1.1.4 The place of the detector in the chain
+The detector occupies a central place in the experimental setup, in this that it collects the photons
+scattered after the beam/sample interaction. So the detector is a main source of information in any
+photon science experiment.
+So far, lots of efforts have been put in the production of high quality beams in terms of stability,
+monochromaticity... The fantastic progress in this field is highlighted by the exponential rise of the
+brilliance of the light sources during the last few decades (see Figure 1.2).
+After those great achievements in brilliance, now comes the time to harvest this huge amount of
+scattered photons with detectors. Indeed, in a lot of experiments, the main limiting factor is
+the detector itself. The ESRF long-term strategy, which defines the future developments at ESRF,
+states that ”detectors are generally recognized as the weak link in the modern use of SR”[1].
+Detectors used in the experiments usually suffer from:
+• Low efficiency (only a very small fraction of the monitored particle are actually detected, so the
+radiation dose received by the sample has to be increased)
+• limited speed (fast reactions cannot be recorded. This also increases the dose received by the
+sample)
+• limited size (lowers the speed of the experiments forcing to make several acquisition.)
+• limited dynamic range (a problem for techniques giving a high contrast, like small angle diffusion
+scattering analysis).
+Now more emphasis is put on instrumentation in the beamlines. Most large facilities have specific
+programs for the development of new generation detectors. To answer the high cost associated to
+these developments, collaborations among several institutes are created.
+Already, various development projects have started to provide the beamlines with detectors, which
+would suit the current requirements of experiments carried out in modern lightsources.
+10 Introduction
+In particular, this thesis is part of a project to develop a new generation of gas-filled
+detectors with a high dynamic, large area, good efficiency and good robustness.
+This thesis explores the possibility to use a photocathode as a first step photons → electrons
+converter to ensure a good efficiency and spatial resolution of the detector.
+1.2 Detectors in the hard X-ray energy range
+A short introduction to the most common technologies of detectors used in the synchrotron radiation
+community can be found in the well-known orange X-ray data booklet [2]. For each technologies an
+extensive description can be found in K.Knoll’s Radiation and Measurement [3].
+It should be noted that in what follows only detectors technologies designed for X-rays are described.
+Yet, most of those detectors can also be used with other sort of particles/radiations.
+1.2.1 What are the detector main characteristics?
+Basically, a detector provides information about the:
+• position
+• time
+• eventually energy and direction
+• intensity
+of an incoming particle/photon beam.
+The measurement of one physical quantity is never perfect, but suffers from several imprecision and
+uncertainties. Those uncertainties have several origins:
+• The measured signal itself suffers from statistical fluctuations. Those intrinsic fluctuations
+cannot be avoided, but several measurements of the same quantity enable to determine the
+distribution function of the physical quantity. Statistical models then enable to determine more
+accurately the physical quantity, and also to calculate the statistical error of the measurement.
+• In addition to the intrinsic fluctuations of the measured physical quantity, the detector suffers
+from a limited precision in measuring it. The characteristics of one detector give information
+on the accuracy of one measurement, and on the error of measurement.
+• The signal is never recorded alone, but several fake events appear with the measurement and
+tend to blur/hide the physical quantity measured. This contribution is often called background,
+and finds its origin both in the detector imperfectness, and in the environment of the detector,
+which can be source of such unwanted contributions to the signal.
+The last two contributions (fluctuation and background) are usually referred to as Noise. The noise
+can be analyzed in terms of power, spectrum, as well as uniformity. The quality of one measurement
+is then evaluated thanks to the ( )
+Power A 2
+Signal to Noise ratio = signal = signal , (1.1)
+Powernoise Anoise
+1.2 Detectors in the hard X-ray energy range 11
+where A is the RMS2 amplitude of the signal.
+The detector characteristics give information about:
+• The quality of the measurement performed by the detector. This comprises among other aspects:
+the resolutions in energy and position, the contrast the detector offers, and the noise it adds to
+the signal.
+• The speed of the detector: the minimum amount of time between successive measurement (dead
+time) and the maximum intensity it can measure.
+• The geometrical information about the detector: mainly its active surface. Also the volume of
+the detector can be of importance in crowded spaces.
+1.2.2 The Detective Quantum Efficiency
+Figure 1.13 : Illustration of the effect of the noise and contrast on the quality of one image.
+The detective quantum efficiency (DQE) characterizes the measurement uncertainty introduced by a
+detector.
+It is now recognized as the best figure of merit of a detector. It provides extensive information about
+the capabilities of a 1D or 2D detector to return images with sharp and noiseless images. So it
+expresses the ability of one detector to sense a signal against a background of radiation, and without
+deteriorating the intrinsic noise of the incident beam.
+The Detective Quantum Efficiency (sometimes spelled Detection Quantum Efficiency), is defined as
+SNR2
+DQE = out2 , (1.2)SNRin
+with SNRout and SNRin being the signal-to-noise ratios at input and output of the detector.
+√
+2root of mean square: the quadratic mean of the signal < x2 >.
+12 Introduction
+It differs from the quantum efficiency QE in the sense that it takes into account, not only the fraction
+of the photons, which are actually recorded, but also all the system losses due to the limited resolution,
+noise performance... of one real detector.
+SNRin can be seen as the best achievable detector performance, and in this sense, 0 < DQE < 1.
+The DQE is function of several parameters[4, 5, 6]:
+• The Quantum Efficiency,
+• The spatial frequency,
+• The particle energy,
+• The signal intensity.
+It is often used as a Figure of Merit of the detector, but it strongly varies with the conditions of
+acquisition of the data, and as the available data are often incomplete, its utility is still limited. A
+lot of discussions are still ongoing to define standard conditions of measurement of the DQE of one
+detector.
+Yet some methods are now recognized as standard for the evaluation of detectors DQE. Practical
+methods of evaluation of the DQE and associated parameters, and more globally of the performance
+of one detector can be found in references [6, 7, 8].
+In the following section, some of the most important characteristics of imaging detectors are shown,
+through their impact on the DQE. Yet, the DQE is rarely fully measured and in most cases, only
+those characteristics of the detectors, which have been measured.
+1.2.2.1 The DQE dependence on the Quantum Efficiency.
+The Quantum Efficiency QE, in its most fundamental definition is the fraction of the incident quanta,
+which participate in the signal formation. So it is evident that the QE is a limiting factor to the DQE
+of one detector.
+SNR2Indeed, if we go back to the definition of the DQE = out2 (eq. 1.1), by writing SNR = Sx weSNRin
+S √ S S √ σ S √
+x σx
+obtain out = DQE in and outσ σ S = DQE
+out
+σ . For σout > σin, and outS = QE the Quantumout in in in in
+Efficiency, we have
+DQE 6 QE. (1.3)
+The quantum efficiency QE acts as an absolute limit to the detective quantum efficiency DQE of the
+detector. In particular, a perfect detector (with no intrinsic noise: σout = σin, infinite resolution...)
+have a DQE = QE. For a real system, the DQE is equal to the QE of a perfect detector, which
+would give the same image statistics for the same input flux [7].
+In conclusion, for an imaging detector, the DQE is best with:
+• small detector noise σdno,
+• high quantum efficiency QE,
+• high input signal Si,
+as expected.
+1.2 Detectors in the hard X-ray energy range 13
+1.2.2.2 The dependence of the DQE on the spatial resolution
+Figure 1.14 : 0.1 mm thick engraved lead line pattern used to test the spatial resolution of detectors
+The properties given in the previous section do not show the influence on the detection efficiency
+of the spatial resolution of the detector. Indeed, it is well known that detectors have a ”limited
+resolution”, meaning they cannot resolve objects smaller than a certain size. This characteristic of
+the detector is also known as the Position Resolution.
+Several mechanisms can decrease the spatial resolution of one detector
+The Position Resolution of one detector
+In a position sensitive detector, there is a shift between the incoming position and the detected one
+of a particle. This is due to pixel size, as well as by charge spread and parallax errors. The spatial
+resolution gives information on the accuracy of the position given by the detector.
+It is best measured with the Modulation Transfer Function (M), which gives the system response to
+a sine-wave spatial-frequency amplitude. In other words, the modulation transfer function gives the
+spatial frequency response of an imaging system or a component.
+the modulation, Mi, of the image divided by the modulation of the stimulus Mo
+M at a certain spatial frequency ν is defined as the ratio of the modulation of the image at output
+and input:
+Modulation
+( ) = outM ν
+Modulationin
+with Modulation = Imax−IminI +I , in analogy with Michelson’s definition of visibility of interferencemax min
+fringes.
+It enables to evaluate easily the response of a complex system as simple product of the individual
+MTF’s of the components of the system. For example for a classical Fluorescent screen + Optic +
+14 Introduction
+CCD camera, the MTF would be given by:
+M =MFluo.Screen ·MOptic ·MCCD.
+The MTF allows to calculate the output signal, which is basically the input signal multiplied
+by the MTF.
+Contrast Transfer Function
+In practice yet, it is much easier to measure the Contrast Transfer Function (C) defined as the square
+wave spatial frequency response. It is related to M by:
+pi C(3N) − C(5N) C(7N)M(N) = [C(N) + + − . . .] (1.4)
+4 3 5 7
+where N is the signal spatial modulation frequency in ’line pairs’ per unit distance.
+In practice, one uses masks with several patterns of lines (see 1.14 of various spaces and thickness to
+evaluate the detector response. The resolution is given by the smallest pattern distinguishable by the
+detector.
+Line spread function
+NB. In the same way one can define the Point spread function.
+This is the response of the system illuminated by a narrow slit (or small point). It is related to M by
+the ’simple’ Four∑ier Transform:+
+M(ν) = k=∞∑ −i2piν−∞ LSF (k∆x)e∞ 
+
+k∆x)+ (1.5)
+k=−∞ LSF (k∆x)
+So the LSF basically gives the detector response as function of the spatial frequency of the image.
+Here again it is easy to measure experimentally for it is enough to measure the response of a detector
+to a mask.
+In most cases, the LSF (or PSF) can be very well described by a Gaussian. It is then fully described
+by the standard deviation σdet (considering that the gaussian is centered at the point/line entry).
+σdet is often called (a bit abusively) position resolution.
+One can also notice that from the PSF one can determine the output intensity:
+Iout(x, y) = PSF (x, y) ∗ Iin(x, y) (1.6)
+where ∗ is a convolution.
+The dependence of the DQE on the MTF
+The dependency of the output intensity from the spatial frequency (cf. the relation between the
+MTF M and the contrast transfer function) is taken into account in the DQE. This corresponds to
+a dependency of the DQE on the MTF, which fully describes the response of the detector as function
+of the spatial frequency.
+1.2 Detectors in the hard X-ray energy range 15
+To take into account the impact of the noise in the frequency domain, one has to consider the power
+spectrum of this noise, also named Wiener Spectrum3. This notion enables to write, in analogy with
+the definition of the DQE, its dependence on the frequency:
+The dependence of the SNRo from the MTF can be written as [9]:
+2
+So MTF 2
+N2
+DQE = o (1.7)
+SNRi
+with N2o being the noise power spectrum, and SNRi the signal to noise ratio at the input ; SNRi
+corresponds to the inherent fluctuation of the signal at the input, and is often considered to follow a
+poisson statistics (like was done in section 1.2.2.1). MTF as well as No are functions of the spatial
+frequency.
+Details on the dependence of the DQE from the MTF and noise are given in [10].
+1.2.3 The mode of operation, speed and behavior of one detector at large inten-
+sities
+Integrating vs. Counting detectors
+There are two modes of operation of detectors, which differ on two approaches to evaluate the intensity
+of the measured signal:
+• Counting detectors, which count the deposited quantas of energy one by one ;
+• Integrating detectors, which accumulate the deposited energy before it is evaluated.
+While counting detectors have been around for a while (for example, the Geiger Muller Counter),
+most of the detectors used nowadays are based on the principle of integration of the signal.
+In an integrating detector, the charge deposited by the particle(s) is accumulated (integrated) over a
+period τ . The measurement of the intensity is obtained from the height of the signal obtained.
+The maximum amount of energy the detector can accumulate before the signal is measured cor-
+responds to the maximum intensity the detector can measure (saturation level). This maximum
+intensity is often limited by physical processes in the detector.
+The frequency at which the image is read gives the frame rate of the detector. In the case of area
+detectors, the frame rate is typically of a few 10 of hertz / cm2.
+In a counting detector, each electrical pulse (corresponding to each particle) will be counted if it
+is above a predefined threshold. The intensity is given by the number of single events, which were
+counted during the period τ .
+The maximum intensity the detector can record is limited by the detector’s maximum count rate,
+which is the maximum number of pulses, which can be recorded. Modern electronics allow count
+rates as high as several megahertz.
+3The power spectrum is the average power of the spectrum of the signal/noise in a unitary bandwidth centered at
+the frequency f.
+16 Introduction
+Figure 1.15 :
+Signal as analyzed by an integrating detector and a counting detector.
+Counting detectors are considered as superior (especially for flat field detectors) because of their very
+low noise (the threshold enables to discriminate real events from noise) and ability to count single
+events. Theoretically those detectors are almost noiseless...
+This is their higher cost (both for development and manufacturing) as well as the limitation of the
+electronics, which have limited their use so far: counting detectors could not answer the needs in
+terms of speed. Recently, the fantastic developments in terms of integration and speed of electronics
+has made it possible to develop fast detectors with high dynamics and low noise. Now counting
+detectors can compete in terms of speed (count rate) with integrating detectors.
+In practice yet, counting detectors are not always better. So, as a compromise, some systems try to
+adapt their modes of operation according to the incident flux, in order to offer the best efficiency
+(DQE -detective quantum efficiency- see 1.2.2) [11].
+Dynamic range
+The dynamic range is the range of intensity the detector can measure: [min Nb Quanta;Max Nb Quanta].So
+it is the signal to noise ratio, computed from the greatest signal acceptable by the detector:
+Max Intensity
+Dynamic = (1.8)
+Noise
+In the case of integrating detectors: the max intensity corresponds to the maximum signal measurable
+1.2 Detectors in the hard X-ray energy range 17
+in each picture, while Noise correspond to the detected intensity in the case of no intensity coming
+on the detector.
+In the case of counting detectors, the dynamic is the maximum count rate over the dark count rate,
+which is the mean frequency of appearance of fake events (count rate recorded at zero intensity).
+Associated to those definitions, there are a few notions of importance to evaluate the performances
+of one detector:
+Differential/Integral Non Linearity
+The differential and integral non linearities (DNL and INL) measure the dependence of the detector
+response as function of the signal intensity. The perfect detector has a constant DNL: ∂Response∂Intensity = Cte
+(and a linear INL: Response ∝ Intensity).
+Deviations are always present but can be corrected (eventually pixel by pixel in the case of position
+sensitive detectors) afterwards.
+The maximum intensity a detector can accept is limited by the so called dead time τ of this detector.
+The dead time enables to measure the minimum time during, which a detector cannot record another
+event. Theoretically, the maximum frequency of events the detector can accept is 1τ .
+But there are two behaviors when successive events occur in a time inferior to τ (see Figure 1.16.
+Dead Time Behavior
+The dead time of one detector is the gap of time after one event was recorded when the detector
+is unable to record another event. This minimum time between consecutive events can come from
+limitations in the electronic of the detector, or from by physical processes in the detector itself.
+For the income of photons on the detector is a random process, the probability that real events can
+be lost is non zero. This limitation can be severe in the case of high flux, as a large number of events
+are separated by a gap of time inferior to the dead time of the detector. There are two important
+models for dead time behavior of the detector:
+In the case of a non paralyzable behavior, the detector is able to count a new event immedi-
+ately after the dead time of the first event is finished. In this case at high intensity, the detector
+records events every τ , and a asymptotic saturation of the recorded signal occurs.
+In the case of a paralyzable behavior, if two events occur successively in a time inferior to τ ,
+then the dead time is prolonged of a value τ from the second event. In the case of high intensities,
+the average time between events becomes shorter than τ , and no event can be recorded until
+two successive events have a time separation superior to τ . The saturation appears then as a
+decrease of the recorded signal.
+18 Introduction
+Figure 1.16 : The paralyzable and non parlyzable behaviors of detectors.
+1.3 Spectroscopy detectors
+Spectroscopy detectors focus on high energy resolution. Most often they are position non sensitive
+detectors, even if some of the technologies used for imaging detectors can offer energy resolution. For
+the most important characteristics of spectroscopy detectors are their energy resolution and noise,
+they often come with complex cooling system, which guaranties a minimum noise.
+There are various types of technologies for spectroscopic detectors, corresponding to various energy
+ranges. In X-ray photon science, the most typical detectors are based on technologies such a:
+• Solid state detectors such as Silicon Drift Detectors, silicon crystals doped with lithium (Si(Li)
+detectors) or high purity germanium (HPGe)
+• Scintillation based detectors with various scintillation materials depending on the energy range.
+Photodiode type detectors
+In general, they consist of a p-n depleted region where electron-pairs are created by the incident
+photons. Then a reverse electric field separates the charges, and a fast current pulse is recorded in
+the built-in electronics. They offer a very high speed, and a good energy resolution (only 3.5 eV are
+required for the creation of an electron pair in Si). Unfortunately, the small size of the depletion area
+and the easy recombination of the charge pairs lower the quantum efficiency of the photodiode to a
+very small value.
+PIN photodiodes are an evolution of the photodiodes. They are based on the same principle, except
+1.3 Spectroscopy detectors 19
+that the depletion zone is made much larger with the use of an undoped layer between the N and P
+zones. Still the lack of internal multiplication of the charges makes them unsuitable for low photon
+flux experiments even if they offer a good quantum efficiency at low energies. Several suppliers of
+PIN diodes are now available4.
+Avalanche Photodiodes (APD) are other cousins of the photodiodes: they combine a thick (130 µm)
+low field zone combined on both sides with a thin strong electric field p-n-junction. A precise control
+of the doping levels makes it possible to have a rather large central depletion zone to ensure a good
+quantum efficiency, and side electric fields strong enough to enable an internal multiplication of the
+charges with gain up to 104. Arrays of APDs making relatively basic 2D detectors are now commer-
+cially available (sizes up to 1 or 2 cm2) 5.
+APDs find more and more domains of applications. Unfortunately they cannot be produced in large
+areas (Si based technology).
+Germanium detectors
+Germanium detectors are based on the same principle
+as photodiodes, except that they use germanium instead
+of silicon as semiconductor. This enables the creation
+of very large depletion zones (cm vs.mm) and so bet-
+ters dramatically the efficiency for high energy particles.
+Their higher intrinsic noise makes the use of liquid nitro-
+gen cooling system almost mandatory6.
+Si(Li) detectors
+The introduction of lithium as a dopant is a way to
+create an intrinsic like zone (donors and acceptors ex-
+actly compensate) in the semiconductor. This enables
+the creation of a much larger zone for pair creation,
+such increasing the quantum efficiency for high energy
+rays7.
+Figure 1.17 : A Photodiode used to monitor
+the beam intensity in its protecting case.
+4Among them, Hamamatsu, Canberra, Eurisys, Centronic, Sintef, Ontrak...
+5again several suppliers: Perkin-Elmer Corporation, Hamamatsu Photonics, Judson technologies. Arrays by Pacific
+Sensor, Perkin-Elmer...
+6Provider of Ge detectors component: Canberra, XIA electronics...
+7company supplying: e2v scientific instruments...
+20 Introduction
+Scintillator detectors
+Figure 1.18 : A Cyberstar scintillator based spectroscopy detector, and its electronics.
+Scintillation materials convert high energy photons (or the energy deposited by other particles) into
+visible, UV or infrared light. The intensity of the light produced is proportional to the energy
+deposited over a wide range of energy (the usual unit is [photons/MeV]), thus enabling a simple
+intensity measurement to determine the energy of the incoming photon. Yet this approach suffers
+some limitations, which limit its use for spectroscopy applications:
+• For the intensity is proportional to the deposited
+energy, it is hard to use a scintillator in the case of
+large numbers of incoming photons.
+• Scintillators providing a good yield, also suffer
+from a long response time, which is another limitation
+to the dynamic range of those detectors.
+Yet, photomultipliers tube, which provide an excellent efficiency to collect the weak light emitted
+from scintillators, and convert it into an electrical signal, have made this approach a prime choice for
+spectroscopy applications for a number of decades.
+Conclusion
+Current spectroscopic detectors mostly suit the current needs of the scientific community. New
+developments now go in the direction of area detectors, and speed in order to enable new types of
+experiments.
+1.4 Imaging detectors 21
+1.4 Imaging detectors
+Imaging detectors include all line or area detectors. They are used both for imaging applications,
+and to speed up the collection of data (with respect to a dimensionless detector, which would move
+to cover the same area). This goes beyond a simple speed up of the whole experiment, for a lot of
+samples, and in particular biological samples, suffer from long exposure into the beam. So imaging
+detector can be an absolute necessity in certain fields in order to guaranty a good quality of data.
+Imaging Detectors are the kind of detectors which need most of the developments in order to satisfy
+the requirements of the experiments that scientists want to carry out nowadays.
+1.4.1 current mature technologies
+CCD based detectors
+CCD detectors consist typically of a 2 dimensional arrays of silicon wells of a few 10’s of µm, which
+store the charges created by light absorption. After this charge was accumulated, it is read out
+sequentially with use of an integrated amplifier. They exhibit a very wide spectral sensitivity with
+attractive quantum efficiency characteristics, but also present a large noise background. They are
+typically used in photo-cameras, video-cameras, scanners, and other massively produced devices. As
+such they are rather inexpensive, except in the case of very fast and large area components.
+When used with hard X-rays, they are usually coupled with a fluorescent screen, which converts
+X-rays into visible light. An optical system (based on common optics elements or on optical fibers)
+is often used to reduce the fluorescent screen size to that of the actual CCD system.
+CCD systems8 are nowadays one of the best way to achieve both large areas (eventually by coupling
+several systems) with a high speed readout9. Unfortunately the optical system, and especially the
+fluorescent screen largely degrade to resolution of those systems. In addition those systems present
+an intrinsic high noise as compared to other technologies of detectors, which reduce their domains of
+application.
+Ongoing developments focus on new scintillator materials used to convert X-rays into visible light.
+Thinner layers would increase the resolution especially with high energy photons, and faster scintil-
+lators would enable higher frame rates. Also faster electronics are being developed, as it is also a
+limitation to the frame rate of cameras.
+8various systems used in the synchrotron world. Some examples: Dalsa-Medoptics CCD, Hamamatsu Photonics,
+Philips, GE Medical Systems, The FRELON system developed at ESRF[12]...
+9Typical systems offer readout speed of a few seconds (up to 15), but new highspeed systems are able to have frame
+rates as high as 20Hz.
+22 Introduction
+Figure 1.19 : A CCD camera from the MAR Com-
+pany with its optical coupling system visible. Figure 1.20 : The image plate MAR 345 detector.
+Image plates
+Image plates10 (sometimes called memory phosphors, storage phosphors or photo stimulated phos-
+phors) are based on thermoluminescent materials, also referred to as thermoluminescent dosimeters
+(TLD). In this type of materials, the absorption of the incoming ionizing particle leads to the cre-
+ation of electron-holes pairs, which are trapped in purposely introduced defects in the crystal. So
+the material acts as an integrating detector, in which the number of ”stored” electrons and holes in
+the defects of the crystal, reflect the intensity of the incoming beam. To obtain the image, energy
+has to be provided so that electrons and holes can escape from the traps and recombine, giving a
+luminescent signal. So classical systems consist of a laser scanning the plate after the acquisition, an
+optics (usually an array of optic fibers), which collects the luminescent signal and a photomultiplier
+or a avalanche photodiode to collect the signal.
+Image plates are available in very large areas (the mar345 is as large as 300 mm in diameter), and offer
+a large dynamics. Their drawbacks lie mainly in the presence of noise, and in their very limited speed
+(the plate has to be scanned to readout the image and typically several minutes are needed per image).
+Gas-filled detectors
+Gas-filled detectors use a gas both for the absorption of the ionizing radiations, and for the ampli-
+fication stage of the signal (electron multiplication). This is now a mature technology, which is still
+interesting because of the major advantages it offers. Unfortunately, gas-filled detectors also suffer
+from certain drawbacks, which prevent their generalized use nowadays.
+A more extensive description of gas-filled detectors is given in the section 2, as well as the description
+of this project, which aims in overpassing their limitations.
+10Mar produces the most common image plates used in the synchrotron world, especially in Macromolecular crystal-
+lography.
+1.4 Imaging detectors 23
+1.4.2 technologies under developments
+1.4.2.1 Spectroscopy Detectors under development
+Development focus on new technologies such as Silicon Drift Detectors in which the created charges
+drift in a high resistivity, fully depleted silicon wafer. Electrons are collected on the edge of the
+detector. Those detectors enable the measurement of simultaneous events occurring at different
+places of the detectors, by being able to distinguish several rise times of the collected charge.
+Already used techniques explained in the previous section are also under permanent development.
+Also multielement detectors are being developed to offer higher count rates capabilities and larger
+surfaces.
+1.4.2.2 Imaging Detectors under development
+CCD detectors and image plates are currently the most common imaging detectors. CCDs are used
+when high speed is mandatory, while image plates offer large areas as well as a very good dynamic.
+To answer the growing needs of the imaging community, strong progress have to be achieved in the
+domains of dynamics, noise, and readout speed.
+So the next step for imaging lies in the use of detectors operated in counting mode with a massively
+parallel electronics (meaning each pixel is connected to a built in electronics where the first stage of
+amplification and signal processing is performed, before the image is read out). This new approach is
+possible thanks to the recent developments in the semiconductor industry, which offers components
+small enough for this level of integration.
+This approach will force the use of other technologies, for current CCD based systems as well as image
+plates cannot be used in counting mode: the physical processes involved in the detection are too slow
+to enable this approach (fluorescent materials as well as thermoluminescent materials have decay time
+constants which are incompatible with single photon counting). So systems using a direct conversion
+of the photon into the electric signal must be used (instead of a several steps conversion system like
+in fluorescent+CCD or trapping+luminescence+photomultiplier). The 2 major possibilities are the
+use of solid materials (Pixel and amorphous selenium detectors) or gas amplification based systems
+(using the photoelectric effect to produce the initial charge).
+24 Introduction
+Pixel detectors
+Figure 1.22 : A large area Gas Filled
+Figure 1.21 : Schematic of pixel detectors. detector.
+Photon-counting pixel detectors arrays are hybrid devices made of a semiconductor sensor connected
+to a parallel CMOS readout circuit. The sensor is a Silicon (or another semiconductor) die with a
+pixel electrode structure connected to the CMOS circuit by bump-bonding flip-chip technology (see
+1.21). The sensor is fully depleted by applying a sufficient voltage bias. The photoelectric charge
+created after X-ray absorption in the sensor is collected to the closest pixel of the CMOS circuit
+along the bias field. Each pixel acts as an independent particle detector, including a complete pulse
+processing chain as well as an event counter.
+This kind of detectors currently achieves the best performance in terms of speed, and resolution.
+Unfortunately, only small sizes can be manufactured yet11, and for large areas, arrays of detectors
+have to be assembled. This results in inhomogeneities, which have to be compensated and dead zones.
+The leading projects in this field are Pilatus (developed at the Paul Scherrer Institute (SLS detector
+Group) in Switzerland [13, 14] and the MaxiPix project developed by the Medipix consortium [15].
+Here again, the integration of the readout electronics is a challenge!
+Amorphous selenium/silicon detectors
+Amorphous semiconductor detectors are based on the liquid crystal display technology. Essentially,
+they are a matrix of capacitances charged (or discharged) by the current generated in the X-ray
+irradiated amorphous semiconductor (often selenium). The charge is read by the TFT transistor
+switches present at each pixel capacity. The main difficulty lies in the availability of a good quality
+material, to permit the drift of the created charges to the transistors.
+They are integrating detectors.
+Gas-filled detectors
+Very few technologies currently offer perspectives for large areas, especially in the case of fast detectors
+(used in counting mode, with low noise...).
+11typically 14 ∗ 14 mm2
+1.4 Imaging detectors 25
+Gas-filled detectors can offer a solution. More details on gas detectors, and on the link of this project
+with gas detectors are given in the next section.
+
+Bibliography
+[1] ESRF, “European synchrotron radiation facility long-term strategy,” tech. rep., ESRF, 2006.
+http://www.esrf.eu/AboutUs/Upgrade/.
+[2] Albert Thompson et al., X-Ray data booklet. Lawrance Berckley National Laboratory, available
+at http://xdb.lbl.gov/ ed., 2001.
+[3] G.F.Knoll, Radiation Detection and Measurement. Willey, 2000.
+[4] G.Zanella et al., “The detective quantum efficiency of an imaging detector,” Nucl. Inst. and
+Meth. A, vol. 359, pp. 474–477, 1995.
+[5] G.Zanella et al., “The role of the quantum efficiency on the dqe of an imaging detector,” Nucl.
+Inst. and Meth. A, vol. 381, pp. 157–160, 1996.
+[6] S.M.Gruner et al, “Charge-coupled device area x-ray detectors,” Review of Scientific Instru-
+ments, vol. 73,8, pp. 2815–2842, 2002.
+[7] C.Ponchut, “Characterization of x-ray area detector for synchrotron beamlines,” Journal of
+Synchrotron Radiation, vol. 13, pp. 195–203, 2006.
+[8] C.Ponchut et al., “Experimental comparison of pixel detector arrays and ccd-based systems for x-
+ray area detection on synchrotron beamlines,” IEEE Trans. Nucl. Sci., vol. 52,5, pp. 1760–1765,
+2005.
+[9] W.Hillen et al., “Imaging performances of a digital phosphor system,” Med.Phys., vol. 14,5,
+pp. 744–751, 1987.
+[10] J.P.Moy, “Signal-to-noise ratio and spatial resolution in x-ray electronic imagers: Is the mtf a
+relevant parameter?,” Med. Phys., vol. 27,1, pp. 86–93, 2000.
+[11] R.H.Menk et al, “Novel detector systems for time resolved saxs experiments,” J. Appl. Cryst.,
+vol. 33, pp. 778–781, 2000.
+28 BIBLIOGRAPHY
+[12] J.C.Labiche et al., “Frelon camera: Fast readout low noise,” ESRF Newsletter, vol. 8, no. 25,
+pp. 41–43, 1996.
+[13] C.Broennimann et al., “The pilatus 1m detector,” Journal of Synchrotron Radiation, vol. 13,
+pp. 120–130, 2006.
+[14] “Pilatus website.” http://pilatus.web.psi.ch/.
+[15] “Medipix website.” http://medipix.web.cern.ch/MEDIPIX/.
+Chapter 2
+The basics of gas-filled detectors
+2.1 historical background
+The history of gas-filled detectors starts around 100 years ago when Rutherford and Geiger (working
+at the Manchester University) discovered electron multiplication gas-filled tube with a thin wire at
+the axis position.
+In 1928, Geiger and Mueller introduced the well known (and still used!) Geiger Tube, one of the
+oldest type of ionizing particle detector. The Geiger Counter was the first electronic ionizing particle
+detector.
+Later, in the Manhattan Project [1], the gas-filled detector technology was largely improved. The
+multiple wire proportional counter (MWPC) was invented. It was later implemented in high energy
+physics by Georges Charpak, and revolutionized this field of physics.
+Figure 2.2 : Schematic of the Geiger Mueller
+Figure 2.1 : A modern Geiger Mueller Counter.
+Counter.
+Nowadays, gas-filled detectors are used in a large variety of research fields as well as for various
+30 The basics of gas-filled detectors
+industrial applications. They are routinely used for the detection of fast and heavy particles (high
+energy physics), for the monitoring of nuclear facilities and other radioactive environment, for photon
+detection and imaging (medical applications, non destructive analysis), etc...
+2.2 Principle of gas-filled detectors
+A detailed description of modern gas-filled detectors can be found in G. C. Smith’s article [2]. A
+deeper analysis of the principles of gas filled detectors (with delay lines) is in A.-M. Petrascu’s article
+[3]. Status of development of gas-filled detectors at the ESRF (giving more details on the specificity
+of gas-filled detectors used in the synchrotron radiation world) is found in M.Kocsis article [4].
+In a gas-filled filled detector, the gas is used for two purposes:
+• First it absorbs a fraction of the energy of the incoming photon/ionizing particle. In result of
+this interaction, one or several electron-ion pairs are created (ionization of one particle of the
+gas).
+• Secondly, an internal multiplication of the electrons. This internal multiplication (typically
+a gain factor of 104 to 105) is sufficient to enable each photon to be directly and separately
+counted by some electronics.
+2.2.1 The X-ray absorption in the gas
+Figure 2.3 : The cross sections of various interaction processes in the case of Lead.
+In a gas-filled detector, the first function of the gas is to absorb part of energy of the incoming photon
+to create an electron, as a base of the electric signal.
+2.2 Principle of gas-filled detectors 31
+In the case of the travel of one X-ray photon through matter, several of sorts of interactions can occur
+between this photon, and the atoms (in our case those of the gas), but mainly three are of importance
+for photon measurements (see Figure 2.3): the photoelectric absorption (τ in Figure 2.3), the compton
+scattering (σincoh in Figure 2.3), and the pair production (κn and κe in Figure 2.3). The later one
+can occur only in the case of highly energetic photons (more than 1.02 MeV = 2∗Masselectron, more
+often called gamma rays), so it will not play any role in the case of low energy X-rays.
+The two other govern the law of absorption of the photon in the gas. Their respective probability
+is measured by their respective cross sections, which in general depends on the element, the density
+and the energy of the photon.
+The photoelectric effect is dominant for energies up to a few 100s of keV depending on the element
+atomic number. Then Compton scattering becomes increasingly important, until it is dominated by
+pair-creation.
+Compton Scattering
+The interaction process of Compton Scattering takes place between the incident X-ray, and an elec-
+tron in the gas. It is an elastic scattering process. The photon is deflected through a certain angle
+θ with respect to its original direction, while leaving part of its energy to the electron, then called
+recoil electron. The energy deposited depends on the angle of deflection, and is increasing with θ.
+Photoelectric absorption
+The photoelectric process is the very process at the source of the electron production in the gas. When
+a photon is absorbed by an atom following such a way, its energy is in fully transferred to an electron,
+ejected by the atom from one of its bound shells. The result is the creation of an electron-ion pair,
+with the electron energy being Ee− = hν − Eb, where Eb is the binding energy of the photoelectron
+in the original shell.
+In the case of X-rays, the most probable absorption occurs with electrons from the inner shells.
+Shortly after the photoemission process, there is a rearrangement of the electrons inside the atom, or
+the absorption of a free electron from the medium. Either one (or more) characteristic X-ray photons
+may be emitted, or an Auger electron will be created to enable the excited ion to reach a more stable
+state. In the case of an X-ray photon re-emission, this photon often is reabsorbed via photoelectric
+effect, such creating another electron in pair, but with less energy.
+2.2.2 The amplification and the modes of operation of gas-filled detectors
+The internal amplification of the signal
+After the first ionization of a gas particle occurred (by the incoming detected particle), the created
+electron is thermalized and under moderate fields, the gained energy is lost in collisions with the
+gas molecules. In the regions where the gained energy between two collisions is exceeding a certain
+level (typically ∼ 35eV ), it becomes a ionizing particle, which will later ionize another gas particle,
+creating a second electron, and finally leading to cascade of ionization (as secondary electrons are
+32 The basics of gas-filled detectors
+produced).
+The amplification of the signal will then depend on several factors such as
+• The type of gas,
+• its density,
+• the accelerating electric field and its shape.
+This leads to various Modes of operation, which are classified for a certain gas, as function of the
+applied electric field.
+Modes of operation of gas-filled detectors
+Depending on the applied accelerating potential, various modes of operations of gas amplification are
+distinguished. The Figure 2.4 (extracted from [5]) gives the amplitude of the signal collected after the
+absorption of a particle and the corresponding amplification modes. The two curves correspond to
+two different amounts of energy deposited in the gas. The result with two X-rays of different energies
+would be alike.
+The different modes of operation of gas amplification are:
+Recombination region When the electric field is very low, the field is insufficient to prevent re-
+combination of the ions pairs. The current collected on the electrodes is very low, as only the
+fraction of the created ions pairs, which did not recombine is collected.
+Ion Saturation From a certain value of applied voltage, the electric field is strong enough to effec-
+tively separate the charges created after absorption of the energy of the ionizing particle. Then
+almost all pairs are collected and the intensity corresponds to the rate of creation of charges in
+the volume of the detector.
+Proportional region When the applied tension is further increased, the mean energy gained by
+electrons between collisions is higher than the ionization energy. From this moment an ampli-
+fication of the signal occurs. For a certain tension, the intensity collected is proportional to the
+original number of ions pairs created. This is the region of true proportionality.
+Limited proportional region and Geiger mode Higher electric field result in the apparition of
+non linearities: when the electric field becomes very strong, the amount of charges present in the
+gas becomes high enough to alter severally the electric field resulting from the applied tension.
+Eventually, this Space Charge can become completely dominant and fully determine the pulse
+shape. This last mode is the Geiger mode of operation of the detector.
+In order to avoid a dependence of the amplification on the localization of the deposited charge in the
+detector chamber, and to improve the stability of the system, the strong electric field is applied only
+in a thin region of the chamber. In the rest of the chamber, where electrons are created, only a drift
+field is applied. This also limits the spread of the electron cloud (going exponentially with distance),
+which occurs during the multiplication and limits the loss of resolution while preserving an absorbing
+area sufficiently large.
+2.2 Principle of gas-filled detectors 33
+Figure 2.4 : Regions of operation of gas-filled detectors for two deposited energies.
+Usually the collection of the electrons is performed with a 2D array of wires, which enables propor-
+tional amplification mode (the so called multiwire proportional counters introduced by Charpak and
+coworkers in 1968 [6]).
+Classical gas mixtures are composed of Xenon, Krypton, Argon, Methane, CF4 etc... (see [2]).
+2.2.3 The benefits of gas-filled detectors
+The main advantaged of gas-filled detectors as compared to the previously described types of detectors
+are:
+• their intrinsic speed mainly limited by the electronics
+• their dynamic range, also limited by the memory depth
+• their available size (among the largest detectors)
+• their cost of development and manufacturing
+• their easiness of operation, and robustness.
+Gas detectors find domains of applications in most fields of photon science. They are some of the very
+few types of detectors, which can be built in very large areas. In the high energy physics experiments,
+it is common to find detectors of several square meters, and covering solid angles of almost 4pi.
+2.2.4 The limitations of gas-filled detectors
+Main limitation
+As compared to other technologies of detectors, gas-filled detectors suffer mainly from one disad-
+vantage, which made them almost abandoned in whole fields of photon science: They have an
+34 The basics of gas-filled detectors
+intrinsic low quantum efficiency, they leave a great number of incoming particles undetected
+(said another way, they are photon hungry).
+This is simply due to the very low density of gases, and so very low stopping power. To overcome
+this, it is possible to increase the pressure of the gas, but this is at the expense of amplification
+characteristics, which are best at low pressures...
+They also suffer from sever parallax error leading to a loss of resolution as soon as the incoming
+particles do not have a direction perpendicular to the detector (see Figure 2.5).
+Figure 2.5 : Parallax error is the loss of resolution due to the absorption of non perpendicular photons all
+along the depth of the ionizing chamber, thus broadening the position response of the detector.
+So when considering their application in photon research, other technologies less photon hungry are
+usually used, even if they offer poorer performances in most other characteristics.
+other limitations Another weakness is linked to the use of wires to collect the charges after
+multiplication (MWPC). The small radius of those wires makes them very sensitive to discharges in
+the detectors (more likely with increasing acceleration voltages/gains). It is indeed very difficult to
+repair broken wires in the detector. In addition the broken wires are likely to create short circuits
+and create further damages).
+Modern gas-filled detectors overpass this by using microstructures in place of the traditional wires.
+2.3 Recent Evolutions of gas-filled detectors 35
+2.3 Recent Evolutions of gas-filled detectors
+There has been various recent evolutions of the classical gas-filled detectors to overcome their weak-
+nesses and keep their advantages.
+The main attempts of improvements of gas-filled detectors over the last few years have been stripped
+detectors, as well as hybrid gaseous multipliers. Interesting Parallax Reduction Techniques were also
+introduced.
+Parallax reduction techniques
+The simplest technique to reduce parallax errors, is to build a curved detector. This technique has
+been successfully used at ESRF ([7]) and later at the Rutherford Appleton Laboratory ([8]). In
+addition it largely suppresses the charge spread problem.
+Figure 2.6 : Curved gas-filled detectors do not suffer from parallax errors.
+Other methods of correction such as off line correction by determination of the X-ray absorption
+depth were also demonstrated ([9]) but never used in the synchrotron world.
+For area detectors, solutions to reduce parallax were offered very early after the idea of MWPC was
+published. Charpak’s group at CERN proposed to add a spherical drift chamber to the front of the
+MWPC [10]. This idea was successfully applied to a working device, which became the workhorse of
+the synchrotron LURE in the 80’s ([11]). The idea was then bettered in the late 90’s [12].
+Micro-Pattern
+Strip detectors are an answer to the fragility of MWPC’s wires and limited amplifications character-
+istics (limited by space between wires). They also permit to avoid the difficult manufacturing of the
+chambers (to place the wires of the chamber).
+A large number of structures have been proposed over the last 20 years such as micro-strip gas
+36 The basics of gas-filled detectors
+chambers [13], the microgap chamber [14], the compteur a` trous [15], the gas electron multiplier [16],
+the micro-mesh gaseous structure [17], or the micro-pin array [12].
+Figure 2.7 : GEMs are thin metal-clad polymer foils pierced by a high density of holes. On application of a
+difference of potential, between the two electrodes (sides) electrons drift and multiply in the holes.
+Among those detectors, GEMs (Gas Electron Multiplier) created the largest interest. Introduced
+in 1996 by F. Sauli and his colleagues from CERN [16], GEM’s key feature is a three-layer (metal-
+insulator-metal) grid which is used both for the amplification of the signal, and for ion feedbacks
+prevention (to protect the photocathode, used to convert electrons). Several of such grids can be as-
+sociated to increase the amplification of the system. Working devices were reported in various groups
+in the world and developments are ongoing to improve this technology. GEMs foils are routinely pro-
+duced at CERN, and are now commercially available thanks to the company Tech-Etch Inc.[18, 19].
+Resolution and speed improvements
+The limiting factor of spatial resolution of the detector is the photoelectron range.
+The center of mass of the produced electrons during multiplication reflects the position of the original
+ionization process, and so of the detected particle. Delay-line encoding or charge division methods
+are naturally determining the center of gravity of the electron cloud below the anode spacing. The
+speed of the above system is limited to Mega counts per seconds (Mcps) range. For example, the
+RAPID (Refined ADC Per Input Detector) system [20] developed at the Daresbury synchrotron in
+the UK, is able to determine the position of this center of mass by comparing the amount of charges
+on the different anodes reached by the cloud of electrons. As a result, the detector is able to position
+the original impact with a speed of 107 counts per second.
+2.4 Gas amplification compared to Microchannel plates 37
+2.4 Gas amplification compared to Microchannel plates
+Microchannel plates (MCP) are devices able to amplify signal with a very large gain in vacuum.
+Figure 2.8 : A two slab Micro Channel Plate (Chevron configuration)
+They consist of a thick slab of highly resistive material (glass, silicates) riddled with small tubes
+(diameter ∅ ∼ 10 µm, and interspace ↔∼ 15 µm) leading one face to the other: the microchannels.
+The face of the tubes is covered by a continuous-dynode electron multiplier. The application of a
+strong potential between each face (∼ 500 V ) enables the acceleration of electrons in the tubes, which
+hit the surface of the tube, leading to an amplification of the signal as they create secondary electrons
+at each impact.
+Modern MCPs usually consist of several slabs of MCPs with an angle between the successive tubes
+(chevron or V-like geometry). This geometry leads to a greater amplification for the same applied
+voltage, and to an excellent compactness.
+Unfortunately, MCPs suffer from major problems:
+• Especially for single events, the gain of MCPs is very dispersed. If used in saturation mode, the
+pulse height is stable and the time jitter small, but the pulse decay is long and not constant.
+If used in linear mode and associated to a constant fraction discriminator, the pulse shape is
+assumed to an impulse response with variable height, but fixed shape from a single particle.
+• They suffer from a limited speed, meaning they cannot reach high count rates (∼ 150 kHz).
+• They can amplify a fix charge during their lifetime, so they need to be replaced frequently.
+• They are not available in very large surfaces (diameter area ∼ 10 cm).
+38 The basics of gas-filled detectors
+Compared to gas amplification system, they offer for the same stability in operation, a better gain
+and a very good compactness. Unfortunately, this is a much slower system, which degrades over time
+and is less easy to maintain. In addition they cannot be built in very large areas (several 10s of
+centimeter).
+Those reasons, especially their limited count rate capabilities make them a difficult choice for high
+count rates detectors.
+2.5 A promising approach to overcome Gas-filled detectors limita-
+tions
+A promising approach to overcome the parallax of gas filled detectors (see 2.2.4) is the use of a solid
+converter called Photocathode. The solid state materials density is roughly 1000 times that of a gas.
+As a result a few microns are enough to absorb the incoming photons and convert them in electric
+signal. This presents several advantages, including the absence of parallax errors (see Figure 2.5), a
+better efficiency, and a higher compactness of the detector.
+Bibliography
+[1] M. P. T. S. National nuclear Series, Ionization Chambers and Counters. Experimental Techniques.
+McGraw-Hill Book Company, Inc, 1949. p97.
+[2] G.C.Smith, “Gas-based detectors for synchrotron radiation,” Journal of Synchrotron Radiation,
+vol. 13, pp. 172–179, March 2006.
+[3] A.-M. P. et al., “A beginners’ guide to gas-filled proportional detectors with delay line readout,”
+Journal of Macromolecular Science, vol. B37:4, pp. 463–483, 1998.
+[4] M.Kocsis, “The status of gas-filled detector developments at a third generation synchrotron
+source (esrf),” Nucl. Inst. and Meth. A, vol. 471, pp. 103–108, September 2001.
+[5] G.F.Knoll, Radiation Detection and Measurement. Willey, 2000.
+[6] G.Charpak et al., “The use of multiwire proportional counters to select and localize charged
+particles,” Nucl. Inst. and Meth., vol. 62, pp. 262–+, 1968.
+[7] V.Zhukov et al., “A curved micro-strip gas counter for synchrotron radiation time resolved
+saxs/waxs experiments,” Nucl. Inst. and Meth. A, vol. 392, pp. 83–88, 1997.
+[8] J.E.Bateman et al., “A gas microstrip wide angle x-ray detector for application in synchrotron
+radiation experiments,” Nucl. Inst. and Meth. A, vol. 477, pp. 340–346, 2002.
+[9] J.E.Bateman et al., “Improving the performance of the mwpc x-ray imaging detector by means
+of the multi-step avalanche technique,” Nucl. Inst. and Meth. A, vol. 239, pp. 251–259, 1985.
+[10] G.Charpak et al., “The spherical drift chamber for x-ray imaging applications,” Nucl. Inst. and
+Meth., vol. 122, pp. 307–312, 1974.
+[11] R.Kahn et al., “An area-detector diffractometer for the collection of high resolution and mul-
+tiwavelength anomalous diffraction data in macromolecular crystallography,” Nucl. Inst. and
+Meth. A, vol. 246, pp. 596–603, 1986.
+40 BIBLIOGRAPHY
+[12] P.Rehak et al., “Mipa: A new micro-pattern detector,” IEEE. Trans. on Nucl. Sci., vol. ns-44,
+pp. 651–655, 1997.
+[13] A.Oed et al., “Position-sensitive detector with microstrip anode for electron multiplication with
+gases,” Nucl. Inst. and Meth. A, vol. 263, pp. 351–359, 1988.
+[14] R.Bellazzini et al., “The microgap chamber: a new detector for the next generation of high
+energy, high rate experiments,” Nucl. Inst. and Meth. A, vol. 368, pp. 259–264, 1995.
+[15] F.Bartol et al., “The c.a.t. pixel proportional gas counter detector,” Journal de Physique III,
+vol. 6, pp. 337–347, 1996.
+[16] F.Sauli et al., “Gem: A new concept for electron amplification in gas detectors,” Nucl. Inst. and
+Meth. A, vol. 386, pp. 531–534, 1996.
+[17] Y.Giomataris et al., “Micromegas: a high-granularity position-sensitive gaseous detector for high
+particle-flux environments,” Nucl. Inst. and Meth. A, vol. 376, pp. 29–35, 1996.
+[18] “Tech-etch inc..” http://www.tech-etch.com/.
+[19] B.Surrow et al., “Development of tracking detectors with industrially produced gem foils,” Nucl.
+Inst. and Meth. A, vol. 572, pp. 201–202, 2007.
+[20] R.A.Lewis et al., “The ”rapid” high rate large area x-ray detector system,” Nucl. Inst. and Meth.
+A, vol. 392, pp. 32–41, 1997.
+Chapter 3
+Photocathode for gas-filled detectors
+What is a photocathode?
+A photocathode is a solid converter: it converts photons into electrons. The energy deposited by the
+incident particle enables the creation of hot electrons (more energetic than free electrons), which exit
+the photocathode at a position very close to the entry of the incoming particle.
+Photocathodes have to suit the following requirements:
+• Good conversion efficiency
+• Chemical stability : as the photocathode has to operate in a gas, it must be reasonably chemically
+stable
+3.1 Basics of Photocathodes
+There is currently no theory to describe precisely and predict numerically the characteristics of pho-
+tocathodes. Only phenomenological models can be made to help predicting the characteristics of
+materials as good photocathodes.
+This comes from the extreme complexity of the physics of electron transport into matter, as the
+cascade of events varies not only with the type of material (chemical nature and related physical
+properties), but also with the microscopic structure of the material (most defects, grain boundaries,
+or impurities act like traps for electrons).
+42 Photocathode for gas-filled detectors
+Figure 3.1 : After its creation, the hot electron rapidly looses
+its energy because of several interactions with the lattice or other Figure 3.2 : The region of the photocath-
+electrons. Few electrons actually reach the surface. ode contributing to yield. L is the scatter-
+ing length, la is the absorption length.
+As a result only the physics of the absorption of the incoming photon into the matter is well described.
+To go further, one has to use approximate models, which cannot lead to numerical predictions of the
+efficiency and speed of the photocathode.
+The best (phenomenological) model to describe photocathodes is called the Spicer Three Step Model.
+It was developed approximately forty years ago by William E. Spicer, when he was working for SLAC
+(The Stanford Linear Accelerator Center)[1].
+This model basically separates the process in three major steps:
+• Absorption
+• Electron transport to the surface
+• Extraction from the surface.
+More precisely, the model consists in examining the contribution of a slab dx at a distance x from
+the surface to the emitted electrons.
+This contribution depends on:
+ the amount of photons, which arrive at this depth.
+ the probability of an electron photoemitted in this slab to join the surface,
+The total yield of the photocathode is then obtained by integrating di(x) over the whole volume.
+To help comparing materials, the model defines two lengths:
+• la is the absorption length in witch most of the photons are absorbed. It is the 1/e length where
+the intensity of the incident beam has dropped to 1/e.
+3.1 Basics of Photocathodes 43
+• L is the scattering length: the distance electrons can go over before they are thermalized.
+The quality of a material can then be examined with the ratio laL , which should be as small as possible,
+and ideally, inferior to unity.
+The model also enables to define the active volume as the portion of the photocathode next to the
+surface, which is at a distant inferior to both la and L (see Figure 3.2 in page 42). This is the region
+of the photocathode, which is close enough to the surface to enable electrons to escape, and at the
+same time in the region of absorption of the photons, so contributing to the yield.
+Absorption
+From the presented model, it is evident that a material with a high stopping power (small la) will
+produce more electrons close to the surface, so more electrons with a high probability to escape the
+material. In practice, these are materials with a high Z (superior to 50, or ideally to 70), which
+present the best stopping powers.
+Figure 3.3 : Electrons with energy EC < E < EC + EG have higher mean free path.
+Electron Transport
+The capacity of the Photocathode to transport hot electrons to the surface depends strongly on the
+type and quality of the material it is made of. This is measured in the Spicer model by the value of
+the ”scattering length” L. This value is closely related to the value of the mean free path and that of
+the average loss of energy of electrons in the material.
+To maximize the value of L, it is best to have a semiconductor. First because in metals, hot electrons
+get thermalized very easily by the many free electrons. Secondly, in semiconductors, there is the
+44 Photocathode for gas-filled detectors
+appearance of the so called Magic window. The magic window is a region in the conduction band
+(Ec < E < Ec + EG) where electrons have a much higher mean free path. Indeed, electrons having
+such an energy cannot excite another electron in the conduction band, for this would result in two
+electrons in the forbidden gap of energy. The electron ion pair creation being a dominant process at
+those energies, this results in a much higher mean free path of electrons in the window.
+It is also of strong importance to have defect free materials: each defect in the material (vacancy, dis-
+location, grain boundaries...) acts like a trap for hot electrons, for they often result in dangling bonds.
+To have further details, one can look at Henke’s papers [2, 3], in which a more precise model for
+electron transport is given (especially concerning electron-electron and electron-plasmon interactions).
+Those references also highlight how the efficiency of the photocathodes is closely related to the prod-
+uct Eµ(E), where E is the energy of the incoming photons, and µ(E) the mass absorption coefficient
+of the photocathode material.
+Extraction
+Electrons close to the surface do not necessarily go in the vacuum: they have to overcome a poten-
+tial barrier called work function φm in metals or electronic affinity χsc in semiconductors (Figure 3.4).
+Figure 3.4 : To exit the solid, e− have to overcome Figure 3.5 : The Band structure of a NEA semi-
+the workfunction φm or electronic affinity χsc conductor close to the surface
+This barrier is often several eV high, so very few electron can overpass it, leading to a poor yield.
+To maximize the photocathode efficiency, one must select materials with a very low electronic affinity.
+There are materials such as CsI, or hydrogenated diamond, which offer a Negative Electron Affinity
+(NEA). Those materials are of course of special interest for they act like a kind of hot electron
+fountain: hot electrons close to the surface see an attracting potential, which tends to eject them
+from the material. The quantum efficiency of this sort of material is of course much better than that
+3.2 Improved Models of Photocathodes 45
+of classical materials.
+Their main disadvantage comes from their very high chemical sensitivity. For the potential tends
+also to attract anions, the negative affinity rapidly disappears as the surface gets polluted. So they
+require special cleanness of the environment, which is hard to achieve when the photocathode is in a
+gas chamber. It was also found that the coating of the surface with materials like caesium or TMAE
+can improve this efficiency (see adding details in the following section, or see [4] published in 1936 !).
+This effect is usually explained by the appearance of dipoles at the surface of the materials, which
+lower the electronic affinity.
+The Contradictions
+Already several contradictory requirements appear for the photocathode :
+• The photocathode must be thick to absorb the incoming particles, but thin to let electrons
+escape.
+• It should be made of high Z materials, but should be defect free. In terms of availability, there
+are very few high Z materials (especially in the case of semiconductors), which can be processed
+with a good purity and few defects.
+• It would better be NEA but has to be chemically very stable.
+So one has to choose the best compromise to finally achieve an optimal quantum efficiency in a certain
+energy range.
+3.2 Improved Models of Photocathodes
+Obviously the model presented in the previous section is very simple, and it cannot be used for
+quantitative analysis. It is yet the only general model.
+Yet more accurate models were developed to predict quantitative secondary emission yield, as well
+as the energy distribution of both photoemitted electrons, and secondary emitted electrons.
+Unfortunately all those models are material specific (they usually study CsI, considered as the most
+interesting material for photocathode application [5, 19, 7]), for they use extensively fitted parameters.
+Most of them were developed for Monte Carlo based analysis. So it is difficult to use this sort of
+models for prediction of efficiencies of new materials.
+More details will be given in the section dedicated to the Monte Carlo Analysis.
+3.3 Major technologies of photocathodes currently available
+Most materials now used as photocathodes have been known for a long time. A compilation by
+P. Mine´ then at Ecole Polytechnique in 1993 [8] is still valid (this publication deals with photoemissive
+materials in the UV, but the state of knowledge in the X-ray energy range is not really different).
+Jochen Teichert, Rong Xiang, Guy Suberlucq and Jeroen W.J Verschuur also made a Report on
+46 Photocathode for gas-filled detectors
+Photocathodes in 2004 but again, mainly focused on photocathodes in UV and Visible range for
+electron injection system applications [9]. Focus was given on a better control of the fabrication
+process to ensure the best quality of cathodes.
+3.3.1 Metallic Photocathode
+Metallic photocathodes are the oldest type of photocathodes.
+Classical materials include gold, copper, and silver. Gold is of all those materials the best, for it offers
+the best efficiency (highest atomic number so excellent stopping power), an excellent speed, as well
+as the best chemical stability (noble metal) .
+Gold is used for photocathodes in a wide range of application where high chemical stability, high
+conductivity and speed are mandatory. This is especially the case for photo-injectors in synchrotrons
+and X-fels (injectors made of photocathode excited with pulsed UV-laser to create the packets of
+electrons) where high quality pulses of electrons (in terms of intensity and shortness) are mandatory.
+The photocathode is often used in RF cavities coupled with the pulsed laser to enable the creation
+of extra short/very high intensity electron packets.
+NB. RF cavities cannot be used to improve the efficiency of gas-filled photodetectors, because they
+work exclusively under ultra high vacuum (discharge problem) so are incompatible with gas amplifi-
+cation.
+Past studies of metallic photocathodes
+Metallic photocathodes were mostly studied during the 70’s and early 80’s (though, some older
+references can be found). Classical references include:
+• for Gold, Copper and Silver: [10, 11, 3, 12, 13].
+• for Aluminum and Al2O3: again [3, 13, 12].
+• other materials such as Tungsten, Molybdenum, Silver, and Palladium are presented in
+[10]
+For the X-ray energy range as well as for the UV energy range, gold is the most suitable metallic
+photocathode. Recent measurement using synchrotron radiation facilities [14, 15] report all with good
+agreement efficiencies of a few tenths of a percents in the 1-10 keV energy range. [16, 17] also provide
+interesting results even if the quantum efficiency is not directly measured. Lastly H.Henneken et al.
+reported measurements of the efficiency of gold in the case of the specific Au(111) surface [15].
+3.3.2 Semiconducting Photocathode
+As previously discussed, semiconductors are theoretically much better materials in terms of quantum
+efficiency. Their availability in excellent purities and almost defect free bulk materials make them a
+very attractive choice.
+In practice several compounds offer excellent efficiencies in the visible or infrared ranges (Alkali
+antimonides such as Cs3Sb, K3Sb, Na2KSb, K2CsSb). Unfortunately they all present a high
+3.3 Major technologies of photocathodes currently available 47
+reactivity to moisture and oxygen, which makes their manipulation difficult, and also completely
+unsuitable for gas amplification based systems.
+Other systems were studied because of their insensitivity to visible photons, and high efficiency in
+the UV range (solar blind photocathodes for spatial application). Those photocathodes reacting
+to wavelength smaller than 380nm, often exhibit a negative electron affinity (eventually after an
+activation with Cs or another material).
+Theoretical analysis of secondary emission by semiconductors can be found in [3, 2].
+Materials, which created interest include
+• boron nitrides BN reported to present NEA characteristics [18]
+• Gallium Arsenide GaAs also reported to present NEA when Cs activated (see [19], which
+compares GaAs with other semiconductors, as well as [20, 21]
+• Gallium nitride, Indium Gallium Nitrides and Aluminum Gallium Nitrides GaN,
+INGaN and AlxGa1−xN were extensively studied because of their potential for solar blind
+detectors ([22, 23, 24, 25]).
+Unfortunately when it comes to X-rays, common semiconductors such as gallium arsenide, silicon or
+germanium are completely inefficient. Indeed those materials do not have the stopping power suitable
+for energetic photons, for electrons cannot reach the surface before they are thermalized. In addition,
+those materials are available only in small dimensions.
+Heavier materials being much harder to process in good quality, there are very few materials, which
+are actually used as photocathodes. CsI is the exception, and it will be later described.
+3.3.3 Organic Photocathode
+Organic photocathode such as TMAE (tetrakis dimethyl-amino!ethylene), or C6H5, have created
+great interest in the 80’s for they exhibit a negative electron affinity. They were also used as activator
+(like Cs). Unfortunately, they are of no interest in the X-ray energy range, because of their very low
+stopping power. The interested reader can find information in P. Mine´’s [8].
+3.3.4 CsI
+Since its first discovery by Taft and Philipp in 1957 [26] and its further studies by J. Edgecumbe
+and E. L. Garwin in 1965 [27, 28], CsI has probably been the material, which was the most widely
+studied. This comes from several advantages it offers:
+• Excellent quantum efficiency: the material exhibit NEA properties, and an excellent stopping
+power (high Z).
+• A rather good chemical stability, at least if compared to most other materials with similar
+characteristics. Still the material is hygroscopic and suffers from degradation with time.
+• Easiness of synthesis and deposition.
+48 Photocathode for gas-filled detectors
+From the beginning, a lot of efforts were put in attempts to reduce its sensitivity to moisture and
+need for cleanness (UHV conditions) [29, 8, 13, 32, 11, 34, 35]1.
+Efficiencies measured vary among authors. This is probably due to the high reactivity of the material,
+and the importance of the deposition/synthesis conditions.
+• [32] report a quantum efficiency of 2 to 4% in the 5 to 10 keV energy range.
+• [13] report a quantum efficiency of 1 to 5% in the same range of energies.
+The ALICE collaboration made a systematic study of the effect of water and oxygen on the quantum
+efficiency of CsI [36]. [32] provides information on the effect of heating to resorb the loss of efficiency
+after exposure to moisture.
+Effects of electric field [12], Gas amplification with various mixtures [38, 39], polarization of X-rays
+[40], as well as various Monte Carlo dedicated codes [38, 5] were also studied. This shows the wide
+interest and hopes that this material created.
+Now, CsI is still considered as a reference, and a lot of projects are still based on the use of this
+material. Unfortunately, the sensitivity of CsI as a photocathode is still an issue, and few success
+were recorded.
+Lastly, a sensitivity of CsI to radiation was recorded [8, 41]. This is of course an issue regarding the
+stability in time of a detector using CsI. Fortunately, this sensitivity seems to be limited in the X-ray
+energy range [41].
+The key feature of CsI is its negative electron affinity. This NEA is explained by the appearance
+of dipole charges at the surface of the material, leading to a bending of the band structure, and the
+presence of an attractive potential to electrons at the surface.
+Those dipoles are of course very attracting to all sorts of impurities, which easily form chemical
+bounding with the surface charges, so destroying the NEA of the surface.
+As a result, CsI photocathodes usually loose their high quantum efficiency after a few hours of
+exposure to moisture, and even much faster in an unclean environment.
+There were a lot of attempts to protect the CsI from degradation in unclean environment. Another
+approach was to try developing online cleaning processes (like [32] already cited). But none of these
+approaches were able to provide a solution acceptable in terms of robustness and efficiency.
+It remains that CsI offers an attractive efficiency, and in addition it is widely available (it was also
+successfully used as a scintillator material by addition of dopants like Tb or Na).
+3.3.5 Conclusions on available technologies of Photocathodes and the issues re-
+lated to their use
+A wide variety of photocathodes is available on the market. But most of them are suitable only for
+low energy applications (visible, ultra-violet and infrared applications).
+There are mainly two families of photocathodes suitable for the hard X-ray energy range:
+• Metallic photocathodes, mainly gold, which offers a poor efficiency but an excellent robustness
+1It should be noted that a number of those publications come from A.Breskin’s group from the Weizmann Institute
+of Science in Israel, which has been very active in developing this technology.
+3.3 Major technologies of photocathodes currently available 49
+Gold CsI
+Efficiency few 110 ’s of a percents [16, 17] few percent [32, 13]
+Sensitivity none To moisture, impurities in gas
+Table 3.1 : Technologies of photocathode
+• CsI photocathodes, which offers the best efficiency, but a sensitivity to moisture and contami-
+nation leading to huge technological problems, especially in the case of gas-filled detectors.
+Recapitulation tabular (Table 3.1):
+Other classical photocathodes such as tetraminoethylene (TMAE), the organometallics ((C2H5)Cr,
+(C2H5)Fe...), are not suitable for X-rays for their stopping power is not good enough and so do not
+achieve a good efficiency (this is mainly due to their low Z).
+The same restrictions apply to GaAs and parents (InGaAs, InGaAsP) usually used after activation
+with Cs. In addition, those materials can be used only with gases of very high purities.
+TMAE was successfully used to increase to quantum efficiency of CsI and other photocathodes, but
+no good stability could be achieved.
+
+Bibliography
+[1] W.E.Spicer, “Photoemissive, photoconductive, and optical absorption studies of alkali-antimony
+compounds,” Phys. Rev., vol. 112, no. 1, pp. 114–122, 1958.
+[2] B.L.Henke et al., “Soft x-ray induced secondary-electron emission from semiconductors and
+insulators: Models and measurements,” Phys.Rev.B, vol. 19, pp. 3004–3021, 1979.
+[3] B.L.Henke et al., “0.1-10kev x-ray induced electron emissions from solids-models and secondary
+electron measurements,” J.Appl.Phys., vol. 48, pp. 1852–1866, 1977.
+[4] L.Malter, “Thin film field emission,” Phys.Rev., vol. 50, pp. 48–58, 1936.
+[5] A.Akkerman et al., “Monte carlo simulations of secondary electron emission from csi, induced
+by 1 10 kev x rays and electrons,” J.Appl.Phys., vol. 72(11), pp. 5429–5436, 1992.
+[6] A.Gibrekhterman et al., “Characteristics of secondary electron emission from csi induced by x
+rays with energies up to 100 kev,” J.Appl.Phys, vol. 74, pp. 7506–7509, 1993.
+[7] A.Gibrekhterman et al., “Spatial characteristics of electron- and photon- induced secondary
+electron cascades in csi,” J.Appl.Phys, vol. 76, pp. 1676–1680, 1994.
+[8] P.Mine´, “Photoemissive materials and their application to gaseous detectors,” Nucl. Inst. and
+Meth. A, vol. 343, pp. 99–108, 1994.
+[9] J.Teichert et al., “Report on photocathodes,” tech. rep., CARE/JRA-PHIN, 2004.
+http://www.fzd.de/projects/CARE/index.files/reports/report.pdf.
+[10] W.C.Walker et al., “Photoelectric yield in the ultraviolet,” J.Appl.Phys., vol. 26(11), pp. 1366–
+1371, 1955.
+[11] W.F.Krolikowski et al., “Photoemission studies of the noble metals. ii. gold,” Phys.Rev.B,
+vol. 1(2), pp. 478–487, 1970.
+52 BIBLIOGRAPHY
+[12] R.H.Day et al., “Photoelectric quantum efficiencies and filter window absorption coefficients from
+20ev to 10kev,” J.Appl.Phys., vol. 52(11), pp. 6965–6973, 1981.
+[13] B.L.Henke et al., “The characterization of x-ray photocathodes in the 0.1-10kev photon energy
+range,” J.Appl.Phys., vol. 52(3), pp. 1509–1520, 1981.
+[14] G.W.Fraser et al., “The characterization of gold x-ray photocathodes,” Nucl. Inst. and Meth. A,
+vol. 321, pp. 376–380, 1992.
+[15] H.Henneken et al., “Absolute total yield of au(111) and cu(111) surfaces,” Journal of Electron
+Spectroscopy and Related Phenomena, vol. 101-103, pp. 1019–1024, 1999.
+[16] M.Hirata et al., “X-ray detection characterization of gold photocathodes and microchannel plates
+using synchrotron radiation (10ev-82.5 kev),” Nucl. Inst. and Meth. B, vol. B66, pp. 479–484,
+1991.
+[17] S.Gosavi et al., “Stability improvement at high emission densities for gold thin film photocathodes
+used in advances electron beam lithography,” J. Vac Sci. Technol. B, vol. B19(6), pp. 2591–2597,
+2001.
+[18] M.J.Powers et al., “Observation of a negative electron affinity for boron nitride,” Appl.Phys.Lett,
+vol. 26, pp. 3912–3914, 1995.
+[19] G.A.Allen, “The performance of negative electron affinity photocathodes,” J. Phys. D, vol. 4,
+pp. 308–317, 1971.
+[20] S.H.Kong et al., “Photocathodes for free electron lasers,” Nucl. Inst. and Meth. A, vol. A358,
+pp. 272–275, 1995.
+[21] K.A.Elamrawi et al., “Preparation and operation of hydrogen cleaned gaas(100) negative electron
+affinity photocathodes,” J. Vac Sci. Technol. A, vol. A17(3), pp. 823–831, 1999.
+[22] F.S.Shahedipour et al., “Efficient gan photocathodes for low-level ultraviolet signaldetection,”
+IEEE Journal of Quantum Electronics, vol. 38(4), pp. 333–335, 2002.
+[23] M.P.Ulmer et al., “Progress in the fabrication of gan photocathodes,” Proc. SPIE, vol. 4288,
+pp. 246–253, 2001.
+[24] P.Sandvik et al., “alxga1−xn for solar blind uv detectors,” J. Cryst. Grow., vol. 231, pp. 366–370,
+2001.
+[25] D.J.Leopold et al., “High quantum efficiency ultraviolet/blue algan/ingan photocathodes grown
+by molecular epitaxy,” J.Appl.Phys., vol. 98, pp. 043525–1,5, 2005.
+[26] E.A.Taft et al., “X-ray induced radiation damage in csi, gadox, y2o2s, and y2o3 thin films,” Phys.
+Chem. Solids, vol. 3, p. 1, 1957.
+BIBLIOGRAPHY 53
+[27] J.Edgecumbe et al., “Attenuation length for secondary electrons in bulk-density kcl and csi,”
+J.Appl.Phys., vol. 37, pp. 2916–2917, 1965.
+[28] J.Edgecumbe et al., “Csi as a high-gain secondary emission material,” J.Appl.Phys., vol. 37,
+pp. 3321–3322, 1966.
+[29] V.Dandendorf et al., “Progress in ultrafast csi-photocathode gaseous imaging photomultipliers,”
+Nucl. Inst. and Meth. A, vol. A308, pp. 519–532, 1991.
+[30] E.Shefer et al., “Photoelectron transport in csi and csbr coating films of alkali antimonide and
+csi photocathodes,” J.Appl.Phys., vol. 92(8), pp. 4758–4771, 1993.
+[31] A.Breskin et al., “New ideas in csi-based photon detectors: Wire multiplication and protection
+of the photocathode,” IEEE Trans.Nucl.Sci, vol. 42(4), pp. 298–305, 1995.
+[32] J.E.Lees et al., “Thermally annealed soft x-ray photocathodes,” Nucl. Inst. and Meth. A, vol. 381,
+pp. 453–461, 1996.
+[33] H.S.Cho et al., “A columnar cesium iodide (csi) drift plane layer for gas avalanche microdetec-
+tors,” IEEE transaction on Nuclear Science, vol. 45(3), pp. 275–279, 1998.
+[34] L.Periale et al., “Evaluation of planar gaseous detectors with csi photocathodes for the
+detection of primary scintillation light from noble gases,” conference paper Presented at
+the 1st Topical Symposium on Functional Breast Imaging with Advanced Detectors, 2001.
+http://arxiv.org/pdf/physics/0106070.
+[35] E.Schyns et al., “Status of large area csi photocathodes developments,” Nucl. Inst. and Meth.
+A, vol. 494, pp. 441–446, 2002.
+[36] A.Di.Mauro et al., “Study of the quantum efficiency of csi photo-cathodes exposed to oxygen
+and water vapour,” Nucl. Inst. and Meth. A, vol. 461, pp. 584–586, 2001.
+[37] A.Breskin et al., “Electric field effects on the quantum efficiency of csi photocathodes in gas
+media,” Nucl. Inst. and Meth. A, vol. 344, pp. 537–546, 1994.
+[38] T.H.V.T.Dias et al., “The transmission of photoelectrons emitted from csi into xe, ar, ne, and
+their mixtures: a monte carlo study of the dependence on e/n and incident vuv photon energy,”
+J.Appl.Phys., vol. 37, pp. 540–549, 2002.
+[39] R.Aleksan et al., “Measurement of csi photocathode quantum efficiency in methane,” Nucl. Inst.
+and Meth. A, vol. 343, pp. 173–191, 1994.
+[40] S.Hanany et al., “Measeurement of the electron yield of csi with polarized x rays,” Phys.Rev.B,
+vol. 48(2), pp. 701–709, 1993.
+[41] A.S.Tremsin et al., “X-ray induced radiation damage in csi, gadox, y2o2s, and y2o3 thin films,”
+Nucl. Inst. and Meth. A, vol. 459, pp. 543–551, 2001.
+
+Chapter 4
+The Simulations by Monte Carlo Method
+This chapter presents the study by Monte Carlo of the photocathodes performed in this work.
+The chapter is divided into four parts :
+1. A general introduction to the Monte Carlo Method,
+2. a description of the Monte Carlo code developed in this work is given,
+3. a detailed analysis of the limits of Monte Carlo methods in the case of particle tracking into
+matter is given, and the reason why these limitations forbid the use of this method in the case
+of photocathode analysis
+4. Conclusions on this part of the work.
+4.1 A first approach to Monte Carlo
+4.1.1 History
+The Monte Carlo Method is called after the city of the Princi-
+pality of Monaco, because of the roulette (and similar games),
+seen as a random number generator. This name and the sys-
+tematic development of the Monte Carlo Method date from
+about 1944.
+Before, there had been several isolated instances of this method,
+some of them on much earlier occasions (see the examples given
+in B.1). Those methods were only rarely actually used for sci-
+Figure 4.1 : Monaco’s Casino entific purpose. A reason for this is the necessity to make a
+large number of repetitive operations to achieve ”a good pre-
+cision”. This is the arrival of computers, which created a greater interest for this sort of simulations.
+56 The Simulations by Monte Carlo Method
+The principles of the Monte Carlo Method are due to the polish mathematician Stanislaw Ulam,
+when he was working in Los Alamo for the Manhattan Project[1].
+Those developments were implied by the work on the atomic bomb, which needed a direct simula-
+tion of the probabilistic problems of neutron diffusion in fissile materials. But even at an early stage
+of the project, Stanislaw Ulam and John von Neumann refined the method to a more general theory[2].
+Finally, the systematic development of the method occurred only in 1948 with the work of Harris
+and Herman Kahn. From this moment, the method had a fast development, and already in 1948,
+Fermi, Metropolis, and Ulam obtained estimations for the eigenvalues of Schrodinger’s equation. The
+Method became intensively used in extremely various fields from 1970, thanks to the new generation
+of computers.
+4.1.2 Description of the Monte Carlo Method
+A possible definition: The Monte Carlo Method, as it is understood now, encompasses any tech-
+nique of statistical sampling employed to approximate solutions to quantitative problems.
+Said another way, the Monte Carlo Method gives an approximate solution to a problem using a sta-
+tistical approach. The method consists in performing statistical sampling experiments, and applying
+the central limit theorem1 to determine the general behavior of the studied system. It applies to
+problems with no probabilistic content, as well as to those with inherent probabilistic structure.
+The progress in terms of performance of modern computers has enabled the use of the Monte Carlo
+Method in an increasing number of problems, and it has now several fields of applications: the most
+common problem treated via a Monte Carlo approach are:
+• Particle Transport through matter (detailed in 4.1.3),
+• Astrophysics models,
+• Molecular studies (”classical”, ”quantum”, ”path-integral”, ”volumetric”, molecular dynamic,
+etc...),
+• Evaluation of multi dimensional integrals (see example in annex B.1.1),
+• solving the integro-differential equations defining the radiance field.
+All those applications have lead to new development in various areas, for example the last application
+has been used in global illumination computations, which is a way to produce photo-realistic images.
+As a Result, Monte Carlo Methods have been usefully employed in industries as various as that of
+Graphics industry (in the case of ray tracing softwares, see the case of the Radiance software [3]),
+Finance [4], or Search And Rescue and Counter-Pollution, where models are used to predict the drift
+of a life raft or of an oil slick on the sea.
+1The Central Limit Theorem states that if the sum of independent random variables has a finite variance, then it
+will be approximately normally distributed.
+said another way: Given a population with a mean of µ and a deviation σ, then the sampling distribution of the mean
+has a mean of µ and deviation of σ (N being the sample size).
+N
+4.2 The Geant4 toolkit for particle transport into matter 57
+4.1.3 The Monte Carlo Method in Particle Transport
+There are mainly two different approaches to study the transport of particles through matter:
+• The deterministic methods, in which the transport equation is solved.
+• The Monte Carlo approach, in which single particle transports are computed.
+It is said sometimes that, while the deterministic approach consists in solving the integral transport
+equation, the Monte Carlo approach consists in solving the integro-differential transport equation.
+This statement (which is incorrect, for the integral and integro-differential equations, are
+actually a single one put in two different forms) illustrates the difference between the two approaches:
+The deterministic methods return a general law of behavior of the particles, and a complete set of
+information (flux, penetration, etc...).
+In contrast, the Monte Carlo Method does not solve an explicit equation, but obtains the solution
+by simulating individual particle transports and interactions with matter and by recording all the
+information along the trajectories of the particle. Then the central limit theorem enables to determine
+the general behavior of the particles by making a statistic analysis of the recorded information.
+The particle transport simulation consists in tracking the particles one by one, by evaluating at each
+step the probability of interaction with matter. The probability densities of interaction (calculated
+according to various parameters such as the particles energy, type, bias... and the material type,
+density...) are used in addition to a random number generator to determine the step length, and the
+interaction type, which will happen. Thus, the particle behavior is not deterministic but governed by
+probabilistic laws, following the quantum nature of fundamental interactions.
+The interaction laws used in the simulation are obtained from the quantum mechanics theory (for
+their analytical form), and from experimental measurements (the cross sections, which describe ”the
+probability of interaction”).
+The major problem of the Monte Carlo Methods for particle tracking is the need of computer power
+to achieve simulations with an acceptable precision (i.e. enough particles tracked to achieve a good
+statistics). Only modern powerful computers are able to perform the simulations in an acceptable
+time (a few hours).
+4.2 The Geant4 toolkit for particle transport into matter
+The development of a Monte Carlo code is a very ambitious project, especially if it is meant to study
+many materials. So it was preferred to use a general toolkit with proven capacities at low energies.
+Several codes were considered (Penelope, MCNPX, EGSnrc, Geant4). Geant4 was chosen because
+of various reasons, including:
+• It has become a standard among Monte Carlo codes.
+• It is well documented and open source, thus it gives straighter access to code and physics
+verification.
+58 The Simulations by Monte Carlo Method
+• It is provided with numerous tools, which simplify data analysis.
+• It has a series of libraries dedicated to low energies.
+Among the disadvantages of Geant4 when compared to other codes:
+• It is harder to program, as the user has to make the program himself (no script language to
+command Geant4). It is written in C++. So the user needs basic notions of object-oriented
+programming.
+• Complex setup of the program (compilation, configuration settings...)
+Those difficulties are also the strength of Geant4, for they find their origin in the very high versatility
+of the toolkit, and in its cross-platform nature.
+Geant -for GEometry ANd Tracking- is a simulation toolkit developed for the tracking of particles
+through matter. It has been developed by more than 100 scientists from 10 institutions and has now
+become a worldwide reference.
+The first version was developed at CERN and dates from 1974. Up to version 3.21, Geant was made
+in Fortran, and was mainly dedicated to high energy physics. From 1994, a new version completely
+written in C++ and with modern object oriented structure was developed.
+The toolkit includes facilities for handling complex geometries, tracking particles, simulating detector
+response, handling run management and the user interface.
+Its possibilities were also expanded, and Geant4 is now routinely used in fields as various as:
+• High energy and nuclear physics,
+• Medical applications,
+• Space industry development,
+• Accelerator physics,
+• Lower energy physics ...
+The reference article for Geant42 was published in Nuclear Instrument and Methods in Physics Re-
+search A: [5].
+4.2.1 The way Geant4 computes particle propagation
+4.2.1.1 The tracking of the particles
+The core of the method consists in tracking the particles one by one, letting them having all possible
+physical interaction with matter3. It takes into account:
+• the particle intrinsic properties, its direction, energy...
+2The reference webpage of Geant is currently : http://cern.ch/geant4/
+3Geant uses a combination of the composition and rejection Monte Carlo Method . The exact description of those
+two methods will not be done here, but those who have interest can have a look at the book from H.Messel and al. [6],
+at the article from J.C.Butcher and al. [7], and at the EGS4 Code System Manual [8].
+4.2 The Geant4 toolkit for particle transport into matter 59
+• all physical processes applicable to the current particle (ex. for a photon the photoelectric
+effect, for an electron the bremsstrahlung ...).
+• the volume boundaries, the material characteristics (geometrical information),
+• the electromagnetic fields.
+One usually makes the difference between the primary particles, which are generated by the program-
+mer with defined type, momentum, position, etc... and the secondary particles, which are generated
+by previous interactions of other particles with the matter or their disintegration (unstable particles).
+Of course the secondaries can generate other secondaries. In Geant4 any created particle is tracked
+until it has a zero energy (absorption).
+In Geant4, the basic element of the tracking is the Step. It consists of two points (start and end
+point) and the ”delta” information of the particle:
+• step length,
+• energy loss during step,
+• change in elapsed time,
+• change of direction, etc.
+A step can be summarized the following way (see table 4.2):
+→ The particle velocity is calculated,
+→ A step length is associated to each physical process:
+The probability of interaction weighed by a random number is computed, and converted into
+a distance.
+The minimum of all computed distances (ie. the limiting physical process) defines the physical
+step length.
+→ The navigator finds ”safety”: the distance to nearest boundary in the direction of the particle.
+→ the minimum of physical step length and safety is kept as the step length
+→ If the physics process has limited the step, the interaction is done (interaction before the
+boundary of the volume). Otherwise the particle is transported to the next volume.
+→ If the particle was not killed during the track, it is ready for the next step. Eventually,
+secondary particles are stored for later tracking.
+Before the following step is performed, Along step physical processes are applied (for example
+scattering).
+→ Last, the track properties are updated (momentum, position, time, etc...).
+60 The Simulations by Monte Carlo Method
+Figure 4.2 : Tracking procedure of particles in Geant4
+At the end of the tracking process of one particle, one can eventually store the trajectory, which is
+the compilation of steps, which happened when tracking the particle.
+To have a better description of the tracking processes4, the interested reader should refer to chapter
+5.1 of the Geant4 Users Guide [9]. Alternatively, the reference publication of Geant4 published by
+the Geant4 community in Nuclear Instrument and Methods in Physics Research A: [5] gives a rapid
+overview of the way particles are tracked.
+4Especially to have a proper description of the way discreet and continuous processes are taken into account, and
+the way boundaries are treated.
+4.2 The Geant4 toolkit for particle transport into matter 61
+4.2.1.2 The physical interactions in Geant4
+The sets of physical processes
+Geant4 offers two sets of processes describing particle interactions with matter:
+• The historical one, dedicated to the high energy physics.
+• The low energy extension of electromagnetic process, which has been developed since 1997,
+intends to extend the validity of Geant4 down to low energy. It can now simulate physical
+process down to 250 eV (and up to 100 GeV) with atomic numbers between 1 and 99.
+This extension is described both in the User Guide [9] and in the Physics Reference Manual
+[10] 5
+In addition, Geant4 also enables the user to use the set of processes from the Penelope Monte Carlo
+toolkit [11]. This way the users are offered two flavors of Low Energy physical processes, and rapid
+comparison can be obtained.
+Cross Sections
+The physical processes involved in particle transport through matter have a quantum nature, meaning
+that they do not follow a deterministic behavior.
+On the other hand, their behavior is very well described by a probabilistic approach: the probability
+of interaction of a particle with a material is fixed. It is measured by the cross section σ and expressed
+in unit of area (usually in barn ≡ 10−28 m2). The cross section can be understood as the apparent
+surface as seen from an incoming particle of an atom. In the case of a thin foil, the probability of
+interaction of the incoming particle is n σ/S with S the surface of the foil and n the number of atoms
+contained in the foil.
+In practice σ varies greatly with the nature of the particle, and its energy.
+The various sorts of interactions of the particle with matter have corresponding cross sections.
+The differential cross section dσdΩ describes the probability to observe a scattered particle per unit of
+solid angle Ω.
+Cross sections used in Geant4 result from measurements as often as possible. When those data are
+unavailable, then only an analytic formula is used to build the cross section data. For the data are
+provided as series of discrete values, an interpolation formula is used to have access to any value of
+the energy:
+log(σ1) log(E2/E)− log(σ2) log(E1/E)log(σ(E)) = . (4.1)
+log(E2/E1)
+The set of data used in Geant4 for the determination of the cross sections and for sampling of the
+final states are extracted from a set of publicly distributed evaluated data libraries (for the low energy
+extension):
+5The low energy extension has its website here http://www.ge.infn.it/geant4/lowE/index.html
+62 The Simulations by Monte Carlo Method
+• EPDL97 (Evaluated Photon Data Library) : [12]
+• EEDL (Evaluated Electron Data Libraries) : [13]
+• EADL (Evaluated Atomic Data Libraries) : [14]
+• stopping power data : [15, 16, 17, 18]
+Those sets of data are well described in their reference manual which can be obtained from Lawrence
+Livermore National Laboratory’s website6.
+4.2.1.3 Analysis and Representation tools
+The Geant4 toolkit offers numerous interfaces to access all physical parameters while the simulation
+is running. It has also dedicated libraries for trajectories and other data storing. So the user can
+record the information it has interest for later analysis.
+But Geant4 is also AIDA compliant, meaning it has access to all the functionalities AIDA offers for
+online data analysis and histogramming/tuppleing.
+AIDA is a set of abstract interfaces and formats for data representation. There are various imple-
+mentations of AIDA, offering all sorts of tools for data analysis (filtering, combination, etc...), and
+representation (histograms, ntupples/data trees...).
+For Geant4 possesses a direct interface with AIDA compliant tools, it is possible to make the analysis
+of the simulations performed online and to store the results of those simulations. This is of particular
+importance, as Monte Carlo simulations produce enormous amounts of data, which can be very long
+to analyze.
+Of course the data recorded can be further studied and exported thanks to dedicated softwares, which
+are also AIDA compliant.
+In addition, Geant4 possesses interfaces for 3D representation of the geometry and particles trajec-
+tories in the volume. This is of strong help for complex geometries definitions.
+4.2.2 The simulation tool developed
+4.2.2.1 Description and Functionalities
+The code developed was expected to
+• help understanding the physics of the photocathodes in the X-ray energy range,
+• compare various geometries of photocathodes,
+• help predicting the efficiencies of unstudied materials.
+For the description of the physical processes is rather straightforward in the Geant4 toolkit, the
+hardest part was the implementation of the tools to perform detailed analysis of the simulations.
+The following libraries of Geant4 or common associated tools were chosen for the implementation:
+6http://www.llnl.gov/cullen1/photon.htm
+4.2 The Geant4 toolkit for particle transport into matter 63
+Concerning the Physics
+The Low Energy Extension was used to perform all the simulations.
+All processes involving photons were activated except the pair creation, which has no sense for sim-
+ulations of photons having energies lower than 100 keV.
+So the following processes were activated:
+• The Photoelectric effect (G4LowEnergyPhotoElectric library).
+Both Fluorescence and Auger de-excitations of photoionized atoms were activated.
+By default, the photoemitted electron has the same direction as the incident photon. Instead,
+the use of the standard electron angular emission generator was forced. Unfortunately, this an-
+gular distribution corresponds only to electrons emitted from the K-shell. For most interactions
+of X-rays in the targeted energy range occur with electrons from the K-shell, this limitation is
+not a real problem.
+• The Compton Scattering process (G4LowEnergyCompton Library).
+• The Rayleigh Scattering process (G4LowEnergyRayleigh).
+Concerning electrons, all the processes were also activated:
+• Electron Ionization (Library G4LowEnergyIonisation).
+Here again Auger and Fluorescence desexcitations of the ionized atom were activated.
+• The Bremsstrahlung continuous loss of energy of electrons (Library G4LowEnergyBremsstrahlung).
+• Electron scattering, which corrects path lengths and lateral displacements after each step for
+charged particles (Library G4MultipleScattering). Identically Auger as well as Fluorescent
+desexcitations were activated, for accurate simulations.
+Cut Lengths (corresponding in Geant4 to energies under which no secondary particles are created),
+were always set to their minimum values (≡ 250 eV).
+Concerning the data analysis tools
+Nb emitted e−To calculate the overall efficiency of the photocathode (calculated as Queff = Nb incoming photons), a
+direct implementation was used. A csv (comma separated value file format) file was happened after
+each simulations with Quantum Efficiency, and the photocathode parameters (Material, geometrical
+information...).
+All other information extracted from the simulations were recorded thanks to the AIDA interface.
+A global Tupple Manager was created and linked to the various manager of the code (RunManager,
+EventActionManager...), in order to enable information to be grabbed in the proper instances of the
+code7.
+More than 20 histograms, 2D clouds... were created to enable a proper track of the simulations.
+7For example, Information regarding physical processes in the StepManager,
+Information regarding the deposition of the photons/electrons in the EventActionManager...
+64 The Simulations by Monte Carlo Method
+4.2.2.2 The test of the code, comparison with experimental values
+Various tests were made to confront the code with experimental data. Unfortunately, it turned out
+that the code is not able to simulate properly the photocathodes.
+In this part, success and failures of the code are exposed, and an explanation is given to those limi-
+tations.
+The aim of the simulations
+Various authors were able historically to create codes based on the Monte Carlo Method calculating
+successfully the efficiencies of photocathodes (especially for CsI, [19, 20] already cited in section 3.2).
+So it was natural to try to develop a code based on the latest technologies to help studying new
+materials for photocathode applications.
+The code was expected to provide reasonable predictions of the efficiency of one material, the influence
+of the geometry, and the influence of an electric field.
+It was planed to use it to study novel sorts of photocathodes, with materials and geometries untested
+so far.
+In none of those expectations, an exact value was considered as mandatory, but an error of less
+than 10 % can be considered as a minimum requirement to be able to use the code for predictions
+on the efficiency of new materials.
+Unfortunately, it turned out rapidly that this precision could not be reached with the code developed:
+the calculated values were always largely underestimated and with an error for some materials of more
+than one order of magnitude !
+It is likely that this error can be bettered by a refinement of the code for each material studied. But
+this process is long and uncertain, and it involves several experimental tests to adjust the physical
+model used for each material.
+This study was out of purpose in the scope of this work, which aims in testing several materials.
+Examples of results returned by the code and discussion
+Gold and CsI were taken as reference materials to test the code. As both materials were intensively
+studied, it was easy to find reliable measurements of their absolute efficiencies.
+For Gold, the measurements made by B. L. Henke et al. at the BESSY-I and II light sources [21]
+were taken as a reference (Figure 4.4, and for CsI, the measurement by G.W.Fraser were taken (Figure
+4.3).
+In the simulation, the photocathode thickness is 1 µm, and the efficiency is calculated from the
+electrons escaping the photocathode on the side of the incident photons (following the corresponding
+measurements in the cited publications).
+4.2 The Geant4 toolkit for particle transport into matter 65
+Figure 4.3 : Quantum Efficiency of CsI as computed by the code, and measured
+Figure 4.4 : Quantum Efficiency of Gold as computed by the code, and measured
+66 The Simulations by Monte Carlo Method
+4.2.2.3 The limits of the Monte Carlo Method
+A deep investigation of the code and of the Monte Carlo Method was performed to understand why
+the simulations were providing such bad results.
+First the Geant4 toolkit was compared with another well known code: Penelope, developed mainly
+at the University of Barcelona (PENetration and Energy Loss Of Electrons and Positrons in matter,
+[22, 23]). This toolkit did not give better results. The same toolkit was also tested through its
+implementation into Geant4.
+After some investigation it became clear that several problems could explain why the code would
+return wrong results:
+• A problem of Approach: The Monte Carlo Method is based on a particle/nucleus interaction
+approach. The models do not include a priori, differences between the various chemical states
+and physical structures, which coexist in one material (chemical bounding, crystalline structure,
+grain joins, etc...). Yet those states can have a large impact on the dynamic of electrons in the
+material, for any defect in the crystallinity of the material corresponds to a trap. In particular,
+a semiconductors and metals are treated mainly the same way.
+In the case of X-rays and energetic electrons, this approximation can be considered as not too
+rough for at high energies, most interactions occur with electrons of the core shells of the atoms.
+Those inner shells being practically unperturbed, the corresponding cross sections do not vary
+sensibly.
+But when it comes to lower energy electrons, most interactions occur with the outer shell
+electrons or with free electrons, so the result becomes largely affected by the precise form of
+the material (chemical state, bounding to neighboring atoms, etc...), as well by its purity and
+its structure (change of band structure, traps, etc...). This is the main limiting factor for
+simulations at low energies[24] .
+Unfortunately, concerning photocathodes, the key phenomenons occur at this energy, for most escap-
+ing electrons have an energy of only a few eV.
+In addition, a number of other difficulties appear at small energy:
+• The quality of experimental data at low energies. Experimental cross sections at low
+energies are extremely hard to obtain with a good precision. Actually, only some indirect data
+can be used, like the stopping power for electrons through a thin slab, characteristic energy losses
+(plasmon excitations), and the total mean free path for inelastic scattering.
+On the other hand it is not possible to theoretically determine the values of the cross sections,
+as this implies solving the many-body interaction problem in solids.
+In practice, while cross sections are provided down to very low energies, their precision is
+considered as extremely poor.
+• The infrared divergence. As explained previously, at low energies, particles tend to create
+large numbers of secondaries, which in turn create an even greater number of daughter particles.
+4.3 The simulation performed 67
+To avoid this, the Monte Carlo codes block the creation of secondary particles under a certain
+cut off energy. This is extremely bad for the simulation of photocathodes, as it turns out that
+secondary electrons are the main contributors to the total yield (from 80 % for materials like
+gold to more than 99.5 % in the case of CsI[21]).
+• The specific problem of electron extraction from the material. As emphasized by the
+Spicer model, the extraction of the hot electrons from the surface is a key problem, for the
+electrons have to overpass a barrier of potential to reach vacuum. Those potentials are of the
+order of a few eV high, so they are far too small to be properly simulated by Monte Carlo codes.
+Moreover, according to B.L.Henke et al.[21], most secondary electrons have an energy inferior
+to 10 eV . The interested reader can also read the publication by A.Gibrekhterman et al., which
+details the proportions of primary to secondary electrons contributing to the emitted current
+in [19] in the case of CsI. Also B.L.Henke et al.[25] detail how the conditions of cleanness of the
+surface can have a major impact on the emission efficiency.
+So the major difficulties arise from the strong dependence of the photocathode quantum efficiency on
+physical effects, which occur at energies unreachable by conventional general purpose Monte Carlo
+codes.
+The few codes, which succeeded to overcome this difficulty are based on analytical formula with free
+parameters such as the probability of loss of an energy ~ω per unit energy, momentum, and path.
+This method enables to obtain codes in very good agreement with experimental data, but they are
+material specific and cannot be extended to other materials in general (see the very interesting work
+by T. Boutboul et al.[20] in the specific case of CsI).
+In conclusion, if the transport of the X-rays is well simulated by the Monte Carlo codes, the simulation
+of the very low electron dynamics in solid state materials is far from being enough refined to enable
+a proper simulation of the photocathodes.
+4.3 The simulation performed
+Despite of the bad performance of the code to reproduce quantitatively the efficiency of the pho-
+tocathodes, simulations were performed to study the possibility of a qualitative description of the
+enhancement of the efficiency by varying the geometrical structure of the photocathode.
+The result of those simulations is presented in this section.
+4.3.1 The simulations performed
+The simulation of flat photocathodes was performed to check the validity of the code. The results were
+presented in the section 4.2.2.2. They serve as the basis to compare with the efficiency of structured
+photocathodes.
+Different types of structures were simulated:
+• Structures with ”pillars”
+68 The Simulations by Monte Carlo Method
+• Structures with ”pyramids”
+• Chevron like structures
+• Structures randomly or periodically placed...
+Those studies enabled to optimize the thickness of the photocathodes as function of the energy of
+the incoming photons. Indeed, the most energetic electrons are those, which exit the photocathode
+from the deepest places, and they are also those which are correctly simulated by the code, for their
+energy is high.
+For example Figure 4.5 shows the position of photoemission of the electrons, which reached the vac-
+uum in the simulation for two different energies. It clearly appears that, from the point of view of the
+escape length of the electrons, a photocathode of thickness 0.5 µm is too thick for low energies (here
+10 keV) but well adapted for higher energies (50 keV). Both the pillar structures and the underlying
+layer are made of the photoemissive material (gold).
+Figure 4.6 shows the simulation of a pyramidal structure with only the outer layer being photoemis-
+sive. This corresponds to the case of structures, which are covered with the photoemissive material
+(gold). The underlying structure would be made of a low absorbing material (like capton), which is
+not simulated.
+4.3 The simulation performed 69
+Figure 4.5 : Simulation of Pillars structures on a photocathode of sizes 0.8 µm height and 0.4 ∗ 0.4 µm2
+size. Each dot corresponds to the creation of one electron, which exited the bulk. Top Picture corresponds to
+a photon energy of 10 keV, and Bottom picture to photon energy 50 keV.
+70 The Simulations by Monte Carlo Method
+Position of escaping electrons (transmited and reflected) X vs Z (in mum)
+0,0020
+0,0019
+0,0018
+0,0017
+0,0016
+0,0015
+0,0014
+0,0013
+0,0012
+0,0011
+0,0010
+0,0009
+0,0008
+0,0007
+0,0006
+0,0005
+0,0004
+0,0003
+0,0002
+0,0001
+0,0000
+-0,0001
+-0,0002
+-0,0003
+-0,0004
+-0,0005
+-0,0006
+-0,0007
+-0,0008
+-0,0009
+-0,0010
+-0,0011
+-0,0012
+-0,0013
+-0,0014
+-0,0015
+-0,0016
+-0,0017
+-0,0018
+-0,0019
+-0,0020
+-0,00020 -0,00015 -0,00010 -0,00005 0,00000 0,00005 0,00010 0,00015 0,00020 0,00025 0,00030 0,00035 0,00040 0,00045 0,00050
+Position of escaping electrons (transmited and reflected) X vs Z (in mum)
+  Entries : 11293 
+0,0021   XMean : 1.3861E-4 
+0,0020   XRms : 1.4593E-4 
+0,0019   YMean : 1.3237E-4 
+  YRms : 5.7028E-3 
+0,0018
+0,0017
+0,0016
+0,0015
+0,0014
+0,0013
+0,0012
+0,0011
+0,0010
+0,0009
+0,0008
+0,0007
+0,0006
+0,0005
+0,0004
+0,0003
+0,0002
+0,0001
+0,0000
+-0,0001
+-0,0002
+-0,0003
+-0,0004
+-0,0005
+-0,0006
+-0,0007
+-0,0008
+-0,0009
+-0,0010
+-0,0011
+-0,0012
+-0,0013
+-0,0014
+-0,0015
+-0,0016
+-0,0017
+-0,0018
+-0,0019
+-0,0020
+-0,00020 -0,00015 -0,00010 -0,00005 0,00000 0,00005 0,00010 0,00015 0,00020 0,00025 0,00030 0,00035 0,00040 0,00045 0,00050
+Figure 4.6 : Simulation of periodically placed pyramidal structures with a photon energy of 5 keV. The top
+picture is a photocathode of thickness 0.1 µm and height 3 µm. The bottom picture is a photocathode with the
+same parameters except the thickness: 2.5 µm.
+4.3.2 Use of the simulations for thickness optimization
+The simulations performed enabled to confirm that the electrons photoemitted have a very short mean
+free path in the photocathode. No quantitative differences in terms of efficiency could be extracted
+for the different thickness. Only a qualitative analysis thanks to diagrams like on figures 4.5 or 4.6
+4.4 Conclusion on this part of the work 71
+enabled to define optimized thickness.
+According to this analysis, for energies in the order of a few keV (as the main target of energy range
+in this application), thickness of the order of a fraction of a micron seem to be the most suitable, for
+all tested material. Larger thickness indeed result in dead zone in the middle of the photocathode,
+and imply larger structures, which corresponds to a smaller surface of the photocathode, and so to a
+lower efficiency.
+This result was predictable from the known mean free paths of electrons in photoemissive materials.
+4.3.3 Simulation of the impact of structures on the photocathode
+Even if the code cannot simulate properly the quantum efficiencies of photocathodes for X-ray de-
+tectors, it is a priori not out of hope that it can help to evaluate the effect of structures on the
+photocathodes.
+To test the validity of the code for this, after the first experimental test of structures had been done,
+the simulations were compared to the experimental results.
+The measurements to perform this verification are detailed in section 7.1.2. The sample Trizact 143
+is constituted of periodic square pyramids of sizes 500 µm length and height ∼ 160 µm (see Figure
+7.4 and 7.5). The faces form an angular of 57oC with respect to the base plane. The sample was
+covered with a gold layer of thickness 0.3 µm.
+The measurement indicate an increase of quantum efficiency of a factor ∼ 1.9 in good agreement with
+the theoretical value of 1cos(57) = 1.9 (see section 6.2.1).
+The simulation by Monte Carlo of the flat surface calculated a quantum efficiency of 0.088 % (cf
+Figure 4.4) for an energy of 5 keV.
+With the geometry of the trizact sample, the code returns a quantum efficiency of 0.12 %. This
+corresponds to a gain of a factor: ∼ 1.4.
+So here again, the code fails to predict correctly the increase of quantum efficiency due to the struc-
+tures on the surface.
+4.4 Conclusion on this part of the work
+Use of the code for photocathode simulations
+Unfortunately, the application developed cannot be used to predict theoretically the quantum effi-
+ciencies of novel photocathodes.
+The limits of the Monte Carlo Method for Photocathodes Simulations.
+The impossibility to simulate properly the photocathodes properties, lies in the poor simulation of
+the particles interactions with matter. This is due to the incomplete cross section knowledge
+for very low energy particle-matter interaction.
+72 The Simulations by Monte Carlo Method
+More precisely, in the case of the photocathode simulations, the electrons behavior could not be
+simulated with a sufficient precision (while the simulation of the photons interaction were precise
+enough).
+So, in order to use a monte carlo approach to simulate X-ray photocathodes, one must first determine
+precisely cross sections at energies down to a few eV.
+To obtain those cross sections at such energies, it is not possible to study each material and combine
+the obtained cross sections to simulate mixtures of them like it is usually done at high energy for
+such an approach cannot take into account the chemical state of the atoms.
+So each material has to be studied one by one.
+Is is possible to use Monte Carlo codes for photocathode simulations ?
+It is possible to overcome the lack of knowledge of the cross sections at low energies by introducing
+free parameters, which are then fitted on experimental data. This approach was successfully used to
+study CsI [20] and enabled a much better understanding of the material.
+Of course this sort of method is material specific and cannot be used for general purpose photocath-
+odes simulations (to study a great number of photocathode material).
+This sort of analysis being out of the scope of this thesis work, the code was not further used, except
+for trivial thickness optimization analysis.
+It should also be noted that the developped application would likely have been more successful in
+simulating the photocathode properties used with more energetic photons.
+As with increasing photon energies, the fraction of energetic electrons contributing to the yield in-
+creases [21], the code is more capable of simulating the photocathodes properties.
+The lack of experimental data at higher energies did not permit to test further the code, and here
+again it was not in the scope of this thesis work to investigate further the limits of the code.
+So it is not hopeless to use a Monte Carlo code to simulate the efficiency of photocathodes in the
+case of photocathodes used with more energetic photons.
+In particular, Geant4 offers all the needed flexibility to implement cross sections with better precision,
+and to adapt the Monte Carlo method to the specific case of very low energies particles.
+The only limitation would be the power of the computer, as the number of secondary particles would
+increase dramatically (infrared divergence).
+Possible other methods for the simulations of photocathode simulations
+with low energy photons.
+Other methods to simulate photocathodes properties are analytical methods like the three step model
+introduced by Spicer (see section 3.1) or more simply an evaluation of the efficiency by considering
+the product Eµ(E) (with E the energy, and µ the photoionization cross sections).
+Those methods do not provide quantitative evaluations of photocathodes quantum efficiencies Yet.
+4.4 Conclusion on this part of the work 73
+It remains that this part of the work was of great help to understand the various processes and
+parameters, which are key for the quantum efficiency of photocathodes in the hard X-ray energy
+range. This has proven to be of great help for the following research of new materials for photocathode
+applications.
+
+Bibliography
+[1] S. U. et al., “Statistical methods in neutron diffusion,” LAMS-551, Los Alamos National Labo-
+ratory, 1947.
+[2] S. U. et al., “The monte carlo method,” Journal of American Statistical Association, vol. 44,
+p. 335, 1949.
+[3] G.Ward et al., “The holodeck ray cache: An interactive rendering system for global illumination
+in nondiffuse environments,” ACM Transactions on Graphics, vol. 18(4), pp. 361–98, 1999.
+[4] P.Jaeckel, Monte Carlo Methods in Finance. John Wiley and Sons, 2002.
+[5] Agostinelli et al., “Geant4-a simulation toolkit,” Nucl. Inst. and Meth. A, no. 506, pp. 250–303,
+2003.
+[6] H.Messel et al., Electron-Photon shower distribution. Pergamon Press, 1970.
+[7] J.C.Butcher et al., “Electron number distribution in electron-photon showers in air and aluminum
+absorbers,” Nucl. Phys., no. 20, 1960.
+[8] R.Ford et al., “The egs4 code system,” Tech. Rep. 265, Slac, Stanford, 1985.
+[9] Geant4 Community, Geant4 User Guide-for application developers.
+[10] Geant4 Community, Physics Reference Manual.
+[11] F.Salvat et al., “A code system for monte carlo simulation of electron and pho-
+ton transport,” Workshop Proceedings, Barcelona, Spain, 4-7 July 2006: OCDE NEA,
+p. http://www.nea.fr/html/dbprog/peneloperef.html, 2006.
+[12] D.Cullen et al., “Epdl97: the evaluated photon data library, 97 version.”
+[13] S.T.Perkins et al., “Tables and graphs of electron-interaction cross-sections from 10 ev to 100
+gev derived from the llnl evaluated electron data library (eedl), z=1-100.”
+76 BIBLIOGRAPHY
+[14] S.T.Perkins et al., “Tables and graphs of atomic subshell and relaxation data derived from the
+llnl evaluated atomic data library (eadl), z=1-100.”
+[15] H.H.Andersen et al., The stopping and ranges of ions in Matter, vol. 3. Pergamon Press, 1977.
+[16] J.F.Ziegler et al., The stopping and ranges of ions in Matter, vol. 4. Pergamon Press, 1977.
+[17] H.H.Andersen et al., The stopping and ranges of ions in Solid, vol. 1. Pergamon Press, 1985.
+[18] A.Allisly et al., “Stopping powers and ranges for protons and alpha particles,” tech. rep., ICRU,
+1993.
+[19] A.Gibrekhterman et al., “Characteristics of secondary electron emission from csi induced by x
+rays with energies up to 100 kev,” J.Appl.Phys, vol. 74, pp. 7506–7509, 1993.
+[20] T.Boutboul et al., “An improved model for ultraviolet- and x-ray- induced electron emission
+from csi,” J.Appl.Phys, vol. 86, pp. 5841–5849, 1999.
+[21] B.L.Henke et al., “The characterization of x-ray photocathodes in the 0.1-10kev photon energy
+range,” J.Appl.Phys., vol. 52(3), pp. 1509–1520, 1981.
+[22] J.Barba et al., “Penelope: An algorithm for monte carlo simulation of the penetration and energy
+loss of electrons and positrons in matter,” Nucl. Inst. and Meth. B, vol. 100, pp. 31–46, 1995.
+[23] F.Salvat et al., “Penelope, a code system for monte carlo simulation of electron and photon
+transport,” in Proceedings of a Workshop/Training Course, OECD/NEA 5-7 November 2001,
+vol. 19, 2001. ISBN:92-64-18475-9.
+[24] J.M.Ferna´ndez-Varea, “Private communication during hands on session of the workshop on use
+of monte carlo techniques for design and analysis,” 09 2006.
+[25] B.L.Henke et al., “0.1-10kev x-ray induced electron emissions from solids-models and secondary
+electron measurements,” J.Appl.Phys., vol. 48, pp. 1852–1866, 1977.
+Chapter 5
+Experimental Setup and Sample Preparation
+5.1 Design of the measurement setup
+5.1.1 A few general considerations
+The measurement of the quantum efficiency of a photocathode is not a trivial task. The actual effi-
+ciency varies greatly with the experimental conditions, and with the material quality and the shape
+of the photocathode material.
+The main factor is the cleanness of the photocathode surface, as it has a strong impact on the work
+function of the material, which is the main parameter determining the quantum efficiency.
+To reach the maximum quantum efficiency of one material, one has to deposit it in an ultra clean
+environment (ultra-high vacuum), and to perform the measurement in situ without any vacuum break.
+Yet, in this work a perfect environment was not targeted as this does not enable to test the photo-
+cathode in real conditions (gas-filled detectors). Indeed maintenance operations often require to open
+the detector.
+The preparation and mounting conditions of the samples are those typical for the preparation of
+gas-filled detectors (clean room environment, special care in cleaning...).
+The main requirements for the photocathode quantum efficiency measurement setup are:
+• Adaptability to all available sources (synchrotron, but also X-ray tube and radioactive sources).
+This implies the ability to work with very small X-rays flux.
+• The possibility to work with samples of various sizes and shapes.
+This requires a system to keep a constant distance between the photocathode and the polarizing
+grid.
+• The possibility to use the system both in reflection and transmission modes (electrons collected
+on the side of incident X-rays or on the opposite side).
+78 Experimental Setup and Sample Preparation
+Parameters Value
+Electrons acceleration 20 kV
+Current Intensity 20 mA
+Slits 1 aperture 7 mm
+Slits 2 aperture 7 mm
+Filter Ø
+Table 5.1 : X-ray tube source parameters
+The main difficulty arises from the necessity to work with very low currents. Indeed, a 55Fe ra-
+dioactive source of activity 30µCi, encapsulated in the protection case typically offers a flux of
+∼ 106 photons/s/4pi (an avalanche photodiode measurement gives 4 ·106counts/s). If the photocath-
+ode has a quantum efficiency of 1% at the k line of 55α Mn (5.9keV), then the expected current is of
+106 ∗ 0.01 ∗ 1.6 ∗ 10−19 ≡ 10−15A ≡ 1 fA.
+So the setup must be able to measure currents of less than a femtoamper.
+The source used to perform the measurement was mainly an X-ray tube, mounted with a copper
+anode. Apart from measurements made for calibration purposes, the tube was used with the param-
+eters indicated in table 5.1.
+The setup was also tested on the ID15c ESRF synchrotron radiation beamline, which has a fixed
+energy of 39.5keV. For the signal to noise ratio was not actually better than the one obtained with
+the X-ray tube (flux ∼ 1010 photons/s, but in the meantime much lower quantum efficiencies of the
+photocathodes), the beamline was not often used.
+5.1.2 The chamber and the ammeter
+5.1.2.1 The Photocathode holder, the electrical shielding
+The electrical scheme used to perform the measurements is given in figure 5.1.
+It was chosen to bias the photocathode at a negative potential and to place the collection grid at
+ground potential, rather than polarizing the collection grid. This presents several advantages:
+• a smaller sensitivity to the geometrical parameters,
+• no contribution to the measured current of electrons photoemitted by surrounding materials at
+ground potential,
+• a better use of the ammeter, which has a dedicated mode for such mounting (see later for a
+description of the ammeter).
+Indeed, some earlier tests with the grid being polarized showed higher leakage currents (typically
+several fA), any other parameters being identical.
+5.1 Design of the measurement setup 79
+Figure 5.1 : Schematics of the experimental setup used to make the measurements
+The holder is mainly made of PEEK, a UHV compatible, hard plastic. It also shows a high electrical
+resistivity (around 1014 Ωm at room temperature). To reduce as much as possible the surface con-
+ductivity, a cleaning with ethanol (and eventually acetone to remove traces of glue due to the copper
+tape -see next) was systematically performed.
+Figure 5.2 : The photocathode peek support
+The circuit is fully shielded with guard rings. A copper tape was used to adapt the shielding to each
+photocathode. Special care was taken to hide the copper from the X-Rays (to avoid contribution
+from the copper).
+80 Experimental Setup and Sample Preparation
+The grid used to polarize the photocathode (actually it is at ground potential) is mounted on a copper
+holder, with an iron ring to put it under voltage.
+After mounting and cleaning of the photocathode, the resistance between the photocathode and the
+other parts of the circuit (guard-rings and collecting grid) was typically of a few 100s G Ω to a few
+T Ω (as measured by the Keithley 6430, see later). When applying a voltage of −100 V , typical
+measured leakage currents were inferior to 0.4 fA.
+5.1.2.2 The Chamber
+Figure 5.3 : The chamber with some of the connectors
+The chamber has a volume of 2.5 dm3. It is made of standard and custom components. It has various
+coaxial and triaxial connectors, as well as a KF-connector for pumping. The entrance window is a
+thin Beryllium window of 2 ∗ 1 cm2 size.
+Connections with the ammeter are performed with triaxial feedthrough connectors (by Pomona)1.
+1For the connectors to the ammeter are 3 slot-male triaxial connectors, while the Pomona feedthrough are 2 slot-male
+triaxial male connectors, 2 to 3 slot-female triaxial connectors made by Trompeter.
+5.1 Design of the measurement setup 81
+The preamplifier of the ammeter (see later) was directly connected to the chamber (via the adaptors)
+without any adding extra wire.
+The chamber was pumped thanks to a turbo-molecular pump. Yet no precaution was taken to reach
+ultra high vacuum. Only high vacuum was used to perform the measurements (to suppress any
+contribution of gas molecules to the measured quantum efficiency). This is justified by the need to
+develop photocathodes for gas-filled detectors, which have to work effectively in unclean environments.
+5.1.2.3 The Keithley 6430 ammeter
+The Keithley 6430 sub-femto ammeter is a high
+end electrometer by Keithley, whose main charac-
+teristic is the presence of a remote pre-amplifier
+with triaxial connectors, which reduces as much as
+possible the contribution of the leading cable to the
+measured signal.
+The 6430 possess several ways of operation, includ-
+ing the possibility to measure very small currents
+while polarizing the sensor to a voltage in a range
+−210 V < U < 210 V (Source-Measure Concept).
+This mode was used to polarize the photocathode
+according to the schematic on figure 5.1. This
+Figure 5.4 : The Keithley 6430 ammeter
+mode is also the one providing the best internal
+precision of measurement [1, 2].
+The 6430 can also be used to measure electrical resistances up to 20T Ω (the measurement is performed
+between the guard and the source). This mode was used to check the quality of the insulation
+(∼ cleanness) of the setup before each measurement.
+5.1.3 Results of calibration and test of the chamber
+To ensure that the setup provides reliable measurements of the photocathode quantum efficiency, a
+tests were performed with the X-ray tube (all tests performed with a copper cathode, acceleration
+parameters being 20 mA current, and 20 kV accelerating voltage).
+First the setup was tested without any photocathode. This enabled to measure the contribution
+of the grid (parasitic photoemission). For this, the schematics presented on figure 5.1 had to be
+inverted, so that the ammeter would actually measure the current emitted from the grid (as a negative
+contribution to the measures intensity). This intensity I0 was I0 < 2 pA. This contribution is superior
+to the typical leaking currents, but can be considered as negligible when compared to typical measured
+photo-currents (typical measured currents are of the order of 20pA to several hundred pA, see 7.1.2).
+In addition, this measurement corresponds to the absence of any electric field (no photocathode). In
+presence of electric field, the amount of grid photo-emitted electrons is reduced to its most energetic
+fraction. Other electron cannot escape the attracting potential.
+82 Experimental Setup and Sample Preparation
+Figure 5.5 : Current-Voltage (I-U) characteristics of the experimental setup in presence of X-rays with a
+gold photocathode.
+With the same configuration (ammeter connected to the grid), tests were performed with a ”non
+emitting photocathode”: a thick kapton foil with copper on the back layer to bias it. This was used
+to measure an hypothetical contribution of the surrounding materials (from the PEEK made holder).
+Again this contribution was extremely small, for no current could be recorded (contribution inferior
+to the intrinsic noise of the system ∼ 0.1 fA).
+This measurement also confirms according the previous measurement (no bias, ammeter connected
+to the grid) that the contribution of the grid is very small.
+Last a reference system (gold deposited on a kapton foil by sputtering) was used to study the de-
+pendence of the electrons collection quantum efficiency on the bias voltage. The result is depicted in
+figure 5.5.
+A current saturation clearly appears for voltages inferior to −40 V . The non zero intensity for posi-
+tive bias can be explained by the proportion of photoemitted electrons with high kinetic energy (see
+[3]). Electrons emitted with energies superior to 100 eV (theoretically up to 20 keV for the tube was
+used with an acceleration of 20 kV ) have a sufficient energy to escape the attractive potential of the
+photocathode and so are counted. The small current value at positive voltages highlights the small
+proportion of photoemitted energetic photons.
+Photoemitted currents as function of the electron intensity on the cathode also follows a very good
+5.1 Design of the measurement setup 83
+linearity with the X-ray tube current in the range [10 mA; 40 mA]: the photoemission is proportional
+to the flux of X-rays. This indicates that there is no saturation effect at those intensities (like charging
+of the surrounding material, which would affect the extraction electric field).
+5.1.4 Conclusion concerning the setup
+The test of the setup was a success: the setup shows very good characteristics for the measurement
+of very low currents. Its intrinsic noise is inferior to the fA, and can measure the typical currents
+emitted by the photocathodes (pA ← nA). The Keithley ammeter guaranties 512 digits at those
+currents.
+Its high modularity enables the test of photocathode samples of very diverse sizes and characteris-
+tics. The setup can be used with various sources of X-rays: radioactive sources, X-ray tubes, and
+synchrotron beamlines.
+
+Bibliography
+[1] keithley Instruments Inc., Private Communication with Keithley, 2004.
+[2] keithley Instruments Inc., Keithley 6430 Manual, Chapter 5, 2000.
+[3] B.L.Henke et al., “The characterization of x-ray photocathodes in the 0.1-10kev photon energy
+range,” J.Appl.Phys., vol. 52(3), pp. 1509–1520, 1981.
+
+Chapter 6
+The different concepts to make a photocathode
+Different approaches were taken to try to increase the photocathode quantum efficiencies. Some ideas
+were explored only theoretically, while others -more promising- lead to the fabrication of test-samples
+to compare them with reference photocathodes.
+6.1 Indirect conversion
+Figure 6.1 : A two step photons to electron conversion
+In this section, an indirect conversion of the X-rays into electrons is evaluated. The X-rays are first
+converted into lower energy photons thanks to a scintillating material, and then the photocathode
+converts those photons into electrons.
+The origin of this idea is the availability of photocathodes offering good quantum efficiencies in the
+visible or UV energy range (infra-red sensitive photocathodes were not considered as they involve
+88 The different concepts to make a photocathode
+cooling systems to suppress their intrinsic noise -due to thermal emission), while one can benefit from
+the yield of scintillators (several UV/visible photons created per incoming X-ray). In addition with
+this technique one can hope to convert 100 % of the X-rays into visible/UV photons, and so avoiding
+the presence of X-ray photons in the back-end electronic, which can be problematic (for the noise of
+the system mainly).
+If a fluorescent material can produce low energy photons with yields as high as 50, 000 photons/MeV ,
+if about one hundredth of those photons hit the photocathode (the solid angle corresponding to angle
+without total reflections is small), and if this photocathode has a quantum efficiency of 10 %, then
+for 10 keV incoming photons, the expected yield is:
+∗ ∗ 150, 000 0.01 ∗ 1 ∼ 0.5 e−/photon.
+100 10
+This is of course only a theoretical value.
+Several aspects have to be considered when making such a system, including the predictable time
+response, which has to be compatible with high count rates and the resolution of the system, which
+must be compatible with the targeted pixel size.
+Some prototypes (like [1, 2, 3]) exploiting such an approach were already made for PET application
+(so with much higher photon energies), but none of them could provide good results until now. This
+study explore the principle in the case of lower energy X-rays.
+6.1.1 Photocathodes in visible and UV
+The requirement for the photocathode to work in the visible range are the same as for those working
+in the X-ray energy range. Yet, because of the difference of energy, one does not have to limit
+the research to high Z materials, so providing a much wider range of possibilities. This is very
+interesting as in general there are more materials with well controlled physical and chemical properties.
+Lastly, photocathodes working at low energies find a lot of applications in astronomy, photo-injectors
+(coupled with short-pulse lasers). At those energies they are typically found in photomultipliers and
+phototubes.
+The most common photocathodes in the visible/UV energy range (available industrially) are:
+Bialkali photocathodes such as Sb−Rb−Cs, Sb−K −Cs. They feature a spectral responses in
+the optical and close UV. They are usually not very stable, and so their use cannot be envisaged.
+Multialkali photocathodes especially Na − K − Sb − Cs, which exhibit a very wide spectral
+response, from ultraviolet to wavelength as long as 930 nm.
+GaAs also with a very wide spectral response. Eventually GaAs photocathodes are covered with Cs
+to make them NEA (negative electron affinity), but this is at the cost of a higher sensibility to
+pollution.
+Solar Blind Photocathode especially GaN , KBr, CsBr, InGaN and AlxGa1−xN . Most were
+developed for space applications (UV cameras, insensible to light pollution due to the sun).
+Those photocathodes often exhibit quantum efficiencies of more than 30 %, at wavelength
+inferior to 350 nm. Among those photocathodes, GaN is the material which offers the most
+promising characteristics.
+6.1 Indirect conversion 89
+Diamond (C*) is a relatively new photocathode, which offers several advantages: it is rather stable
+[4] and NEA[5, 6] when plasma-hydrogenated. In addition in principle it suffers less than
+other materials from pollution due to organic gases such as methane (which is a good gas for
+amplification). Diamond photocathodes are obtained by CVD1, or by low energy ion deposition
+of carbon. They are amorphous materials, which exhibit a mixture of sp2 (graphite like) and
+sp3 (diamond like) bonds (CVD deposited diamonds are usually better as they exhibit a higher
+proportion of diamond like bonds, and a better crystallinity). The surfaces are then treated by
+plasma hydrogenation in order to make the surface NEA. The problem comes from its sensitivity
+limited to wavelength inferior to 210 nm (large band gap semiconductor: 5.47 eV ).
+6.1.2 Scintillation materials
+There are various materials able to provide fluorescence photons at various energies. They are char-
+acterized by four main parameters:
+• The fluorescence yield, usually given in photons / MeV. The linearity of the yield is excellent
+for energies up to a few MeV.
+• The energie(s) of emitted photons.
+• The time response of the scintillator, often there is a fast response corresponding to few photons
+and a slower one corresponding to a much higher yield, and to an energy slightly different.
+• The achievable resolution with the scintillator. This is strongly related to the thickness of the
+deposited layer. But in average, with a resolution of a few µm, most materials can absorb 100 %
+of the photons with wavelengths inferior to 30 keV .
+To obtain a competitive quantum efficiency, as shown in the calculus made in the introduction, a
+minimum yield of 10, 000 photons/MeV is necessary.
+As said previously, it would be best to have a photocathode sensible to UV light. So the fluorescent
+material needs to have a good yield at those wavelength (typically less than 350 nm).
+Also, the aim of the project is to build a detector able to work in counting mode, and with a typical
+count rate of the order of 1 MHz. This means the decay time constant of the fluorescence must be
+at least one order of magnitude smaller, so of the order of 100 ns.
+Here is a list of the most commonly used scintillation materials with high yields, small decay times,
+and maximum of emission at energies inferior to 500 nm [7]:
+NaI(T l) is one of the most common scintillators. PureNaI offers a maximum yield of 76, 000 photons/MeV
+at λmax = 303 nm, and with a scintillation decay time constant of 60 ns. It is more often used
+doped with thallium, and then has the following parameters: λmax = 415 nm, with yield
+38, 000 photons/Mev and a decay time constant of 230 ns.
+BaF2 is interesting because it emits very energetic photons: the fast component, which is 25 % of
+the total yield is at 220 nm with a yield of 2500 photons/MeV and a decay time constant of
+0.6 ns. The main maximum is at 310 nm with a decay time constant of 630 ns.
+1CVD stands for Chemical Vapor Deposition
+90 The different concepts to make a photocathode
+CsI(Na) has a maximum emission at 420 nm, with a total yield of 38, 000 photons/MeV and a
+decay time constant of 630 ns.
+CaF2(Eu) has its maximum at 435 nm, a yield of 19, 000 photons/MeV , and a decay time constant
+of 630 ns.
+K2LaCl5(Ce) has its maximum at 380 nm, with a yield of 30, 000 photons/MeV , and a decay time
+constant of 80 ns.
+LaCl3(Ce) has its maximums at 330 − 352 nm with a yield of 49, 000, with several components,
+which have all a decay time constant inferior to 200 ns.
+LaBr3(Ce) has its maximums at 358− 387 nm, a total yield of 61, 000 photons/MeV , and 90 % of
+the emission occurring before 90 ns.
+Lu2Si2O7(Ce) (LPS) has a total yield of 23, 000 photons/MeV , with maximums of emission at
+380− 385 nm, and a decay time constant of 38 ns.
+LuI3(Ce) has a maximum emission at 465 nm, with a yield of 33, 000 photons/MeV , and a decay
+time constant of 34 ns.
+RbGd2Br7(Ce) has a maximum of emission at 420 nm, with a yield of 56, 000 Photons/MeV , and
+a decay time constant of 43 ns.
+BrilLancer 350 and 380 of formula LaCl3(10%) and LaBr3(5%) by the Company St Gobain are
+also very interesting: BrilLancer350 for example offers a maximum of emission at 350 nm,
+with a yield of 49, 000 photons/MeV , and a decay time constant of 28 ns.
+In conclusion, there are a lot of materials providing maximums of emissions in the close ultra-violet
+energy range, with acceptable decay time constants, and good yields. Unfortunately, all high yield
+materials are limited to wavelengths superior to 300 nm, which is a problem as shown next.
+6.1.3 Possible combinations
+To obtain a good quantum efficiency, it is of course mandatory that the maximum of emission (and
+more generally, the whole spectrum of emission) of the scintillation material be contained in the
+spectrum of sensitivity of the photocathode.
+For the same reasons as previously exposed, it is also necessary that the photocathode exhibits a good
+robustness to pollution and to irradiation damages. The robustness to pollution of the scintillator
+is less important, as it can be well protected if enough care is taken by the photocathode and the
+substrate.
+This leaves few choices of photocathode.
+Diamond
+In spite of its very interesting characteristics of quantum efficiency, diamond cannot be chosen, for
+its sensitivity starts at energies unreachable by scintillation processes. In addition, diamond is not
+yet well known as a material, and only a few groups can produce diamond with a sufficient quality
+(in terms of crystallinity, hydrogen activation quality, purity of the material). Yet diamond is now
+6.1 Indirect conversion 91
+a subject of great interest for applications in the field of photocathodes (solar blind, for space ap-
+plications), so it might become an interesting alternative in the future, also if suitable scintillation
+materials are discovered in the future.
+Bialkali and Multialkali
+Bialkali and Multialkali are very interesting because they offer a good sensitivity at the emission peaks
+of high yield scintillators. Unfortunately they are also extremely sensitive to pollution and moisture,
+and even protective layers do not prevent loss of yield after short exposure to polluting environments
+[8].
+GaN and relatives
+Those photocathodes have been the subject of a lot of studies for they offer a very good quantum
+efficiency below the long-wavelength cut off (typically Q.E. ∼ 0.4) while having a very low quantum
+efficiency above this cut-off. This is of special interest for solar-blind detectors in space applications.
+In our case this means that they could be coupled to high-yield scintillators to form a two step X-ray
+photocathode. In particular an association of a NaI scintillator and GaN photocathode seems to be
+a promising combination.
+Alas, those photocathodes also require a good vacuum to work effectively. So for the same reasons
+as previously, they cannot be used in detectors using gas amplification.
+Protected photocathodes
+Studies have been made to try protecting UV and visible photocathodes for the specific case of gas-
+filled detectors [8]. The possibility exists to effectively reduce the sensitivity of the photocathodes to
+moisture and oxygen (the main contributors to the degradation of the photocathodes in unclean envi-
+ronments), but at the cost of a highly-reduced quantum efficiency (at maximum 10 %, the protection
+depending on the thickness of the protecting layer).
+6.1.4 Conclusion
+It appears clearly that in spite of its promises it will be difficult to build a 2 steps photocathode for
+X-ray detection.
+Diamond seems to be the most promising material, for it is a robust material (yet no real studies of
+the stability of the hydrogenated surface -by plasma activation or else- could be found), but short
+wavelength scintillators have still to be found. Otherwise carbon does not offer the stopping power
+mandatory to enable a good quantum efficiency with X-rays without a first conversion stage.
+The other materials unfortunately do not offer a stability good enough to guaranty a good reliability
+when used in gas-filled detectors.
+92 The different concepts to make a photocathode
+6.2 Direct conversion
+As an indirect conversion does not seem to be a good way of designing a photocathode for gas-filled
+detectors, a direct conversion has to be used.
+There are various possibilities to better the quantum efficiency of the photocathodes presented in
+section 3.3. Three approaches were studied theoretically and experimentally in the scope of this work
+to try bettering the quantum efficiency of photocathodes in the X-ray energy range:
+• Modify the geometry of the photocathode in order to maximize the yield of a material,
+• Use of sharp tips to profit from a field emission phenomena,
+• Investigate new materials in order to find one with better properties.
+All three approaches are detailed in the following subsections:
+6.2.1 Modify the geometry to increase the yield of one material
+As explained in section 3.1, the yield of the photocathode depends directly on the ratio laL , where la
+is the absorption length and L is the scattering length.
+Figure 6.2 : The impact of the incidence angle of photons on the active area (contributing to the yield).
+This formula is valid in the case of photons with a direction perpendicular to the surface. Indeed
+in the case of photons with slanted directions, the apparent thickness is increased, leading to more
+photons absorbed in the active area (distance to the surface inferior to L). With the definition of the
+angle α of Figure 6.2, the theoretical increase of quantum efficiency is a factor 1cos(α) :
+∝ laEfficiency · 1 . (6.1)
+L cos(α)
+This was measured by D.P.Lowney et al. in [9] in the case of CsI, and the measurements show a
+good agreement with the formula.
+6.2 Direct conversion 93
+To use this effect, the classical way is the use of a grazing incidence. Unfortunately, this leads also
+to technological problems, and to the impossibility of making large areas detectors. So in this work
+the possibility to use microstructures was investigated.
+More generally this approach consists in increasing the surface to volume ratio of the material, as
+this increases the active area. In fact the best available photocathodes have a controlled microstruc-
+ture, which maximizes this surface to volume ratio (often a columnar structure obtained during the
+deposition of the material).
+The main requirement for the microstructures concerns their size: they should be much smaller than
+the pixel size (collecting anodes in the case of a gas amplification), which means structures with
+typical sizes of less than a micron.
+Various ways of playing with the geometry were tested during this study, as will be shown in the
+coming subsections. Only systems which can be obtained on large surfaces for a reasonable price were
+used during this study.
+6.2.1.1 Porous Photocathodes
+The most straightforward way of creating a structure is the use of a porous material. Indeed this
+enables the creation of a much larger surface (so a greater active area) actually reached by the photons
+(then the absorption length becomes la , where Porosity is the fraction VporesPorosity V in the material).total
+But as explained in the previous section, with increasing porosity, the probability that emitted elec-
+trons reach the actual surface of the photocathode also decreases for the electrons have to find their
+way through the connected pores or even through thin walls between pores to then exit the pho-
+tocathode. While M.P Lorikyan [10] published interesting results using this sort of materials, the
+measurements could not be later confirmed, and doubts subsist concerning a possible amplification
+inside the pores, which would affect the measurement of the quantum efficiency (as several electrons
+would be detected per single detected photon).
+Still a similar approach was used for some of the samples prepared, and results are given in the next
+chapter.
+6.2.1.2 Regular Structures
+Modern photocathode always have a microstructure, which maximizes the surface to volume ratio,
+in order to have a maximum active area. Yet the structure is not fully controlled as it is most often
+obtained by carefully controlling the deposition parameters so that the photocathode material adopts
+a columnar growth [11]. So there is little control on the actual structure of the deposited material.
+Another approach can be the use of a patterned substrate or a process able to imprint the desired
+structure in the material. So that the geometry of the deposited material is well controlled and opti-
+mized.
+The main problem of structured photocathodes lies in the lack of escape path for electrons reaching
+vacuum (or the gas) at a point far from the surface of the photocathode. The solid angle is indeed
+94 The different concepts to make a photocathode
+inversely proportional to the square of the aspect ratio of the structure2
+Figure 6.3 : Two examples of regular Structures.
+There are some requirements to respect to guarantee a minimum quantum efficiency of the photo-
+cathode:
+• For the photocathode has to work in transmission, special care must be taken to guaranty an
+excellent transparency to X-rays of the substrate. Ideally the substrate is thin, made of low Z
+material, and flexible in order to guarantee a good mechanical robustness. Organic materials
+like kapton or some sorts of polymers are good candidates.
+• The process used to create the structures must be adaptable to large surfaces at an acceptable
+price. In particular, etching technologies or holographic-based technologies, which are common
+in the semiconductor industry should be avoided, for their costs increase dramatically with large
+surfaces. On the other hand, physical engraving technologies are well adapted (see the example
+of the Trizact Sample in the next Chapter).
+• The uniformity of the pattern has to be good enough to guaranty a good homogeneity of the
+conversion efficiency.
+As said before, typical sizes of the structures must be small enough to ensure that they will have no
+impact on the uniformity of the image.
+In addition, in theory it would be best to match the typical escape length3 of the emitter material.
+Indeed smaller sizes will not enable to minimize the transparency and larger sizes will result in a loss
+of flux in the active area of the photocathode.
+But in practice the typical values of L are very hard to obtain (for example L(Gold) ≈ 2 nm and
+L(CsI) ≈ 50 nm), and as the photocathode works in transmission, it is better to deposit a thin
+layer of the high yield material (thus high stopping power) on top of a low stopping power structured
+material, so that a maximum flux of photons reaches the active area of the material.
+Concerning the shape, a trade-off must be done between two different requirements:
+2For example, in the case of a square well of surface l2 and deepness h, the solid angle from the bottom of the well
+l2is 2 ∝ 1 2 ).4pih (Aspect Ratio)
+3the escape length is inferior to the scattering length because of the work-function/electron affinity of the material.
+6.2 Direct conversion 95
+1. The higher the aspect ratio, and the higher the angle with the surface of the structure, the
+larger the active area,
+2. The smaller and the more separated the structures are, the higher the electron escape solid
+angle is, and so the higher the escape probability.
+It is also better to have non rectangular like shapes, as the active area is very thin. Pyramidal, or
+conic like shapes, offer a larger surface of the photocathode with an oblique surface with respect to
+the X-rays.
+Those shapes also enable a better penetration of the electric field between the structures, and offer
+a larger solid angle for electrons allowing exit from the bulk of the material far from the top of the
+structures. Indeed, the surface of the material often exhibits an attractive potential to electrons in
+the gas (except in the case of NEA materials), so electrons are likely to return back in the material
+again before reaching the surface of the photocathode.
+To increase the escape probability of the electrons, one has to use an electric field. Unfortunately,
+also the efficiency of the electric field is limited: Figure 6.4 depicts the result of the simulations of
+the electric field in the case of metallic structures with rectangular and triangular shape by means
+of a Finite Element Method (the simulations were performed with Comsol Multiphysics). The back
+surface (flat) of the structure was at ground potential, while a ”collecting plane” above the structures
+was at a potential of 100 V .
+It appears in the simulation, that the electric field penetrates more into the triangular structures. In
+both cases yet, the values reached are very small. Fortunately, most electrons exit the bulk material
+with energies of only a few eV , so even a small electric field can have a strong impact on the collection
+of the electrons.
+In conclusion, the simulations show that the aspect ratio (HeightWidth ) of the structures cannot be very
+high, otherwise the electrons created far from the surface will be not extracted.
+96 The different concepts to make a photocathode
+Figure 6.4 : Simulations of the electric field in triangular and rectangular structures.
+6.2 Direct conversion 97
+6.2.2 Field emission
+Figure 6.5 : Simulation of the electric field in the case of silicon sharp tips.
+As explained in section 3.1, the most important parameter for photocathode quantum efficiencies con-
+cerns the electrons extraction of the material. Several studies [12, 13, 9] were performed to evaluate
+the effect of an electric field to diminish the potential barrier electrons have to overpass to reach vac-
+uum (the electron affinity/work function). Those studies showed that strong electric field is needed to
+have a real impact on the quantum efficiency of the photocathodes. This can be explained by the much
+higher value of the dielectric permittivity in solid materials (ex. ε(CsI) = 6.3 and ε(Si) = 12) than
+in gas/vacuum (ε(vac.) = 1): in the case of two dielectrics superposed, the proportion of the energy
+stored in both materials is the inverse of the ratio of the electric permittivities. As a result the electric
+field has a very small value inside the material, and does not effect much the dynamics of the electrons
+in the material (see the simulations by finite elements of metal microstructures on Figure 6.4). To
+create a strong field inside the material, one has to connect electrodes to the photocathode, which is
+of course not possible in the case of electro-emitters (the electrode would take the role of the emitter).
+In order to improve the electric field, it was envisaged to use sharp tips to profit from the concentration
+of the electric field around sharp tips (Tip effect), and so create a field emission system.
+Figure 6.5 depicts the result of the simulation by the finite element method of such sharp silicon tips.
+98 The different concepts to make a photocathode
+Indeed, a strong electric field appears at the top of the tips.
+Such arrays were already successfully used in association with short pulse UV-lasers for photo-injectors
+systems [14], and could be interesting for photon-detection systems. Tests were performed with
+silicon-made tips arrays in order to test the efficiency with X-rays.
+6.2.3 A new material: CsI3
+In parallel to the work made to enhance the emission properties of known materials by changing the
+geometry of those materials, new materials were investigated. Following the example of CsI, which
+is currently the best material in terms of quantum efficiency, various iodide were studied.
+In particular, CsI3 as a derivative material of CsI was found to share some interesting physical
+properties with CsI, while solving some issues specific to CsI.
+Bibliography
+[1] G. Charpak et al., “Some studies of the application of csi photocathodes in gaseous detectors,”
+Nucl. Inst. and Meth. A, vol. 333, pp. 391–398, 1993.
+[2] J. Van der Marel et al, “A microgap photomultiplier for the read-out of a laf3 : Nd(10÷)
+scintillator,” Nucl. Inst. and Meth. A, vol. 410, pp. 229–237, 1998.
+[3] F.Garibaldi et al, “A pet scanner employing csi films as photocathode,” Nucl. Inst. and Meth.
+A, vol. 525, pp. 263–267, 2004.
+[4] A.Laikhtman et al., “Absolute quantum photoyield of diamond thin films: Dependence on sur-
+face preparation and stability under ambient conditions,” Nucl. Inst. and Meth. A, vol. 73,10,
+pp. 1433–1435, 1998.
+[5] J.Roberston et al., “Band diagram of diamond and diamond-like carbon surfaces,” Diamond and
+Related Materials, vol. 7, pp. 620–625, 1998.
+[6] D.Vouagner et al., “Photoemission properties and hydrogen surface coverage of cvd diamond
+films,” Diamond and Related Materials, vol. 13, pp. 969–974, 2004.
+[7] M.Globus et al., Inorganic Scintillators For Modern And Traditional Applications. National
+Academy of Sciences of Ukraine., 2005.
+[8] E.Shefer et al., “Photoelectron transport in csi and csbr coating films of alkali antimonide and
+csi photocathodes,” J.Appl.Phys., vol. 92(8), pp. 4758–4771, 1993.
+[9] D.P.Lowney et al., “Characterization of csi photocathodes at grazing incidence for use in a unit
+quantum efficiency x-ray streak camera,” Review of scientific instruments, vol. 75,10, pp. 3131–
+3137, 2004.
+[10] M. P. Lorikyan, “Study of counting characteristics of porous dielectric detectors of radiations,”
+Nucl. Inst. and Meth. A, vol. 515, pp. 701–717, 2003.
+100 BIBLIOGRAPHY
+[11] H.S.Cho et al., “A columnar cesium iodide (csi) drift plane layer for gas avalanche microdetec-
+tors,” IEEE transaction on Nuclear Science, vol. 45(3), pp. 275–279, 1998.
+[12] A.Breskin et al., “Electric field effects on the quantum efficiency of csi photocathodes in gas
+media,” Nucl. Inst. and Meth. A, vol. 344, pp. 537–546, 1994.
+[13] A.Breskin et al., “New ideas in csi-based photon detectors: Wire multiplication and protection
+of the photocathode,” IEEE Trans.Nucl.Sci, vol. 42(4), pp. 298–305, 1995.
+[14] e. J. M. Nation, “Advances in cold cathode physics and technology,” Proceedings of the IEEE.,
+vol. 87, 5, pp. 865–889, 1999.
+Chapter 7
+Experimental tests and discussion of the
+results
+Not all the different approaches to improve the photocathodes were experimentally tested. In partic-
+ular, the indirect conversion photocathodes were not actually fabricated, for no good combinations
+of scintillators and emitters could be found. Otherwise, most ideas to improve the photocathode
+quantum efficiencies were tested. This section follows the structure of the previous one and gives the
+experimental results obtained.
+7.1 Modify the geometry to increase the yield of a material
+As previously explained, the approach of modifying the geometry of one material consists in benefiting
+from the increasing of the quantum efficiency in the case of an oblique incidence of photons on the
+surface of the photocathode material. Only samples potentially manufacturable as large surfaces were
+used.
+Mainly two types of structured photocathodes were tested:
+Random Structures were actually sand paper materials normally used for the coarsing of surfaces.
+The different grades of papers enabled to test further the impact of the structure sizes on the
+quantum efficiency.
+Periodic Pyramidal Structures were special sorts of sand paper available in a very special and
+periodic shape. They are normally used for highly demanding polishing applications (in terms
+of uniformity, and robustness of the paper).
+The reference sample was a flat Kapton foil.
+Those samples were covered with 0.2−0.4 µm of gold by argon ion sputtering (the thickness could not
+be precisely controlled, so the thickness was evaluated thanks to the given deposition characteristics
+of the machine). This thickness was sufficient to ensure a maximum yield (thickness greater than the
+escape length) while not changing radically the structure shapes.
+102 Experimental tests and discussion of the results
+7.1.1 Analysis of the microstructures characteristics
+Several samples were created and their structures were analyzed both with an optical and a scanning
+electron microscope (SEM).
+First a flat kapton foil was taken as a reference photocathode.
+For the random structures, the samples were the following (SEM images):
+Figure 7.1 : Grade 280 sam- Figure 7.2 : Grade 800 sam- Figure 7.3 : Grade 1200 sam-
+ple: Random structures of sizes ∼ ple: Random structures of sizes ∼ ple. Random structures of sizes ∼
+100 µm. 20 µm. 10 µm.
+Those samples were made with normal sand paper, normally used for grinding of surfaces. Higher
+grades correspond to a finer smoothening, so structures are smaller and more numerous. The sizes
+indicated under each pictures (7.1, 7.2, 7.3) are those of the largest structures (covering most of the
+surface), and are always surrounded with smaller structures.
+For the periodic structures, the special Trizact 143 paper by the company 3M was used. Those
+structures are obtained by positive engraving in a special polymer and are available in large areas.
+Figure 7.5 : Periodic Structure seen from the
+Figure 7.4 : Periodic Structures seen from side Optical Microscope.
+top SEM image, size of structures ∼ 500 µm
+The side surfaces form an angle of∼ 57o with respect to the base plane (averaged on several pyramids).
+7.2 Field Emission 103
+7.1.2 Efficiency measurements
+The different samples presented were all covered with a layer of gold of thickness ∼ 0.3 µm. This
+thickness is far bigger than the escape length of gold (a few nm), so there is no contribution to the
+yield from the substrate. The structures are much larger than the gold thickness, and there was
+no attenuation observed of the quantum efficiency due to a ”smoothening” of the surface by the
+deposited layer (different thickness of deposited gold gave the same results).
+The results are presented compared to a flat surface of gold obtained in the same conditions in table
+7.1 (X-ray tube parameters: 20kV acceleration voltage, 20mA intensity, with Cu anode):
+Substrate Gold Thickness (µm) Measured Current (pA)
+Kapton 0.3 18.5± 0.9
+Sand Paper Grad 280 0.3 22.4± 1.1
+Sand Paper Grad 800 0.3 20.8± 1.0
+Sand Paper Grad 1200 0.3 19.4± 0.9
+Trizact 143 0.3 34.65± 1.7
+Table 7.1 : Results intensities of gold covered structured paper
+The best sample is the Trizact 143, which indeed offers the largest inclined surface (so a higher active
+area). It should be noted that with respect to the flat Kapton sample, there is a factor
+34.65 ≈ 11.87 = = 1.83
+18.5 cos(57)
+as predicted by the formula in section 6.2.1.
+Sand Paper do not give results as good as the periodic trizact samples, probably because the structure
+covered surface is much smaller than that of the trizact samples.
+7.2 Field Emission
+Silicon sharp tips were obtained and tested to evaluate their potential in the case of X-ray photo-
+cathodes.
+7.2.1 Analysis of the microstructure characteristics
+The sample is formed of a periodic array of 4.5 µm separated tips, engraved in a silicon wafer.
+104 Experimental tests and discussion of the results
+Figure 7.6 : Si Tips Array SEM images at 10 µm and 2 µm resolution. No better image could be obtained
+because of space charge effects.
+Due to the small dimension of the tips, neither the SEM images nor the optical ones enabled us to
+obtain detailed information about their shape. Yet the SEM images do show an effect of emission
+enhancement at the tips tops (Figure 7.6).
+7.2.2 Efficiency Measurements
+The measurement of the quantum efficiency of silicon tips as X-ray photocathodes showed that silicon
+tips are not a good choice for no signal could be detected. This demonstrates that the yield is very
+small.
+This can be explained by the small stopping power of silicon in the case of X-ray photons. For
+photons penetrate deeply in the material before being stopped, the electrons are created too far
+from the surface to drift and exit the bulk (in the case of moderate electric field as presented in the
+simulations detailed in section 6.2.2).
+It is likely that a strong electric field could enhance the yield, but such a field is not compatible with
+gas amplification.
+7.3 CsI3 as a new photocathodes material
+7.3.0.1 Physical and chemical characteristics
+CsI is a dark reddish-brown solid material, with a standard density of 4.51 g/cm−33 , and melting
+point of 207.5oC. Its crystal structure was first studied in 1925 by Bozorth et al.[?], and later refined
+by H.A.Tasman et al. and by J.Runsink et al.[?, ?] and belongs to space group Pmcn.
+Extensive studies (complete phase diagram) on the manufacturing of polyiodides of caesium can be
+found in [?] ; the material is also available from major chemicals companies such as Sigma-Aldrich
+or Alfa Aesar or can be easily synthesized from CsI and I2 [?].
+7.3 CsI3 as a new photocathodes material 105
+It is not stable under vacuum at room temperature but it releases I2. L.E.Topol indicates in [?] that
+the partial vapor pressure can be obtained from the formula
+−4269 + 0.20(T − 273)
+log(PCsI3 [Torr]) = − 2.013 log T + 16.2548. (7.1)T
+In particular, at a temperature of 25oC, P ≈ 10−3Torr = 1.33 · 10−3 mBar and at 40oCsI3 C:
+P ≈ 4.14 · 10−3 Torr = 5.51 · 10−3CsI3 mBar.
+More detail (including (E−Eo), ∆G associated to the system CsI −CsI3) can be found in [?]. The
+differential free enthalpy is ∆o = −358 kJmol−1f .
+Indeed when CsI3 was left on the photocathode holder in vacuum, a layer on surroundings metals
+appeared, which is a sign of reaction with I2 (the layer showed the same aspect as when exposed to
+vapors of I2 obtained from solid iodide). Also the color of the sample rapidly changed to a brighter
+one (yellowish, after a few hours in vacuum), which is also a sign of the appearance of CsI at the
+surface (CsI is white or transparent, depending on its crystallinity). After 1 week in vacuum at a
+pressure of ∼ 10−5 the sample had lost as much as 12 % of its weight. Unfortunately we could not
+leave it under vacuum for a longer time to test further the stability of solid blocks (to check whether
+there is only surface transformation, which acts like a passivation layer, or deeper degradation and
+if a denser block would degrade the same way). The scanning electron microscope (SEM) analysis
+confirms an evolution of the material microstructure (see figures 7.7 and 7.8):
+Kept in air at atmospheric pressure, there was no visible evolution after several months, apart from
+the plastic box, which turned into red (like it did with other compounds such as AuI, known to re-
+lease I2), which indicates that the evolution is slow, as soon as the equilibrium pressure of I2 is reached.
+7.3.1 The CsI3 samples
+Different flavors of CsI3 samples were obtained and tested. For each the analysis of the microstructure
+and the quantum efficiency measurements were performed. CsI3 is unstable under vacuum, so an
+analysis of the microstructure evolution under vacuum was performed.
+Samples of CsI3 were created following two ways:
+1. CsI3 was ordered from the company Sigma-Aldrich, and pressed into a pellet with a die-press
+set. A pressure of 3.5 GPa was enough to obtain a solid sample.
+2. CsI samples were exposed to I2 vapors (CsI with solid I2 in a closed bottle in a furnace at
+30oC). The solid state reaction is very slow. We had to wait several days to observe a reaction
+of the bulk of the material. This method has the advantage that it is possible to compare
+directly nearly identical CsI and CsI3 samples.
+CsI3 samples obtained were tested and compared with CsI and gold. CsI is an isolator, therefore
+it is hard to test due to charging effects. To overcome the space charge, conductive CsI(C) samples
+were made, and compared with CsI3(C).
+106 Experimental tests and discussion of the results
+7.3.1.1 Preparation of the different samples
+Samples obtained from CsI3 as supplied
+CsI3 was obtained from the company Sigma-Aldrich (the vendor guaranties a purity better than
+99.99x %).
+The product came as a fine powder, which was then pressed into a pellet in an hydraulic press die,
+at a pressure of 4GPa for 5 minutes.
+Samples obtained from a CsI crystals, in presence of I2 vapors
+Samples of CsI(T l) crystals grown for fluorescence applications were obtained from the company
+Saint-Gobain.
+The samples come in the form of a polished crystal (transparent to light, colorless). It was then
+exposed to I vapors at a temperature of ∼ 40o2 C for several days. Already after a few minutes, the
+color of the crystal had changed into one very close to that of CsI3. After several weeks in presence
+of I2, the sample is hard to distinguish from the one obtained from the CsI3 powder.
+CsI was also tested. To do this, it was placed rapidly after opening (less than 5 minutes in air) on the
+experimental setup in vacuum and tested. Unfortunately, this test was not relevant, as explained later.
+Samples obtained from a powder of CsI mixed with carbon in order to reduce
+the space charge
+The CsI crystals from St Gobain could not be tested directly because of charging effects. So high
+purity CsI powder (from the company Sigma-Aldrich) was mixed with graphite in order to increase
+its conductivity. Those samples enabled to have a direct comparison of CsI and CsI3.
+Because CsI is an hygroscopic material, all manipulations were done under protecting atmosphere, in
+a glove box. The sample was then rapidly mounted on the experimental setup (less than 5 minutes)
+and put under vacuum for testing.
+The received CsI was grained and mixed with graphite in a mortar. The sample composition was
+0.5 % of graphite-carbon and 99.5 % high purity CsI.
+It was then removed from the glove box, put in a die and pressed at 6 GPa for 2 minutes. Immediately
+after it was mounted and put under vacuum. Such a way, the sample stayed less than 5 minutes in
+air between its removal from the glove box, and the start of the pump.
+A second sample prepared the same way, was treated in iodine vapors in order to transform it to
+CsI (C) (left in a furnace at a temperature of 40o3 C for one week).
+Porous CsI Photocathodes
+Porous CsI photocathodes by the company Luxel were tested for comparison purpose. Those pho-
+tocathodes have a microstructure, which is optimized for a use in X-ray cameras. They give an
+indication of the maximum yield obtainable with CsI. Those photocathode are shipped in a sealed
+flask filled with an inert gas to protect them from moisture. As for the previous samples, they were
+mounted in the clean room and evacuated in less than five minutes.
+7.3 CsI3 as a new photocathodes material 107
+7.3.1.2 Analysis of the microstructures of the samples and their evolution
+The CsI3 samples were stored in the clean room, in non hermetic plastic boxes. No visible change
+of aspect could be observed after several months, and no evolution of the microstructure was visible
+with the scanning electron microscope.
+However, under vacuum a clear evolution was observed. Details of the sample evolution under vac-
+uum are the following:
+Samples obtained from pure CsI3
+The evolution of the microstructure of the sample was observed by SEM (a Gemini Leo 1530 ):
+The surface microstructure of the pressed sample is depicted in the Figure 7.7.
+Figure 7.7 : CsI3 as pressed SEM images. Left image is a large field picture with resolution ∼ 10 µm,
+right image is a closer view with resolution ∼ 2 µm.
+This sample was left for one week under vacuum at a pressure of ∼ 10−6 mbar. The sample was then
+re-examined by SEM. The result is depicted in Figure 7.8.
+Figure 7.8 : CsI3 samples SEM images, after the sample was placed for one week in vacuum. Left image
+is a large field picture with resolution ∼ 2 µm, right image is a closer view with resolution ∼ 1 µm.
+108 Experimental tests and discussion of the results
+There is a clear evolution in the microstructure, which has become much more porous. In the mean
+time, the color of the sample changed from dark to a white yellowish one (close to the color of CsI).
+This is further indication of the reaction
+CsI3 
+ CsI + I2. (7.2)
+Samples obtained from CsI exposed to I2
+The study of the samples made from CsI3 enabled to study the microstructure evolution of the
+material in vacuum. It is also interesting to study the evolution of microstructure of samples of CsI
+after they were exposed to I2 and then placed in vacuum.
+The following pictures depict the evolution of the samples made of pure CsI mixed with 0.5 % of
+carbon: ”CsI(C)”.
+As pressed, the microstructure of this sample is depicted in Figure 7.9.
+Figure 7.9 : CsI(C) at 20 (left), 10(center), and 2 µm resolution (right).
+After exposure to I2 for two days, no visible evolution of the microstructure was observed.
+But after one night in vacuum, the structure becomes the following (Figure 7.10).
+Figure 7.10 : CsI(C) at 20 (left), 10 (center), and 2 µm resolution (right) after the sample was exposed to
+I2 and placed one night in vacuum.
+The samples obtained from the CsI(T l) crystals show the same evolution (visible on Figure 7.11).
+7.3 CsI3 as a new photocathodes material 109
+Figure 7.11 : CsI(T l) Crystal by St Gobain Before any treatment (left), and after it was exposed to
+I2, and placed one night in vacuum (right).
+Before any treatment, most of the surface is flat like on picture 7.11 left (polished sample). The
+right picture highlights the complete change of the surface after the exposure to I2 and vacuum.
+This evolution follows the same trend as for the compacted CsI3 samples. The difference of obtained
+microstructure can be explained by the difference of the CsI microstructure before exposure to I2.
+When the structures are left in vacuum for longer periods, no visible change occurs at the surface.
+Porous samples of CsI
+Those samples are obtained from the company Luxel and have a microstructure optimized for the
+detection of X-rays in streak cameras.
+Indeed they show a spongy structure as depicted in pictures 7.12.
+Figure 7.12 : CsI optimized for streak cameras from the company Luxel. The left SEM image is shot
+with a resolution of ∼ 20µm, the right one with a resolution of ∼ 1µm. Space charges on the sample prevented
+us from obtaining a better image.
+As presented in section 6.2.1.1, this sort of structure is a way to obtain a large surface of the material
+110 Experimental tests and discussion of the results
+and then, a large active area (cf. 6.2.1).
+It should be noted that this sample has a microstructure which is similar to that of the CsI samples
+exposed to I2 and then placed in vacuum.
+So the exposure to I2 appears as a way to obtain a granular microstructure of the CsI.
+This is an important result, as this method is much easier than the complex deposition
+processes normally used to obtain such materials.
+This result will be further detailed in the conclusion concerning the use of CsI3 as a photocathode
+material.
+7.3.2 CsI3 quantum efficiency and comparison with CsI.
+The quantum efficiency of CsI3 was evaluated and compared to that of CsI, both before and after
+exposure to air. See chapter 5 for details concerning the experimental setup.
+7.3.2.1 The quantum efficiency of CsI and its evolution in air
+measurement of the quantum efficiency of clean CsI
+Those measurements were done for calibration and comparison purpose, as this subject was already
+widely studied in the past.
+Yet, few authors provide results of the quantum efficiency after exposure to air (at best short exposures
+and techniques to recover the virgin quantum efficiency [29, ?, ?, ?, 32]).
+The best quantum efficiency one can obtain is measured in our case by the quantum efficiency of
+the samples provided by the Luxel company. Those samples are optimized for a very high quantum
+efficiency: thick deposited layers, with an adapted microstructure.
+The best quantum efficiency, was obtained right after introduction of the sample in the chamber.
+With our setup, a maximum current of 1144 ± 57 pA was recorded. The second sample gave
+1115± 55 pA (3% difference, can be attributed to a slight degradation of the sample during its ma-
+nipulation, or to a difference in the sample itself).
+Those results were compared with the samples obtained from the CsI mixed with 0.5 % of carbon.
+The intensity obtained was 144± 7.2 pA.
+While this lower intensity can be explained by an effect of the structure of the sample (as explained
+before, prior exposure to I2, the surface of the CsI(C) sample was very flat), it is likely that the
+condition of cleanness during the preparation of the chamber cannot guaranty a maximum quantum
+efficiency of the CsI photocathode prepared this way: the quantum efficiency of CsI as a secondary
+emitter depend strongly on the state of cleanness of the sample surface (cf. section 3.3.4). For
+the CsI used to prepare the sample was grained and pressed during the preparation process (see sec-
+7.3 CsI3 as a new photocathodes material 111
+Time in air Intensity measured (pA)
+0 1144± 57
+1 day 736± 36
+30 days 113± 5.6
+Table 7.2 : Evolution of the current of the porous CsI sample after it was left in air.
+tion 7.3.1.1), it can have been polluted, despite of the care taken to clean the mortar and the die used.
+Evolution of the quantum efficiency of the porous CsI in vacuum and after
+exposure to air
+CsI is known for being sensitive to pollution, and in particular to moisture. Tests were performed in
+order to compare its stability with that of CsI3.
+• Evolution of the quantum efficiency of CsI in vacuum.
+The vacuum in which the measurements were performed is not ultra high. The measured pressure
+next to the chamber was in the range 10−5 to 10−4 mbar. This pressure is high enough to cause
+contamination of the surface on the long-term.
+Under such conditions, a degradation of the quantum efficiency of the porous CsI was recorded
+only after a few days: the quantum efficiency after 2 days was at a value of 1040 ± 52 pA. This
+corresponds to a drop of quantum efficiency of 9%.
+This highlights the necessity to keep the photocathode in a very clean environment, as already
+reported.
+In the same time, no drop of intensity was recorded in the case of the sample CsI(C).
+• Evolution of the quantum efficiency of CsI in air.
+The evolution of the quantum efficiency after exposure to air is just a way to study the evolution of
+the quantum efficiency of the photocathode when it is left in a more aggressive environment.
+The different samples of CsI were just left in a protecting box, inside the clean room. So the samples
+are still in a controlled environment, but in particular there was no protection against moisture, which
+is known as the worst enemy of CsI photocathodes.
+It turns out the evolution of the quantum efficiency is much more dramatic, than when the photo-
+cathode is kept in vacuum (table 7.2):
+After one night in air, the intensity was 736 ± 36 pA, which corresponds to a relative drop of
+35 % of the quantum efficiency.
+After one month in air, the intensity was only 113± 5.6 pA. So only 10% of the original quantum
+efficiency was left.
+No change of intensity was recorded for the sample of CsI(C) in the same time. This is a further
+indication that the sample was already degraded at the time of the first measurement.
+112 Experimental tests and discussion of the results
+Time (in hours) Intensity measured (pA)
+Introduction 160± 8
+0.5 188± 9.4
+1 217± 10
+2 230± 11
+∞ did not increase further
+Table 7.3 : Evolution of the current returned by the sample CsI3(C) when placed in vacuum.
+7.3.2.2 The quantum efficiency of CsI3, its evolution in air and comparison with CsI.
+The quantum efficiency of CsI3 was evaluated the same way as CsI, except that in addition to
+those measurements, after exposure to air, CsI3 samples were eventually put back in an atmosphere
+saturated with I2 and then they were tested again.
+Following the evolution of the microstructure presented in the last section, there is an evolution of
+the CsI3 photocathode quantum efficiency when left in vacuum.
+For all the samples of CsI3 prepared do not have the same microstructure, all the quantum efficiencies
+of the various samples are not equal. Yet they all follow the same trend concerning the evolution of
+their quantum efficiencies.
+First, the sample made of ”CsI3(C)” is detailed here. Then a comparison of the maxi-
+mum intensities of the different samples is given.
+The sample ”CsI3(C)”
+• Evolution of the quantum efficiency after introduction in the chamber under vacuum.
+The sample made of CsI(C) after it was tested as a CsI sample was put in presence of I2 vapors for
+two days, at a temperature of 40oC. The obtained CsI3(C) was then tested.
+At the introduction in the chamber, the intensity was 160± 8.0 pA and rapidly evolved (table 7.3).
+The maximum intensity was then ∼ 230 ± 11 pA. The microstructure then corresponds to Figure
+7.10.
+No further evolution of the intensity was recorded, so the sample was removed from the chamber.
+• Evolution of the quantum efficiency when left in air.
+The sample was then left for a long period (1 month) in air in the clean room (storage in a plastic
+box). After only one day the sample had lost a great part of its quantum efficiency, for the measured
+intensity was then 93± 4.6 pA. This evolution did not go further, and after one month, the quantum
+efficiency was still 92± 4.6 pA (table 7.4).
+7.3 CsI3 as a new photocathodes material 113
+Time in air Intensity measured (pA)
+Introduction 230± 11
+1 day 93± 4.6
+30 days 92± 4.6
+Table 7.4 : Evolution of the current of the sample CsI3(C) sample after it was removed from vacuum, and
+left in air.
+Time (in hours) Intensity measured (pA)
+Introduction 160± 8
+0.5 260± 13
+1.5 299± 14
+3 314± 15
+4 320± 16
+15 340± 17
+∞ did not increase further
+Table 7.5 : Evolution of the quantum efficiency of the sample CsI3(C) in air after re-exposure to I2.
+• Evolution of the quantum efficiency after re-exposure of the sample to I2.
+Lastly the sample was put back in presence of I2 for a few days, and the quantum efficiency was
+retested. The quantum efficiency then evolved according to the data of table 7.5.
+In conclusion, the history of this peculiar sample can be plotted like on Figure 7.13.
+114 Experimental tests and discussion of the results
+Intensity
+(pA) Vacuum Air Vacuum I2 Vacuum
+320
+300
+280
+260
+240
+220
+200
+180
+160
+140
+120
+100
+80
+60
+40 Time
+(Hours)
+20
+1 Month
+1 2 3 4 1 Month1 2 1 2 3 4 5 6
+Figure 7.13 : Summary of the evolution of the quantum efficiency of the sample of CsI3(C). after first
+introduction in vacuum, one month stay in air, and Re-exposure to I2.
+After the CsI sample was exposed to I2, there is an increase of efficiency when it is left in air. The
+sample then becomes sensitive to pollution, and an exposure to air results in a drop of efficiency.
+A re-exposure to I2 enables to recover the lost efficiency, and is even beneficial for the maximum
+intensity obtained is then higher than after direct introduction of the sample.
+A further cycle of exposure to I2 and stay in vacuum gave the same results.
+CsI crystal from St Gobain.
+As already explained, the performances of the CsI crystal by St Gobain could not be measured,
+because of space charging. Only after it was exposed to I2 it became conductive enough to enable
+measurements.
+After a long exposure to I2, as highlighted by the microstructure and color changes, a part of the
+sample turned into CsI3.
+7.3 CsI3 as a new photocathodes material 115
+Time (in hours) Intensity measured (pA)
+Introduction 120± 6
+2 130± 6.5
+10 151± 7.5
+∞ did not increase further
+Table 7.6 : Evolution in vacuum of the intensity for the CsI(T l) sample by St Gobain, after exposure to I2.
+The performances and behavior after exposure to vacuum and I2 of this sample are similar to those
+of the ”CsI(C)” and pressed pellet samples (table 7.6).
+Then, after only one week in air, the intensity recorded was only 68± 3.4 pA.
+After it was exposed to I2 for a few days, the intensity rose to approximately the same value of
+154± 7.7 pA again.
+So this sample follows the same trend as the previous one except that a second exposure to I2 does
+not enable a bettering of the efficiency, but only a recovery of this efficiency after pollution of the
+sample by air.
+Figure 7.14 : Exposure of the Luxel Sample to I2 in open air.
+The CsI photocathode from Luxel.
+A tentative was made to use the CsI photocathode from Luxel to make a CsI3 one as with the crystal
+by St Gobain. Unfortunately, it turned out that the Aluminized mylar substrate used to grow the
+photocathode is very reactive to I2. It was not the CsI of the photocathode, which reacted with I2,
+but the aluminum of the substrate itself.
+So the only way to obtain a CsI3 photocathode from this sample was to put in open air, a solid iodine
+grain on the CsI deposited layer (Figure 7.14). The grains were deposited around the measured area,
+116 Experimental tests and discussion of the results
+Time (in hours) Intensity measured (pA)
+Introduction 390± 19
+1 412± 20
+2 580± 29
+4 812± 40
+∞ did not increase further
+Table 7.7 : Evolution in vacuum of the quantum efficiency of the porous CsI sample after exposure to I2
+Time (in hours) Intensity measured (pA)
+Introduction 120± 6.0
+0.5 141± 7.0
+2 177± 8.8
+4 200± 10
+∞ did not increase further
+Table 7.8 : Evolution of the current of the CsI3 pressed pellet in vacuum
+on place invisible to the X-rays (far from the 7 ∗ 7 mm2 enlightened area). Table 7.7 gives the results
+of the measurements of the photocurrent.
+It is evident that such a method cannot guaranty a good homogeneity of the CsI3 surface. So the
+result of those measurement must be taken with caution.
+When the sample was removed from the chamber, it was completely white. So, if the value at the
+time of introduction is likely to be a measurement of the quantum efficiency of CsI3, then, the sample
+progressively changed back into CsI.
+This measurement was performed right after measuring the quantum efficiency of CsI, so the last
+value is a measurement of clean (less than a few minutes in air in total) but transformed -see struc-
+tural analysis- CsI.
+CsI3 pressed pellets
+The evolution of the quantum efficiency of the samples made of compacted CsI3 follows the same
+trend as those obtained from CsI exposed to I2. At the introduction, the samples typically return
+an intensity of 120± 6 pA, and this values rises in a few hours to typical values of 200± 10 pA (table
+7.8).
+In the meantime, as explained earlier, the surface changes color, and the microstructure evolves as
+depicted earlier.
+A tentative of study of the stability on the long-term was performed by leaving one of the samples
+of compacted CsI3 in vacuum. But after one week, two pumps had broken, so the experiment was
+stopped (it is likely that the I2 release was at the origin of this failure).
+Still, the transformation of this sample had probably gone deeper than with the other samples, and
+7.3 CsI3 as a new photocathodes material 117
+Intensity measured (pA)
+few hours 1 week
+188± 9.4 31± 1.5
+Table 7.9 : The photocurrent at the reintroduction of the CsI3 pressed pellets according to the time passed
+in vacuum, and after one month in air.
+Time in hours Intensity measured (pA)
+Time in vacuum before left in air few hours 1 week
+Introduction 130± 6.5 31± 1.5
+1 177± 8.8 32± 1.6
+2 257± 12 35± 1.7
+4 274± 13 37± 1.8
+∞ did not increase further did not increase further
+Table 7.10 : Recovery of the photocurrent in vacuum, for two CsI3 pressed pellets, which stayed a few hours
+or one week in vacuum, and then one months in air and two days in presence of I2.
+the color of surface had change to a brighter color than the one of the samples, which stayed only
+one or two complete days in vacuum.
+After this, the two samples (the one pumped 1 week, and the one pumped only for the primary
+measurements: few hours) were left for one month in a plastic box in the clean room, and were tested
+again.
+It turned out that the quantum efficiency of both samples evolved very differently.
+At their reintroduction in the chamber, the intensities were rather different (table 7.9):
+• The sample, which had stayed only a few hours in vacuum had an intensity of 188± 9.4 pA.
+• The sample, which had stayed one week in vacuum had an intensity of only 31± 1.5 pA.
+No real evolution was then recorded. So the samples were put in presence of I2 vapors. After two
+days, the sample, which had been left only a few hours in vacuum was dark again, while the color of
+the sample which had been left in vacuum for one week did not change color. The quantum efficiencies
+of the two samples were tested again (table 7.10).
+The sample which had stayed only a few hours recovered like the other samples its quantum efficiency,
+while the one which had stayed a long time in vacuum, kept a very low quantum efficiency. No further
+stay in I2 of the sample left 1 week in vacuum could change its color, and its quantum efficiency did
+not change neither (same value of ∼ 35± 1.75pA).
+Later, a tentative to remove mechanically the bright layer was successful: it detached easily when
+pressed by tweezers.
+The uncovered layer was then tested, and showed similar properties to those of the freshly made
+118 Experimental tests and discussion of the results
+sample.
+Summary
+The typical values obtained with the different samples can be found in the table 7.11.
+It appears that, despite the variations in the precise values, the general trend is the same for the
+different samples.
+Some general conclusions can be already given when looking at the different values:
+• Contrary to CsI, CsI3 seems to be insensitive to air.
+• The quantum efficiency of CsI3 is lower than clean CsI (from the Luxel sample, probably a
+factor 7), but better than exposed to air CsI.
+• When exposed to I2 and then put in vacuum at least twice, the quantum efficiency is increased.
+This does not further increase after two cycles yet.
+• A too long stay of CsI3 in vacuum makes the sensitivity to air rise, and I2 treatment does not
+enable to recover the best efficiency.
+Also, both ways to obtain CsI3 samples (from CsI and CsI3) seem to be equivalent as they offer
+similar values at the time of introduction.
+7.3.3 Analysis of the results obtained with CsI3
+The behavior of the CsI3 as a photocathode can be explained by a transformation of the outer layer,
+following the reaction
+CsI3 
+ CsI + I2 (1)
+The CsI3 samples, when put in vacuum transform according to the reaction (1) in the left to right
+direction, so a layer of fresh CsI is formed at the surface of the sample. This is visible by the change
+of color from dark red (CsI3) to yellow-white (CsI).
+The different test with pure CsI and CsI3 show that CsI is a better emitter, so there is an increase
+of quantum efficiency when this reaction occurs, until all the CsI3 of the active layer of the photo-
+cathode transformed in CsI.
+The reaction does not stop as the I2 released in the chamber is pumped, so the equilibrium vapor
+pressure is never reached. Eventually, a thick layer of CsI is formed on top of the sample, which
+corresponds to the one removed mechanically from the CsI3 pressed pellet after it stayed one week
+in vacuum.
+When left in a plastic box, there is no evolution of the microstructure, or of the emission character-
+istics, at least in the time scale of a few months. This indicates that when the equilibrium vapor
+pressure of I2 is reached, there is no evolution of CsI3.
+When I2 is released, there is a change of the surface microstructure as shown by the SEM pictures.
+This evolution is in favor of a greater quantum efficiency of the CsI left: the microstructure becomes
+7.3 CsI3 as a new photocathodes material 119
+Test of CsI Test of CsI3
+Before After After exposure After exposure After (re)exposure
+Samples
+exposure to air exposure to Air to I2 to air to I2
+CsI(C) 144± 7.2 91± 4.5 160± 8→ 230± 11 92± 4.6 340± 17
+CsI Crystal From Saint Gobain Charging 120± 6→ 151± 7.5 68± 3.4 154± 7.7
+CsI from Luxel 1140± 57→ 760± 38 113± 5.6 390 ∗ ±19→ 812± 40 370± 18 XXX
+± → ± short stay in vacuum 118± 5.9 270± 13CsI3 XXX ** 130 6.5 200 10 long stay in vacuum 31± 1.5 37± 1.8
+*: this value must be taken with caution.
+**: No sense.
+Table 7.11 : CsI3 measurements summary.
+120 Experimental tests and discussion of the results
+porous, which betters the quantum efficiency of CsI as already known.
+If the samples of CsI3 are left in air after a long stay under vacuum, the thick layer of CsI gets
+polluted and the quantum efficiency of the photocathode drops rapidly, like it does for pure CsI
+samples. After a short stay in vacuum, CsI3 seem to be less sensible to air pollution.
+It seems that the state of degradation of the CsI layer (after a stay in air, so after exposure to
+moisture) has an impact on the possibility to re-transform in CsI3.
+In conclusion:
+• If the CsI3 did not stay too long in vacuum, it can be ”recovered” (the formed CsI layer can
+retransform in CsI3) even after a long stay in air.
+• If the CsI3 stayed a long time in vacuum, the recover can occur only after a short exposure to
+air.
+This indicates that exposure to I2 does not enable to regenerate a thick layer of degraded CsI (or
+that the reaction is much slower).
+7.3.4 Conclusion on the use of CsI3 as a photocathode
+The study performed on CsI3 show that it is itself an interesting photocathode, providing a good
+quantum efficiency, and a good robustness to pollution and moisture. It has the disadvantage that it
+is unstable in vacuum, so it is mandatory to let the gas in the detector reach the equilibrium vapor
+pressure to enable its use as a photocathode.
+The most promising approach is its use as a precursor to CsI. Indeed, CsI3 is not an emitter
+as good as CsI in terms of quantum efficiency. But its instability under vacuum and its insensitivity
+to air degradation makes it a very attractive choice to create porous CsI photocathode.
+Indeed, as the material is very easy to manipulate in air, it is very easy to place the photocathode in
+gas-filled detectors. Then, simply pumping the chamber enables to obtain a porous CsI photocathode,
+which is the best photocathode available (eventually several cycles of pumping and exposure to I2
+can be necessary to obtain the best structure / quantum efficiency).
+Later maintenance operations are also easier to perform if the photocathode is first exposed to I2, it
+then transforms in CsI3, which makes it much more robust to air damages. This method does not
+enable to recover the efficiency of a CsI which was severely polluted though.
+This study shows that CsI3 can potentially be a good way to fabricate porous CsI photocathodes.
+Bibliography
+[1] R.M.Bozorth et al., “Unknown title,” The Journal of American Chemical Society, vol. 47, p. 1561,
+1925. This reference could not be obtained.
+[2] H.A.Tasman et al., “Re-investigation of the crystal structure of csi3,” Acta Cryst., vol. 8, 59,
+pp. 59–60, 1955.
+[3] J.Runsink et al., “Refinement of the crystal structure of (c h ) asi and csi at 20o6 5 4 3 3 c and at
+−160oc,” Acta Cryst., vol. B28, pp. 1331–1335, 1972.
+[4] T.R.Briggs et al., “The polyiodides of cesium, cesium iodide, iodine, and water at 25oc,” The
+Journal of Physical Chemistry, vol. 34, pp. 1951 – 1960, 1930.
+[5] L.E.Topol et al, “Thermodynamic studies in the polyiodides systems rbi−rbi3, nh4i−nh4i3, csi−
+csi3, and csi3 − csi4.,” Inorganic Chemistry, vol. 7, pp. 451–454, 1968.
+[6] V.Dandendorf et al., “Progress in ultrafast csi-photocathode gaseous imaging photomultipliers,”
+Nucl. Inst. and Meth. A, vol. A308, pp. 519–532, 1991.
+[7] E.Shefer et al., “Photoelectron transport in csi and csbr coating films of alkali antimonide and
+csi photocathodes,” J.Appl.Phys., vol. 92(8), pp. 4758–4771, 1993.
+[8] A.Breskin et al., “New ideas in csi-based photon detectors: Wire multiplication and protection
+of the photocathode,” IEEE Trans.Nucl.Sci, vol. 42(4), pp. 298–305, 1995.
+[9] B.L.Henke et al., “The characterization of x-ray photocathodes in the 0.1-10kev photon energy
+range,” J.Appl.Phys., vol. 52(3), pp. 1509–1520, 1981.
+[10] J.E.Lees et al., “Thermally annealed soft x-ray photocathodes,” Nucl. Inst. and Meth. A, vol. 381,
+pp. 453–461, 1996.
+
+Chapter 8
+Conclusion
+The aim of this work was to develop new photocathodes with improved quantum efficiency and ro-
+bustness to allow their use as a first stage X-ray electron converter in gas-filled detectors.
+This implied both theoretical studies and practical experiments to identify the most promising tech-
+niques to develop such device.
+This work allowed the development of a simulation tool using a Monte Carlo method for prospecting
+new materials and structures. It turned out that the tool could not simulate properly the photocath-
+odes’ physics, leading to unreliable results. Deep investigations highlighted that it was the method
+and not the specific program, which is adequate for such simulations. The Monte Carlo method can
+be used to develop material already well known and better understand them, by developing specific
+codes for this material. Unfortunately, this approach is of no help to investigate prospective materials,
+which properties are not known. This limit finds its root in the strong variation of the electrons dy-
+namic in the bulk and at the surface of the material with its precise structure and chemical state. So
+any Monte Carlo Study of a photocathode material implies a deep study of the materials properties,
+which is just longer than a direct experimental study.
+Still the development of this tool helped in understanding the key parameters which govern one pho-
+tocathode quantum efficiency.
+In order to enable reliable tests of the quantum efficiency of the photocathodes, an experimental setup
+was developed and built. This setup showed excellent characteristics, as it was able to measure very
+weak photocurrents, while being very flexible. Currents of less than 1 fA were successfully measured.
+The setup then served as a basis for all study of the quantum efficiency of prospective photocathodes.
+The last part of the work consisted in developing methods to better the quantum efficiency of photo-
+cathodes. Various approaches were investigated, and eventually experimentally tested. In particular,
+the study of the impact of microstructures on the material efficiency was performed, and the in-
+124 Conclusion
+vestigation of a scintillator-low energy photocathode system was performed. The most promising
+approach, and which was more extensively investigated is the use of CsI3 as a precursor to CsI,
+which is currently the best known photocathode.
+The use of CsI3 as a photocathode is advantageous in several ways:
+• Contrary to CsI, CsI3 is not hygroscopic, and is rather resistant to pollution. Thus, it can be
+easily manipulated in air.
+• When put in vacuum, it releases I2, and transforms in CsI with a porous structure. Porous
+CsI is known for being the best photocathode in terms of quantum efficiency. So CsI3 is a way
+to obtain structured photocathodes, without using complex evaporation systems, which enable
+the growth of porous CsI photocathode. A simple deposition of CsI3 or even of unstructured
+CsI later exposed to I2 vapors is enough to obtain a structured CsI photocathode.
+• The reaction CsI3 
+ CsI + I2 is reversible. So one can protect CsI from air pollution by
+exposing it to an atmosphere saturated with iodine. This is a very attracting method for it
+simplifies dramatically the maintenance operations.
+So the use of CsI3 as a photocathode is technologically promising. It can lead to the fabrication
+of gas-filled detectors, which can answer the growing need of fast, large areas counting detectors in
+photon science...
+Further study will need to validate experimentally this approach to create and protect CsI photo-
+cathodes.
+Appendix A
+Detector characteristics
+A.1 Position resolution in the case of gas-filled detectors
+The spatial resolution gives information on the accuracy of the position returned by the detector.
+The position resolution is the result of four main contributions [1]:
+σ = (σ2 + σ2 + σ2 + σ2 )1/2det noise diff er aval .
+where
+• σnoise is the r.m.s contribution from the electronic noise. I depends on the type of readout.
+• σdiff is the contribution due to electrons diffusion.
+• σer is the contribution from Auger electrons and photoelectrons.
+• σaval is the contribution from avalanche centroid fluctuation. It is due to statistical variations
+and varies greatly with gas gain. It is often the main contributor and depends on both pressure
+and gas mixture.
+More details on each contributions can be found in [1] and in chapter 4 of [2].
+A.2 Energy Resolution
+The Energy resolution is usually defined as the full width half maximum of the spectral response of
+the detector to a given energy.
+Indeed, with an excellent prec√ision(∼ 1%), the response has a gaussian shape. More precisely, The
+resolution R is given by: R = (electronic noise)2 + (Fano)2:
+→ Electronic noise gives the contribution of the electronic to the error of measurement. This
+term is itself the result of several contributions.
+→ Fano is the contribution due to the Fano Statistics: the generation of electrons and holes
+charges is the result of a statistical process. The energy of the incoming particle/photon is
+126 Detector characteristics
+shared between lattice excitation (∼ 2/3) and the√generation of charge carriers (∼ 1/3). The
+resultant spread in energy is FWHMFano = 2.35 FεE with ε being the charge pair creation
+energy (ex. 3.63eV/e-h for Si), F the Fano factor (F ≈ 0.12 for Si, F is not a constant), and
+E the energy.
+A.3 Space Charging in gas-filled detectors
+The space charging effect is important because it can be physical limitation to counting rate char-
+acteristics. Two methods have been given by Sipilia et al. in 1980 and later by Mathieson et al. in
+1992 [3, 4].
+It concerns the reduction of the electric field between the anode and cathode due to ions in the volume.
+This presence is unavoidable for the amplification process necessarily creates such ions (ionization
+avalanche). The two models calculate the effective field reduction at the anode surface.
+Bibliography
+[1] G.C.Smith, “Gas-based detectors for synchrotron radiation,” Journal of Synchrotron Radiation,
+vol. 13, pp. 172–179, March 2006.
+[2] G.F.Knoll, Radiation Detection and Measurement. Willey, 2000.
+[3] H.Sipila et al., “Mathematical treatment of space charge effects in proportional counters,” Nucl.
+Inst. and Meth., vol. 176, pp. 381–387, 1980.
+[4] E.Mathieson et al., “Gain reduction due to space charge in a multiwire proportional chamber
+irradiated by a uniform beam of rectangular section,” Nucl. Inst. and Meth. A, vol. 316, pp. 246–
+251, 1992.
+
+Appendix B
+Monte Carlo Application Examples
+B.1 Simple Examples of statistical sampling methods
+In this section, some of the most classical example of statistical sampling methods are given. Those
+methods can be considered as particular application of the Monte Carlo Method1.
+B.1.1 Calculus of an integral
+As a first approach to the Monte Carlo method, an example of calculation of an integral is given:
+Let assume the function φ is to be integrated between a and b:
+∫ b N∑−1 b− a 1 b− a
+Φ(t)dt = Φ(xi) +O( ) with xi = a+ − i.a N N N 1i=0
+This is the classical formula of the trapezoidal rule.
+Instead of a uniform sampling, imagine an evaluation where the positions {xi} are random numbers
+uniformly distributed in the interval [a, b]; this yields a Monte Carlo integration:
+∫ b ∑N b− a √1Φ(t)dt = Φ(xi) +O( ) with a ≤ xi ≤ b.
+a N Ni=1
+In this particular exa√mple, the methods appears to be less efficient than the trapezoidal rule for its
+absolute error is in 1/ N instead of 1/N . Though the Monte Carlo approach has a strong advantage
+over it: it is independent of the number of dimensions. So, contrary to the uniform sampling, which
+has an error scaling as N−1/d, the Monte Carlo Method will stay with an error scaling as N−1/2.
+This is a direct consequence of the central limit theorem.
+1The name statistical sampling method is used instead of Monte Carlo Method, for those methods were developed
+before the name Monte Carlo Method was given and presented as a general method.
+130 Monte Carlo Application Examples
+B.1.2 An historical example: Buffon’s needles
+One of the first statistical approach to solve a mathematical problem is due to the mathematician
+Comte de Buffon.
+Figure B.1 : Georges Louis Leclerc Comte de Buffon Figure B.2 : The needle problem by Buffon
+He invented a method to calculate an approximation of pi. Here is the problem he solved, which leads
+to the approximation method of pi: if a needle of length l is dropped several times on a horizontal
+surface ruled of parallel lines separated of a distance d¿l, what is the probability ℘ that the needle
+cross one line?
+That outcome will happen only if 0 6 A 6 d and 0 6 θ < pi.
+If we assume that the vector (A, θ) is randomly distributed on the region [0, d[×[0, pi[, then the
+probability 1∫d∫ensity function is dpi , and the probability that the needle cross the line is:pi l sin θ 1
+℘ = dAdθ
+0 0 dpi
+2l E(M)
+So the probability is ℘ = = if M is the random variable for the number of times the needle
+dpi n
+cross the line, and n the number of drops.
+n 2l
+It appears that is a statistical estimator for pi. So to determine pi, one can evaluate E(M),
+E(M) d
+which is easily done, just dropping needles.
+De´veloppement de photocathode de meilleures
+efficacite´s quantiques pour de´tecteurs a` gaz
+Re´sume´ en franc¸ais.
+Introduction
+Ce travail de the`se vise a` explorer diffe´rentes voies d’ame´lioration de l’efficacite´ des photocathodes.
+Plus ge´ne´ralement, il prend place dans le de´veloppement de de´tecteurs a` gaz de rayons X de grandes
+surfaces, susceptibles de re´pondre aux besoins croissants en matie`re de vitesse et de taille des de´tecteurs
+utilise´s dans les domaines du me´dical et de la recherche mobilisant le rayonnement synchrotron.
+Les photocathodes pour de´tecteurs a` amplification par gaz
+De´tecteurs a` 2 dimensions
+Les de´tecteurs a` 2 dimensions (ou a` 1 dimension) sont par opposition aux de´tecteurs ponctuels
+capables de fournir une information spatiale sur la particule de´tecte´e.
+Ce type de de´tecteur pre´sente l’e´norme avantage qu’il dispense de syste`mes me´caniques pour couvrir
+l’ensemble de l’espace (dans le cas de l’espace re´el comme re´ciproque). Ainsi il est possible d’effectuer
+beaucoup plus rapidement les expe´riences d’imagerie. Certaines expe´riences ne´cessitent meˆme l’utili-
+sation de de´tecteur 2D, soit pour des raisons de temps d’exe´cution autrement trop longs (cas de la
+tomographie 3D par exemple) soit meˆme pour des raisons de de´gradation de l’e´chantillon qui ne peut
+supporter le faisceau qu’un temps tre`s court (notamment dans les domaines de la biologie ou dans le
+cas des analyses me´dicales !).
+Les de´tecteurs a` amplification par gaz
+Les de´tecteurs a` amplification par gaz (aussi appele´s  de´tecteurs gazeux ), sont parmi les plus
+vieux syste`mes de de´tection de rayonnement ionisant. Ils sont en particulier les premiers a` avoir offert
+132 Re´sume´
+une de´tection e´lectronique du passage d’un rayonnement ou d’une particule ionisante.
+L’exemple le plus ce´le`bre de ce type de de´tecteur est le Tube Geiger introduit par Geiger etMueller
+en 1928 apre`s que Geiger et Rutherford aient de´couvert le principe de la multiplication e´lectronique
+dans un gaz.
+Ces de´tecteurs sont base´s sur une multiplication interne des e´lectrons ionise´s a` la suite d’un de´poˆt
+d’e´nergie par la particule/le rayonnement traversant le gaz. Cette multiplication des e´lectrons est
+rendue possible par la pre´sence d’un champ e´lectrique au sein de la chambre a` gaz, qui acce´le`re
+les charges pre´sentes. Si l’e´nergie cine´tique gagne´e par ces charges entre deux collisions avec une
+mole´cule du gaz est supe´rieure a` l’e´nergie d’ionisation d’une particule de gaz (typiquement 35eV),
+alors la particule devient susceptible de ioniser une particule de gaz, et est donc a` la source d’une
+cascade de ionisation. L’augmentation exponentielle du nombre de charges permet alors une de´tection
+aise´e par simple collection des charges sur des e´lectrodes.
+Les de´tecteurs a` gaz constituent maintenant une technologie mature. Ils ont comme avantage principal
+de permettre la fabrication de de´tecteurs de grande dimension et rapides a` un couˆt acceptable, tout
+en permettant un fonctionnement en comptage (par opposition aux de´tecteurs fonctionnants avec
+des e´crans fluorescents, qui impliquent un mode d’ope´ration en inte´gration, et donc un bruit plus
+important).
+Ils pre´sentent aussi des inconve´nients, notamment un phe´nome`ne de parallax, qui de´grade fortement
+la re´solution dans le cas des incidences obliques, et une efficacite´ quantique limite´e notamment aux
+e´nergies supe´rieures a` 10keV. En effet, l’efficacite´ d’absorption du gaz augmente avec la pression,
+alors que l’efficacite´ d’amplification est optimum pour les faibles pressions.
+Une approche pour contrebalancer ces deux inconve´nients, consiste en l’utilisation de photocathodes
+solides comme convertisseurs photon → e´lectrons, permettant ainsi une se´paration (et donc une
+optimisation se´pare´e) des deux fonctions d’absorption et d’amplification.
+Les photocathodes de´die´s a` une utilisation dans des de´tecteurs a` gaz
+Les photocathodes permettent une conversion de la lumie`re incidente en e´lectrons par le biais de
+l’effet photoe´lectrique.
+Les photocathodes ont principalement e´te´ utilise´es au sein de photomultiplicateurs, dans lesquels elles
+sont couple´es a` une se´rie de dynodes, capables d’amplifier fortement le signal e´lectrique.
+Le me´canisme qui me`ne a` l’e´jection de l’e´lectron a` l’exte´rieur de la photocathode est en fait complexe :
+l’e´lectron(s) e´mis a` la suite de l’absorption par effet photoe´lectrique du photon incident subit une se´rie
+d’interactions avec les autres e´lectrons pre´sents dans le mate´riau et perd rapidement cette e´nergie.
+Au cours de ce trajet, il ionise lui-meˆme d’autres atomes et cre´e ainsi une se´rie d’e´lectrons chauds
+secondaires au sein du mate´riau. Eventuellement, un ou plusieurs de ces e´lectrons peuvent atteindre
+la surface et quitter la photocathode.
+Cependant, pour quitter le mate´riau, l’e´lectron doit passer une barrie`re de potentiel appele´e affinite´
+e´lectronique dans le cas des semi-conducteurs, ou travail de sortie dans le cas des me´taux. Du fait
+de leur thermalisation rapide apre`s e´jection de l’atome, peu d’e´lectrons peuvent effectivement passer
+cette barrie`re et les rendements d’e´mission sont en ge´ne´ral faibles.
+133
+Les photocathodes pre´sentant les meilleurs rendements pre´sentent la particularite´ de pre´senter une
+affinite´ e´lectronique ne´gative. Ainsi, les e´lectrons chauds pre´sents dans le mate´riau sont facilement
+e´jecte´s et les rendements sont e´leve´s. Cependant, ces mate´riaux pre´sentent aussi une grande sensibilite´
+a` toute forme de pollution de leur surface, qui leur fait perdre cette affinite´ e´lectronique ne´gative.
+En conclusion, ide´alement une photocathode pour de´tecteurs a` gaz pre´sente les caracte´ristiques sui-
+vantes :
+Une affinite´ e´lectronique ne´gative : afin de laisser sortir un maximum d’e´lectrons chauds cre´e´s
+a` la suite de l’absorption du photon incident.
+Un grand pouvoir d’arreˆt : afin de garantir que les photons seront absorbe´s pre`s de la surface
+d’e´jection des e´lectrons. Le pouvoir d’arreˆt est en ge´ne´ral plus e´leve´ avec des e´le´ments de nume´ro
+atomique Z e´leve´.
+Une faible re´activite´ chimique : afin d’e´viter une trop grande sensibilite´ de la photocathode a` la
+pollution par le gaz utilise´ pour l’amplification du signal (en particulier, les ions ge´ne´re´s lors de
+l’avalanche e´lectronique sont une grande source de pollution).
+Modalite´s de l’e´tude de photocathodes a` efficacite´ quantique supe´rieure
+L’e´tude entreprise lors du travail de the`se comporte Trois e´tapes principales :
+1. Une e´tude the´orique des photocathodes. En particulier un code de simulation par Monte Carlo
+a e´te´ de´veloppe´ pour simuler l’efficacite´ des photocathodes.
+2. L’e´tude et la fabrication d’un dispositif expe´rimental permettant de tester concre`tement des
+photocathodes.
+3. L’e´tude de diffe´rentes me´thodes pour ame´liorer l’efficacite´ des photocathodes, et l’e´tude de
+nouveaux mate´riaux potentiellement bons photo-e´metteurs.
+Chacune de ces e´tapes est de´crite brie`vement ci-dessous.
+Le de´veloppement d’un code de simulation par me´thode Monte Carlo
+introduction a` la me´thode Monte Carlo
+A la suite de sa premie`re utilisation au cours du Projet Manhattan a` Los Alamos au lendemain de la
+seconde guerre mondiale pour le de´veloppement de la bombe nucle´aire ame´ricaine, la me´thode Monte
+Carlo pour la simulation du transport de particules dans la matie`re est devenue un outil standard de
+la physique des particules.
+Cette me´thode permet de rendre compte de l’aspect ale´atoire de l’interaction des particules avec la
+matie`re. Elle consiste a` simuler le trajet des particules en calculant la probabilite´ d’interaction d’une
+particule au moyen d’un ge´ne´rateur de nombres ale´atoires, et des densite´s de probabilite´s d’interac-
+tions pour chacun des me´canismes d’interaction connus. Ces densite´s de probabilite´s sont e´value´es au
+moyen des tables de sections efficaces, qui sont des grandeurs expe´rimentales.
+134 Re´sume´
+le code de´veloppe´
+Le de´veloppement d’un code de simulation par Monte Carlo est un projet tre`s ambitieux en soi, aussi
+une librairie standard de simulation par Monte Carlo a-t-elle e´te´ utilise´e pour e´crire le code.
+Le choix a e´te´ porte´ surGeant4, une librairie de´veloppe´e par un consortium de laboratoires et pilote´e
+par le CERN. L’ensemble du code ainsi qu’une documentation de´taille´e est disponible sur le site du
+CERN, ce qui a fortement participe´ a` la popularite´ du code, outre ses performances de simulations
+reconnues.
+En particulier, c’est la pre´sence de plusieurs bibliothe`ques de´die´es aux basses e´nergies qui a justifie´
+l’adoption de Geant4 comme base du code.
+Les simulations devaient permettre de pre´dire le gain en efficacite´ de certaines microstructures, et de
+pre´dire les efficacite´s quantiques de certains mate´riaux encore non e´tudie´s.
+Malheureusement, il s’est ave´re´ que le code e´tait beaucoup trop impre´cis pour mener a` bien ce type
+de calcul. Les efficacite´s pre´vues par le code se sont ave´re´es comple`tement fausses dans un certain
+nombre de cas de´ja` connus.
+Une e´tude plus approfondie a montre´ que la simulation de photocathodes est actuellement impossible
+avec ce type de simulations. Deux facteurs principaux expliquent cela :
+Les tables de sections efficaces utilise´es par les codes Monte Carlo sont trop impre´cises. En effet,
+l’obtention de valeurs de sections efficaces a` basse e´nergie est beaucoup plus difficile qu’a` haute
+e´nergie, du fait du nombre d’interactions que subissent les particules a` ces e´nergies. De ce fait,
+les tables de sections efficaces a` basse e´nergie sont base´es sur des mode`les semi-empiriques, et
+sont entache´es de nombreuses incertitudes.
+L’approche interaction particule/atome qui est utilise´e est globalement trop grossie`re : elle ne
+permet pas de rendre compte efficacement de l’e´tat chimique du mate´riau et de sa surface. En
+particulier, l’e´tat de surface, qui s’ave`re eˆtre une donne´e cruciale n’est pas mode´lisable par une
+approche purement atomistique.
+Le code n’a donc pas pu eˆtre utilise´ pour effectuer des simulations de photocathodes.
+Etude et construction d’un dispositif expe´rimental
+Afin de pouvoir tester expe´rimentalement les photocathodes envisage´es, un dispositif adapte´ a e´te´
+cre´e´.
+Il consiste essentiellement en une chambre a` vide munie de connecteurs et d’une feneˆtre adapte´e, et
+d’un ampe`reme`tre tre`s pre´cis : la chambre posse`de une fine feneˆtre de beryllium permettant de laisser
+passer une large proportion du flux de rayons X. Des connecteurs triaxs permettent de connecter
+directement sur la chambre le pre´-amplificateur associe´ a` l’ampe`reme`tre. Au sein de la chambre,
+l’ensemble des pie`ces supportant la photocathode au plus pre`s de la feneˆtre est re´alise´ en PEEK,
+mate´riau pre´sentant a` la fois une grande durete´ et une re´sistance e´lectrique e´leve´e. Une grille de
+collection est monte´e environ 5mm au-dessus de la photocathode teste´e. Enfin, un connecteur CF
+standard permet la connection a` une pompe.
+135
+L’ampe`reme`tre utilise´ est un Keithley 6430. Cet appareil est capable de mesurer des courants infe´rieurs
+au fA, graˆce a` la pre´sence d’un pre´-ampli exte´rieur, qui permet d’approcher autant que possible les
+connecteurs de la source de courant.
+Le dispositif de mesure a e´te´ teste´ avec succe`s avec une source radioactive a` des courants de l’ordre
+de 0,5fA. Le courant de fuite e´tant infe´rieur a` 10% de la valeur mesure´e.
+Cependant, le dispositif a e´te´ essentiellement utilise´ avec un tube conventionnel de rayons X, cathode
+de cuivre. L’ensemble des ope´rations de montages du dispositif et des e´chantillons s’est de´roule´ en
+salle blanche.
+Les photocathodes e´tudie´es et leur efficacite´
+Principalement deux approches ont e´te´ adopte´es pour ame´liorer l’efficacite´ des photocathodes exis-
+tantes :
+– L’e´tude de certaines microstructures et de leurs effets
+– L’e´tude de nouveaux mate´riaux
+Des microstructures pour ame´liorer les mate´riaux de´ja` connus
+L’effet de microstructures sur l’efficacite´ des e´missions a e´te´ e´tudie´.
+Deux types d’effets ont e´te´ recherche´s :
+– Un effet purement ge´ome´trique afin de profiter de l’augmentation du rendement d’e´mission dans le
+cas d’incidence oblique.
+– Un effet d’e´mission de champ a e´te´ recherche´ par l’e´tude de micro-pointes de silicium.
+Emission de champ
+Dans le cas de structures tre`s pointues, telles que des pointes de silicium, il se produit une concentra-
+tion du champ e´lectrique aux alentours de la pointe. L’ide´e e´tait donc de profiter de cette concentration
+du champ e´lectrique normalement utilise´ pour faire migrer les e´lectrons photo e´mis vers la grille de
+collection, pour e´tudier un e´ventuel phe´nome`ne d’augmentation du rendement d’e´mission par effet de
+champ.
+Malheureusement, aucun courant n’a pu eˆtre de´tecte´ par ce biais. C’est probablement le faible pouvoir
+stoppant du silicium qui peut expliquer la tre`s faible efficacite´ quantique du silicium dans ce cas. En
+effet, si les e´lectrons sont cre´e´s trop loin de la surface de la photocathode, une tre`s faible proportion
+d’entre eux parvient a` la surface, ce qui se traduit par un rendement global tre`s faible.
+Effet de l’angle
+Dans le cas d’une incidence oblique des rayons X sur la surface du mate´riau, il se produit une
+augmentation du rendement de la photocathode. En effet, une plus large proportion (facteur 1cosα
+si α est l’angle d’incidence vis-a`-vis de la normale a` la surface) des photons est absorbe´e au sein de
+la zone active de la photocathode (imme´diatement a` proximite´ de la surface). Il s’en suit donc une
+augmentation du nombre d’e´lectrons qui peuvent s’e´chapper.
+136 Re´sume´
+L’effet de structures, facile a` obtenir sur de larges surfaces (il s’agissait en fait de papier de verre clas-
+sique ou de type Trizact), a re´ve´le´ que l’on obtient facilement un doublement de l’efficacite´ quantique
+avec de simples structures pyramidales re´gulie`rement place´es a` la surface de la photocathode.
+Le CsI3 comme nouveau mate´riau de photocathode
+Le mate´riau le plus efficace actuellement connu est le CsI. En effet, ce sel de deux compose´s de
+nume´ro atomique Z e´leve´ pre´sente un pouvoir stoppeur important, double´ d’une affinite´ e´lectronique
+ne´gative.
+De ce fait, le CsI peut revendiquer des efficacite´s de plusieurs pour-cents a` des e´nergies de quelques
+keV.
+Malheureusement, comme tous les mate´riaux a` affinite´ ne´gative, il est aussi fortement sensible a` la
+pollution due a` son environnement, et, a` moins de le laisser sous ultra-vide (ce qui est re´alisable au
+sein des photomultiplicateurs scelle´s) son utilisation ne peut eˆtre envisage´e au sein d’un de´tecteur a`
+gaz (et ce malgre´ de tre`s nombreuses e´tudes dans ce sens).
+En substitution a` ce mate´riau, le CsI3 : un de ses de´rive´s, peut constituer une alternative inte´ressante.
+Le CsI3 est un mate´riau de couleur marron-orange´, instable sous vide (il se de´compose selon la
+re´action CsI → CsI + I ), pre´sentant une densite´ de 4, 51gc˙m−33 2 . C’est un cristal dont la structure
+appartient au groupe Pmcn.
+Le mate´riau est commercialise´ par des entreprises telles que Sigma-Aldrich ou peut eˆtre obtenu en
+mettant un e´chantillon de CsI au sein d’un atmosphe`re sature´e d’iode.
+Les tests du CsI3 ont montre´ une efficacite´ intrinse`que inte´ressante, qui de plus augmente apre`s
+quelques heures place´ sous vide (pression de l’ordre de 10−4 mBar).
+Une e´tude plus pousse´e de ce mate´riau a permis d’e´tablir un sce´nario permettant d’expliquer cette
+ame´lioration.
+Lorsque la photocathode est laisse´e sous vide, le CsI3 se de´compose en CsI. Ceci explique l’ame´lioration
+de l’efficacite´ alors constate´e, en effet le CsI est actuellement le meilleur mate´riau connu pour la
+constitution de photocathodes. Il pre´sente cependant le de´faut d’eˆtre particulie`rement sensible a` la
+pollution par le milieu, et en particulier, il est tre`s hygroscopique.
+A l’inverse le CsI3 semble eˆtre particulie`rement peu sensible a` la pollution. Il peut de plus eˆtre
+re´ge´ne´re´ apre`s un passage sous vide (et donc la transformation de sa surface en CsI) par mise dans
+une enceinte contenant de l’iode solide, et donc ou` la pression partielle de I2 est importante.
+L’e´tude a aussi montre´ une modification de la structure de la surface qui prend un caracte`re poreux
+lors de la transformation CsI3 → CsI + I2. Ainsi, lorsque le processus de mise en contact avec I2
+puis mise sous enceinte sous vide est re´pe´te´, l’efficacite´ s’en trouve ame´liore´e.
+L’utilisation de CsI3 comme pre´curseur du CsI est donc inte´ressante en soi, car elle permet une
+structuration du CsI. On perd cependant la plus grande insensibilite´ du CsI3 en regard a` celle du
+CsI. Ainsi, meˆme si le CsI pur est plus efficace que le CsI3 (facteur 8 environ), une fois pollue´, le
+CsI est beaucoup moins efficace que le CsI3.
+Cette approche peut s’ave´rer tre`s utile pour permettre l’utilisation du CsI comme photocathode dans
+137
+le cas des de´tecteurs a` gaz. En effet il est possible de fabriquer les de´tecteurs munis de la photocathode
+sous forme de CsI3 ce qui permet sa manipulation sous air. Ensuite, le de´tecteur e´tant herme´tique,
+la transformation du CsI3 en CsI permet l’obtention d’une photocathode pre´sentant un caracte`re
+poreux, et donc d’une grande efficacite´. Ceci apporte aussi une solution au proble`me de la maintenance
+qui ne´cessite souvent l’ouverture du de´tecteur. On peut en effet prote´ger la photocathode de CsI en
+l’exposant pre´alablement a` de l’iode (I2) ce qui la rend re´sistante a` l’humidite´. Ainsi il n’est plus
+ne´cessaire d’ouvrir le de´tecteur en enceinte prote´ge´e de l’humidite´.
+
+Acknowledgements / Remerciements
+The first thank of course goes to my supervisor Menyhert Menhard Kocsis.
+Not much to say, apart that I would not have done much without his help and support. He did not
+help only for the work, but he also showed great courage to defend me at a moment I had a very bad
+time.
+Thanks a lot Menhard !
+I would like to thank then people in chronological order :
+Mes parents, ma famille pour leur soutient avant et pendant ce travail.
+Mes grands parents car ils ont eu une importance de´cisive dans mes choix d’e´tude, et l’orien-
+tation que j’ai donne´e a` mon travail.
+Mlle. Lenoble ma professeur de physique en classe de 1e`re qui a su rendre une matie`re alors
+bien fatiguante beaucoup plus attractive ! Vous voyez Mlle. Lenoble, j’ai fini par vous e´couter et aller
+chercher tout seul les re´ponses aux questions auxquelles la physique n’a pas encore re´pondu...
+Julie ! Et oui elle a certainement duˆ m’aider meˆme lorsque je ne m’en rendais pas compte...
+My colleagues from the ESRF :
+The whole ISG group.
+In particular Christophe, Francis, Thierry, Cedric who provided me with a great and constant support
+and taught me so much.
+Also thanks a lot to Joel, Jose-Maria, Emmanuel, Laurent, Marc, Paul-Antoine, Pablo, Herve, Ri-
+cardo, Jean-Claude, John, Ernesto, Cyril, Roland, Jean-Jacques, Denis... And last, as a former guy
+140 Thanks / Merci !
+from ISG, Heinz who certainly had a peculiar place in this work...
+Narayanan for being my tutor during this PhD. Thesis.
+The Scisoft Group In particular Claudio and Romeu for sharing their knowledge concerning the
+Monte Carlo method and programming.
+The whole id15 beamline For their support each time they could give me a hand.
+And also : Irina for the SEM images, Harald for the help in preparing the samples in the chemistry
+lab, Gemma for the access to the die/press, Elizabeth for her help in preparing job interviews, Philippe
+for providing me with a Pump, Fabienne for her daily help, and her bread ! Delphine for her help with
+the administration from the University, Werner for his help with the mechanical pieces, Stephanie
+and Patrick for the help with the safety aspects...
+.. Guillaume, Andy, Virgile, Anne, Alex, Sylvain, Manuel, Chantal, Julio, Jorge, Davide, Valentina,
+Simo, Moritz, Paul-Antoine, Paul, Adeline, Oier, Gemma, Florian, Yvonne, Frank, Delphine, Pas-
+cal, Benoit, Sebastian, Sebastian (bis), Ioana, Olivia, Irmi, Jean-Michel, Wolfgang, Claudio, Romeu,
+Rainer, Olivier, Mohamed, Bertrand, Christian, Julia, Peter, Till, Andreas, Stefen, Alex, Roberta,
+Caroline, Elizabeth, Benedicte, Jose, Riccardo, Kieran, Nicolas... and those I forget, but who still
+have a place in my heart !
+for all the good moments I had at the ESRF.
+Mes tuteurs de l’Universite´
+Vincent Comparat et Johann Collot qui ont assure´ le suivi acade´mique et ont e´te´ de patientes
+et passionnantes sources de conseils pour ce travail de the`se.
+,
diff --git a/examples/theses/TH2013PEST1177.pdf b/examples/theses/TH2013PEST1177.pdf
new file mode 100644
index 00000000..f9462e78
Binary files /dev/null and b/examples/theses/TH2013PEST1177.pdf differ
diff --git a/examples/theses/TH2013PEST1177/fulltext.pdf b/examples/theses/TH2013PEST1177/fulltext.pdf
new file mode 100644
index 00000000..f9462e78
Binary files /dev/null and b/examples/theses/TH2013PEST1177/fulltext.pdf differ
diff --git a/examples/theses/TH2013PEST1177/fulltext.pdf.txt b/examples/theses/TH2013PEST1177/fulltext.pdf.txt
new file mode 100644
index 00000000..430a9e50
--- /dev/null
+++ b/examples/theses/TH2013PEST1177/fulltext.pdf.txt
@@ -0,0 +1,4937 @@
+Bio-methanation tests and mathematical modelling to
+assess the role of moisture content on anaerobic
+digestion of organic waste
+Flavia Liotta
+To cite this version:
+Flavia Liotta. Bio-methanation tests and mathematical modelling to assess the role of mois-
+ture content on anaerobic digestion of organic waste. Earth Sciences. Universite´ Paris-Est;
+Universite´ de Cassino, 2013. English. <NNT : 2013PEST1177>. <tel-00967951>
+HAL Id: tel-00967951
+https://tel.archives-ouvertes.fr/tel-00967951
+Submitted on 31 Mar 2014
+HAL is a multi-disciplinary open access L’archive ouverte pluridisciplinaire HAL, est
+archive for the deposit and dissemination of sci- destine´e au de´poˆt et a` la diffusion de documents
+entific research documents, whether they are pub- scientifiques de niveau recherche, publie´s ou non,
+lished or not. The documents may come from e´manant des e´tablissements d’enseignement et de
+teaching and research institutions in France or recherche franc¸ais ou e´trangers, des laboratoires
+abroad, or from public or private research centers. publics ou prive´s.
+ Joint	  PhD	  degree	  in	  Env	  ironmental	  Technology	  
+Spécialité:D	  Socciteenucre	  	  deet	  	  Tl’Uecnhivneiqrsuieté	  d	  Pea	   	  lr’Eisn-­‐vEi
+	  srto	  nnement	  
+Dottore	  di	  Ricerca	  in	  T	  ecnologi	  e	  Ambientali	  
+	   Degree	  of	  Doctor	  in	  Environmental	  Tech	  nology	  	   Thèse – Tesi dFi laDvoiat	  Ltoiortatato	    – PhD thesis	  
+ 
+Bio-Methanation tests and Mathematical Models to assess the effect of moisture content 
+on anaerobic digestion of complex organic substrates 
+ 
+Defended 12/12/2013 
+ 
+In front of the PhD committee  
+ 
+Dr. Renaud Escudiè Reviewer 
+Prof. Francesca Malpei Reviewer 
+Dr. Hab.E.D. Eric van Hullebusch Co-Promotor 
+Prof. dr.ir. Piet N.L. Lens Co-Promotor 
+Dr. Giovanni Esposito Promotor 
+Prof. Massimiliano Fabbricino Co-Promotor 
+ 
+Erasmus	  Joint	  doctorate	  prog r a  m    me	  in	   Environ men(EtaTl	  eT CeocSh3n)o	   	   	  
+lo gy	  for	  Co ntamina  t e  d  	   S  o  l  i d  s  ,	   S  o  ils	   and	  Sedim  enit	  s	  	   	   	   	   	  
+  
+	  	  	  	  	  	  	  	  	  	  	  “Love	  the	  truth,	  show	  yourself	  as	  you	  are,	  without	  claim,	  without	  fears	  and	  cares.	  And	  if	  the	  truth	  
+costs	  you	  persecution,	  accept	  it,	  and	  if	  the	  torment,	  bear	  it.	  And	  if	  for	  the	  truth	  you	  have	  to	  sacrifice	  
+yourself	  and	  your	  life,	  be	  strong	  in	  your	  sacrifice”.	  
+	  
+San	  Giuseppe	  Moscati	  	  	  	  	  	  	  
+	   	  	  
+To	  my	  fami 	  mlyy,	  	  msoyn	  b	  Cealorlvoe	  dw	  hhuos	  ibs	  asntidll	  	  Cinla	  mudyi	  ob	  ealnlyd.	  	  	  	  	  	  	  	  	  
+	  	  	  
+	  	  
+	  
+ 
+ 
+ 
+ 
+ 
+ 
+	   	   i	  i	   	   	   	   	  
+ Acknowledgment 
+ 
+I would like to thank the European Commission for providing financial support through the Erasmus 
+Mundus Joint Doctorate Programme ETeCoS3(Environmental Technologies for Contaminated Solids, 
+Soils and Sediments under the EU grant agreement FPA No 2010-0009 and the French Ministry of 
+Foreign Affairs in the framework of MOY Programme under Moy Grant N°2010/038/01. 
+My gratitude also to the committee members, Dr. Renaud Escudiè and Prof. Francesca Malpei for their 
+helpful comments, constructive criticisms and valuable discussions.  
+I also would like to thank my PhD Supervisors, Prof. Giovanni Esposito and Prof. Massimiliano 
+Fabbricino for their invaluable suggestions, patient advices and continuous encouragement extended 
+throughout three years of this research. My special thanks go also to Prof. Francesco Pirozzi, Prof. Piet 
+Lens, Prof. Eric van Hullebusch and Prof. Patrice Chatellier for supporting my during my PhD mobility 
+and for scientific contribution on my research.  
+Special thanks to all friends, MariaRosaria, Jaka, Alberto, Stefano, Antonio, Anish, Rosita and Mario, 
+who were working with me in DIGA Department of University Federico II of Napoli and in DIMSAT 
+Department of University of Cassino and Lazio Meridionale. 
+Special thanks also to Ludovico, the head of the LARA (Laboratory of Environmental analysis and 
+research) for helping me with patience and enthusiasm in sample analysis and equipment operation.  
+I also would like to thank Luigi for all useful suggestions for the research and his help on mathematical 
+modelling and paper writing.    
+I can not forget all my international friends, in particular Rohan, Anna, Wendy, Alexandra and Mani, 
+who I met during my mobility period in UNESCO-IHE and in University of Paris Est, with whom I 
+shared my research and moments of fun! 
+To conclude, tanks to my parents, my sister and Claudio for supporting and encouraging my during my 
+PhD studies. 
+I would like also to express my thank to God for giving me the inspiration, courage and the patience 
+during the course of these three years and the little Carlo, who still has to born but accompanied me on 
+the last months of my PhD studies. So small, but he already gave to me the power for a brilliant final 
+defence and the hope for a prosperous and smiley future. 
+	  	  
+ 
+	   i	  ii	   	   	   	   	  
+ PhD Thesis Index 
+Abstract .................................................................................................................................................... 1 
+Sommario ................................................................................................................................................. 2 
+Resumè ..................................................................................................................................................... 4 
+Samenvatting ........................................................................................................................................... 5 
+Chapter 1. Introduction .......................................................................................................................... 7 
+1.1 Problem Description ..................................................................................................................... 8 
+1.2. Objectives of the Study ................................................................................................................ 9 
+Chapter 2. Effect of moisture content on wet anaerobic digestion of complex organic substrates 12 
+2.1 Introduction ................................................................................................................................. 13 
+2.2. Materials and Methods .............................................................................................................. 15 
+2.2.1 Digester set-up and analytical measurements ........................................................................ 15 
+2.2.2 Preliminary tests: Drying procedure ...................................................................................... 15 
+     2.2.3 Effect of particle size on AD ................................................................................................. 17 
+     2.2.4 Effect of moisture content on AD ......................................................................................... 19 
+     2.2.5 Mathematical model .............................................................................................................. 19 
+2.3. Results and discussions .............................................................................................................. 21 
+2.3.1 Effect of particle size on AD performance ............................................................................ 21 
+     2.3.2. Effect of TS content on AD performances ........................................................................... 23 
+2.4. Modelling results ........................................................................................................................ 24 
+2.4.1. Modelling the effect of particle size on AD .......................................................................... 24 
+2.4.2. Modelling the effect of TS on AD ........................................................................................ 27 
+2.5 Conclusion .................................................................................................................................... 30 
+Chapter 3. Effect of moisture content on anaerobic digestion of food waste .................................. 32 
+3.1. Introduction ................................................................................................................................ 33 
+3.2. Materials and Methods .............................................................................................................. 34 
+    3.2.1 Experimental set-up ............................................................................................................... 34 
+    3.2.2. Substrate and inoculum preparation ...................................................................................... 35 
+    3.2.3. Analytical methods ............................................................................................................... 36 
+       3.2.3.1 Methane production ......................................................................................................... 36 
+       3.2.3.2 VFAs analysis .................................................................................................................. 36 
+       3.2.3.3 Other parameters .............................................................................................................. 37 
+3.3. Results and Discussion ............................................................................................................... 37 
+   3.3.1 Bio-methane production .......................................................................................................... 37 
+   3.3.2 VFAs production ..................................................................................................................... 39 
+3.4 Conclusions .................................................................................................................................. 44 
+Chapter 4. Effect of moisture content on anaerobic digestion of rice straw. .................................. 45 
+4.1 Introduction ................................................................................................................................. 46 
+4.2. Material Methods ....................................................................................................................... 47 
+   4.2.1 Experimental set-up ................................................................................................................ 47 
+   4.2.2. Substrate and inoculum preparation ....................................................................................... 47 
+   4.2.3. Analytical methods ................................................................................................................ 48 
+	         4.2.3.1 Methane production, COD, TS, VS. .	  ...............................................................................i.	  v 4	  8	   	   	   	  
+     4.2.3.2 VFAs and phenols analysis ................................................................................................. 48 
+4.3. Results and Discussion ............................................................................................................... 49 
+   4.3.1 Methane production ................................................................................................................ 49 
+   4.3.2 Analysis of process intermediates ........................................................................................... 51 
+4.4 Comparative process efficiency ................................................................................................. 55 
+4.5. Conclusions ................................................................................................................................. 55 
+Chapter 5. Modified ADM1 for dry and semi-dry anaerobic digestion of solid organic waste ..... 57 
+5.1 Introduction ................................................................................................................................. 58 
+5.2 Model description ........................................................................................................................ 59 
+5.3 Model calibration ........................................................................................................................ 63 
+5.4. Results and discussion ............................................................................................................... 68 
+5.5 Conclusion .................................................................................................................................... 71 
+Chapter 6. Literature Review .............................................................................................................. 72 
+6.1 Mathematical modelling of aerobic plug flow reactor and non-ideal flow reactor .............. 73 
+    6.1.1 Introduction ............................................................................................................................ 73 
+    6.1.2. Design models and performance-prediction models ............................................................. 74 
+6.1.3 Modeling approaches ............................................................................................................. 76 
+6.1.4.Mathematical modeling of Activated Sludge plug flow reactors .......................................... 79 
+   6.1.4.1 Process description ........................................................................................................... 79 
+6.1.5. Model development ............................................................................................................... 80 
+   6.1.5.1 Ideal PFR and CSTR in series .......................................................................................... 80 
+   6.1.5.2 Non ideal flow reactor models ......................................................................................... 82 
+   6.1.5.3 Computational fluid dynamics model development ........................................................ 84 
+   6.1.5.4 Models comparisons ........................................................................................................ 86 
+6.1.6. Mathematical modeling of fluidized bed reactors ................................................................. 86 
+   6.1.6.1 Process description ........................................................................................................... 86 
+   6.1.6.2 Model development .......................................................................................................... 87 
+      6.1.6.2.1 Ideal flow reactor models ........................................................................................... 87 
+      6.1.6.2.2 Non ideal flow reactor models ................................................................................... 88 
+      6.1.6.2.3 Models comparisons .................................................................................................. 90 
+6.1.7 Mathematical modeling of biofilter reactors .......................................................................... 90 
+   6.1.7.1 Process description ........................................................................................................... 90 
+   6.1.7.2 Model development .......................................................................................................... 91 
+   6.1.7.2.1 Ideal flow reactor model ............................................................................................... 91 
+   6.1.7.2.2 Non-ideal flow reactor model ....................................................................................... 92 
+   6.1.7.2.3 Models comparisons ..................................................................................................... 95 
+6.1.8 Model comparisons and validation and calibration ............................................................... 96 
+   6.1.8.1 Models comparisons ........................................................................................................ 96 
+   6.1.8.2 Activated sludge reactor ................................................................................................... 98 
+      6.1.8.2.1 Ideal PFR and CSTR in series .................................................................................... 98 
+      6.1.8.2.2 Non ideal flow reactor models ................................................................................... 99 
+    6.1.8.3 Fluidized Bed Reactors ................................................................................................. 100 
+    6.1.8.4 Biofilter reactors ........................................................................................................... 101 
+6.2 Mathematical modelling of anaerobic plug flow reactor and non-ideal flow reactor .... 104 
+   6.2.1 Introduction ....................................................................................................................... 104 
+   6.2.2 Mathematical modelling of UASB Reactors .................................................................... 104 
+	         6.2.2.1 Hydrodynamic based models ........	  .............................................................................. v1	   	  06	   	   	   	  
+      6.2.2.2 Models coupling hydrodynamic with anaerobic digestion conversions ...................... 111 
+     6.2.2.3 Models comparisons .................................................................................................... 112 
+  6.2.3.  Mathematical modelling of Anaerobic Biofilters ............................................................ 113 
+     6.2.3.2 Models comparisons .................................................................................................... 116 
+  6.2.4 Mathematical modeling of Anaerobic Biological Fluidized Bed Reactors ....................... 116 
+     6.2.4.1 Models comparisons .................................................................................................... 118 
+  6.2.5. Mathematical modeling of wet and dry digesters treating bio-solids ............................... 119 
+     6.2.5.1 Models comparisons .................................................................................................... 123 
+  6.2.6. Model comparisons and validation and calibration .......................................................... 123 
+     6.2.6.1 Models comparisons .................................................................................................... 123 
+     6.2.6.2 UASB reactor model validation and calibration .......................................................... 123 
+     6.2.6.3 Anaerobic Biofilters model validation and calibration ................................................ 125 
+     6.2.6.4 Anaerobic Fluidized Bed Reactor model validation and calibration ........................... 127 
+     6.2.6.5 Wet and dry digesters model validation and calibration .............................................. 128 
+  6.2.7. Conclusion ........................................................................................................................ 129 
+Chapter 7. Discussion and Conclusions ............................................................................................ 130 
+References ............................................................................................................................................ 135 
+	   	   v	   i	   	   	   	   	  
+ 	  
+	  Abstract  
+Dry Anaerobic Digestion (AD) presents different advantages if compared to wet AD, i.e. smaller 
+reactor size, lesser water addition, digestate production and pretreatment needed, although several 
+studies have demonstrated that water promotes substrate hydrolysis and enables the transfer of process 
+intermediates and nutrients to bacterial sites. 
+To better understand the role of water on AD, dry and semidry digestion tests of selected complex 
+organic substrates (food waste, rice straw, carrot waste), with various TS contents of the treated 
+biomass have been carried out in the present study. The results confirm that water plays an essential 
+role on the specific methane production rate, final methane yield and Volatile Solids (VS) 
+degradation. The final methane yield in semi-dry and dry conditions was 51% and 59% lower for rice 
+straw and 4% and 41% lower for food waste, respectively, if compared with wet conditions.  
+Inhibition tests, based on Volatile Fatty Acid (VFA) analysis, were carried out to investigate the 
+specific inhibition processes that take place with the selected substrates at different TS contents. In 
+wet AD of carrot waste no VFA accumulation was found, and all VFA concentrations were lower than 
+the inhibition limits. A direct correlation between TS content and total VFA (TVFA) concentration 
+was noticed for rice straw and food waste AD. For rice straw a maximum TVFA concentration of 2.1 
+g/kg was found in dry condition, 1 g/kg in semidry conditions and 0.2 g/kg in wet conditions, whereas 
+for food waste the TVFA concentration was 10 g/kg in dry condition, 9 g/kg in semidry conditions 
+and 3 g/kg in wet conditions.  
+A Mathematical model of complex organic substrate AD in dry and semidry conditions has been 
+proposed to simulate the effect of TS content on the process. The data obtained from batch 
+experiments, in terms of methane production and VFA concentrations, were used to calibrate the 
+proposed model. The kinetic parameters of VFA production and degradation, calibrated using the 
+experimental data, resulted highly dependent on the TS content and different from wet AD literature 
+values. This is due to VFA accumulation in dry conditions, which implies lower values of the kinetic 
+constants function of the TS content introduced in the model.  
+Finally, as dry AD takes usually place in Plug Flow (PF) reactors, an historical and critical review on 
+the role of hydrodynamics in PF bioreactors has been carried out.  
+	   	   1	   	   	   	   	   	  
+ Sommario  
+ 
+La digestione anaerobica (DA) a secco presenta diversi vantaggi rispetto a quella ad umido legati alla 
+riduzione delle dimensioni del reattore, al minore consumo di acqua, alla più facile gestione del 
+digestato prodotto, e alla mancata richiesta di pretrattamenti. Al contempo, tuttavia, il minor contenuto 
+di umidità può comportare dei problemi nello svolgimento delle reazioni di trasformazione, giacché 
+l’acqua promuove l’idrolisi dei substrati in trattamento, ha una azione di diluizione nei confronti di 
+eventuali intermedi di processo che potrebbero inibire il metabolismo microbico, e permette il 
+passaggio dei nutrienti e dei metaboliti attraverso il protoplasma cellulare.  
+Per meglio comprendere il ruolo dell’acqua sulla DA sono state effettuate prove di digestione batch a 
+secco, semi-secco, ed umido, adoperando tre substrati diversi, vale a dire: scarti alimentari misti, 
+paglia di riso e carote. Ai substrati è stato aggiunto un inoculo pre-digerito, il cui contenuto di solidi 
+sospesi è stato opportunamente variato attraverso un processo di disidratazione. I risultati ottenuti 
+hanno confermato che l’acqua svolge un ruolo fondamentale nello sviluppo del processo, 
+influenzando sia il tasso di produzione specifica di metano che la produzione complessiva di 
+quest’ultimo, oltre che le cinetiche di degradazione del substrato, e quindi il rendimento di riduzione 
+dei Solidi Volatili.  
+Nello specifico, prendendo a riferimento la produzione complessiva di metano ottenuta nel processo 
+ad umido, adoperando come substrato la paglia di riso i valori sono risultati ridotti di circa il 50% 
+nella digestione a semi-secco, e di circa il 60% nella digestione a secco. La riduzione è risultata meno 
+sensibile nel trattamento degli scarti alimentari misti, per i quali si è avuta un decremento del 4% nel 
+corso del processo a semi-secco, e di poco più del 40% nel corso del processo a secco.  
+Il monitoraggio della concentrazione degli acidi grassi volatili (AGV) nel corso delle prove ha 
+consentito di evidenziare gli eventuali accumuli di composti inibitori in funzione del substrato trattato 
+e della concentrazione di solidi totali (ST). A riguardo si è osservato che nel caso della DA ad umido 
+delle carote, non si è avuto alcun accumulo di AGV e tutte le concentrazioni misurate sono risultate 
+sempre inferiori al valore limite d’inibizione. Nel caso della DA della paglia di riso e del rifiuto 
+alimentare, è stata invece individuata una relazione lineare tra il contenuto di ST e la concentrazione 
+di AGV. Più in dettaglio per la paglia di riso è stato trovato un valore di concentrazione massimo degli 
+	  AGV pari a 2,1 g·kg
+-1 nel processo a secco, ed un	   valore minimo di 0,2 g·kg
+-1 nel processo ad umi2d	   	  o,	   	   	   	  
+ mentre nel processo a semi-secco la concentrazione si è attestata su un valore intermedio, pari ad 1 
+g·kg-1. Nel caso della paglia di riso le concentrazioni rilevate sono state di 10 g·kg-1 nella digestione a 
+secco, di 9 g·kg-1 nella digestione a semi-secco, e di 3 g·kg-1 nel processo ad umido.  
+I risultati ottenuti nel corso delle prove sperimentali sono stati interpretati alla luce di un modello 
+matematico all’uopo sviluppato, in grado di simulare il processo di digestione di substrati organici 
+complessi, tenendo conto del diverso contenuto dei ST che caratterizzano i processi a secco, semi-
+secco ed umido. La calibrazione del modello, effettuata sulla base di valori misurati relativi alla 
+produzione di metano ed alla concentrazione degli AGV, ha consentito di verificare come i parametri 
+cinetici relativi alla produzione ed alla degradazione di tali acidi siano fortemente dipendenti dal 
+contenuto di ST, e, nel caso dei processi a basso contenuto di umidità, notevolmente diversi dai dati 
+proposti in letteratura per la DA ad umido. Questo risultato è legato all’accumulo di acidi che 
+comporta una riduzione delle cinetiche di degradazione dei substrati organici complessi di partenza e 
+dei successivi intermedi delle trasformazioni in fase acquosa. Considerato che la DA a secco viene 
+solitamente sviluppata in reattori con flusso a pistone, la parte conclusiva del lavoro è stata infine 
+dedicata all’analisi storico-critica dei lavori presenti in letteratura relativi alla modellazione 
+idrodinamica dei processi biologici, ed al ruolo che le diverse configurazioni reattoristiche possono 
+avere nello sviluppo delle cinetiche di trasformazione, nell’ottica di porre le basi per una modellazione 
+c	   ompleta della digestione a secco, comprensiva sia della parte idrodinamica che di quella biochimica.  
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+	   	   3	   	   	   	   	   	  
+ 	  Resumè 
+La méthanisation par voie sèche possède différents avantages par rapport à la méthanisation par voie 
+humide. Les réacteurs sont plus petits, les besoins en eau sont moindres, la production de digestat et le 
+prétraitement nécessaire sont également moins importants. Cependant, plusieurs études ont démontré 
+que l'eau favorise l'hydrolyse du substrat et permet le transport des sous-produits d’hydrolyse et des 
+nutriments vers les bactéries. 
+Pour mieux comprendre le rôle de l'eau lors de la méthanisation, des tests de digestion sèche et semi-
+sèche à partir de substrats organiques complexes (déchets alimentaires, paille de riz, déchets de 
+carotte), avec différentes teneurs en matière sèche de substrat traité ont été réalisées. Les résultats 
+confirment que l'eau joue un rôle essentiel sur le taux de production spécifique de méthane, le 
+rendement final de méthane généré et la dégradation de la matière volatile sèche (MVS). Le 
+rendement final de méthane produit dans des conditions semi-sèches et sèches est respectivement de 
+51% et de 59% inférieur avec la paille de riz et 4% et 41% de moins pour les déchets alimentaires en 
+comparaison avec des conditions humides. 
+Des tests d'inhibition basés sur l’analyse des acides gras volatils (AGV) ont été menées pour étudier 
+les processus d'inhibition spécifiques qui ont lieu avec les substrats sélectionnés à différentes teneurs 
+en matière sèche. Pour le cas de la méthanisation par voie humide des déchets de carotte, aucune 
+accumulation d’AGV a été trouvé, et toutes les concentrations d'AGV étaient inférieurs aux seuils 
+d'inhibition. Une corrélation directe entre la teneur en matière sèche et la concentration totale d’AGV 
+(AGVtot) a été mise en évidence pour la paille de riz et les déchets alimentaires. Pour la paille de riz, 
+une concentration d’AGVtot maximale de 2,1 g / kg a été trouvé pour la voie sèche, 1 g / kg dans les 
+conditions semi-sèche et 0,2 g / kg dans les conditions humides, alors que pour les déchets 
+alimentaires la concentration d’AGVtot était de 10 g / kg à l'état sec, 9 g / kg dans les conditions semi-
+sèche et 3 g / kg dans les conditions humides. 
+Un modèle mathématique de la méthanisation de substrats organiques complexes dans des conditions 
+sèches et semi-sèche a été proposé pour simuler l'effet de la teneur en matière sèche sur le processus. 
+Les données obtenues à partir d'expériences en mode batch, en termes de production de méthane et de 
+concentration d'AGV, ont été utilisées pour calibrer le modèle proposé. Les paramètres cinétiques de 
+production et d’élimination d’AGV ont été calibrés à l'aide des données expérimentales, et il a été 
+	  montré qu’ils sont fortement dépendants de la te	  neur en matière sèche et différent des valeurs de4	   	  la	   	   	   	  
+ littérature concernant la méthanisation par voie humide. Cela est dû à l'accumulation d’AGV dans les 
+conditions sèches, ce qui implique d’utiliser des valeurs plus reduit concernant les constantes 
+d'inhibition introduites dans le modèle. 
+Enfin, comme la méthanisation par voie sèche a généralement lieu dans des réacteurs à écoulement 
+piston, une étude historique et critique de la littérature concernant la compréhension du rôle de 
+	  l'hydrodynamique dans des bioréacteurs à écoulement piston a été réalisée. 
+	  Samenvatting 
+Droge Anaërobe Vergisting (AD) biedt verschillende voordelen in vergelijking met natte AD: kleinere 
+reactorvolumes, minder water toevoeging, lagere digestaat productie en minder voorbehandeling nodig, 
+ondanks dat verscheidene studies hebben aangetoond dat water de substraat hydrolyse en de 
+uitwisseling van tussenproducten en nutriënten van en naar de bacteriële sites bevordert. 
+Om de rol van het water in AD beter te begrijpen, zijn in deze studie droge en halfdroge afbraaktests 
+uitgevoerd met geselecteerde complexe organische substraten (voedselafval, rijststro en wortelafval), 
+met verschillende Totale Vaste Stof (TS) gehaltes van de behandelde biomassa. De resultaten 
+bevestigen dat water een essentiële rol speelt in de specifieke methaan productiesnelheid, de 
+uiteindelijke methaanopbrengst en de afbraak van de organische stof (VS). De uiteindelijke 
+methaanopbrengst onder semi-droge en droge omstandigheden was, respectievelijk, 51% en 59% 
+lager voor rijststro en 4% en 41% lager voor voedselafval in vergelijking met natte omstandigheden. 
+Remmingsproeven, gebaseerd op vluchtige vetzuren (VFA) analyses, werden uitgevoerd om de 
+specifieke remming van de geselecteerde substraten bij verschillende TS concentraties te 
+onderzoeken. Gedurende de natte AD van wortelafval werd geen VFA accumulatie gevonden, en de 
+VFA concentraties bleven lager dan de inhibitiewaarden. Bij de AD van rijststro en voedselafval werd 
+een direct verband tussen het TS gehalte en de totale VFA concentratie gevonden. De maximale totale 
+VFA concentratie bedroeg 2,1 g/kg voor rijststro bij droge, 1 g/kg bij halfdroge en 0,2 g/kg bij natte 
+AD, terwijl voor voedselafval de totale VFA concentratie 10 g/kg bij droge, 9 g/kg bij halfdroge en 3 
+g/kg bij natte AD bedroeg. 
+Een wiskundig model voor de AD van complexe organische substraten onder droge en halfdroge 
+condities werd ontwikkeld om het effect van de TS concentratie te simuleren. De data van 
+	  batchexperimenten, met name methaanproductie	    en VFA concentraties, werden gebruikt om 5h	   	  et	   	   	   	  
+ ontwikkelde model te kalibreren. De kinetische parameters van VFA productie en afbraak, 
+gekalibreerd met experimentele data, bleken sterk afhankelijk van de TS concentratie en verschilden 
+aanzienlijk van de natte AD literatuurwaardes. Dit komt door de VFA accumulatie onder droge 
+omstandigheden, dit leidt tot lagere inhibitiewaarden die in het model zijn opgenomen.  
+Ten slotte, omdat droge AD gewoonlijk plaats vindt in Plug Flow (PF) reactoren, werd een overzicht 
+van de geschiedenis van dit reactortype gemaakt en de rol van de hydrodynamica in deze PF 
+bioreactoren kritisch geëvalueerd. 
+	   	   6	   	   	   	   	   	  
+ 	  
+ 
+ 
+ 
+CHAPTER 1 
+                                                                                                               
+	  	  
+Introduction 
+	  	  	  	  	  	  	  	  
+	  	  
+	   	   7	   	   	   	   	   	  
+CHAPTER 1 - INTRODUCTION 
+1.1 Problem Description  
+ 
+Anaerobic Digestion (AD) is a biological process historically applied to wastewater treatment sludge, 
+that reduces Chemical Oxygen Demand (COD) of complex organic substrate and converts it into a gas, 
+which is mainly composed by methane and carbon dioxide. During this process organic matter is 
+progressively converted into simpler and smaller sized organic compounds obtaining biogas and 
+digestate as final products. This digestate is rich in nutrients and microelements and it is suitable for 
+utilization in agricultural contexts (Esposito et al. 2012a,b). Nowadays there is a pressing need to 
+manage correctly bio-waste from its generation stage to its safe disposal and to reduce its impact on 
+the environment. Therefore AD can be used as biological treatment as it is one of the best option to 
+achieve at the same time the objectives of the Kyoto Protocol and the EU Policies concerning 
+renewable energy and organic waste disposal. 
+Based on the solid content of the influent bio-waste, AD can be defined dry, semidry and wet. In dry 
+AD (high-solids digestion), the feedstock to be digested has a Total Solids (TS) content higher than 
+15%. In semidry AD the solid substrate to be digested has a TS content ranging between 10%-15%. In 
+contrast, wet AD (low-solids digestion) deals with diluted feedstock having a TS content lower than 
+10% (Li et al. 2011; Zeshan and Annachatre, 2012). In the last decades, dry AD has got much 
+attention due to its many advantages: smaller reactor volume, reduced amount of water addition, 
+easier handling of digested residues, minimal nutrient loss (Karthikeyan and Visvanathan, 2012; 
+Zeshan and Annachatre, 2012) and simplified pre-treatments compared to wet systems. The only pre-
+treatment which is necessary before feeding the wastes into a dry AD reactor is the removal of coarse 
+materials larger than 40 mm (Vandevivere 1999). Because of the high viscosity of the treated bio-
+waste, in dry AD, the substrate moves via plug flow inside the reactor. Plug flow conditions within the 
+reactor offer the advantage of technical simplicity. They leave however the problem of mixing, which 
+is crucial to guarantee adequate inoculation and reduce acidification problems. 
+The economical differences between wet and dry systems are small, both in terms of investment and 
+operational costs. The differences between those systems are more substantial in terms of 
+environmental issues. For instance, while wet systems typically consume one m3 of fresh water per 
+ton of treated Organic Fraction of Municipal Solid Waste (OFMSW), the water consumption of their 
+	  dry counterparts is ten-fold less. As a conseque	  nce, the volume of wastewater to be discharged8	   	  is	   	   	   	  
+CHAPTER 1 - INTRODUCTION 
+several-fold less for dry systems (Vendevivere 1999).  
+Despite the listed advantages, this high solid contents determine also several technical disadvantages 
+in terms of transport, handling and mixing compared to wet processes (Lissens et al. 2001; De Baere 
+et al. 2010; Bollon et al. 2013). Moreover the low amount of water affects the process development. 
+The water content in fact is a key parameter of dry AD as several studies have demonstrated that 
+water promotes substrate hydrolysis and enables the transfer of process intermediates and ease the 
+bacterial community access to nutrients (Lay et al. 1997a, b; Mora-Naranjo et al. 2004; Pommier et al. 
+2007; Bollon et al. 2013).  
+The present study is aimed at better understanding the role of water on AD, discussing in detail the 
+experimental data obtained during dry and semidry digestion tests of selected complex organic 
+substrates by varying the TS percentages of the treated biomass. Obtained data are used to model the 
+effect of water content during dry AD. Moreover, considering, as mentioned previously, that AD takes 
+usually place in Plug Flow reactors, this study analyses also in detail the hydrodynamic conditions of 
+different bioreactors through an historical and critical literature review of the role of the 
+hydrodynamic behaviour on biological processes. This review was done to create the premises for the 
+development of a mathematical model able to simulate the dry AD in real biological reactor.  
+1.2. Objectives of the Study 
+The main objective of this research is to investigate the process performances of AD reactors, studying 
+the effect of moisture content on process development. The research was carried out at lab-scale in 
+batch reactor on the following substrates: rice straw and food waste. These two substrates were 
+selected because food waste is representative of readily biodegradable bio-waste, while rice straw is 
+representative of slowly biodegradable ones. Moreover both of them are produced in large amount and 
+there is a practical need to define a proper treatment for them. Further investigations are conducted on 
+carrot waste to study the effect of moisture content also in the case of wet AD and to analyse the effect 
+of particle size on methane production. This substrate was selected because it presents a shape and a 
+consistency that can be easily modelled. Mathematical modelling aimed at upgrading the Anaerobic 
+Digestion Model n. 1 (ADM1) proposed by Batstone et al. 2002 by considering the effect of moisture 
+on the process performances is also an objective of this thesis. The experimental data obtained during 
+batch studies were used to calibrate the proposed model. The specific objectives of the research 9ar	  e 	   	   	   	   	   	   	  
+CHAPTER 1 - INTRODUCTION 
+listed below: 
+• Assess the effect of moisture content on semidry and dry AD of a selected easily biodegradable 
+substrate (i.e. food waste); 
+• Model the dry AD of food waste and determine the kinetic parameters of the model by 
+considering the effect of moisture content; 
+• Assess the effect of moisture content on semidry and dry AD of slowly biodegradable 
+substrate, i.e. rice-straw; 
+• Model the dry AD of rice straw and determine the kinetic parameters of the model by 
+considering the effect of moisture content; 
+• Assess the effect of moisture content on wet AD of carrot waste; 
+• Model the wet AD of carrot waste and determine the kinetic parameters of the model by 
+considering the effect of moisture content; 
+• Individuate possible process inhibitions that could occur in dry anaerobic conditions by 
+studying process intermediates, such as VFAs and model these parameters varying TS content.  
+• Review the hydrodynamic models described in literature for aerobic and anaerobic treatment of 
+wastewater to give the premises for the development of a coupled model able to simulate the 
+dry anaerobic digestion process, considering both the effect of the hydrodynamic conditions. 
+The specific objectives are addressed in the following chapters of this thesis. In chapter 2 are 
+described the experimental and modelling results obtained on carrot waste wet AD. The batch tests 
+results are used to discuss the effect of different particle size and moisture content on methane 
+production. In chapter 3, the experimental results obtained on wet, semidry and dry AD of food 
+waste are described. The effect of different moisture contents on methane production, VFA 
+concentration and anaerobic degradation in terms of VS and COD is discussed. In chapter 4, the 
+experimental results obtained on wet, semidry and dry AD of rice straw are described and 
+discussed following the same approach used in chapter 3 for food waste. In chapter 5, an up-
+graded version of the ADM1 model for dry and semidry anaerobic digestion is proposed. Mo1d0el	   	   	   	   	   	   	   	  
+CHAPTER 1 - INTRODUCTION 
+calibration is performed by fitting the experimental data (methane production and VFA 
+concentrations obtained during the batch tests described in chapter 3 and 4) on food waste and rice 
+straw in wet, semidry and dry AD conditions. In chapter 6 are reviewed mathematical models of 
+anaerobic and aerobic non-ideal flow reactor in wastewater treatment are reviewed. Finally, in 
+chapter 7 an overall discussion and conclusion of the results is reported. 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+	   	   1	   1	  	   	   	   	  
+CHAPTER 2 - EFFECT OF MOISTURE CONTENT ON WET ANAEROBIC DIGESTION OF 
+COMPLEX ORGANIC SUBSTRATES 
+ 
+ 
+ 
+CHAPTER 2 
+Effect of moisture content on wet anaerobic digestion of complex 
+organic substrates 
+	   
+	  	  
+	  	  	  
+This chapter has been published as: 
+ 
+Liotta, F., d’Antonio, G., Esposito, G., Fabbricino, M., Frunzo, L., van Hullebusch, E. D., Lens, 
+N.L. and Pirozzi, F. (2014). Effect of moisture on disintegration kinetics during anaerobic 
+digestion of complex organic substrates. Waste Manage. Res. 32, 40-48. 
+	   	   1	   2	  	   	   	   	  
+CHAPTER 3 - EFFECT OF MOISTURE CONTENT ON ANAEROBIC DIGESTION OF FOOD 
+WASTE 
+2.1 Introduction  
+Anaerobic digestion is a multi-step process, that involves several micro-organisms: hydrolytic, 
+fermentative, acetogenic and methanogenic bacteria. The limiting step of the AD process can not be 
+unequivocally defined. Acetogenesis (Hills and Robert 1981; Bryers 1985; Costello et al. 1991a, b; 
+Siegrist et al. 1993) and methanogenesis (Graef and Andrews 1974; Moletta et al. 1986; Smith et al. 
+1988), as well as hydrolysis (Vavilin et al. 2001) and disintegration (ADM1, Batstone et al. 2002, 
+Esposito et al. 2008, 2011a,b, 2012a,b), can constitute the rate-determining steps. 
+When considering complex organic matter, the hydrolysis of complex polymeric
+ substances becomes the rate-limiting step and modelling of this process has to be improved 
+(Pavlostathis and Giraldo-Gomez 1991; Vavilin et al. 1996b, 1997, 1999; Batstone et al. 2002). In 
+particular, several models showed that the presence of OFMSW particles can be better described with 
+the introduction of a disintegration step. This step individuates the physical break and transformation 
+of the complex organic matter in soluble particulate organics, and represents the rate-limiting step of 
+the process (Hills and Nakano 1984; Sharma et al. 1988; Esposito et al. 2008, 2011a, 2012a; Batstone 
+et al. 2002).  
+Several authors investigated the rate of hydrolysis and disintegration as a function of different 
+parameters such as pH, temperature, hydrolytic biomass concentration, type of particulate organic 
+matter and particle size (Pavlostathis and Giraldo-Gomez, 1991; Veeken et al. 1999; Hill and Nakano 
+1984; Esposito et al. 2008; Sharma et al. 1988; Sanders et al. 2000). However, it is less understood 
+how the TS content can affect hydrolysis and in particular the disintegration step of complex organic 
+substrate. There are several attempts in the literature to model the effect of moisture content on dry 
+and semi-dry AD process. In particular in their work, Abbassi-Guendouz et al. (2012), by the 
+application of ADM1 model, found a decreasing first-order hydrolysis rate constant for carbohydrates 
+by increasing TS content. This constant was calibrated using batch experimental data with cardboard 
+as initial substrate and imposing the TS content in the range of 15-30%. This finding is in agreement 
+with results presented by Bollon et al. (2011). There are also several attempts in literature to 
+investigate the effect of TS content on methane production by operating Specific Methanogenic 
+Activity (SMA) tests and by simulating experimental data by using the Gompertz model (Le Hyaric et 
+al. 2011; Le Hyaric et al. 2012; Lay et al. 1997a, 1997b, 1998). These authors suggested also that high 
+TS content could reduce substrate degradation, resulting in a lower methanogenic activity. These 
+CHAPTER 2 - EFFECT OF MOISTURE CONTENT ON WET ANAEROBIC DIGESTION OF 
+COMPLEX ORGANIC SUBSTRATES 
+results are consistent with several studies performed by Qu et al. (2009), Fernández et al. (2010), 
+Forster-Carneiro et al. (2008), Pommier et al. (2007), who found a reduction of methane production 
+with higher TS. All these studies showed that the moisture content plays an essential rule in the biogas 
+formation as the nutrients and substrates for the microorganisms must dissolve in water phase prior 
+they can be assimilated. Furthermore, the moisture content is an important factor also in the low-solids 
+(wet) anaerobic digestion because it supports the bacterial movement and helps substrate and product 
+diffusion through the porous medium (solid waste) to bacterial cell membrane (Lay et al. 1997a; Lay 
+et al. 1997b; Mora Naranjo et al. 2004; Le Hyaric et al. 2012; Pommier et al. 2007).  
+The aim of this chapter is, therefore, to assess the impact of the moisture content on wet anaerobic 
+digestion of a selected complex organic substrate. To better evaluate the impact of the water content 
+on the AD performances, computer solution using a new version of the ADM1 of complex organic 
+substrate, proposed by Esposito et al. (2008, 2011a,b) is applied. The model is used to describe the 
+experimental data and to define the dependence of the disintegration kinetic parameter on the particle 
+size and moisture content. 
+More in detail, this chapter includes the following objectives: 
+• propose an experimental procedure for obtaining an inoculum at different moisture contents; 
+• investigate the effect of PS effect on the disintegration step of AD process of complex organic 
+matter, i.e. greengrocery waste (carrot waste); 
+• investigate the TS effect on methane production; 
+• propose a new mathematical modelling approach to describe the effect of TS on the 
+disintegration step of AD by using a new version of ADM1 model proposed by Esposito et al. 
+(2008, 2011a, b). 
+• determine the surface based kinetic constant for the cited selected substrate, using the model 
+proposed by Esposito et al. (2008). 
+ 
+	   	   1	   4	  	   	   	   	  
+CHAPTER 2 - EFFECT OF MOISTURE CONTENT ON WET ANAEROBIC DIGESTION OF 
+COMPLEX ORGANIC SUBSTRATES 
+2.2. Materials and Methods 
+2.2.1 Digester set-up and analytical measurements 
+Biomethanation Tests (BMTs) were performed on a small scale under controlled and reproducible 
+conditions in a 1000 mL glass bottle GL 45 (Schott Duran, Germany). Small amounts of Na2CO3 
+powder were also added to control pH value. Each bottle was sealed with a 5 mm silicone disc that 
+was held tightly to the bottle head by a plastic screw cap punched in the middle (Schott Duran, 
+Germany). All digesters were immersed up to half of their height in hot water kept at a constant 
+temperature of 308.15 K by 200 W A-763 submersible heaters (Hagen, Germany). Once a day, each 
+digester was connected by a capillary tube to an inverted 1000 mL glass bottle containing an alkaline 
+solution (2% NaOH). The inverted 1000 mL glass bottle was sealed in the same way as the digesters. 
+To enable gas transfer through the two connected bottles, the capillary tube was equipped on both 
+ends with a needle sharp enough to pierce the silicone disc. The weight, TS and VS concentration of 
+the anaerobic sludge as well as the dry matter, moisture organic matter and ash content of substrate 
+were determined according to Standard Methods (APHA/AWWA/WEF, 1998). Temperature and pH 
+of all mixtures investigated were monitored for at least once a day with a TFK 325 thermometer 
+(WTW, Germany) and a pH meter (Carlo Erba, Italy), respectively (Esposito et al.  2012a). 
+ 
+2.2.2 Preliminary tests: Drying procedure 
+In order to evaluate the effect of different moisture contents during AD, experiments at different TS 
+contents are necessary. With the objective to evaluate only the effect of moisture content, these 
+experiments must be conducted using the same inoculum, at the same operational conditions, varying 
+only the TS content. Therefore fresh digestate was collected from a mesophilic AD of a buffalo farm 
+and stored in 10 L buckets at 4°C and used as inoculum source. The initial inoculum characteristics in 
+terms of TS, VS, carbohydrates fraction (Ch), proteins fraction (Pr) and lipids fraction (Li) are shown 
+in Table 1.  
+ 
+	   	   1	   5	  	   	   	   	  
+CHAPTER 2 - EFFECT OF MOISTURE CONTENT ON WET ANAEROBIC DIGESTION OF 
+COMPLEX ORGANIC SUBSTRATES 
+Table 1. Main characteristics of Anaerobic Sludge 
+Initial Initial  Ch Pr Li 
+ 
+TS [%] VS [%] [%] [%] [%] 
+Wet anaerobic sludge 2 1.2 2.1 56 41.9 
+ 
+The inoculum was dried by testing three different procedures: overnight drying of fresh digestate at 
+50°C until constant weight, centrifugation with 6000 rpm, 10 min and membrane filtration with a 
+Kubota 203 microfiltration module. The selected drying procedures were aimed at removing water 
+from inoculum, obtaining a final value of 4% TS.  
+In order to evaluate the effects of different drying treatments, the concentrated inoculum was reported 
+at the initial TS content of 2% adding distilled water and was compared with the untreated inoculum 
+in terms of biomethane potential. The aim of these tests was to individuate the drying procedure that 
+does not modify the inoculum characteristics in terms of biomass activity and methane production. 
+Therefore the inoculum obtained from each adopted drying procedure was used to carry out BMTs. 
+These experiments were performed using pasta and cheese with known carbohydrate, protein and lipid 
+concentrations (Table 2). The choice of the substrates was aimed at balancing the quantity of 
+carbohydrates, proteins and lipids in the digester influent. The selected substrate allows the 
+development of all microbial species involved in degradation of carbohydrates, proteins and lipids in 
+order to evaluate the pre-treatment effect on all these species. 
+Table 2. Mass composition of organic substrate 
+Pasta [g] Cheese [g] Anaerobic Sludge [g] Na2CO3 [g] 
+2.63 5.24 500 0.32 
+ 
+The methane production is expressed under standard conditions and takes into account the gas content 
+variation in the headspace of the reactor. The calculated methane production accounts for the global 
+methane production without the residual endogenous methane production measured with the blank 
+assay, which represent the reactor filled only with digestate without substrate addition.  
+	   	   1	   6	  	   	   	   	  
+CHAPTER 2 - EFFECT OF MOISTURE CONTENT ON WET ANAEROBIC DIGESTION OF 
+COMPLEX ORGANIC SUBSTRATES 
+5000  
+4000
+3000
+2000
+1000
+0  0 10 20 30 40 50 60 70
+Time [days]
+Thermal Filtration Centrifugation Untreated 	  
+Figure 1. Cumulative methane production of different tests. 
+ 
+Figure 1 shows the cumulative methane production obtained using the different inoculums resulting 
+from the different drying procedures and the untreated inoculum. The Bio-methanation Potential 
+(BMP) is the same for all tests, but only adopting the centrifugation it is possible to observe a similar 
+trend as for the untreated digestate. These results indicate that all the tested methods are suitable 
+drying procedures that do not change the inoculum characteristics. For the following experiments, 
+centrifugation was selected as drying procedure because it gives the minimum alteration of the 
+inoculum and it is the most simple and cheaper method to apply in the laboratory.  
+ 
+2.2.3 Effect of particle size on AD 
+Bio-methanation experiments were performed using as initial substrate a selected greengrocery waste, 
+(i.e. carrot waste) as initial substrate with the chemical composition in terms of TS, VS and 
+concentrations of carbohydrates, proteins and lipids reported in Table 3. This substrate was selected 
+for modelling purposes, due to the ease to obtain a cylindrical shape (Fig. 2). That shape was obtained 
+by using cylindrical steel tube with a selected diameter. For each particle the same diameter and 
+height was imposed in order to obtain a ratio between area and mass equal to a particle with spherical 
+	  shape. The tests were conducted using four diffe	  rent PS: 0.25 mm, 4 mm, 9 mm, 15 mm (Table 1	  47).	  	   	   	   	  
+CH4 [mL]
+CHAPTER 2 - EFFECT OF MOISTURE CONTENT ON WET ANAEROBIC DIGESTION OF 
+COMPLEX ORGANIC SUBSTRATES 
+The selected ratio between organic matter and anaerobic sludge was 0.5 organic matter/anaerobic 
+sludge (i.e. Food/Mass ratio (F/M)). The selected digestate was collected from a mesophilic AD of a 
+farm treating buffalo manure. The mass composition adopted for all tests is described in Table 4. 
+BMTs were operated in triplicate and a blank assay was also carried out. In total 15 BMTs were 
+performed. 
+Table 3. Substrate characteristics. 
+Initial TS Initial  Ch Pr Li 
+ 
+[%] VS [%] [%] [%] [%] 
+Carrot 12.7 11.4 0.121* 0.025* 0.006* 
+*Buffière et al. (2006). 
+Table 4. Composition of the organic mixture in terms of F/M ratio, PS, input substrate and inoculum 
+for the experiments T1-T4 
+Initial radius Carrots Anaerobic Tests F/M sludge  Na2CO3  [mm] [g] [g] [g] 
+T1 0.5 15 48.2 (±0.5) 500 (±1) 0.30-0.40 (±0.001) 
+T2 0.5 9 48.2 (±0.5) 500 (±1) 0.30-0.40 (±0.001) 
+T3 0.5 4 48.2 (±0.5) 500 (±1) 0.30-0.40 (±0.001) 
+T4 0.5 0.25 48.2 (±0.5) 500 (±1) 0.30-0.40 (±0.001) 
+ 
+	  
+Figure 2. Different PS of Carrots with cylindrical shape. 
+	   	   1	   8	  	   	   	   	  
+CHAPTER 2 - EFFECT OF MOISTURE CONTENT ON WET ANAEROBIC DIGESTION OF 
+COMPLEX ORGANIC SUBSTRATES 
+2.2.4 Effect of moisture content on AD  
+BMTs were performed using carrot with a cylindrical shape and buffalo manure anaerobic digestate. 
+A specific value of PS = 15 mm was selected in order to get the disintegration step as rate limiting 
+step. 
+The initial TS content of the fresh digestate was 2%, that was dried by operating centrifugation in 
+order to obtain the desired moisture contents. A fixed substrate amount of substrate was defined and 
+only the digestate volume was changed to obtain different moisture contents. All the tests were 
+performed imposing a selected ratio between organic matter and anaerobic sludge of 0.5 organic 
+matter/inoculum. All the tests were conducted in triplicate. A total of nine bottles were operated with 
+three TS contents: 4.98%, 7.5%, 11.3%. The mixture composition of each BMT test is reported in 
+Table 5. 
+Nine further tests were conducted using only anaerobic sludge as substrate to estimate the volume of 
+methane resulting from the fermentation of the organics contained in the anaerobic sludge. Totally 18 
+tests were performed. 
+Table 5. Mixture composition 
+TS mixture VS mixture Carrot Dried  
+Test 
+[%] [%] amount [g] Anaerobic sludge [g] 
+T5 11.3 8.57 40 120 
+T6 7.5 4.6 40 245 
+T7 4.98 3.7 40 320 
+               
+2.2.5 Mathematical model  
+For better understanding the effect of TS and PS on the anaerobic degradation of complex organic 
+substrates, the anaerobic co-digestion model for complex organic substrates proposed by Esposito et 
+al. (2011a,b) was used. The model was calibrated with the experimental data of the batch experiments 
+to estimate the kinetic constant of the surface based disintegration process, K -2 -1sbk (ML T ). The 
+differential mass balance equations and the process kinetics and stoichiometry, described in detail in 
+Esposito et al. (2011a,b), are based on the ADM1 approach.  
+	  The disintegration kinetic is based on the surface	  -based kinetic expression proposed by Sanders et1 	  a9l.	  	   	   	   	  
+CHAPTER 2 - EFFECT OF MOISTURE CONTENT ON WET ANAEROBIC DIGESTION OF 
+COMPLEX ORGANIC SUBSTRATES 
+(2000) and reformulated by Esposito et al. (2008, 2011a,b) by including a*, which characterize the 
+disintegration process: 
+a* A=                                            (1) 
+M
+dC
+= −Ksbk ⋅a* ⋅C                             (2) dt
+where: 
+C = concentration of the complex organic substrate in the digester [ML-3]; 
+A = disintegration surface area [L2]; 
+M = complex organic substrate mass [M]. 
+Assuming that all the organic solid particles have the same initial size and cylindrical shape with h = 
+2R, that they are progressively and uniformly degraded, a* equation is given by the following 
+equation: 
+n
+∑Ai
+a*= i=1 nA 3= i =                         (3) n
+∑M nMi δRi
+i=1
+where: 
+A  = disintegration surface area of the organic solid particle i [L2i ]; 
+Mi = mass of the organic solid particle i [M]; 
+n = total number of organic solid particles [ad.]; 
+δ = complex organic substrate density [ML-3]; 
+R = organic solid particles radius [L], assumed to be time dependent according to the following 
+expression proposed by Sanders et al. (2000): 
+R R K t= 0 − sbk                         (4) δ
+where: 
+R0 = initial organic solid particle radius [L], specified as the initial condition for model 
+application. 
+	   	   2	   0	  	   	   	   	  
+CHAPTER 2 - EFFECT OF MOISTURE CONTENT ON WET ANAEROBIC DIGESTION OF 
+COMPLEX ORGANIC SUBSTRATES 
+The a* coefficient is different than the one proposed by Esposito et al. (2011a,b) as the solid particle 
+present cylindrical instead of spherical shape. 
+Integration of the differential algebraic equations is performed using a multi-step solution algorithm 
+based on the numerical differentiation formulas in the software tool MATLAB®. 
+Model calibration and validation was also performed to estimate K  (ML-2T-1sbk ) constant, the surface 
+constant of the surface-based disintegration process.  
+Calibration was performed by comparing model results with experimental data of cumulative methane 
+production for a selected particle size and define the unknown parameter by fitting experimental data 
+with model results. 
+The calibration and validation procedure proposed by Esposito et al. (2011a,b) was performed. A 
+comparison between experimental data and model results was performed by applying the Root Mean 
+Square Error (RMSE) (Esposito et al. 2012a,b; Janssen and Heuberger 1995). 
+2.3. Results and discussions 
+2.3.1 Effect of particle size on AD performance  
+Figure 3 shows the cumulated methane production for the reactors operated at four different PS during 
+the whole experiments. Each curve represents the average of three replicates. The results clearly show 
+a different initial trend for the four curves indicating a cumulative methane production rate inversely 
+proportional to the PS. The cumulative methane production rate was inversely proportional to the PS. 
+The methane yield of all curves is in the range of 460(±30) mL/gVS. There are no large differences as 
+all reactors were filled with the same substrate amount (Fig. 3). 
+	   	   2	   1	  	   	   	   	  
+CHAPTER 2 - EFFECT OF MOISTURE CONTENT ON WET ANAEROBIC DIGESTION OF 
+COMPLEX ORGANIC SUBSTRATES 
+4000  
+3000
+2000
+1000
+0  0 10 20 30 40 50 60 70
+Time [days]
+2.5 mm 4 mm 9 mm 15 mm 	  
+Figure 3. Effect of PS on the cumulative methane production  
+ 
+Figure 4 shows a logarithm relationship between PS and initial methane production rate for the 
+substrate added, evaluated by dividing the specific net methane production by the number of days (3 
+days) from the start of the experiment. The Figure 4 indicates a strong impact of the PS on the kinetic 
+rates and individuates the disintegration process as the rate-limiting step for methane production. 
+These results are consistent with the findings of previous studies (Hills and Nakano 1984; Sharma et 
+al. 1988; Esposito et al. 2008, 2011a,b). Hills and Nakano, (1984) plotting the methane gas production 
+relative to the parameter 1/ΦsDm (where Φs represent the sphericity of the particles and Dm the average 
+particle diameter) found a linear correlation between these parameters. The similar correlation was 
+implicitly considered in the model proposed by Esposito et al. (2008, 2011a).	  
+70
+60
+50
+40
+30
+200.05 0.1 0.15 0.2 0.25 0.3 0.35 0.4
+1/D [mm-1] 	  
+Figure 4. Influence of particle size on initial methane production rate.  
+ 
+	   	   2	   2	  	   	   	   	  
+Initial methane pro
+[mLCH  grVS-1
+duction rate 
+4 in d
+-1]     CH4 [mL]
+CHAPTER 2 - EFFECT OF MOISTURE CONTENT ON WET ANAEROBIC DIGESTION OF 
+COMPLEX ORGANIC SUBSTRATES 
+2.3.2. Effect of TS content on AD performances  
+Figure 5 shows the cumulated methane production for the reactors operated at 3 different TS contents 
+during the whole experiments. Each curve represents the average of 3 replicates. Lag-phase and the 
+initial methane production rate, resulted inversely proportional to the TS content. These results are 
+consistent with previous studies performed by Lay et al. (1997a,b), who made batch tests in 
+mesophilic digesters at different pH values by testing the effect of moisture content in the range of wet 
+digestion. The final methane yield, measured at the end of each experiment can be assumed for all 
+tests coincident and equal to the mean value of 450 mL/gVS with a standard deviation of 14.23 (Table 
+6). This is apparently not in agreement with the findings of Abbassi-Guendouz et al. (2012), 
+Fernández et al. (2008) and Dong et al. (2010), who found higher methane yields with lower TS in the 
+range of dry and semidry AD. The difference is due to the different moisture content range 
+investigated, as the present experiments were carried out in wet conditions. The conversion of acids to 
+methane by methanogenic bacteria can thus be influenced by the lack of water (Lay et al. 1997b; 
+Ghosh 1985) that can occur with higher TS content in the range of dry and semidry digestion 
+(Abbassi-Guendouz et al. 2012; Fernández et al. 2008; Dong et al. 2010). 
+3500  
+3000
+2500
+2000
+1500
+1000
+500
+0  0 5 10 15 20 25 30 35 40 45 50 55
+Time [days]
+4.95% 7.50% 11.50% 	  
+Figure 5. Effect of TS on the cumulated methane production from anaerobic digestion of carrots 
+waste. 
+ 
+Figure 6 indicates a linear relationship between TS content and initial methane production rate. Such 
+linear relationship was observed also by Lay et al. (1997b) on AD of selected dry organic waste (e.g. 
+	  sludge cake, meat, carrot, rice, potato and cabb	  age), Le Hyaric et al. (2012) on AD of cellulo2	  s3e,	  	   	   	   	  
+CH4 [mL]
+CHAPTER 2 - EFFECT OF MOISTURE CONTENT ON WET ANAEROBIC DIGESTION OF 
+COMPLEX ORGANIC SUBSTRATES 
+Abbassi-Guendouz et al. (2012) on AD of cardboard, Mora-Naranjo et al. (2004) for waste samples 
+excavated from landfill and Pommier et al. (2007) for paper waste. The presented results confirm that 
+the TS content, also in wet AD, has a strong effect on the kinetic rates. In particular, at lower TS, due 
+to the increasing water content and better transport and mass transfer conditions, it seems to be 
+plausible that the microorganisms are better sustained with soluble substrates (Mora-Naranjo et al. 
+2004). 
+50  
+40
+IMPR=-740.3TS+84.34
+30 R2=0.9987
+20
+10
+0  4 5 6 7 8 9 10 11 12
+TS [%]
+Experimental data Regression line  
+Figure 6. Influence of the TS on initial methane production rate. 
+ 
+Table 6. Cumulative methane production. 
+TS mixture [%] 4.98 7.5 11.3 
+Cumulative methane production [mL] 3410 3210 2830 
+Cumulative methane production of blank [mL] 1340 1230 725 
+Net cumulative methane production [mL] 2070 1980 2105 
+Specific Final Methane Yield [mL/gVSfeed] 455 430 460 
+                           
+2.4. Modelling results 
+2.4.1. Modelling the effect of particle size on AD  
+Model calibration was used to estimate the kinetic constant of the surface based disintegration 
+process, K -2 -1sbk (M L T ). Calibration was performed by comparing model results with experimental 
+measurements of methane production and adjusting the unknown parameters until the model results 
+	  adequately fit the experimental observations. Th	  e measured data of experiment T1 (Table 7) w2e	   r4e	  	   	   	   	  
+Initial methane producti
+[mLCH  grVS-1 d-1
+on rate 
+4 in ]
+CHAPTER 2 - EFFECT OF MOISTURE CONTENT ON WET ANAEROBIC DIGESTION OF 
+COMPLEX ORGANIC SUBSTRATES 
+used, and a calibration procedure introduced by Esposito et al. (2011a,b) was applied. Using the 
+previously calibrated Ksbk model, validation was performed by calculating RMSE for T2, T3 and T4 
+experiments. 
+The model calibration performed resulted in setting the kinetic constant Ksbk equal to 0.28 kg m-2s-1. 
+Ksbk was the value that minimizes RMSE (Fig. 7), that show a single monotone reversal trend that 
+proves the existence of one and only one solution to the specific optimization problem. 
+In Figure 8A a good overlap between the simulated and model data is shown. A small shift between 
+experimental data and model results was observed. 	  
+0.025
+0.02
+0.015
+Ksbk=0.28
+RMSE=0.063
+0.01
+0.005 0.25 0.5 0.75 1
+Ksbk[kgm-2s-1] 	  
+Figure 7. Calibration procedure for PS = 15 mm: dependence of RMSE on Ksbk. 
+ 
+(A) (B)
+0.2 0.16
+0.15 0.12
+0.1 0.08
+0.05 0.04
+0 0
+0 10 20 30 40 50 60 70 0 0.04 0.08 0.12 0.16
+Time [d] Measured CH4 [mol] 	  
+Figure 8. Comparison of measured and simulated cumulative methane production for experiments 
+with PS = 15 mm: overlapping between measured and simulated data (a); comparison between 
+s	   imulated and experimental data with line of perfect fit (b). 
+The results of experiments T2, T3 and T4 were used to validate the mathematical model, assessing the 
+	  agreement between simulated and observed dat	  a for the cumulative methane production with 2t	  h5e	  	   	   	   	  
+CH4 [mol] RMSE
+Simulated CH4 [mol]
+CHAPTER 2 - EFFECT OF MOISTURE CONTENT ON WET ANAEROBIC DIGESTION OF 
+COMPLEX ORGANIC SUBSTRATES 
+parameter RMSE. Figures 9, 10 and 11 show a very good agreement between the simulated and 
+experimental data. This agreement is confirmed in Table 8, where the values of a* constant evaluated 
+for different PS are also reported.  
+(A) (B)
+0.2 0.16
+0.15 0.12
+0.1 0.08
+0.05 0.04
+0 0
+0 10 20 30 40 50 60 70 0 0.04 0.08 0.12 0.16
+Time [d] Measured CH4 [mol] 	  
+Figure 9. Comparison of measured and simulated by cumulative methane production for experiments 
+with PS = 9 mm: overlapping between measured and simulated data (a); comparison between 
+s	   imulated and experimental data with line of perfect fit (b). 
+(A) (B)
+0.2 0.16
+0.15 0.12
+0.1 0.08
+0.05 0.04
+0 0
+0 10 20 30 40 50 60 70 0 0.04 0.08 0.12 0.16
+Time [d] Measured CH4 [mol] 	  
+Figure 10. Comparison of measured and simulated cumulative methane production for experiments 
+with PS = 4 mm: overlapping between measured and simulated data (a); comparison between 
+	  simulated and experimental data with line of perfect fit (b). 
+	   	   2	   6	  	   	   	   	  
+CH4 [mol] CH4 [mol]
+Simulated CH4 [mol] Simulated CH4 [mol]
+CHAPTER 2 - EFFECT OF MOISTURE CONTENT ON WET ANAEROBIC DIGESTION OF 
+COMPLEX ORGANIC SUBSTRATES 
+(A) (B)
+0.2 0.16
+0.15 0.12
+0.1 0.08
+0.05 0.04
+0 0
+0 10 20 30 40 50 60 70 0 0.04 0.08 0.12 0.16
+Time [d] Measured CH4 [mol] 	  
+Figure 11. Comparison of measured and simulated cumulative methane production for experiments 
+with PS = 0.25 mm: overlapping between measured and simulated data (a); comparison between 
+simulated and experimental data with line of perfect fit (b). 
+ 
+Table 7. Results of the model calibration procedure. 
+Test  PS [mm] a* [m2kg-1] Ksbk  [kg m-2s-1] RMSE 
+T1 15 0.561 0.28 0.083 
+                         
+Table 8. Results of the model validation procedure. 
+Test PS  a* Ksbk  [mm] [m2kg-1]  [kg m-2s-1] RMSE 
+T2 0.25 12.632 0.28 0.063 
+T3 4.0 1.579 0.28 0.0627 
+T4 9.0 0.702 0.28 0.067 
+ 
+ 2.4.2. Modelling the effect of TS on AD  
+The mathematical model proposed by Esposito et al. (2008, 2011a,b) was calibrated to set different 
+values of the kinetic disintegration constant K -1dis[T ] = Ksbk a*, for different TS contents. For a selected 
+PS = 15 mm, the value of a* constant was 0.561 m2kg-1. The measured data of experiment (Table 4) 
+were used, a calibration procedure introduced by Esposito et al. (2011a,b) was applied and RMSE for 
+T5, T6 and T7 experiments were evaluated. 
+The results (Fig. 12-14) show a good agreement between the simulated and experimental data; this 
+	   	   2	   7	  	   	   	   	  
+CH4 [mol]
+Simulated CH4 [mol]
+CHAPTER 2 - EFFECT OF MOISTURE CONTENT ON WET ANAEROBIC DIGESTION OF 
+COMPLEX ORGANIC SUBSTRATES 
+agreement is confirmed in Table 9, where the values of the Kdis constant, evaluated for different TS, 
+are also reported. In particular the good fitting between simulated and experimental concentrations 
+shows the capability of the model to simulate the AD process of substrates with different initial TS. 
+(A) (B)
+0.2 0.16
+0.15 0.12
+0.1 0.08
+0.05 0.04
+0 0
+0 10 20 30 40 50 0 0.04 0.08 0.12 0.16
+Time [d] Measured CH  [mol]
+4 	  
+Figure 12. Comparison of measured and simulated by proposed model cumulative methane production 
+for experiments with PS=15 mm and TS= 4.98%:overlapping between measured and simulated data 
+(a); comparison between simulated and experimental data with line of perfect fit (b). 
+(A) (B)
+0.2 0.16
+0.15 0.12
+0.1 0.08
+0.05 0.04
+0 0
+0 10 20 30 40 50 0 0.04 0.08 0.12 0.16
+Time [d] Measured CH4 [mol] 	  
+Figure 13. Comparison of measured and simulated by proposed model cumulative methane production 
+for experiments with PS = 15 mm and TS= 7.48%: overlapping between measured and simulated data 
+	  (a); comparison between simulated and experimental data with line of perfect fit (b). 
+(A) (B)
+0.15 0.16
+0.12
+0.12
+0.08 0.08
+0.04 0.04
+00 10 20 30 40 50 00 0.02 0.04 0.06 0.08 0.1 0.12 0.14
+Time [d] Measured CH4 [mol] 	  
+Figure 14. Comparison of measured and simulated by proposed model cumulative methane production 
+for experiments with PS= 15 mm and TS= 11.34%:overlapping between measured and simulated data 
+	  (a); comparison between simulated and experimen	   tal data with line of perfect fit (b). 2	   8	  	   	   	   	  
+CH4 [mol] CH4 [mol] CH4 [mol]
+Simulated CH4 [mol]
+Simulated CH4 [mol] Simulated CH4 [mol]
+CHAPTER 2 - EFFECT OF MOISTURE CONTENT ON WET ANAEROBIC DIGESTION OF 
+C	   OMPLEX ORGANIC SUBSTRATES 
+Table 9. Disintegration constant and RMSE for different TS. 
+ 
+Test a* [m2kg-1]  K -1dis[s ] RMSE 
+ 
+T5 0.561 0.1 0.0084 
+T6 0.561 0.3 0.0088 
+T7 0.561 0.55 0.0087 
+ 
+Figure 15 indicates a linear relationship between TS and the disintegration kinetic constant obtained 
+with the model proposed by Esposito et al. (2008, 2011a,b) implementation: 
+0.6
+0.5
+0.4 IMPR = -740.3 TS+84.34
+R2 = 0.9987
+0.3
+0.2
+0.1
+04 5 6 7 8 9 10 11 12
+TS [%] 	  
+Figure 15. Correlation between TS content and disintegration rate constant. 
+The linear correlation represented in Figure 15 can be expressed using the following linear equation:  
+d [CH4 ]0 = −740.3⋅ (TS%)+84.34                                        (5) dt
+By considering the presence of a limiting step (i.e. disintegration process) the rate of the overall AD 
+process can be modelled by one equation. If first order kinetics is assumed for the disintegration 
+process, the methane production rate can be expressed by equation (6): 
+d [CH ]4 = Kdis[C]                                                        (6) dt
+where:  
+[C] = substrate concentration [ML-3]. 
+By including the following two parameters: 
+	   	   2	   9	  	   	   	   	  
+Disintegration rate constant
+[kg m2 s-1]     
+CHAPTER 2 - EFFECT OF MOISTURE CONTENT ON WET ANAEROBIC DIGESTION OF 
+COMPLEX ORGANIC SUBSTRATES 
+l = angular coefficient of the interpolation line (-2961.2) 
+f = intercept value of the interpolation line on the axis of the initial methane production rate 
+(337.36) 
+and integrating and making simplifications it is possible to obtain the following equation:  
+K ln(l ⋅(TS%)+ f ) ⋅tdis = C                                           (7) 0
+where:  
+t = integration time for the initial bio-methane production rate evaluation [T]; 
+Co = initial substrate concentration [ML-3]. 
+Table 10. Disintegration kinetic constants obtained with equation (7) and with the mathematical 
+model. 
+K  [s-1]  K  [s-1Test dis dis ] 
+[with Esposito et al., 2011a,b)] [with eq. (7)] 
+T5 0.1 0.19 
+T6 0.3 0.22 
+T7 0.55 0.55 
+ 
+In Table 10 the values of the disintegration constant, obtained with equation (7) and with the 
+mathematical model proposed by Esposito et al. (2008, 2011a,b) are reported, showing a good 
+agreement of the results of the two methods. This confirms that a simplified model (i.e. a one equation 
+model) can approximate the results of a full model when a rate-limiting step of the biological process 
+is clearly present. 
+2.5 Conclusion 
+This chapter focused on the effect of TS content and PS on anaerobic digestion of complex organic 
+substrates. A linear correlation between initial methane production rate and TS content was 
+individuated. An inverse correlation between the Particle Size and the specific methane production 
+was found and also a linear relationship between 1/PS and initial methane production rate for the 
+substrate added were found. These results underline a strong impact of the PS on the kinetic rates and 
+	  individuating the disintegration process as the rat	  e-limiting step for methane production. The surfa3c	   e0-	  	   	   	   	  
+CHAPTER 2 - EFFECT OF MOISTURE CONTENT ON WET ANAEROBIC DIGESTION OF 
+COMPLEX ORGANIC SUBSTRATES 
+based kinetic constant Ksbk for the disintegration equation of carrot waste was determined. Also the 
+values of the disintegration constant for different TS content were assessed. Finally a simple equation 
+correlating TS and the disintegration constant was proposed, that showed a good agreement with the 
+results of new version of ADM1 of complex organic substrate proposed by Esposito et al. (2008, 
+2011a,b). 
+	   	   3	   1	  	   	   	   	  
+CHAPTER 3 - EFFECT OF MOISTURE CONTENT ON ANAEROBIC DIGESTION OF FOOD 
+WASTE 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+CHAPTER 3 
+Effect of moisture content on anaerobic digestion of food waste 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+This chapter is the modified version of the article “Effect of total solids content on methane and 
+VFA production in anaerobic digestion of food waste ” submitted to the Journal Waste 
+Management and Research (under revision). 
+CHAPTER 3 - EFFECT OF MOISTURE CONTENT ON ANAEROBIC DIGESTION OF FOOD 
+WASTE 
+ 	  
+3.1. Introduction 
+The environmental challenges related to the global population growth and the global energy demand 
+are continuously promoting research efforts to develop innovative technologies aimed at producing 
+energy from non-conventional sources (Lay et al. 1997a, b; Mora-Naranjo et al. 2004; Pommier et al. 
+2007; Bollon et al. 2013). The Kyoto Protocol imposed to the major EU industrial countries to reduce 
+their total Greenhouse Gas (GHG) emissions by 8% from the 1990 level by the end of  2012 (Kyoto, 
+1997). To achieve this, the EU policies have set forward the task of supplying 5% of the European 
+energy demands from Anaerobic Digestion (AD) biogas by the year 2020 (Kim and Oh 2011).  
+AD is a biological process for degradation of organic substrates under anaerobic conditions (Esposito et 
+al., 2012a; Esposito et al., 2008) Based on the TS of waste used in the process, three types of AD can 
+be distinguished: dry AD, characterized by a TS above 15%, semi-dry AD with a TS ranging between 
+15% and 10%, and wet digestion with a TS lower than 10% (Li et al., 2011; Liotta, 2014; Zeshan and 
+Annachhatre, 2012). The dry and semi-dry systems most widely applied at industrial scale are Valorga, 
+Dranco, Kompogas and Bekon (Reith et al., 2003), but further applications have also been tested at 
+pilot and farm-scale (Lianhua et al. 2010; Mussoline 2012; Mussoline et al. 2013; Zhang and Zhang 
+1999). 
+The key parameter of the dry AD process is the water content, that is essential for the biological 
+process as water promotes substrate hydrolysis and enables the transfer of process intermediates and 
+nutrients to the bacteria (Bollon et al., 2013; De Baere et al., 2010; Lissens et al., 2001). Hence, the 
+first aim of this paper is to investigate the effect of TS on the AD of Food Waste (FW) under 
+mesophilic conditions in batch reactors. BMTs were performed to compare methane yield, methane 
+production rate, COD, VS and TS degradation in wet, semi-dry and dry conditions. In particular, 
+VFAs composition and concentrations were also investigated as a useful indicator of process stress 
+and instability (Ahring et al. 1995). VFAs are also valuable products that can be used as carbon source 
+in biological processes (Elefsiniotis et al. 2004). However, the role of these parameters on the process 
+development remains still little studied. Therefore, the second aim and main novelty of this chapter is 
+to assess the TS effect on VFAs production from FW, and the VFAs effect on the process evolution. 
+ 
+	   	   3	   3	  	   	   	   	  
+CHAPTER 3 - EFFECT OF MOISTURE CONTENT ON ANAEROBIC DIGESTION OF FOOD 
+WASTE 
+ 3.2. Materials and Methods 
+3.2.1 Experimental set-up  
+BMTs were performed at laboratory scale under controlled and reproducible conditions (Esposito et 
+al. 2012b; Esposito et al. 2011a, b; Esposito et al. 2012c) using 2000 mL glass bottles GL 45 (Schott 
+Duran, Germany). Each bottle was sealed with a 5 mm silicone disc, held tightly to the bottle head by 
+a plastic screw cap punched in the middle (Schott Duran, Germany). A plastic tube hermetically 
+closed to the top was inserted in the plastic screw cap to permit sample withdrawing. All digesters 
+were immersed up to half of their height in hot water kept at a constant temperature of 308.15 K by 
+200 WA-763 submersible heaters (Hagen, Germany). Small amounts of Na2CO3 powder were also 
+added to control the pH and alkalinity values (Esposito et al. 2012b,c) . 
+	   	   3	   4	  	   	   	   	  
+CHAPTER 3 - EFFECT OF MOISTURE CONTENT ON ANAEROBIC DIGESTION OF FOOD 
+WASTE 
+3.2.2. Substrate and inoculum preparation 
+BMTs were conducted in triplicate using FW and Buffalo Manure (BM) anaerobic digestate as 
+inoculum. The FW was prepared according to Valorgas report (Valorgas, 2012) as indicated in Table 
+11.  
+Table 11. Food waste composition of the synthetic substrate used. 
+Amount  
+  Food type (gr wet) 
+Potatoes 200 
+Tomatoes 170 
+Eggplants 170 
+Salad leaves 180 
+Broccoli 180 
+Carrots 140 
+Apples 150 
+Tangerines 170 
+Banana 150 
+Chicken 70 
+Pork 70 
+Fish 70 
+Cheese 20 
+Milk 20 
+Bread 70 
+Biscuits 70 
+Rice 50 
+Pasta 50 
+ 
+Particles size smaller than 0.5 mm were obtained by grinding the FW substrate before starting the 
+experimental tests. The BM digestate, sampled from a mesophilic anaerobic digester, was dehydrated 
+by filtration to obtain a final TS content of 17.82%. BMTs were carried out in wet (TS = 4.52%), semi-
+dry (TS= 12.87%) and dry (TS = 19.02%) conditions as indicted in Table 12. The different TS 
+contents of the mixture were obtained by adding 500 g of inoculum, differently diluted with distilled 
+water and varying the amount of the substrate calculated in order to keep the ratio between organic 
+matter and anaerobic sludge equal to 1:2. Blank BMTs were also conducted on BM without addition of 
+substrate to estimate, as a control, the volume of methane resulting from the fermentation of the 
+inoculum. Table 12 gives the mixture composition of each BMTs and reports the BM and substrate 
+	   	   3	   5	  	   	   	   	  
+CHAPTER 3 - EFFECT OF MOISTURE CONTENT ON ANAEROBIC DIGESTION OF FOOD 
+WASTE 
+amount as well as the TS and VS concentration of the substrate mixture. 
+ 
+Table 12. Composition of inoculum and FW substrate in BMT. 
+Inoculum TS Substrate TS TS VS Tests [g] inoculum amount substrate mixture Mixture [%] [g] [%] [%] [%] 
+T1 500 (±1)   3.45 27.26 24.21 4.52 3.61 
+T2 500 (±1)  10.88 87.80 24.21 12.87 10.45 
+T3 500 (±1)  17.82 139.10 24.21 19.02 15.25 
+ 
+3.2.3. Analytical methods 
+3.2.3.1 Methane production 
+Volumetric methane production was measured once a day, by connecting each digester by a small 
+pipe to an inverted 1000 mL glass bottle containing a strong alkaline solution (12% NaOH). The 
+inverted 1000 mL glass bottle was sealed in the same way as the digesters. The adopted procedure is 
+described in detail in the Chapter 2. 
+  
+ 3.2.3.2 VFAs analysis 
+VFAs concentration and speciation were monitored throughout the process. VFAs were analysed 
+collecting 100 mg of digestate sampled from each reactor and diluted with ultrapure water. The 
+samples were vigorously stirred for three minutes and centrifuged at 8000 rpm for 5 min. VFAs were 
+extracted from the supernatant by SPME prior to GC-MS injection following the procedure proposed 
+by Ábalos et al. (2000). 50 µL of a 2,2 dimethyl butanoic acid solution was added as internal standard. 
+85 µm polyacrilate coated fibers from SUPELCO were used for the extraction and analysed after 
+thermal desorption by an Agilent 6850 GC coupled with a 5973 Network MSD detector. 
+  
+	   	   3	   6	  	   	   	   	  
+CHAPTER 3 - EFFECT OF MOISTURE CONTENT ON ANAEROBIC DIGESTION OF FOOD 
+WASTE 
+3.2.3.3 Other parameters 
+The weight, TS and VS concentration of the anaerobic sludge were determined by gravimetry 
+according to EPA Standard Method 1684 (U.S.E.P.A, 2001). Temperature of all mixtures investigated 
+was monitored for at least once a day with a TFK 325 thermometer (WTW, Germany). COD was 
+determined by the closed reflux method, followed by photometric determination according to APHA 
+standard method 5220D (APHA, 1998) and by applying the method proposed Zu
+The photometer used was a WTW Photolab Spektral visible spectrophotometer.	  	  pančič & Roš (2012).  
+ 
+ 3.3. Results and Discussion  
+3.3.1 Bio-methane production 
+Results of BMTs are summarized in Figures 16-18. Figure 16 reports the specific cumulative methane 
+production versus time in reactors operated with different TS content. Each curve represents the 
+average of 3 replicates (max standard deviation = 4%). The specific cumulative methane production 
+was obtained dividing the cumulative methane production of each test by the initial substrate-inoculum 
+VS mixture. Figure 17 reports the final specific methane yield, measured at the end of each 
+experiment, as a function of the TS content and subtracted of the respective blank production. Finally 
+Figure 18 illustrates the initial methane production rate versus the TS content, evaluated by dividing 
+the specific net methane production by the number of days (3 days) from the start of the experiment.  
+A lower TS content favours both the cumulative methane production and the final methane yield. 
+Such a result is consistent with previous findings (Abbassi-Guendouz et al. 2012; Fernández et al. 
+2008; Le Hyaric et al. 2012; Li et al. 2011; Liotta et al. 2014) obtained using different biodegradable 
+substrates (Table 13), and confirms that the conversion of acids to methane by methanogenic bacteria 
+can be negatively influenced by the lack of water (Lay et al. 1997a; Lay et al. 1997b). It is worth 
+noting that the initial methane production rate is linearly and negatively correlated with the TS 
+percentage (Fig. 18), as already observed during the AD of other organic wastes more or less rapidly 
+biodegradable: dehydrated sludge mixed with dry kitchen waste (Lay et al. 1997a), waste excavated 
+from a sanitary landfill (Mora-Naranjo et al. 2004), paper waste (Pommier et al. 2007), cellulose (Le 
+Hyaric et al. 2012) and cardboard (Abbassi-Guendouz et al. 2012). At lower TS concentration, due to 
+	  the increasing water content and to the more fa	  vourable transport and mass transfer conditions3,	   7it	  	   	   	   	  
+CHAPTER 3 - EFFECT OF MOISTURE CONTENT ON ANAEROBIC DIGESTION OF FOOD 
+WASTE 
+seems plausible that the microorganisms are better sustained with soluble substrates (Mora-Naranjo et 
+al. 2004), so that the process takes place more rapidly.  
+ 
+Figure 16. Specific cumulative methane production of FW at different TS content (Tests T1-T3). 
+	  
+Figure 17. Final methane yield of FW with different TS content 
+	  
+Figure 18. Linear correlation between the specific initial methane production rate and the TS content of 
+F	   W. 	   3	   8	  	   	   	   	  
+CHAPTER 3 - EFFECT OF MOISTURE CONTENT ON ANAEROBIC DIGESTION OF FOOD 
+WASTE 
+ 
+Table 13. Final methane yields improvement in wet conditions compared with semi-dry and dry 
+conditions. 
+ 
+Substrates used Final methane yield TS and References 
+in BMTs  improvement with Temperature 
+lower TS content [%] 
+FW 57 TS = 30%, Fernández et al. 
+20%; (2008) 
+T=35°C 
+Water sorted    
+organic fraction of 15  TS = 16%, Dong. et al. (2010) 
+municipal solid 11%; 
+waste T=30 °C 
+    
+Cellulose 11.6 TS = 25%, Abbassi-Guendouz 
+18%; et al. (2012) 
+T=35°C  
+Cardboard 24 TS = 30%, Le Hyaric et al. 
+10% (2012) 
+T = 35 °C 
+Carrot Waste 1 TS =11.3%,      Liotta et al.2014 
+TS = 5% 
+T =35°C 
+FW 69 TS=19.2 %, This study 
+4.5%;T= 35°C 
+  
+3.3.2 VFAs production 
+A deeper understanding of the TS effect on process development can be obtained by comparing the 
+trend of daily methane production (Fig. 19) and the corresponding concentration and speciation of 
+VFAs (Fig. 20). A first peak of methane production can be detected in all reactors on the second day 
+(Fig. 19). This peak, most likely due to the degradation of fast biodegradable compounds, corresponds 
+to the peak of Total Volatile Fatty Acids (TVFAs) related to acid accumulation at the start-up of the 
+process (Fig. 20). This means that the methanization is the rate-limiting step at the beginning of the 
+process.  
+Once the methanization has begun, the rate-limiting step becomes the hydrolysis process, and the 
+TVFAs concentration slowly decreases. Two more peaks of methane production can be observed on 
+	  day 15 and day 36. This finding is in agreement 	  with Charles et al. 2009 and Dong et al. 2010 w3	  h9o	  	   	   	   	  
+CHAPTER 3 - EFFECT OF MOISTURE CONTENT ON ANAEROBIC DIGESTION OF FOOD 
+WASTE 
+found two peaks of methane production during anaerobic digestion of organic fraction of municipal 
+solid waste. Dong et al. 2010 correlated this finding to the inhibitory effect of an elevated H2 partial 
+pressure on the acetoclastic methanogenesis. It is likely that the two peaks correspond to the 
+degradation of easily and slowly biodegradable compounds contained in the FW. 
+The maximum TVFAs concentration found in the case of 12.9% and 19.2% were respectively 127 
+mmol/kg and 135 mmol/kg (Fig. 20): in these cases TVFAs concentrations exceed the threshold 
+values reported by Karthikeyan and Visvanathan, 2012 over that a sensible reduction of process 
+kinetics occurs. The same occurs for the concentration of acetic acid, which reaches values higher 
+than 33 mmol/L. The lower specific methane yield detected at the higher TS content can be correlated 
+to acid inhibition during the process, which is more important for TS 12.9% and 19.2%. Indeed, high 
+TVFAs concentrations induce acidification of the medium, leading to the presence of TVFAs in their 
+un-dissociated forms, which are more toxic for microorganisms (Amani et al. 2010). A lower water 
+content in the fermenting mixture makes the TVFAs concentration higher due to a lack of solvent. 
+Therefore, even if the amount of produced TVFAs is the same, their concentration in the reactor will 
+be much higher in dry AD. 
+It has to be stressed that because of the lack of the mixing device inside the reactor higher TS 
+concentrations imply higher heterogeneities and possible accumulation of inhibitory compounds 
+inside specific reactor zones is likely to occur. Furthermore, at the highest TS concentrations 
+investigated, environmental conditions do not allow the growth of acetoclastic, methanogens or 
+acetate-oxidizing bacteria because of too high VFA concentrations and too low pH values (Abbassi-
+Guendouz et al. 2012). During the first stage (0-4 days), acetic acid accumulation occurs (Fig. 21a) 
+because hydrolysis and acidogenesis take place and the easy biodegradable fraction of FW is 
+converted to TVFAs. During the second stage (5-35 days), acetoclastic methanogens are in the 
+exponential growth phase and the acetic acid consumption rate is higher than its generation rate (Dong 
+et al. 2010). Therefore, hydrolysis and acidogenesis become the rate-limiting steps and the produced 
+acids are consumed to produce methane (Dong et al. 2010). 
+	   	   4	   0	  	   	   	   	  
+CHAPTER 3 - EFFECT OF MOISTURE CONTENT ON ANAEROBIC DIGESTION OF FOOD 
+WASTE 
+ 
+Figure 19. Daily methane production of FW at different TS content 
+	  
+Figure 20. Evolution of TVFAs concentration in AD of FW at different TS contents 
+ 
+The maximum concentration of propionic acid (Fig. 21b) occurs sooner for lower TS concentrations 
+(day 13) and later for higher TS concentrations (day 17). This accumulation, common also to formic 
+acid (Fig. 21e), can be correlated to the limited transformation of propionate to other VFAs as pointed 
+out also by Hanaki et al. 1994. Also butyrate and valeric acid isomers present higher values with 
+higher TS (Fig. 21c and 21d), probably a consequence of the process instability occurring during the 
+acid production, which determines the formation of isomeric compounds. About the propionic acid, 
+although an accumulation (8-12 days) can also be seen for TS = 4.5% during days 7-12, in this case the 
+concentration starts immediately to decrease and drops regularly to zero (Fig. 21b). Such behavior can 
+be attributed to the fact that the concentration of propionate is directly related to that of acetate in the 
+reactor and the lowest acetate accumulation occurs during test T1 (TS = 4.5%) (Fig. 21a). During tests 
+T2 and T3 the concentration of acetate is twice higher and lasts for about 5 days longer. This leads to 
+an accumulation of propionate that is contemporary to the accumulation of acetate. A long acetate and 
+propionate accumulation is instead not present in the reactor with TS content of 4.5%. The 
+a	   ccumulation of butyric and propionic acid that ta	  kes place only in the dry and semidry reactors mi4g	   h1t	  	   	   	   	  
+CHAPTER 3 - EFFECT OF MOISTURE CONTENT ON ANAEROBIC DIGESTION OF FOOD 
+WASTE 
+be attributed to the co-presence of alternative fermentation pathways, that yield to butyric acid 
+accumulation. This pathway is alternative to the acetic fermentation and can have different process 
+kinetics.  
+	  
+a) Acetic acid 
+ 
+b) Propionic acid 
+ 
+c) Butyric acid 
+	   	   4	   2	  	   	   	   	  
+CHAPTER 3 - EFFECT OF MOISTURE CONTENT ON ANAEROBIC DIGESTION OF FOOD 
+WASTE 
+ 
+d) Valeric acid 
+ 
+e) Formic acid 
+Figure 21. Evolution of the VFAs concentration of FW AD: a) acetic acid; b) propionic acid; c) butyric 
+acid; d) valeric acid; e) formic acid. 
+ 
+The Total COD concentration in the reactor at different initial TS concentrations was also investigated. 
+As expected, the COD degradation decreased under all TS conditions. The COD values at the end of 
+the experiment were higher for higher TS content as COD removal decreased from 74 ± 6% (TS = 
+4.5%) to 62 ± 8% (TS = 12.9%), down to 56±7% (TS = 19.2%), confirming the slowdown of process 
+kinetics taking place at higher TS content due to high VFA concentration (Figs. 20 and 21). 
+ 
+ 
+ 
+	   
+	   	   4	   3	  	   	   	   	  
+CHAPTER 3 - EFFECT OF MOISTURE CONTENT ON ANAEROBIC DIGESTION OF FOOD 
+WASTE 
+ 3.4 Conclusions 
+This chapter focused on the effect of the TS content on the anaerobic digestion of FW. The 
+experimental results show a decrease of the specific final methane yield of 4.3% and 40.8% in semi-
+dry and dry conditions, respectively, compared to wet conditions. A higher specific cumulative 
+methane production rate and better process performance in terms of COD reduction were also 
+achieved at lower TS content. A linear correlation between the initial methane production rate and the 
+TS content was observed. High TVFA concentrations of 135 mmol/kg and 127 mmol/kg were found 
+in dry and semidry conditions, respectively, resulting in a slowdown of process kinetics
+	   	   4	   4	  	   	   	   	  
+CHAPTER 4 - EFFECT OF MOISTURE CONTENT ON ANAEROBIC DIGESTION OF RICE 
+STRAW 
+ 
+ 
+CHAPTER 4 
+Effect of moisture content on anaerobic digestion of rice straw.
+CHAPTER 4- EFFECT OF MOISTURE CONTENT ON ANAEROBIC DIGESTION OF RICE 
+STRAW 
+ 
+ 4.1 Introduction 
+Rice straw is one of the most abundant residues and is a potential renewable source for energy 
+generation. AD may offer a promising alternative to solve imminent rice straw disposal problems in 
+rice production regions (Zhang and Zhang 1999). Different advantages are connected to the AD of 
+rice straw. This substrate is a very common agricultural waste and the biogas production potential is 
+appealing to both developed and developing countries (Mussoline et al. 2013). However, one of the 
+main disadvantages is related to the ligno-cellulosic structure of rice straw that is well attested to be 
+difficult to biologically degrade (Sambusiti, 2013). Rice straw as lignocellulosic material is thus 
+mainly composed as follow: cellulose (37.4%), hemi-cellulose (44.9%), lignin (4.9%) and silicon ash 
+(13%) (Hills and Robert 1981).  
+Dry AD is well suited to handle lingo-cellulosic biomass and provides a reduction of problems 
+encountered in liquid, such as floating and stratification of solids. Dry AD of rice straw received much 
+attention due to the high TS content of rice straw, that requires less sludge addition and smaller 
+reactor volumes and pre-treatment. However, such high solid contents involve several technical 
+disadvantages in terms of transport, handling and mixing to those encountered in wet processes (De 
+Baere et al. 2010). The key parameter of dry AD processes is the water content, that is essential for 
+the biological organic waste conversion. Water promotes substrate hydrolysis and enables the transfer 
+of process intermediates and nutrients to bacterial sites (Lay et al. 1997a,b; Mora-Naranjo et al. 2004; 
+Pommier et al. 2007).  
+The aim of this chapter is to investigate the effect of the moisture content relating the AD performance 
+to the process parameters monitored during the rice straw degradation. More in detail, by varying the 
+TS in the range of 4.85-23.41% TS, the final specific methane production yield, VS, COD, VFA and 
+total and soluble phenols concentration were analysed. In particular, this chapter focuses on inhibition 
+problems and final methane yield reduction that occurs at elevated TS concentrations caused by VFAs 
+and high concentration of soluble phenolic compounds. 
+	   	   4	   6	  	   	   	   	  
+CHAPTER 4- EFFECT OF MOISTURE CONTENT ON ANAEROBIC DIGESTION OF RICE 
+STRAW 
+ 
+ 4.2. Material Methods 
+4.2.1 Experimental set-up  
+During the biogas production, samples were taken from the reactor, where pH, COD, VFAs and 
+phenols concentrations were monitored. BMT were performed on a small scale under controlled and 
+reproducible conditions in a 2000 mL glass bottle GL 45 (Schott Duran, Germany). Each bottle was 
+sealed with a 5 mm silicone disc that was held tightly to the bottle head by a plastic screw cap 
+punched in the middle (Schott Duran, Germany). A plastic tube hermetically closed at the top was 
+inserted in the plastic screw cap to permit sampling. All digesters were immersed up to half of their 
+height in hot water kept at a constant temperature of 308 +/- 1 K by 200 WA-763 submersible heaters 
+(Hagen, Germany). Small amounts of Na2CO3 powder were also added to the medium to control pH 
+values (Esposito et al., 2012a,b). 
+ 
+4.2.2. Substrate and inoculum preparation 
+BMTs were performed using rice straw and the anaerobic digestate of BM. The value of particle size 
+smaller than 0.5 mm was obtained by grinding the rice straw prior to starting experimental tests.  
+The initial TS content of the fresh digestate was 10.88%, this high value is related to the nature of the 
+digestate, that is an effluent of the dewatering system of a mesophilic Anaerobic Reactor. To increase 
+the TS content, the digestate was dewatered by filtration to obtain a final TS content of 17.20%. Then, 
+the sample was diluted with water to obtain the designed moisture content for batch tests with lower 
+TS content (Table 14). A fixed amount of BM digestate equal to 500 g was defined for each batch test 
+and only the amount of substrate was changed to obtain different moisture contents. All the tests were 
+performed imposing a selected organic matter/inoculum ratio of 0.5 and conducted in triplicate. A 
+total of nine bottles were operated with a final TS content of the mixture: 4.84%, 14.86%, 23.40%, 
+which represents, respectively, wet, semi-dry and dry conditions. Table 14 gives the mixture 
+composition of each BMT test. 
+Nine further tests were conducted using only BM as the substrate to estimate the volume of methane 
+	  resulting from the fermentation of the organics 	  contained in the anaerobic sludge. Totally 18 te4	  s7ts	  	   	   	   	  
+CHAPTER 4- EFFECT OF MOISTURE CONTENT ON ANAEROBIC DIGESTION OF RICE 
+STRAW 
+ 
+were performed.   
+Table 14. Inoculum and substrate characteristics. 
+Anaerobic TS Substrate TS VS 
+Tests sludge inoculum amount  substrate TS mixture [%] Mixture [g] [%] [g] [%] [%] 
+T1 500(±1) 3.45 8.09 91.00 4.85     3.75 
+T2 500(±1) 10.88 26.05 91.00 14.86    11.68 
+T3 500(±1) 17.82 41.27 91.00 23.41    17.98 
+                     
+4.2.3. Analytical methods 
+4.2.3.1 Methane production, COD, TS, VS. 
+Volumetric methane production was measured once a day, by connecting each digester by a capillary 
+tube to an inverted 1000 mL glass bottle containing an alkaline solution (12% NaOH). The inverted 
+1000 mL glass bottle was sealed in the same way as the digesters. To enable gas transfer through the 
+two connected bottles, the capillary tube was equipped on both ends with a needle sharp enough to 
+pierce the silicone disc. 
+The weight, TS and VS concentration of the anaerobic sludge as well as the dry matter, moisture 
+organic matter and ash content of the substrate were determined by gravimetry according to Standard 
+Methods (APHA, 1998). Temperature of all mixtures investigated was monitored for at least once a 
+day with a TFK 325 thermometer (WTW, Germany). COD was determined by the closed reflux 
+method, followed by photometric determination using a WTW Photolab Spektral visible 
+spectrophotometer	   according to the APHA standard method 5220D and by applying the method 
+proposed by Zupančič and Roš (2012).	  
+ 
+4.2.3.2 VFAs and phenols analysis 
+VFAs concentration and speciation were monitored throughout the process. VFAs were analysed 
+collecting 100 mg of digestate sampled from each reactor and diluted with ultrapure water. The 
+	  samples were vigorously stirred for three minutes	   and centrifuged at 8000 rpm for 5 min. VFAs w4e	   r8e	  	   	   	   	  
+CHAPTER 4- EFFECT OF MOISTURE CONTENT ON ANAEROBIC DIGESTION OF RICE 
+STRAW 
+ 
+extracted from the supernatant by SPME prior to GC-MS injection following the procedure proposed 
+by Ábalos et al. (2000). 50 µL of a 2,2 dimethyl butanoic acid solution were added as internal 
+standard. 85 µm polyacrilate coated fibers from SUPELCO were used for the extraction and analysed 
+after thermal desorption by an Agilent 6850 GC coupled with a 5973 Network MSD detector. 
+Total Phenols determination is according to APHA standard method 5550 B (APHA, 1998), by the 
+use of the Folin reagent. The method is sensitive for any compound containing aromatic hydroxyl 
+group. The calibration curve was built preparing standards at increasing concentration of phenol 
+(C6H5OH).  
+ 4.3. Results and Discussion  
+4.3.1 Methane production 
+Results of BMTs are summarized in Figures 22-24. Figure 22 reports the specific cumulative methane 
+production versus time in reactors operated with different TS content. Each curve represents the 
+average of 3 replicates (max standard deviation = 3%). The specific cumulative methane production 
+was obtained dividing the cumulative methane production of each test by the initial substrate-inoculum 
+VS mixture. Figure 23 reports the final specific methane yield, measured at the end of each 
+experiment, as a function of the TS content and subtracted of the respective blank production.  
+Figures 22-23 show that the lower TS content was favourable for improving the cumulative methane 
+production and the final methane production yield.  
+Figure 24 illustrates the daily methane production during the first 60 days. One initial peak of methane 
+production was detected in all reactors. This peak is connected to the anaerobic degradation of 
+biodegradable substrates, corresponding to the TVFA (Fig. 26) peak related to acid accumulation at 
+the start-up of the process. This means that the hydrolysis is the rate-limiting step of the process. The 
+results obtained with the final methane yield for different TS are consistent with previous studies 
+operated with different types of substrate performed by Lay et al. (1997a, b), Abbassi-Guendouz et al. 
+(2012), Fernández et al. (2008), Dong et al. (2010), Le Hyaric et al. (2012) and Shi et al. (2014). All 
+authors do agree that higher methane yields can be obtained with a lower TS. Thus, the conversion of 
+acids to methane by methanogenic bacteria might be influenced by the lack of the free water (Lay et 
+	  al. 1997b; Ghosh 1985) that can occur with a h	   igher TS content in the range of dry and semid4	   r9y	  	   	   	   	  
+CHAPTER 4- EFFECT OF MOISTURE CONTENT ON ANAEROBIC DIGESTION OF RICE 
+STRAW 
+ 
+digestion (Abbassi-Guendouz et al. 2012; Fernández et al. 2008; Li et al. 2011). Figure 25 indicates a 
+non-linear relationship between TS content and initial methane production rate. This behaviour is not 
+in agreement with several author findings, who found a linear relationship between the two parameters 
+(Lay et al. 1997b; Le Hyaric et al. 2012; Abbassi-Guendouz et al. 2012; Mora-Naranjo et al. 2004; 
+Pommier et al. 2007). The different behaviour can be explained because of the different substrate 
+composition, the complex nature of lingo-cellulosic compounds, the low bio-availability of cellulose, 
+the substrate crystalline structure and the presence of hemicellulose. 
+ 
+Figure 22. Specific cumulative methane production of rice straw in mesophilic conditions at different 
+TS content. 
+ 
+Figure 23. Final methane yield of rice straw AD at different TS content.  
+	   	   5	   0	  	   	   	   	  
+CHAPTER 4- EFFECT OF MOISTURE CONTENT ON ANAEROBIC DIGESTION OF RICE 
+STRAW 
+ 
+	  
+Figure 24. Daily methane production of rice straw anaerobic digestion at different TS content. 
+	  
+Figure 25. Not linear correlation between specific methane production and TS content.  
+ 
+4.3.2 Analysis of process intermediates 
+To explain the obtained results it was monitored the concentration of VFAs, that is considered an 
+useful indicator of process stress and instability (Ahring et al. 1995). Figure 26 illustrates the temporal 
+evolution of selected VFAs (acetate, butyrate, propionate, valerate and formic acid) for the three TS 
+concentrations investigated. The lower methane yield detected with a higher TS content corresponded 
+to an higher concentration of acids. The highest concentrations were observed at TS = 23.41%, with 
+maximum values of 8.73 mmol acetic acid/kg on the 2nd day, 9.52 mmol formic acid/kg on the 8th day, 
+19.18 mg propionic acid/kg on the 2nd day and 2.02 mmol butyric acid/kg on the 8th day were found. 
+In the case of TS = 14.86%, the maximum values of 5.16 mmol acetic acid/kg on the 8th day, 2.57 
+mmol formic acid/kg on the 8th day, 6.82 mg propionic acid/kg on the 8th day and 0.43 mmol butyric 
+	  acid/kg on the 9
+th day were found. For a TS co	  ntent of 4.85% the maximum values of 2.56 mm5	   o1l	  	   	   	   	  
+CHAPTER 4- EFFECT OF MOISTURE CONTENT ON ANAEROBIC DIGESTION OF RICE 
+STRAW 
+ 
+acetic acid/kg on the 3rd day, 0.4 mmol formic acid/kg on the 1st day, 1.57 mmol propionic acid/kg on 
+the 8th day and 0.21 mmol butyric acid/kg on the 3rd day were found. 
+An insufficient amount of methanogenic archaea may be the cause of such high concentrations of 
+VFAs. Indeed, high VFA concentrations induce acidification of the medium, and result in the 
+presence of VFAs in their un-dissociated form which is more toxic for microorganisms (Amani et al. 
+2010). Furthermore, at the highest TS concentrations, environmental conditions did not allow the 
+growth of acetoclastic methanogens or acetate-oxidizing bacteria on account of high VFA 
+concentrations and low pH values (Abbassi-Guendouz et al. 2012). Also during the first days, acid 
+accumulation occurred (Fig. 27a-e), because the hydrolysis and acidogenesis took place and the easy 
+biodegradable fraction of rice straw was converted to VFAs. During the second stage, acetoclastic 
+methanogens where in the exponential growth phase and the acetic acid consumption rate exceeded its 
+generation rate, also if the hydrolysis and acidogenesis were still going on. In the final stage, the 
+balance between the hydrodysis/acidogenesis and methanogenesis was formed and the produced acids 
+were consumed to produce methane (Dong et al. 2010). 
+Is finally possible to notice how the accumulation of butyric and formic acids takes place only in the 
+dry and semidry reactors and lasts until the 8th day, while both this acids concentrations are close to 
+zero during almost the whole experiment. This might be attributed to the co-presence of an alternative 
+fermentation pathway, that brings to the formation of butyric acid. This pathway is alternative to the 
+acetic fermentation and determine different process kinetics. This indicates that in the studied reactors 
+the border conditions are different for the fermenting microorganisms, probably originating bacterial 
+growths with different distributions and degradation pathways. 
+ 
+	   	   5	   2	  	   	   	   	  
+CHAPTER 4- EFFECT OF MOISTURE CONTENT ON ANAEROBIC DIGESTION OF RICE 
+STRAW 
+ 
+	  
+Figure 26. Evolution of TVFA concentration of rice straw at different TS content.  
+	  	  
+a) Acetic acid	  
+	   	  
+b) Propionic acid 
+	   	   5	   3	  	   	   	   	  
+CHAPTER 4- EFFECT OF MOISTURE CONTENT ON ANAEROBIC DIGESTION OF RICE 
+STRAW 
+ 
+	  	  
+c) Butyric acid	  
+	   	  
+d) Valeric acid                                                         
+	  
+e) Formic acid 
+Figure 27. Evolution of VFA concentration of rice straw anaerobic digestion with different TS content: 
+a) Acetic acid; b) propionic acid; c) butyric acid; d) valeric acid; e) formic acid.  
+ 
+Despite the observed differences among the three TS concentrations, each detected VFA 
+c	   oncentrations never reached the inhibition limit (	  Fig. 27). The maximum TVFA concentrations w5e	   r4e	  	   	   	   	  
+CHAPTER 4- EFFECT OF MOISTURE CONTENT ON ANAEROBIC DIGESTION OF RICE 
+STRAW 
+ 
+3 mmol/kg, 15 mmol/kg and 33 mmol/kg, respectively, i.e. much lower respect to the threshold value 
+indicated by Karthikeyan and Visvanathan, 2012. It was therefore supposed that the inhibition 
+occurred because of higher total phenols content at higher TS concentration (Fig. 28). 
+	  
+Figure 28. Total phenol degradation in anaerobic digestion of rice straw for different TS. 
+ 
+ 4.4 Comparative process efficiency  
+The reactor performances are reported for all TS concentrations in terms of VS reduction, evolution of 
+COD removal and specific final methane production yield. In terms of VS removal efficiency, the 
+better performances were observed at a lower TS content. This finding is in agreement with the 
+measured final methane production yield.  
+The COD values at the end of the experiment were higher for higher TS content as COD removal 
+decreased from 63 ± 6% (TS = 4.85%) to 59 ± 8% (TS = 14.86%), down to 48 ± 7% (TS = 23.4%), 
+confirming the slowdown of process kinetics taking place at higher TS content due to high VFA 
+concentration. 
+ 
+ 4.5. Conclusions 
+This chapter focuses on the effect of the moisture content on the anaerobic digestion of rice straw. A 
+higher specific methane production yield and process performance in terms of VS and COD 
+reductions were achieved at a lower TS content. This suggests that a wet anaerobic digestion gives 
+	   	   5	   5	  	   	   	   	  
+CHAPTER 4- EFFECT OF MOISTURE CONTENT ON ANAEROBIC DIGESTION OF RICE 
+STRAW 
+ 
+better performances compared with dry processes. An inhibition correlated to the TVFA accumulation 
+was found at higher TS content. In fact maximum TVFA concentration of 2.1 g/kg was found in dry 
+condition, 1 g/kg in semidry conditions and 0.2 g/kg in wet conditions. Higher total phenol 
+concentration was also found at higher TS content. This could determine inhibition phenomena and 
+reduction of methane production. 
+	   	   5	   6	  	   	   	   	  
+CHAPTER 5 - ADM1 FOR DRY AND SEMI-DRY ANAEROBIC DIGESTION OF SOLID 
+ORGANIC WASTE 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+CHAPTER 5 
+Modified ADM1 for dry and semi-dry anaerobic digestion of solid 
+organic waste  
+ 
+ 
+	   
+ 	  
+ 
+ 
+ 
+ 
+ 
+This chapter is the modified version of the article “Modified ADM1 for dry and semi-dry anaerobic 
+digestion of solid organic waste”  submitted to Bioresource Technology Journal (under revision). 
+	   	   5	   7	  	   	   	   	  
+CHAPTER 5 - ADM1 FOR DRY AND SEMI-DRY ANAEROBIC DIGESTION OF SOLID 
+ORGANIC WASTE 
+5.1 Introduction 
+Experimental research carried out in recent years on AD have definitely established that the TS content 
+plays an important role on process development (Dong et al. 2010; Brown and Yebo 2013; Fernàndez 
+et al. 2008; Forster-Carneiro et al. 2007; Forster-Carneiro et al. 2008; Le Hyaric et al. 2012; Lü et al. 
+2012; Jha et al. 2013; Wang et al. 2013; Xu and Li 2012; Liotta et al. 2014; Shi et al. 2014; Zhu et al. 
+2014). As a consequence, several studies have been lead recently to adapt and calibrate the existing 
+mathematical models to take into account the effect of the TS content (Lay et al. 1997a, 1997b; Fdez-
+Güelfo et al. 2012; Brown et al. 2012; Le Hyaric et al. 2012; Motte et al. 2013). Le Hyaric et al. (2012) 
+and Lay et al. (1997a, 1997b) applying the Gompertz model to simulate the results of Specific 
+Methanogenic Activity test, found that a high TS content (15%-25%) reduces substrate degradation 
+because of water and nutrients limitation, resulting in a lower methanogenic activity. Brown et al. 
+(2012) used the first-order kinetic models to characterize the methane production of lignocellulosic 
+biomass and found a linear relationship between logarithmic methane production and reaction time in 
+both in wet and dry anaerobic digestion of switchgrass, corn stover, wheat straw, leaves, yard waste 
+and maple. Dry anaerobic digestion generally exhibits a poor start-up performance, thus several models 
+assume the hydrolysis as the rate-limiting step of the process (Jha et al. 2013). In particular, Abbassi-
+Guendouz et al. (2012), applying the ADM1 (Batstone et al. 2002) to cardboard treatment, found a 
+decreasing first-order hydrolysis rate constant for carbohydrates degradation when increasing the TS 
+content between 15-30%. Liotta et al. (2014) also found a decreasing disintegration rate when 
+increasing the TS content in the range of wet digestion. Bollon et al. (2011) found a similar result using 
+municipal solid waste digestate.  
+Moreover recent studies demonstrated the important role of the mechanisms associated to VFAs uptake 
+on process performances (Ward et al., 2008, Bolzonella et al., 2003, Dai et al., 2013, Jha et al., 2013, 
+Pohl et al., 2013). As intermediate products, VFAs have been treated as an indicator of the digestion 
+efficiency, but high concentrations of VFAs can determine a decrease of pH leading to performance 
+failure of the digester (Gerardi, 2003, Jha et al., 2013, Motte et al., 2013, Vavilin et al., 1996a). 
+An attempt to model dry anaerobic digestion considering also the role of VFA uptake was done by 
+Guendouz et al. (2010), who found a transitory accumulation of VFA during the batch tests indicating 
+that not only the hydrolysis is the rate-limiting step during dry anaerobic digestion of the solid wastes. 
+Motte et al. (2013) proposed a quadratic model able to descript dynamically the effect of TS, PS and 
+s	   ubstrate/inoculum ratio on methane production	  , pH and VFA concentration. The model resu5l	  t8ed	  	    	   	   	  
+CHAPTER 5 - ADM1 FOR DRY AND SEMI-DRY ANAEROBIC DIGESTION OF SOLID 
+ORGANIC WASTE 
+highly significant (p-value < 0.05) and the coefficient of determination reach also 80%, however the 
+authors have not implemented a complete model, like ADM1, and have not calibrated any kinetic 
+constant varying TS content.  
+The aim of the present chapter is to develop a kinetic model that can specifically characterize the 
+disintegration, the acetogenesis and methanogenis steps of selected complex organic substrates as a 
+function of TS content in order to obtain a model able to predict and interpret results from anaerobic 
+digesters in wet, semi-dry and dry AD. In the following section, an overview of the model structure, 
+assumptions and main model parameters is presented. The proposed model is based on the cited ADM1 
+model (Batstone et al., 2002) as modified by Esposito et al. (2008, 2011a,b, 2012a,b) for complex 
+organic substrates (modified ADM1). The kinetic equations are reformulated to consider the direct 
+effect of TS content and the effect of the intermediate compounds, which can affect, as a function of 
+the TS content, the whole process development. The dynamics of acetate, propionate and methane 
+production presented in Chapter 3 and 4 and obtained from two different series of batch anaerobic 
+digestion of food waste and rice straw were used to calibrate the proposed model. Food waste was 
+selected as representative of easily, highly biodegradable and heterogeneous substrates (Zhang et al. 
+2007), while rice straw as representative of slowly biodegradable and model of lignocellulosic residues.  
+ 
+5.2 Model description 
+The proposed model is based on the Modified ADM1 (MADM1), extended to take into account the 
+presence of complex organic substrates in the feedstock, and the operation of the digester in semi-dry 
+and dry conditions. It is applied for Completely Stirred Tank Reactor (CSTR) and batch systems. The 
+MADM1 is a structured biological model that simulates the major conversion mechanisms of organic 
+substrates into biogas and the degradation of by-products. It assumes that composite materials are 
+converted into carbohydrates, proteins and lipids by a disintegration step (Esposito et al. 2012a,b). 
+These components are further hydrolysed into simple sugars, amino acids and long chain fatty acids. 
+Then, during the acidogenic step, fermentative micro-organisms convert these products into acetic, 
+propionic, butyric and valeric acids, hydrogen and carbon dioxide. The uptake of fatty acids yields 
+acetate (acetogenic step), which is converted into methane by methanogens.  
+The disintegration and hydrolysis steps are modelled by first-order kinetics. The disintegration used 
+	  surface based kinetic, while hydrolysis step 	   a classical first order kinetic. All the oth5e	   r9 	  	   	   	   	  
+CHAPTER 5 - ADM1 FOR DRY AND SEMI-DRY ANAEROBIC DIGESTION OF SOLID 
+ORGANIC WASTE 
+transformations are classical biochemical transformations performed by specific bacterial groups, and 
+are described by a Monod-type equation, where the substrate uptake is associated to the microbial 
+growth. The kinetics of microbial growth and decay are also included in the model. 
+The overall model consists of 28 mass balance equations (Batstone et al. 2002) applied to the 28 state 
+variables (13 substrates and 15 biomasses) summarized in Tables 15-16. The kinetic constants and 
+processes of the modelled substrates in the MADM1 are listed in Table 17. It is worth noting that, 
+according to the MADM1, only the parameter Ksbk, not included in the original version of the ADM1, 
+is function of the substrate intrinsic characteristics and therefore depends also on the TS content of 
+the substrate (Liotta et al. 2014). 
+Table 15. Substrate variables in the MADM1 model. 
+ 
+Substrate variables [ML-3] Symbol 
+ Initial Substrate C 
+Soluble Inert Si 
+ Total Propionate Spro 
+Total Acetate Sac 
+                   Total Butyrate Sb 
+Total Valerate S  
+ vGaseous Hydrogen Shg  
+ Gaseous Methane Shm 
+Inorganic carbon Sc 
+  Nitrogen SN 
+LCFA SLCFA 
+ Sugar SS 
+Amino acids Sam 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+	   	   6	   0	  	   	   	   	  
+CHAPTER 5 - ADM1 FOR DRY AND SEMI-DRY ANAEROBIC DIGESTION OF SOLID 
+ORGANIC WASTE 
+ 
+Table 16. Biomass variables in the MADM1 model 
+ 
+Biomass variables [ML-3] Symbol 
+Particulate inert Xi 
+ Propionate degraders Xpro 
+Acetate Degraders Xac 
+ Butyrate and Valerate 
+degraders Xb/v 
+ Hydrogen degraders Xh 
+Readily and slowly 
+degradable carbohydrates Xcb-S/Xcb-R 
+ Readily and slowly 
+degradable lipids Xl-S /Xl-R 
+ Readily and slowly Xp-S/Xp-R 
+degradable protein 
+ 
+LCFA Degraders XLCFA 
+ Sugar Degraders Xs 
+Amminoacids Degraders Xam 
+ 
+Sludge concentration Xsl 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 	   	   6	   1	  	   	   	   	  
+CHAPTER 5 - ADM1 FOR DRY AND SEMI-DRY ANAEROBIC DIGESTION OF SOLID 
+ORGANIC WASTE 
+ 
+Table 17. Kinetic constants of the MADM1 model. 
+ Kinetic Kinetic  
+ Substrate constants Process (ρ j) [T-1]* 
+ Complex Organic Disintegration of 
+Substrate Ksbk complex organic matter 
+ Propionate Kpro Uptake of 
+Propionate 
+ Acetate Kac Uptake of acetate 
+Total Valerate and Uptake of Valerate 
+ Butyrate 
+Kc4 and Butyrate 
+Hydrogen Kh Uptake of hydrogen 
+Methane K   
+ mCarbohydrate  Hydrolysis of 
+(slowly and readily Kc-S/Kc-R carbohydrates 
+ biodegradable) 
+Lipids  Hydrolysis of lipids 
+ (slowly and readily Kl-S/Kl-R 
+biodegradable) 
+Proteins  Hydrolysis of 
+ (slowly and readily Kp-S/Kl-R proteins 
+biodegradable) 
+ LCFA KLCFA Uptake of LCFA 
+ Sugars Ks Uptake of Sugars 
+ Amino acids K  Uptake of amino am acids 
+*only in the case of Ksbk constant dimension is [ML-2T-1]. 
+With respect to the MADM1, the proposed model modifies some of the kinetic equations listed in 
+Esposito et al. (2011a,b). Each kinetic constant (Ksbk, Kac and Kpro) is expressed as function of the TS 
+content in order to take into account the reduction of intermediate process kinetic on the following 
+processes: the initial substrate disintegration, the acetate and the propionate up-take. More precisely 
+assuming CSTR conditions and a constant reactor Volume (V), for each state variable (Ci), the mass 
+balance has the following form: 
+     dCi qC= i−in qC− i−outdt V V +∑ ν ρ         (8) j=i−23 ij j
+w	   here: 	   6	   2	  	   	   	   	  
+CHAPTER 5 - ADM1 FOR DRY AND SEMI-DRY ANAEROBIC DIGESTION OF SOLID 
+ORGANIC WASTE 
+the term  qCi−in qC− i−outV V  = 0 in batch conditions, where the flow rate (q) is assumed to be zero, and 
+the term∑ ν ijρ j is the overall reaction term expressed as a sum of specific kinetic rate for the j=i−23
+process j (ρj) multiplied by the stoichiometric coefficients (νij) that describe the influence of the 
+specific process j on the individual component i.  
+The specific kinetic rates and the stoichiometric coefficients used in the present model are strictly 
+equivalent to those present in the MADM1. 
+The main difference of the proposed model compared to the MADM1 is the capability to consider the 
+variation of the kinetic constants Ksbk, Kac and Kpro with the TS content. These constants are involved 
+in the following specific kinetic rates:  
+      ρi,1 = Ksbk ⋅C ⋅a*       (9) 
+     Sρ = K ⋅ proi,13 pro K S ⋅Xpro ⋅ I+ 2     (10) s bu
+     Sρ aci,14 = Kac ⋅ K S ⋅Xac ⋅ I3     (11) s + ac
+These equations have been reformulated by substituting the kinetic constants Ksbk, Kac and Kpro with 
+the following functions:  
+     Ksbk (TS) = a ⋅TS + b             (12) 
+             Kac,pro(TS) = c ⋅TS + d           (13) 
+where the new parameters a, b, c and d need to be calibrated depending on the substrate type (in this 
+study rice straw and food waste) and the specific experimental conditions such as temperature, 
+pressure, pH, retention time and mixing conditions (Liotta et al. 2014). 
+ 
+5.3 Model calibration 
+The proposed model was calibrated using the experimental data obtained during anaerobic digestion 
+of food waste and rice straw. The experimental tests were conducted in batch, at 32°C, using two liter 
+r	  eactors. The following TS concentrations were t	  ested 4.2%, 12.8% and 19.2% for the food wast6e	   3, 	  	   	   	   	  
+CHAPTER 5 - ADM1 FOR DRY AND SEMI-DRY ANAEROBIC DIGESTION OF SOLID 
+ORGANIC WASTE 
+and 4.85%, 14.86% and 23.40% for the rice straw. The experimental procedures and the obtained 
+results are reported in Chapters 3-4. 
+The calibration was performed in two steps. In the first step, the simulated curves were plotted for 
+each value of K  ac, Kpro and Ksbk, and the simulated results were compared with experimental data by 
+applying the RMSE method, as usually done for the model calibration process (Janssen and 
+Heuberger 1995; Esposito et al. 2011a, b). In the second step, the values of each K  ac, Kpro, Ksbk 
+associated to the lower RMSE that better fit the proposed equations (12, 13), were introduced in the 
+model to perform a second set of simulations. These modelling results were again compared with 
+experimental data by individuating the final RMSE values for each K  ac, Kpro and Ksbk value. The final 
+results of calibration procedure are summarized in Figures 29-31 and Table 18. In particular the 
+experimental data were used for both substrates to calibrate the disintegration kinetic constants Kdis of 
+the ADM1, assuming it coincides with the constant Ksbk of the MADM1, as the specific surface did 
+not varied in the different tests. Acetic and propionic acid productions were used to calibrate the 
+constants Kac and Kpro. All the other constants and parameters were set from literature data (Batstone 
+et al. 2002; Esposito et al. 2008, 2011a, b).  
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+	   	   6	   4	  	   	   	   	  
+CHAPTER 5 - ADM1 FOR DRY AND SEMI-DRY ANAEROBIC DIGESTION OF SOLID 
+ORGANIC WASTE 
+(A) (B)
+0.16 0.16
+0.14 0.14
+0.12 0.12
+0.1 0.1
+0.08 0.08
+0.06 0.06
+0.04 0.04
+0.02 0.02
+0 0
+0 10 20 30 40 50 0 0.04 0.08 0.12 0.16
+Time [d] Measured CH4 [mol] 	  
+(C) (D)
+0.4 0.4
+0.35 0.35
+0.3 0.3
+0.25 0.25
+0.2 0.2
+0.15 0.15
+0.1 0.1
+0.05 0.05
+0 0
+0 10 20 30 40 0 0.1 0.2 0.3 0.4
+Time [d] Measured CH4 [mol] 	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  
+(E) (F)
+0.6 0.6
+0.5 0.5
+0.4 0.4
+0.3 0.3
+0.2 0.2
+0.1 0.1
+0 0
+0 10 20 30 40 0 0.1 0.2 0.3 0.4 0.5 0.6
+Time [d] Measured CH4 [mol]  
+Figure 29. Comparison of measured (points) and simulated (continuous line) data of cumulative 
+methane production for experiments with food waste at A, B) TS = 4.52%; C, D) TS = 12.87%; E, F) 
+TS = 19.02%. 
+	   	   6	   5	  	   	   	   	  
+CH4 [mol] CHCH  [mol] 4
+ [mol]
+4
+Simulated CH  [mol] Simulated CH  [mol]
+Simulated CH4 [mol]
+4 4
+CHAPTER 5 - ADM1 FOR DRY AND SEMI-DRY ANAEROBIC DIGESTION OF SOLID 
+ORGANIC WASTE 
+(A) (B) x 10-3 (C) x 10-3 (D)
+0.018 0.035 6 1
+0.016 0.9
+0.03
+5
+0.014 0.8
+0.025 0.7
+0.012 4
+0.6
+0.01 0.02
+3 0.5
+0.008 0.015
+0.4
+0.006 2
+0.01 0.3
+0.004 0.2
+1
+0.005
+0.002 0.1
+	  	  	  	  	  	   0 0 0 00 20 40 60 0 20 40 60 0 20 40 60 0 20 40 60Time [d] Time [d] Time [d] Time [d] 	  
+(E) (F) (G) x 10-3 (H)
+0.045 0.07 0.025 6
+0.04
+0.06
+5
+0.035 0.02
+0.05
+0.03 4
+0.015
+0.025 0.04
+3
+0.02 0.03
+0.01
+0.015 2
+0.02
+0.01 0.005
+1
+0.01
+0.005
+	  	  	  	  	   0 0 0 00 20 40 60 0 20 40 60 0 20 40 60 0 20 40 60Time [d] Time [d] Time [d] Time [d] 	  
+(I) (L)
+0.05 0.07 (J) (K)0.07 0.01
+0.045 0.009
+0.06 0.06
+0.04 0.008
+0.035 0.05 0.05 0.007
+0.03
+0.04 0.0060.04
+0.025 0.005
+0.03
+0.02 0.03 0.004
+0.015 0.02 0.02 0.003
+0.01 0.002
+0.01 0.01
+	  	   0.005 0.00100 20 40 60 00 20 40 60 0 00 20 40 60 0 20 40 60Time [d] Time [d] Time [d] Time [d] 	  
+Figure 30. Comparison of measured (points) and simulated (continuous line)	   data for experiments with food waste: A-D) TS = 4.52%; E-H) TS = 12.92% and I-K) TS = 19.02%. 
+ 
+	   	   6	   6	  	   	   	   	  
+propionate [mol] propionate [mol] propionate [mol]
+acetate [mol] acetate [mol] acetate [mol]
+butirate [mol] butirate [mol] butirate [mol]
+valerate [mol] valerate [mol]
+valerate [mol]
+CHAPTER 5 - ADM1 FOR DRY AND SEMI-DRY ANAEROBIC DIGESTION OF SOLID 
+ORGANIC WASTE 
+(A) (B) x 10-3 (C)
+1.8 x 10
+-3 (D)
+0.14 0.14 3
+1.6
+0.12 0.12 2.5
+1.4
+0.1 0.1
+1.2 2
+0.08 0.08 1
+1.5
+0.06 0.06 0.8
+0.6 1
+0.04 0.04
+0.4
+0.02 0.02 0.5
+0.2
+0 0 0 0
+0 20 40 60 0 0.05 0.1 0.15 0.2 0 20 40 60 0 20 40 60
+Time [d] Measured CH4 [mol] Time [d] Time [d] 	  
+(E) (F) x 10-3 (G) x 10-3 (H)
+0.12 0.12 7 6
+6
+0.1 0.1 5
+5
+0.08 0.08 4
+4
+0.06 0.06 3
+3
+0.04 0.04 2
+2
+0.02 0.02 1
+1
+0 0 0 0
+0 20 40 60 0 0.05 0.1 0.15 0.2 0 20 40 60 0 20 40 60
+Time [d] Measured CH4 [mol] Time [d] Time [d] 	  
+(I) (L) (J) x 10-3 (K)
+0.25 0.25 0.02 9
+0.018 8
+0.2 0.2 0.016 7
+0.014
+6
+0.15 0.15 0.012
+5
+0.01
+4
+0.1 0.1 0.008
+3
+0.006
+0.05 0.05 0.004 2
+0.002 1
+0 0 0 0
+0 20 40 60 0 0.1 0.2 0.3 0.4 0 20 40 60 0 20 40 60
+Time [d] Measured CH4 [mol] Time [d] Time [d] 	  
+Figure 31. Comparison of measured (points) and simulated (continuous line) data for experiments 
+	  with rice straw: A-D) TS = 4.85%; E-H) TS = 14.86%; I-K) TS = 23.4%. 
+	  	  
+	   	   6	   7	  	   	   	   	  
+CH4 [mol] CH4 [mol] CH4 [mol]
+Simulated CH4 [mol] Simulated CH4 [mol] Simulated CH4 [mol]
+propionate [mol]
+propionate [mol] propionate [mol]
+acetate [mol] acetate [mol] acetate [mol]
+CHAPTER 5 - ADM1 FOR DRY AND SEMI-DRY ANAEROBIC DIGESTION OF SOLID 
+ORGANIC WASTE 
+ 
+Table 18. Kinetic constant for disintegration and VFA at different TS concentrations for food waste 
+and rice straw.  
+	  
+TS Kdis RMSE Kac RMSE Kpro RMSE 
+Substrate 
+[%] [d-1] [d-1] [d-1] 
+4.52 6.5 0.0072 8.47 0.0076 8.47 0.0052 
+Food Waste 12.8 4 0.01 5.08 0.019 5.08 0.019 
+19.02 2 0.0065 2.46 0.011 2.46 0.021 
+ 4.85 2.5 0.01 8.79 0.005 8.79 0.005 	  
+Rice Straw 14.86 1.25 0.009 5.94 0.001 5.94 0.0019 	  
+ 23.40 0.65 0.0073 3.51 0.001 3.51 0.0055 
+ 
+5.4. Results and discussion 
+Table 18 and Figure 32 show that for both substrates the calibrated disintegration rate constant 
+linearly decreased with increasing TS concentration for both substrates. The linear function (12) can 
+be expressed in this case as follow:  
+For food waste: Kdis = −0.31⋅TS + 7.9  with r2 = 0.99    (14) 
+For rice straw: Kdis = −0.1⋅TS + 2.9     with r2 = 0.97               (15) 
+Where Kdis is assumed to be coincident with Ksbk.  
+The values of parameters a, b are different for the two tested substrates because of the specific 
+characteristic of the initial substrate to be hydrolysed. In fact food waste is a more easily 
+biodegradable substrate compared to rice straw that is a complex lignocellulosic structure more 
+difficult to be disintegrated. In fact, the structure of rice straw consists of different types of polymers 
+that are difficult to degrade such as: cellulose (37.4%), hemi-cellulose (44.9%), lignin (4.9%) and 
+silicon ash (13%) (Hills and Robert 1981; Mussoline et al. 2013). Thus for each TS the rice straw 
+disintegration rate constant (and the values a, b) are lower than the one of food waste. These results 
+are consistent with results previously presented by Liotta et al. (2014), where a linear correlation with 
+r2 = 0.99 was found between the carrot waste disintegration rate constant and TS in the range of wet 
+conditions. 
+	   	   6	   8	  	   	   	   	  
+CHAPTER 5 - ADM1 FOR DRY AND SEMI-DRY ANAEROBIC DIGESTION OF SOLID 
+ORGANIC WASTE 
+The linear correlations (14, 15) describe the slowing-down of the disintegration process with higher 
+values of the TS content caused by the lack of water and the limited transfer of hydrolysis products 
+(and other intermediates) to bacterial sites (Lay et al. 1997a, 1997b; Mora-Naranjo et al. 2004; 
+Pommier et al. 2007). This is in agreement with results presented by Abbassi Guendouz et al. (2012), 
+Pommier et al. (2007) and Liotta et al. (2014), who observed a strong impact of the TS content on 
+biodegradation kinetic rates and maximum methane production in anaerobic digestion of different 
+substrates.  
+Figure 33 shows that for both substrates, a linear and inverse correlation exist between the values of 
+the propionate and acetate kinetic constants and the TS content. In this case, a unique linear function, 
+as reported in (13), can be expressed for acetate and propionate as follows:  
+For food waste: Kac/pro = −0.41⋅TS +10.35  with r2  > 0.99   (16) 
+For rice straw:  K = −0.28 ⋅TS +10.71 with r2 ac/pro > 0.97   (17) 
+The values of parameters b, c in equation (16, 17) are the same for acetate and propionate. This 
+means that the kinetic rate constants for acetate and propionate are equal for each TS content. Thus, it 
+can be concluded that the effect of the water content on propionate and acetate up-take is equal.  
+Also in this case the parameters c, d differ on the base initial substrate type because of different 
+experimental conditions and biomass involved in the anaerobic degradation of food waste and rice 
+straw. Additionally there are larger differences between the values of Kac/pro for rice straw and food 
+waste with higher TS. Thus, the intrinsic characteristics of the substrate type are more influent on the 
+process development and biomass selection with a lack of water.  
+This study show that with a higher TS content lower values of Kac/pro are obtained, that determine 
+higher concentrations of acetate and propionate during the whole process (Figures 30-31). This means 
+that a higher TS content can lead to process inhibition due to VFA accumulation, implying lower 
+process efficiency in terms of VS degradation, final methane yield and specific methane production 
+rate. Indeed,  Figures 30-31 show a lower level of inhibition for the experiments under wet digestion 
+conditions (TS = 4.52% for the food waste and TS = 4.85% for the rice straw), compared to the 
+experiments under semi-dry (TS = 12.87% and TS = 14.86%) or dry (TS = 19.2% and TS = 23.4%) 
+anaerobic conditions. This is probably due to a reduction of the water content that implies a lower 
+nutrient content in the media and TVFAs accumulation.  
+Despite the good fitting between simulated and experimental concentrations, showing the capability 
+of the model to simulate the AD process of the two substrates with different initial TS, it is wor6th9 	   	   	   	  	   	   	   	  
+CHAPTER 5 - ADM1 FOR DRY AND SEMI-DRY ANAEROBIC DIGESTION OF SOLID 
+ORGANIC WASTE 
+noting that the model fitting is of higher quality for the data obtained during rice straw digestion. For 
+food waste, Figures 31,e and 31, i show that some points could not be fitted by the simulated curves. 
+This means that an inhibition phenomenon, related to the difficult degradation of propionic acid and 
+consequent formation of propionate isomers during the process not taken into account in the 
+simulation, should be considered in the further development of the kinetic equations of the model. 
+This different behaviour can be related to the nature of the substrate type. Food waste is of complex 
+nature and contains many different compounds that have different degradation kinetics. In contrast, a 
+unique substrate like rice straw, presents a kinetic behaviour easier to be modelled.  
+	  
+Figure 32. Linear correlation between disintegration kinetic constant and TS for rice straw and food 
+waste. 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+Figure 33. Linear correlation between propionate and acetate kinetic constants and TS content for rice 
+straw and food waste. 
+ 
+ 
+ 
+	   	   7	   0	  	   	   	   	  
+CHAPTER 5 - ADM1 FOR DRY AND SEMI-DRY ANAEROBIC DIGESTION OF SOLID 
+ORGANIC WASTE 
+5.5 Conclusion  
+• A mathematical model capable to simulate dry anaerobic digestion of selected complex 
+organic substrates such as rice straw and food waste is proposed.  
+• Model calibration resulted in the determination of the disintegration and VFA kinetic 
+constants for different TS contents in the range of 4.5%-23%. 
+• The good fitting of the bio-methanation tests data with the model simulation results for both 
+methane production and VFA concentrations confirms the suitability of the model.  
+• A linear equation that correlate the TS content with the disintegration kinetic constant was 
+proposed and included in the model MADM1. 
+• A linear equation that correlate the TS content with the acetate and propionate kinetic 
+	   constants was proposed and included in the model MADM1. 	  
+	  	  
+	   	   7	   1	  	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+	  	  	  	  
+	  	  	  
+	  	  	  
+CHAPTER 6 
+Literature Review 
+	   
+	  	  	  
+	  	  
+The paragraph 6.1 is the modified version of the article: 
+Flavia Liotta, Patrice Chatellier, Giovanni Esposito, Massimiliano Fabbricino, Eric D. van Hullebusch 
+& Piet N. L. Lens. (2014). Hydrodynamic mathematical modeling of aerobic plug flow and non-ideal 
+flow reactors: a review, Crit. Rev. Env. Technol. DOI:10.1080/10643389.2013.829768 
+ 
+The paragraph 6.2 is the modified version of the article: 
+Flavia Liotta, Patrice Chatellier, Giovanni Esposito, Massimiliano Fabbricino, Eric D. van Hullebusch 
+& Piet N. L. Lens. Current views on hydrodynamic
+submitted to Crit. Rev. Env. Technol. (under review).	    models of non-ideal flow anaerobic reactors, 
+	   	   7	   2	  	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+6.1 Mathematical modelling of aerobic plug flow reactor and non-ideal flow reactor 
+6.1.1 Introduction 
+Mathematical modelling and dynamic simulation have become important tools for design and 
+operation of wastewater and solid waste treatment plants. However, semi-empiric methods and 
+mathematical models based on ideal assumptions are still used for routine reactor design and 
+operation. For instance, biochemical models for the evaluation of the bioconversion processes 
+prevailing in CSTR, such as the IAWPRC Activated Sludge Model (ASM1) (Henze et al. 1987) and 
+modelling tools to evaluate system design and upgrade options, such as the ATV models (ATV 1991; 
+Benedetti et al. 2008) are widely applied. However, these models do not include the hydrodynamics of 
+the bioreactor. This is a limitation for the model suitability as many authors claim that the efficiency of 
+the pollution removal process depends also on the reactor hydrodynamics (Levin and Gealt 1993; Le 
+Moullec et al. 2008; Makinia and Wells 1999).  
+Several authors in the presented models couple the hydrodynamic processes with biochemical 
+processes and consider in the model the effect of one process on another. In particular the biochemical 
+process can be affected by the reactor flow conditions because the biomass, substrates and inhibiting 
+compounds can be distributed in different reactor zones. This implies that the biochemical process can 
+occur with different kinetics depending on hydrodynamic condition. Inhibition could also happen due 
+to the accumulation of some inhibitory compounds in specific reactor zones. In parallel, the biomass 
+type developing in the reactor influences the viscosity of the mixed liquor and thus the hydrodynamics 
+of the reactor. The objective of this literature review is, therefore, to review mathematical models of 
+aerobic reactors going beyond the hypothesis of complete mixing conditions and focusing only on 
+hydrodynamic aspects and on the role of reactor configuration on the process performances. The 
+present research also analyses and compares performance-prediction models referring to the most 
+common aerobic bioreactors configurations, i.e. Activated Sludge Reactors (AS), Fluidized Bed 
+Reactors (FBR), Biofilters (BF) and Trickling Filters (TF), and addresses both plug flow reactors and 
+non-ideal flow reactors. Finally, the chapter illustrates more in details the differences among the 
+proposed approaches, indicates the adopted solving algorithms and discusses the capacity of the 
+models to fit the experimental data.  
+ 
+	   	   7	   3	  	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+6.1.2. Design models and performance-prediction models 
+A design model is a model capable of predicting the reactor volume when the desired treatment 
+efficiency and the operational conditions are set. It is typically based on simplified assumptions 
+aiming to make the model easy to apply. For instance, steady-state instead of dynamic conditions are 
+assumed. In the literature, there are few attempts to use steady-state mathematical models to design 
+PFR and non-ideal flow reactors (San 1994) (Table 19). They are often simply modelled in terms of 
+design graph or charts (San 1994). These steady-state models are however beyond the scope of this 
+chapter. In contrast, a performance-prediction model is typically a dynamic model that simulates most 
+of the physical, chemical and biological processes taking place in the reactor. It is aiming to predict 
+the effluent concentrations once the bioreactor volume is known and the operational conditions are 
+set. Table 20 gives some performance-prediction models published in the literature. They are 
+reviewed in details in this chapter, after a short description of the fundamentals of the adopted 
+approaches. The attempts made by the authors to calibrate or validate these models are described as 
+well. 
+ 
+Table 19. Design model of Activated Sludge and Fluidized Bed Reactor 
+ 
+        R   e  a  c tor  References 
+Activated Sludge   San (1994);   
+ Muslu (2000)  
+ Fluidized Bed Reactor  Shieh et al. (1982) 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+	   	   7	   4	  	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+ 
+Table 20. Performance prediction mathematical models 
+   San (1989); San (1992); 
+ Activated Sludge  L	   awrence and McCarty (1980);  Olsson and Andrews (1978);  
+               PFR Fluidized Bed  Shieh et al. (1982);	  
+Biofilter and  Meunier and Williamson (1981);  
+Trickling Filters Baquerizo et al. (2005); Jacob et al. (1996);	  
+ Milbury et al. (1965); 
+       TIS/TIS derived Activated Sludge Braha and Hafner (1985);  
+Muslu (2000a,b). 
+Fluidized Bed                         Y   u   e  t   a  l .   ( 1  9  9  9  )  	                
+Biofilter and  Fdz-Polanco et al. (1994);	  
+Trickling Filters 
+ Martinov et al. (2010); Mezaoui 
+ (1979); Nyadziehe (1980); 
+         Activated Sludge Sant'Anna (1985); De Clercq et al. 
+  (1999); Turian et al. (1975); Lee et 
+ al. (1999a,b); 
+ Olsson and Andrews (1978); Makinia and Wells (2000); 
+ El-Temtamy et al. (1979a,b);  
+ Muroyama and Fan (1985);  
+                Dispersion  Fluidized Bed                          D   a  v  i d  s  o  n   e  t  a l  .  ( 1  9  8  5  ) ;   
+ Lin (1991);  
+Kim and Kang (1997); 
+Michelsen and Østergaard (1970).	  
+Froment and Bischoff 1990;  
+Biofilter and Trickling Séguret and Racault (1998); Muslu 
+Filters (1990); Muslu (1984); 
+Muslu 	  and San 1990; Séguret et al. (2000)
+ Activated Sludge Le Moullec et al. (2010a,b); Glover 
+ (2006) 
+                 CFD Fluidized Bed  	  
+Biofilter and  Iliuta and Larachi (2005)	  
+Trickling Filters 
+ 
+ 
+	  	  	  
+	   	   7	   5	  	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+6.1.3 Modeling approaches 
+Hydrodynamic models can be generally divided into two different groups: ideal models, referring to 
+CSTR and PFR conditions, and non ideal models, taking into account the effect of longitudinal 
+mixing neglected by ideal models (Table 21). In the CSTR model, the inlet reactant is assumed to be 
+completely mixed in the reactor so that concentrations are homogeneous in the vessel. 
+The mass-balance equation for a non-reactive tracer in a CSTR is: 
+  dCex V =Q ⋅Cin −Q ⋅Cex                                                                     (18) dt
+where:  
+t = time [T]; 
+V = reactor control volume [L3]; 
+Q = volumetric flow rate [L3T-1]; 
+C = reactant concentration [ML-3]; 
+in = subscript denoting influent;  
+ex = subscript denoting effluent;  
+In the PFR, it is assumed that no longitudinal mixing occurs between adjacent elements of the fluid 
+and each element of the influent reactant remains in the reactor for a time equal to the hydraulic 
+retention time (HRT).  
+The mass-balance for a non-reactive tracer is: 
+ ∂C dV =Q C Q ⎛C ∂C⋅ − ⋅⎜ + dx ⎞⎟                                                                     (19)  
+∂t ⎝ ∂x ⎠
+where: 
+x = spatial variable in the flow direction [L]. 
+Under un-steady state conditions, equation (11) may be written as: 
+  ∂C v ∂C= − ⋅                                                                               (20) 
+∂t ∂x
+where: 
+v = flow velocity [LT-1]. 
+Among non-ideal models, a prominent role is played by the tank-in-series (TIS) model. This model is 
+used to describe the dispersion in PFR. The TIS model describes the flow in a reactor system 
+	  considering it can be discretized into a series o	   f equal-sized hypothetical CSTRs. This model7i	  n6g	  	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+approach was introduced for tracer analyses and one of the earliest descriptions of this theory was 
+given by MacMullin and Weber (1935).  
+If a tracer is distributed uniformly throughout all the compartments of the vessel and then diluted out 
+at a constant rate, the effluent tracer concentration Cex as a function of time is given by (Martin, 2000):  
+C NN t N−1 N⎛ ⎞ − tex = ⎜ ⎟ e τ                                                              (21) 
+Cin (N −1) !⎝τ ⎠
+where: 
+N = number of reactor in series.  
+Levenspiel (1972) related the number of reactors in series to the variance number with the following 
+expression: 
+ 2 1σ =                                                                                    (22) 
+N
+where: 
+σ2 = variance of Residence Time Distribution (RTD) curve from a pulse tracer input.  
+Generally, N = 1 represents a CSTR, whereas N = ∞ means a PFR. 
+With respect to the previous approach, the extended tank-in series model (ETIS) (Murphy and 
+Timpany 1967) presents a small difference, as it introduces the concept of non-integer number of 
+hypothetical tanks in series to remove the quantization problem which occurs as N tends to 1. The 
+ETIS model defines the exit age distribution function, E(t), through the following equations: 
+C NN t N −1 N⎛ ⎞ − t E(t)= ex = ⎜ ⎟ e τ                                                      (23)  
+Cin Γ(N )⎝τ ⎠
+∞
+Γ(N )= ∫ e−v ⋅v(N −1)dv                                                                                          (24)  
+0
+Consequently, the N parameter loses its physical meaning as a number (positive) of tanks in the ETIS 
+model, but the model acquires a continuous distribution of flow-rate. The ETIS model coincides with 
+the TIS model when the parameter N is an integer number. This model is particularly useful when N is 
+small and a large number of discontinuities occurs in the TIS model due to the discrete nature of the 
+parameter N. A further variation of the TIS model consists in fractionating the reactor in different 
+sections, e.g. a CSTR section, a PFR section and a dead section with by-pass flows or back-mixing 
+flows between the zones. With tracer tests and considering different liquid and gas flow rates, it is 
+possible to define the values of bypass flows and dead sections. 
+	   	   7	   7	  	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+Apart from the TIS and TIS-derived models, other approaches have been followed to describe the 
+dispersion effect. One of the pioneering and most complete studies on longitudinal mixing in aeration 
+tanks was published by Thomas and McKee (1944). They demonstrated that longitudinal mixing is 
+the effect of various factors as the degree of turbulence, the flow rate, the length of the tank and the 
+number of baffles. The authors set up the dispersion model introducing the differential equation for a 
+tubular reactor with longitudinal diffusion as well as flow (changes in volume were assumed not to 
+occur, so that the mean longitudinal velocity is the same at all cross-sections). The resulting equation 
+is: 
+∂C D ∂
+2C ∂C
+= 2 − v                                                                             (25) ∂t ∂x ∂x
+where: 
+D = dispersion number [L2T-1].  
+Equation (17) was solved considering as initial boundary conditions that the concentration gradient 
+was equal to the initial concentration and by assuming that the exit gradient was equal to zero at the 
+end of the reactor.  
+The authors calculated the dispersion coefficient as:  
+ D = L2 1802           (26) π ⋅ t90
+where: 
+L = reactor length [L]; 
+t90 = time required for the effluent concentration to attain 90% of its ultimate value [T].  
+The dispersion number, D is defined as: 
+  D D=                                                                                              (27) 
+v ⋅ L
+D has an important role to indicate which of the ideal flow models is approached. When D is higher 
+than 0.5-4, completely mixing can be assumed (Khudenko and Shpirt 1986; U.S. EPA 1993; Makinia 
+and Wells 1999). Long and narrow tanks, with a dispersion number lower than 0.05-0.2 (Khudenko 
+and Shpirt 1986; U.S. EPA 1993; Eckenfelder et al. 1985; Makinia and Wells 1999) are considered an 
+approximation of plug flow. Typical dispersion numbers in wastewater treatment units are in the range 
+between 0.1 and 4, which suggests that the existing deviations from ideal flow have to be taken into 
+consideration (Makinia and Wells 2005; Makinia and Wells 1999). 
+	   	   7	   8	  	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+With regard to the integration of the equations an algebraic solution is possible for simple models 
+based on CSTR or CSTR in series configurations, whereas finite difference techniques or 
+Computational Fluid Dynamics (CFD).  
+ 
+Table 21 Modelling approach: PFR, CSTR, TIS, Dispersion model, CFD basic concept and equation 
+ 
+ 
+ Modelling approach      Basic concept                   Equation  
+ 
+  No longitudinal mixing  
+Ideal PFR occurs between adjacent ∂C v ∂C = − ⋅     elements of fluid. ∂t ∂x
+ 
+  The concentration is C  t−
+ Ideal CSTR  assumed to be 
+ex = e τ  
+homogeneous in the Cin
+ reactor. 
+TIS The flow is discretized Cex N N
+N −1 N
+⎛ t ⎞ − t
+into a series of = e τ  
+ C (N −1)
+⎜ ⎟
+ !⎝τ ⎠
+hypothetical CSTRs. in
+Dispersion model  The Differential ∂C 2D ∂ C ∂C equation that include = − v  ∂t ∂x2 ∂x
+ longitudinal diffusion 
+	   and advection term. CFD Is a techniques applied Discretizes the reactor using a 	   to solve fluid dynamics computational grid and include 	   models on digital fundamental mass, momentum computers.  and energy conservation 
+	   	  
+equation. 
+6.1.4.Mathematical modeling of Activated Sludge plug flow reactors 
+6.1.4.1 Process description 
+The activated sludge process is used for the biological treatment of municipal and industrial 
+wastewaters. The basic activated sludge treatment process (Fig. 34A) consists of the following three 
+	  components: i) a flocculant slurry of mixed liquo	  r suspended solids (MLSS) utilized in the bioreac7	  to9r	  	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+to remove soluble and particulate organic matter from the influent waste stream; ii) a sedimentation 
+tank to separate the MLSS from the treated water and iii) a recycle system to return solids removed 
+from the liquid-solids separation unit back to the bioreactor.  
+The MLSS containing bioreactor is commonly called an aeration basin. It is an open tank equipped 
+with a system to transfer oxygen into solution to provide mixing energy to guarantee suspension of the 
+MLSS. Models taking into account the hydrodynamics of the plug flow aeration basin, that could 
+affect key parameters of the process such as treatment efficiency or settling properties of the activated 
+sludge, are described below. 
+ 
+6.1.5. Model development 
+6.1.5.1 Ideal PFR and CSTR in series 
+The ideal plug-flow model has been frequently applied to plug flow activated sludge systems (Fig. 
+34B). Lawrence and McCarty (1970), assuming steady-state conditions, proposed the following 
+equation for processes that occur in the aeration basin based on the hypothesis of constant biomass 
+concentration in the reactor, valid as long as the SRT/HRT ratio is higher than 5: 
+dC C ⋅ X
+= −µ ⋅                                                                                                   (28) 
+dt ks +C
+X  = time averaged biomass concentration [ML-3]; 
+ks = saturation coefficient [ML-3]; 
+µ = maximum specific growth rate [T-1]. 
+San (1989, 1992) considered the same mass balance equation proposed by Lawrence and McCarty 
+(1970) for the reactant at steady-state conditions. Taking also into account the time variation of the 
+biomass concentration in the reactor and introducing the settler in the process configuration, they 
+obtained the following differential equations: 
+  dC 1 C ⋅ X ⎛ 1 ⎞= −µ ⋅ ⋅ ⎜ ⎟                                                         (29) 
+dt Y ks +C ⎝1+ R ⎠
+dX dC k ⋅ X
+− =Y ⋅ + d                                                                   (30) 
+dt dt 1+ R
+where:  
+	  X = biomass concentration [ML-3];  	   8	   0	  	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+ks = saturation coefficient [ML-3];  
+R = sludge recycle ratio;  
+µ = maximum specific growth rate [T-1]; 
+Y= yield coefficient; 
+k  = decay coefficient [T-1d ].  
+Equations (21) and (22) were solved by San (1989, 1992) using the following boundaries conditions, 
+obtained from the mass balances of substrate and biomass concentration at the mixing point of fresh 
+feed and recycled flow (Fig. 34B), also proposed by Tuček et al. (1971): 
+Cin + R ⋅CCmix =                                          (31) 1+ R
+X X= in + R ⋅ Xrmix                                (32) 1+ R
+where:  
+r = subscript denoting the return flow; 
+mix = subscript denoting the combined flow entering in aeration basin; 
+in = subscript denoting the inlet flow in the activated sludge system constituted of aeration basin and 
+settler. 
+Another attempt to use the ideal plug flow approach for activated sludge plug flow reactors, was done 
+by Olsson and Andrews (1978) who proposed a model that simulates the substrate, biomass and 
+oxygen concentrations as a function of time and the spatial variable. 
+To the best of our knowledge, one of the first attempts to model a plug flow reactor with a tank in 
+series configuration was done by Milbury et al. (1965). Following this work also Murphy and 
+Timpany (1967); Braha and Hafner (1985) and Muslu (2000a,b) modeled the plug flow reactor as a 
+multiple tanks in series configuration. In particular Muslu (2000a,b) applied the old work of Milbury 
+et al. (1965), removing some hypotheses of their proposed model. In particular they changed the 
+biochemical model and proposed a new modeling approach where the axial change in biomass 
+concentration is considered by writing two mass balance equations for biomass and reactant and 
+considering a series of equal-sized, completely mixed reactors (Fig. 34 C) to represent the PFR 
+reactor.  
+A steady state mass balance is considered for the biomass and substrate. The resulting equations that 
+represent the effluent concentration of substrate and biomass from each reactor in dimensionless form 
+are: 
+	   	   8	   1	  	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+1 kd ⋅τ X inC + −C = ex = N X exex                                                             (33) 
+kS (µ − kd )⋅τ X in−1+
+N X ex
+X Xex X in +Cin −Cexex = =                                                                               (34) 
+Y ⋅ kS ⎛⎜1
+kd ⋅τ+ ⎞⎟
+⎝ N ⎠
+These equations have to be solved using trial and error procedures.  
+(1+R)Q  C          C+ΔC  (1+R)Q
+              X                   X+ΔX
+influent effluent Q C
+ o            Ci            Q1, C1 Q-Qww
+Q  C Q0 Cex  Xo                  Xi0 in Plug              X1
+flow Aeration
+Tank
+Qr+Qw       Qw,C
+sludge Qr,C                    Xw
+recycle
+          Xr Xr,C
+A. Schematic configuration of an activated sludge system B. Representation of plug flow model for activated sludge system
+            Q  C              Ci              Ce              C Q0-Q4Q  C 1 i 20 in
+              X              Xi              Xe              X C2 X5X iin 2       
+Q3+Q4
+Q3,C3 C2 X3
+          X3                  Q4
+C. Reactor in series with sludge return
+                                      Figure 34. Schematic representation of activated sludge reactor. 
+ 
+    
+6.1.5.2 Non ideal flow reactor models 
+In the plug flow aeration basin of activated sludge process can cause high transverse axial mixing and 
+high aeration rate, high traverse velocities and irregular air distribution. Therefore, it is not possible to 
+describe the process with ideal plug flow equations. Thus several authors (San 1989; Lee et al. 1999a; 
+Wehner and Wilhelm 1956) described non-ideal conditions, caused by axial mixing, with the 
+following advective-diffusive equation including a reaction term: 
+  ∂C ∂(v ⋅ C) ∂ ⎛D ∂C+ =  ⎞⎜ ⎟+ RC                                                             (34) 
+	   ∂t ∂x ∂x ⎝ ∂x ⎠ 	   8	   2	  	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+where:  
+R  = reaction term [ML-3T-1C ]. 
+In particular, Khudenko and Shpirt (1986) did not introduce the reaction term in the equation (34), but 
+coupled this equation to the oxygen mass transfer equation to find the optimal sizes to the aeration 
+tank and aeration system. 
+San (1992) developed an analytical solution for the differential equations of dispersed plug flow 
+systems in steady-state conditions, including a reaction term based on Monod kinetics. Lately the 
+same author (San 1994) introduced the following differential equations to simulate the effect of feed 
+and outlet channels: 
+2
+ 1 d C dC− = 0    x∉[0, 1]                                                               (35) 
+Pe dx2 dx
+1 d 2C dC τ ⋅µ ⋅ X 1
+− − = 0    x∈[0, 1]                                                          (36)  
+Pe dx2 dx Y ⋅ kS 1+C
+where: 
+Pe = Peclet number. 
+Equations (35) and (36) were solved using boundary conditions introduced by Wehner and Wilhelm 
+(1956), resulting from the conservation of reactants at the exit and entrance of the reactor, taking into 
+account flow and diffusion, and from the intuitive argument that the concentrations should be 
+continuous between the reactor entrance and exit sections in steady-state conditions. 
+Turian et al. (1975), Lee et al. (1999a, 1999b) and Makinia and Wells (2000a,b) incorporated a more 
+comprehensive chain of biological reactions into the dispersion flow reactor model in unsteady state 
+conditions. Olivet et al. (2005) proposed tanks in series model to simulate the hydrodynamic 
+behaviour of a full scale plant. In particular a four tank in series model was developed. The authors 
+also included a dead zone to simulate the reactor zone with diffusers. Furthermore, the hydraulic 
+model includes the external recycle from the secondary settler. RTD tests were done to find the model 
+that better describes the reactor hydraulic behaviour. Also Potier et al. (2005) simulated full scale 
+aerated channels treating wastewater by applying a tanks in series model with back-mixing. The 
+authors considered in the model the variations of the wastewater characteristics (concentration and 
+composition of polluted influent, flow-rate, etc.). They also demonstrated that it is possible to simulate 
+easily the variations of the axial dispersion coefficient with the flow-rate through this model with a 
+maximal fixed number of mixing cells and a variable backflow rate. The authors also found several 
+	   	   8	   3	  	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+correlations of the dispersion coefficient with reactor width, reactor length and gas flow-rate as 
+reported below:  
+0.5
+D =0.2032 "Q %⋅H ⋅$ GL '                                                                          (37) # &
+where:  
+Q = gas flow-rate [ML-3G ]. 
+In another paper, Fall and Loaiza-Navia (2007) modelled with AQUASIM Software a full-scale 
+activated sludge reactor by applying the CSTR in series model. The authors also validated the model 
+by operating tracer tests. Lately, Ramin et al. (2011) modelled the activated sludge reactor also 
+including a settling tank. The authors also performed a sensitivity analysis with the Monte Carlo 
+method and uncertainty method and applied the convection-dispersion model. 
+6.1.5.3 Computational fluid dynamics model development 
+All the models described above are called “systemic models”, because they emphasize the functional 
+aspects of the reactor, without detailing the localization of the phenomena inside the reactor. Thus, 
+they give quite rapidly and with moderate efforts a first approximation of the reactor behavior. These 
+models have a good robustness in the range of experimental and size conditions for which they have 
+been developed (Le Moullec 2010b). However, they could remain unsatisfactory to consider local 
+phenomena and to model the influence of the reactor geometry (length/width ratio, presence of 
+baffles, effluent inlet device), the aeration process (sparging device, gas fraction field) and the 
+resulting local mixing (Le Moullec 2010a).  
+In the last few years some attempts were made to model the activated sludge reactor using a new 
+approach: a Computational Fluid Dynamics (CFD) model. It is a powerful tool which allows studying 
+the influences of the operating parameters and the hydrodynamic phenomena at local scale (Le 
+Moullec 2010b). With a structural approach a CFD model discretizes the reactor using a 
+computational grid, formulates and solves the fundamental mass, momentum, and energy 
+conservation equations in space (Huang et al. 2005). CFD simulations can define the flow patterns and 
+the retention time distribution to characterize the reactor hydraulic behavior. This information 
+provides a hint to the role of possible hydraulic problems related to the bad plant performance.  
+	   	   8	   4	  	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+Alex et al. (2002) were among the first authors in the literature to use the CFD approach to generate 
+an appropriate model structure to simulate the biological processes in CSTR activated sludge 
+compartments. The first authors who implemented the ASM1 into the CFD code through the use of 
+classical convective scalar transport equations were Glover et al. (2006). The obtained model, 
+subsequently called CFD-ASM1, was then analysed at different levels and was validated with an 
+experimental study and two numerical studies of an SBR-oxidation ditch (Vermande 2005). Glover et 
+al. (2006) demonstrated that the classical biological modeling can take advantages of CFD results in 
+order to obtain the local oxygen concentration and transfer and the hydraulic structure (recycling rate 
+and number of perfect mixed reactors) of the system.  
+However, despite numerous developments and improvements, this approach still remains difficult to 
+handle for reactors involving complex and coupled local hydrodynamics, heat and mass transfer and 
+chemical reactions because of the high computational requirements. 
+Le Moullec et al. (2011) coupled CFD with the ASM model and compartmental approach. The 
+authors considered also the dispersion model and found a correlation between the axial dispersion 
+coefficient, the gas and liquid flow-rates and the reactor geometry. Such studies should allow to 
+improve the detailed design of aerated reactors in wastewater treatment plants (gas distribution 
+system, baffles location). In another study, Zima et al. (2009) proposed CFD for predicting the 
+behaviour of reactive pollutants  in the aerobic zone of a full scale bioreactor. The one-dimensional 
+advection-dispersion equation was combined with simple biokinetic models incorporating the Monod-
+type expressions. 
+Even in single-phase reactors, chemical reactions are described by non-linear terms that often cause 
+numerical instabilities. The high data quantity required is often prohibitive, while the complexity of 
+the problems that arises from coupling the fluid dynamics with the bio-chemical phenomena means 
+that the systems has be treated with attention for case (Rigopoulos and Jones 2003). In fact a lot of 
+parameters are involved in both the biochemical (kinetic and stoechiometric) and hydrodynamic 
+(dispersion) models. Furthermore is difficult to solve together two systems of linear and non-linear 
+equations represented by Navier-Stocks equations and differential equations. These models also 
+assume that the bio-chemical model does not impact on the hydrodynamic model and vice versa. This 
+assumption is possible by neglecting the effect of biochemical processes on hydrodynamics but it is a 
+big assumption for the effect of hydrodynamic conditions on biochemical processes. In fact the 
+biochemical process can be affected by the reactor flow conditions because, the biomass, substra8te5s	   	   	   	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+and inhibiting compounds can be distributed in different reactor zones. This implies that the 
+biochemical process can occur at a different kinetic in function of the hydrodynamic condition. 
+Recently, “hybrid” approaches have emerged as an alternative. In these cases CFD is employed only 
+for the hydrodynamic simulations, while the bio-chemical phenomena are resolved with 
+compartmental modeling (Rigopoulos and Jones 2003). The latter describes the reactor as a network 
+of functional compartments spatially localized. It is based on CFD and on the determination of 
+volumes in which physico-chemical processes occur. 
+6.1.5.4 Models comparisons  
+The model proposed by Lawrence and McCarty (1970), San (1989, 1992) and Milbury (1965) are old 
+and simple to apply but the results can present a big degree of uncertainty. More complete models 
+taking into account the dispersion related to reactor configuration and aeration are the ones proposed 
+by Khudenko and Shpirt (1986) and San (1992). But the best models are those proposed by Turian et 
+al. (1975), Lee et al. (1999a, 1999b), Olivet et al. (2005), Potier et al. (2005) and Makinia and Wells 
+(2000a,b) who considered biochemical reactions and dispersion flow are the ones. Finally it is also 
+useful to apply CFD models that are more complex than the previous models but describe the 
+hydrodynamic phenomena more in detail, considering the local process that happens in the reactor. 
+6.1.6. Mathematical modeling of fluidized bed reactors 
+6.1.6.1 Process description 
+In biological Fluidized Bed Reactors (FBR), the liquid to be treated is pumped through a bed of inert 
+particles (sand, pumice, activated coal) at a velocity sufficient to cause ﬂuidization. Particles in a 
+ﬂuidized state provide a large speciﬁc area for attached biomass growth; this feature enables long 
+solids residence times and low suspended solid concentrations. Usually aeration occurs through the 
+liquid recirculation from the reactor to an oxygenator in which air or oxygen is bubbled (Fig. 35). It is 
+also possible to have a three-phase fluidized bed reactor, by insufflating the oxygen directly into the 
+reactor (Wisecaver and Fan 1989; Hirata et al. 1986; Trinet et al. 1991; Fan et al. 1987). 
+	   	   8	   6	  	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	   	  Figure 35. Schematic representation of fluidized bed reactor. 
+ 
+6.1.6.2 Model development 
+6.1.6.2.1 Ideal flow reactor models 
+The liquid phase transport of a reactant through an FBR encompasses molecular diffusion, turbulent 
+diffusion, and convective diffusion caused by a non-uniform velocity distribution; the axial dispersion 
+is insignificant under normal operating conditions. Thus, FBRs have usually been modeled using ideal 
+flow patterns, such as CSTR or PFR (Shieh et al. 1982; Mulcahy et al. 1980; Mulcahy et al. 1981; 
+Rittmann 1982; Park et al. 1984) conditions. Due to the high recirculation rates many mathematical 
+models that were developed, as CSTRs did not consider the spatial gradients of the substrates and 
+products along the height of the reactor. 
+Rittmann (1982) stated that FBR can achieve a better performance compared to complete-mix because 
+the biofilm is evenly distributed throughout the reactor while the liquid regime is still “plug flow”. 
+Adding an effluent recycle, making the liquid phase more homogeneous, can change this 
+hydrodynamic behaviour. That dilutes the feed and makes the performance approaching a complete 
+mixing unit, which implies a lower removal efficiency than under plug-flow conditions (Rittmann 
+1982). Shieh et al. (1982) tried to apply the PFR model to an FBR assuming that macroscopic radial 
+	   	   8	   7	  	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+gradients do not occur inside the reactor and pseudo-steady-state conditions prevail. The adopted 
+continuity plug flow equation is: 
+u dC + Rv = 0                                                    (38) dx
+where: 
+u = superficial velocity [ML-1]; 
+Rv = reactant conversion rate per unit fluidized bed volume [ML-3T-1]. 
+The authors included the following elements in their model: i) external and internal biofilm mass 
+transfer; ii) reactant consumption within the biofilm; and iii) a degree of bed expansion and an 
+expanded bed height under a given set of operating conditions such as flow rate, biofilm thickness, 
+media size, and density. As a result, a general model of an FBR reactor was obtained by combining 
+equation (38) with the reactant conversion rate expression and integrating the resulting equation 
+subject to boundary conditions that considers a bulk-liquid reactant concentration equal to the inlet 
+reactant concentration. The resulting equation describing the reactant concentration profile through 
+the FBR is: 
+0.9
+0.55 x ⎡0.55 3⋅r
+2 ⎤
+C =C − ⋅0.6162 p 0.55 0.45⎢ ⎥ k ⋅D ⋅ x       Φ ≥1.15          (39)  in v 0 0,m⎣⎢ρ ⋅ (r 3 − r 3p m )⋅0.5⎦⎥
+where: 
+k0 = intrinsic zero order rate constant [T-1]; 
+rm = media radius [L]; 
+rp = bioparticle radius [L];  
+r = biofilm dry density [ML- 3 ]; 
+Φ0,m  = Thiele modulus. 
+ 
+6.1.6.2.2 Non ideal flow reactor models 
+A three-phase fluidized bed reactor cannot always be described using simple models such as ideal 
+plug flow, because appreciable back-mixing may occur in the liquid phase (Muroyama and Fan 1985). 
+This back-mixing is caused by the rising of coalesced gas bubbles, in particular for beds of fine 
+particles (Muroyama and Fan 1985). Thus, Yu et al. (1999) proposed a tank-in-series model, applying 
+	  equation (13), to describe the flow pattern of an F	  BR that considers the reactor to be a combination8	   o8f	  	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+two ideal CSTR reactors. Many other investigations on the flow pattern in an FBR suggest that an 
+axial dispersed plug flow model can also be used to simulate the hydrodynamics of the process 
+(Østergaard 1968; El-Temtamy et al. 1979a; Muroyama and Fan 1985; Davidson et al. 1985; Lin 
+1991; Kim and Kang 1997; Michelsen and Østergaard 1970; El-Temtamy 1979b).  
+Additionally, many authors studied the effect of gas production on the hydrodynamics for the design 
+and scale-up of three-phase fluidized bed reactors. El-Temtamy et al. (1979a,b) described the flow of 
+the gaseous and liquid phases in a three-phase FBR by introducing a radial dispersion coefficient 
+inside the following axially dispersed plug flow equation: 
+∂C u ∂C ∂2C ⎛ ∂2C 1 ∂C ⎞
++ ⋅ = D +Dr⎜⎜ + ⋅ ⎟⎟+ RC                                  (40)  ∂t ε ∂t ∂x2 ⎝ ∂r
+2 r ∂r ⎠
+where: 
+ε = fluidized bed porosity; 
+r = relative radial position [L]; 
+Dr = radial dispersion coefficient [L2T-1]. 
+The authors solved equation (33) using boundary equations proposed by Danckwert (1953). 
+The authors also identified an indirect correlation between the Peclet number based on the particle 
+diameter and the gas flow rate and a correlation between axial mixing in the liquid phase, the presence 
+and motion of bubbles and the radial velocity profile (El-Temtamy et al. 1979a; Mulcahy and La 
+Motta 1978).  
+Lin (1991) applied an axial dispersion model for the bulk phase considering reactant diffusion and 
+consumption inside the biofilm and imposing Danckwerts (1953) boundary conditions to solve the 
+proposed equations. Additionally, the author compared the experimental data obtained by Mulcahy 
+and La Motta (1978) and Jeris (1977) with the model results and a high value of the Peclet number 
+was also found that enables a simplification based on plug flow conditions. Thus, neglecting the 
+dispersion term, the substrate in the bulk phase was modelled using the axial dispersion equation:  
+C C
+∂ ∂
+ Cin Cin Ab ⋅kS ⋅H
+⎛ C C f ⎞= − − ⋅⎜⎜ − ⎟⎟                                                                            (41) ∂t ∂x ε ⋅u ⎝Cin Cin ⎠
+where: 
+Cf  = reactant concentration in the biofilm phase [ML-3]; 
+Ab = specific surface area of coated particle [L2]; 
+	  H = height of fluidized bed [L].  	   8	   9	  	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+In this case, the authors imposed an initial boundary condition for the value of the initial reactant 
+concentration in the bulk phase.  
+ 
+6.1.6.2.3 Models comparisons  
+The models proposed by Ritmann (1982) and Schieh et al. (1982) are plug flow and steady-state 
+models, that are easy to apply but their results not are accurate. Instead more accurate models consider 
+	  also the effect of gas production on hydrodynamic behaviour (Lin et al. 1991; El-Temtamy 1979a,b). 
+6.1.7 Mathematical modeling of biofilter reactors 
+6.1.7.1 Process description 
+Aerobic biofilters (Fig. 36) are rectangular or circular packed beds used for the bio-oxidation of 
+domestic or industrial wastewater. It is possible to schematize the reactors as a three-phase system 
+where the liquid phase passes through the bed in contact with both the microbial film and a counter-
+current air stream rising by natural convection. Trickling filters have characteristics similar to 
+biological aerated filters, except they are not submerged.  
+EFFLUENT
+LIQUID
+RECIRCULATION
+PFR OXYGENETOR
+FBR
+INFLUENT
+	  
+Figure 36. Schematic representation of up-flow biofilter reactor design. 
+	  	  
+	  
+	   9	   0	  	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+6.1.7.2 Model development 
+6.1.7.2.1 Ideal flow reactor model 
+Many models assume ideal plug flow conditions in biofilter; however, non-ideal conditions may occur 
+with increased mixing and dispersion at a high flow rate. Rittmann (1982), Chang and Rittmann 
+(1987), Oleszkiewicz (1981), Costa Reis and Sant’Anna (1985) proposed a complete bioreactor model 
+that includes the biofilm and CSTR flow for the liquid phase.  
+In particular, Rittmann (1982) stated that the biofilter hydrodynamics are related to the recycle ratio, 
+in fact the reactor can achieve complete mixing conditions when the recycle ratio exceeds 10. 
+Although some researchers have found that aerobic biofilters act as plug flow systems due to either 
+channelling or backmixing (Särner 1978; Gray and Learner 1984; Vandevenne 1986; Muslu 1986; 
+Meunier and Williamson 1981). In particular, Meunier and Williamson (1981) modelled the reactor 
+considering a plug flow regime but neglected the back-mixing effect from rising bubbles of biogas. 
+Baquerizo et al. (2005) proposed a mathematical model for the biofilter based on the mass balance 
+equations, and considering four phases in the system: gas, liquid, biofilm, and solid. A plug flow 
+pattern is considered for both the liquid and gas phases, resulting in the proposed equations:  
+∂Cg ∂C a= −vg ⋅ g − b ⋅Fg−l                                                              (42) ∂t ∂x ε
+∂Cl v ∂C a a= b bl ⋅ + ⋅Fg−l − Fl−b                                                            (43) ∂t ∂x h h
+where: 
+g = subscript referred to the gas phase; 
+l =  subscript referred to the liquid phase; 
+v  = interstitial velocity [LT−1]; 
+ab = biofilm surface area per unit volume of biofilter bed [L2L−3];  
+Fg − l  = mass flux from the gas phase to the liquid phase [ML
+−2T−1]; 
+F = mass flux from the liquid phase to the biofilm phase [ML−2 −1l−b  T ]; 
+h = dynamic hold-up coefficient [ad.]. 
+In addition to the presented equations, the authors proposed a mass balance for the biofilm and the 
+	  solid phase. Jacob et al. (1996) developed a com	   plete dynamic model and applied it to an aero9b	   1ic	  	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+biofilter assuming ideal plug flow conditions. The authors accounted for filter clogging and described 
+a progressive reduction of the liquid space caused by biomass growth and suspended particle 
+retention. 
+ 
+ 6.1.7.2.2 Non-ideal flow reactor model 
+Fdz-Polanco et al. (1994) performed a tracer test at a pilot scale plant and obtained different hydraulic 
+reactor models by fitting experimental data with the theoretical model. These authors achieved a 
+Standard Relative Deviation (SRD) value below of 20% only applying a CSTR reactor and a dead 
+zone model. They also performed tracer tests for several design parameters (the length/particle 
+diameter ratio and the porosity) and operational parameters (liquid and gas superficial velocity). These 
+tests approached the plug flow for porous bed reactors, low bed porosity, low liquid and/or gas 
+velocity. However, different authors demonstrated that back-mixing could occur in such reactors 
+depending on the bed length, size of the packing particles and liquid phase velocity (Martinov et al. 
+2010; Froment and Bischoff 1990). Martinov et al. (2010) modelled a fibrous fixed bed reactor using 
+recycle with a tank-in-series model, which is advantageous since it can model the large void fraction 
+of the fixed bed and it is independent of the boundary conditions. Furthermore to account for a 
+deviation from ideal flow, they proposed a schematic model with recirculation.  
+Sanchez et al. (2005) proposed a model based on two-mixed reactors of different sizes and included in 
+the model the biofilm and gas liquid transfer. The proposed equations that describe the two mixed 
+reactors of different size are reported below in dimensionless form: 
+exp( θ ! exp) $ θ ! '− a − ⋅& )E!(θ !) = %1− a (2 a 1                                                      (44) ⋅ −
+a V= R2V V                                                                                    (45) R1 + R2
+where: 
+ VR1 = volume of the first reactor [L3]; 
+VR1 = volume of the first reactor [L3]; 
+E’ = dimensionless residence time distribution function [ad.]; 
+θ’ = dimensionless time [ad.]. 
+	   	   9	   2	  	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+ 
+Also Perez et al. (2005) proposed a model based on the tanks in series model for nitrifying fixed bed 
+bioreators. This model was used to provide a detailed description of the biomass, ammonium, nitrite 
+and nitrate concentrations along the reactor vertical axis. This flow model is useful to describe in a 
+simple way the biofilm thickness gradient along the bed as experimentally observed. 
+The tanks in series description were complemented with a back-mixing flow-rate to describe the effect 
+of the aeration flow-rate on the liquid phase mixing. Physically, raising gas bubbles generate a liquid 
+down-flow, which is taken into account in the mathematical description of the flow model. 
+The reactor was then divided into three parts: the bottom represented by one stirred tank, the fixed bed 
+represented by 5 identical stirred tanks in series, and the top represented by one stirred tank. To 
+complete the hydrodynamic equations, a gas–liquid mass transfer term and a liquid-biofilm transfer 
+term were added. 
+Froment and Bischoff (1990) focused on packed bed axial dispersion, using a low Reynolds number 
+range (between 1 and 10) and the axial dispersion model. They demonstrated that the Peclet number 
+of non-aerated granular beds varies within the range 1.4-2. Similar studies in a 0.2 m diameter packed 
+bed bubble column with high porosity packing and a vertical co-current up-flow of gas and liquid 
+have been reported by Bhatia et al. (2004). Séguret and Racault (1998) applied the residence time 
+distribution method to define the effect of the mixing pattern on the process performance in a full-
+scale nitrifying biofilter. They demonstrated that the floating filter bed itself behaves as a dispersed 
+plug flow reactor. Additionally, they identified a direct correlation between the dispersion and the 
+flow rate, and a variation of the dispersion coefficient and the residence time distribution along the 
+reactor height. They also applied a theoretical nitrifying model that accounts for the observed 
+hydrodynamic behavior. One limit of the mechanistic models is the large number of variables 
+requiring experimental confirmation. Thus, empirical models that are simpler to implement and solve 
+are of interest, such as the model proposed by Mann and Stephenson (1997). 
+With regard to Trickling filters (TF), many authors studied residence time distribution in TFs (Sinkoff 
+et al. 1959; Kshirsagar et al. 1972; Tariq 1975; Särner 1978; Gray and Learner 1984; Vandevenne 
+1986). In most works on the hydrodynamic behavior of TF, the RTD profile is a function of the media 
+used, the hydraulic loading, and the amount of biomass. TF are modeled in most studies as a series of 
+perfect mixers with a dead zone (Mezaoui 1979; Nyadziehe 1980; Sant' Anna 1980). While in the 
+	  model proposed by De Clercq et al. (1999) the	   influence of the heterogeneous film structure w9	  a3s	  	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+considered, which consisted of a biofilm, a free flowing and a captured liquid film. The authors 
+modelled the diffusion effect with the tanks in a parallel configuration and the free flowing liquid with 
+CSTR series configuration linked to the diffusion block (De Clercq et al. 1999). Other model 
+approaches are also described in the literature, such as the axial dispersed plug flow model proposed 
+by Séguret and Racault (1998). The authors proposed a bio-diffusion model which considers the TF as 
+a vertical tube that includes the reactor filling, an immobile phase, and a liquid film. The flow in the 
+liquid is postulated to be an axially dispersed plug flow, and the governing equation is:  
+∂C ∂2D C ∂C 1= ⋅ −u ⋅ + ae ⋅ JE (x)                                               (46) ∂t ∂x2 ∂x εβm
+where:  
+ae = specific surface area available for exchange per volume of filter [L2L-3]; 
+bm = mobile volume fraction; 
+JE(X) = flux of reactant at the interface between the main flow and the immobile phase [ML-2T-1]. 
+ 
+To solve this equation, the authors applied Danckwerts boundary conditions for the dispersion of flow 
+at the flow entrance, and the cessation of dispersion at the output (Séguret et al. 2000). In the 
+immobile zone it is assumed that the tracer is subject to diffusion. One particular case of equation (46) 
+is when a slice dz is consider to be perpendicular to the flow direction, in this case the mass balance 
+becomes: 
+∂C ∂2
+= D Cm ⋅ 2                                                                      (47) ∂t ∂x
+where:  
+Dm= molecular diffusion coefficient of reactant inside the biomass in the immobile phase [L2T-1].  
+Additionally the following boundary conditions at the liquid/biomass interface are also defined: 
+ C(z = 0) = C(X )                                                                                 (48) 
+ ⎛ ∂C ⎞⎜ ⎟ = 0                                                                                   (49) 
+⎝ ∂z ⎠z=e
+where: 
+e = thickness of biomass [L]. 
+Muslu (1990, 1984), Muslu and San (1990) conducted a tracer test on inclined plane trickling filters. 
+The result was used to determine the following expression that correlates the dispersion coefficient for 
+	  conserved tracer substances in flow over porous m	   edia and the flow rate: 9	   4	  	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+D φ= q4 / 3          (50)  
+L
+where: 
+φ = coefficient function of viscosity, molecular diffusion, localization of the flow path [ad.];  
+q = flow rate per unit of width [ML-2]; 
+L = length of axial travel in the reactor [L]. 
+The authors identified the hydraulic reactor model considering different flow patterns that could occur 
+inside the reactor. With high hydraulic loadings the flow pattern is a dispersed plug flow, thus the 
+authors applied the axial dispersion equation. While with lower hydraulic loading rates the authors 
+assumed a complete mix flow pattern. A transition zone in the flow regime indicates other mixing 
+conditions.  
+Iliuta and Larachi (2005) modelled TF reactors using a two-dimensional two-fluid dynamic model. 
+The complete model describes two-phase flow and the space-time evolution of biological clogging 
+and physical plugging. It is based on the macroscopic volume-averaged mass and momentum balance 
+equations, the continuity equation for the solid phase, the species balance equation for the fine 
+particles and the volume-averaged species balance equations at the reactor level. The model is coupled 
+with the simultaneous transport and consumption of phenol and oxygen within the biofilm and the 
+simultaneous diffusion of both phenol and oxygen and the adsorption of phenol within the activated 
+carbon particles. Using equations that account for the reactor hydrodynamics, the authors applied the 
+axial dispersion model to describe the species balance in the fluid phase for oxygen and the substrate, 
+	  while plug flow was assumed in the gas phase. 
+6.1.7.2.3 Models comparisons  
+Meunier and Williamson (1981), Baquerizo et al. (2005) and Jacob et al. (1996) proposed a plug flow 
+model neglecting the back-mixing effect. Others models proposed by Fdz-Polanco et al. (1994), 
+Martinov et al. (2010), Pérez et al. (2005) and Sanchez et al. (2005) included also the back-mixing 
+conditions with tank in series configurations. Also Séguret and Racault (1998), Froment and Bischoff 
+(1990), Muslu (1984, 1990), Muslu and San (1990) considered in the model the effect of dispersion 
+by applying dispersion equation obtaining a more detailed model. Lately, CFD model was proposed 
+by Iliuta and Larachi (2005). This is the most complete model because it describes a two-phase flow 
+	  and the space-time evolution of physical and biolo	  gical phenomena 9	   5	  	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+6.1.8 Model comparisons and validation and calibration 
+6.1.8.1 Models comparisons 
+The models presented above for activated sludge reactor, fluidized bed reactor and biofilter reactor 
+have different advantages and disadvantages. Furthermore there are some models which can be useful 
+in some situation and not in others. Table 22 lists all the models reported indicating for each one the 
+advantages and disadvantages and when can be utilize. 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+	   	   9	   6	  	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+Table 22. Models comparisons 
+ 
+Author Advantages Disadvantages When can be 
+used 
+Van der Meer and Heertjes, 1983; Bolle et Introduce the model of CSTR Without calibration and For initial simulation 
+al., 1986a,b; Costello et al.,1991a,b, Ojha in series model for UASB validation, simple to understand the 
+and Singh (2002) and Singh (2005). UASB reactor model with a lot of general reactor 
+assumption behaviour 
+Wu and Hickey (1997), Singhal (1998) Consider dispersion in the Without calibration and For initial simulation 
+and Zang et al. (2005). But the best models reactor validation, simple to understand the 
+are those proposed by Kalyuzhnyi et al., model with a lot of general reactor 
+(2006), Batstone et al. (2005), Mu et al. assumption behaviour 
+(2008) and Penã et al. (2006). UASB 
+Ren et al. (2009).  Use the CFD model, describe Without calibration and To study the process  
+UASB the process with  validation in detail and focalize 
+local phenomena also on local 
+phenomena in the 
+reactor 
+Young and McCarty (1968), Young and Apply the simple model of Do not model the gas For initial simulation 
+Young (1988).  AFBR CSTR in series in AFBR phase in the reactor to understand the 
+reactor general reactor 
+behaviour 
+Escudié et al. (2005), Huang and Jih Consider the presence of Without calibration and For initial simulation 
+(1997) and Smith (1996). AFBR biofilm validation and to understand the 
+biofilm growth 
+Bonnet et al. (1997) Introduce the model of plug Without calibration and For initial simulation 
+BAF flow. validation, simple to understand the 
+model with a lot of general reactor 
+assumption behaviour 
+Seok and Komisar (2003), Otton et Consider dispersion in the Without calibration and For initial simulation 
+al.(2000), Buffière et al. (1998a,b), reactor validation, simple to understand the 
+Schwarz et al.(1996-1997) and Diez and model with a lot of general reactor 
+Blanco (1995). BAF assumption behaviour 
+Buffière et al. (1998a,b). Apply the dispersion model Without model For initial simulation 
+BAF and consider also the gas- calibration and to understand the 
+phase behaviour validation general reactor 
+behaviour 
+Monteith and Stephenson (1981), Apply the simple model of Do not model the gas For initial simulation 
+Mendoza and Sharratt (1998, 1999), Smith CSTR in series in AFBR phase in the reactor to understand the 
+et al. (1993) and Keshtkar et al. (2003). reactor general reactor 
+CSTR behaviour 
+Vavilin et al. (2001, 2003). CSTR Consider dispersion in the Without calibration and For initial simulation 
+reactor validation, simple to understand the 
+	   model with a lot of general reactor assumption behaviour 
+	   	   9	   7	  	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+6.1.8.2 Activated sludge reactor 
+6.1.8.2.1 Ideal PFR and CSTR in series 
+Lawrence and McCarty (1970) first solved the proposed differential equations and obtained an 
+algebraic solution. This solution was approximate because they assumed that the biomass 
+concentration in the reactor remains nearly constant at least as long as the ratio of the solid retention 
+time to the hydraulic retention time (SRT/HRT) exceeded 5. With this assumption, they demonstrated 
+that the difference between PFR and CSTR is not too significant with regard to the evaluation of the 
+biomass concentration. San (1989) solved the same equations with a finite difference method, 
+avoiding any assumptions that could become restrictive in the case of wastewater with high solids 
+concentrations. The author described a numerical method to determine the mean residence time and 
+the effect of the kinetic coefficients on the mean solids residence times, but did not calibrate and 
+validate the model with experimental data for the field conditions.  
+As a first attempt to model a plug flow reactor with a CSTR in series model, Milbury et al. (1965) 
+defined the effective number of compartments for different detention times. Therefore they compared 
+the effluent tracer concentration of a rectangular laboratory aeration vessel with the model results. 
+Another model was developed by Muslu (2000a) and compared to the CSTR model results obtained 
+with the approximate model developed by Lawrence and McCarty (1970). Experimental data reported 
+by Lovett et al. (1984) were used to validate the model. The author obtained larger differences 
+between the real and simulated data when the mean solids residence times were small. In particular for 
+some industrial wastewater applications, there may be a considerable difference between the results of 
+the Muslu model and the approximate analytical solution of Lawrence and McCarty that neglects the 
+existence of a longitudinal biomass concentration gradient.  
+Among the models cited above only San (1989, 1992) solved the proposed equations using finite 
+difference technique, the other authors (Lawrence and McCarty 1990; Milbury et al. 1965) proposed 
+algebraic solutions of the equations introducing some simplifications.  
+Many authors performed tracer experiments that estimate the hydraulic parameters and characterize 
+the hydraulic reactor model. These parameters include the real HRT value, the dispersion coefficient 
+(for a dispersion model), the number of reactors in series (for a tank-in-series model), and back-
+mixing flows or dead zone volume. It is possible to obtain these parameters from the RTD curve that 
+	  describes the exit concentration with time. The 	  AWWA guide (Teefy 1996) gives several advi9c	  e8s	  	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+regarding the achievement of tracer tests in water and wastewater treatment plants particularly with 
+respect to the selection of suitable tracer. Murphy and Timpany (1967) made a comparison between 
+reactor model and lab-scale reactor hydrodynamics using experimental points obtained from a tracer 
+test conducted with a laboratory tank. The authors showed that the two extremes of PFR and CSTR 
+are inadequate and that the dispersion model fits the experimental data significantly better than equal 
+size CSTRs in series or the unequal size CSTR in series model.  
+6.1.8.2.2 Non ideal flow reactor models 
+San (1994) compared his method with a method using the same boundary conditions (Wehner and 
+Wilhelm 1956) but with a first order reaction instead of a Monod type reaction. The author 
+implemented the proposed equation and obtained a graph that can be used to design a plug flow 
+reactor, in particular it gives a correlation between reaction rate, Peclet number and biological 
+efficiency. Makinia and Wells (2000b) verified the flow pattern effects of their model on the one-
+dimensional unsteady advection-dispersion equation using data from a full-scale plant and introducing 
+the model parameters developed from previous experiments (Makinia and Wells (2000a) and data 
+from the literature. With dynamic conditions, the authors compared the predicted concentration of 
+ammonia nitrogen and dissolved oxygen with the experimental data, and showed that, in all cases, the 
+errors between the model predictions and the data were lower for the advection-dispersion model than 
+for the tank-in-series model. In fact, even in the case of five mixed zones of equal size that was found 
+as the best fitting tank-in-series model, the predicted peak concentrations were lower by 
+approximately 12–17% and delayed by approximately 30–60 min compared with the actual peaks. 
+The dispersion model was solved in unsteady conditions with a computational algorithm proposed by 
+Lee et al. (1999a, 1999b). The results were compared with results obtained by the proposed model-
+collocation with a tank-in-series model using experimental data (Lee et al. 1999b). The authors 
+applied the model to pilot-scale activated sludge process data presented in a previous study (Nogita et 
+al. 1983), and showed that with simulated dynamics of the reactant at the outlet of the pilot plant, the 
+proposed algorithm provides a superior prediction than the tank-in-series model. They demonstrated 
+the feasibility of improving the accuracy of the results by optimizing the Peclet number.  
+Lee at al. (1999a) also validated the model using different numerical techniques - the orthogonal 
+collocation method (MOC), the line method (ML), and the internal collocation and four elements 
+	   	   9	   9	  	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+method (OCFE) and experimental data related to the hydraulics of a Surface Flow System (SSF) 
+constructed wetland process presented by King and Forster (1990).  
+For all of these methods there is a good agreement between the experimental data and the model 
+results, but these validations suggest that the OCFE technique is superior to ML and MOC in terms of 
+numerical stability and the accuracy of the solution. Furthermore, all simulated RTD curves show a 
+slower rise time and a faster tail than the experimental data, which indicates a plant-model mismatch. 
+It is important to note that the experimental tracer curves at various points across the gravel bed of the 
+SSF describe different peak concentrations and response times, which implies that there is a 
+channelling phenomenon to a certain extent which is not accounted for in the axial dispersion model.  
+The authors also calibrated the model with simulations using different values of the Peclet number, 
+and they demonstrated that with an appropriate value it is possible to predict the process time delay 
+using either technique (preferably OCFE or ML).  
+Glover et al. (2006) calibrated and validated a CFD-ASM1 model using experimental data from a 
+laboratory scale reactor. Le Moullec et al. (2010b) applied a CFD model to an activated sludge reactor 
+and compared systemic, CFD, and compartmental models for a biological reactor used in wastewater 
+treatment in a theoretical case, without reference to experiments. In this model, the author considered 
+a gas-liquid reactor with oxygen transfer and complex kinetics and showed that all three models 
+follow the same main trends; in particular, the compartmental model provided results very similar to 
+the CFD model. A discrepancy was observed between the CFD and compartmental models due to the 
+more realistic introduction of effluent in the CFD model. In the case of a particulate biodegradable 
+substrate, significant differences are noted between a systemic model and a CFD-based model (Le 
+Moullec et al. 2010b) this is due to the calculated hydrolysis process, which is affected by the in-
+homogeneity of the particulate compounds concentration on a section of the reactor (Le Moullec et al. 
+2010b). This in-homogeneity is not taken into account in systemic models.  
+ 
+6.1.8.3 Fluidized Bed Reactors 
+Shieh et al. (1982) performed a sensitivity analysis of the proposed model parameters using reported 
+numerical values. These authors studied the effects of media size and biofilm thickness on FBR 
+performance in terms of the reactant conversion rate and biomass concentration. They found that these 
+	  are two most important parameters that affect t	  he FBR performance, but they did not include 1t	  h0e0	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+effects of the hydrodynamic parameters on the process. The authors additionally proposed an iterative 
+procedure that is applied to the model for design purposes.  
+Yu et al. (1999) performed tracer experiments using a laboratory scale fluidized bed reactor to study 
+the mixing and flow patterns of tap water. The author introduced a pulse input of a dye solution and 
+demonstrated that the flow pattern can be described with a model of two CSTRs in series. This result 
+was obtained by calculating, from the tracer concentration, the residence time distribution curves and 
+their variance correlated to the number of CSTR reactors. The author also demonstrated that this 
+approach improved the fit to the experimental data at low gas velocities and was equivalent to the 
+axially dispersed plug flow model at higher gas velocities. Lin (1991) presented graphs that compared 
+experimental data from the literature for biological fluidized bed de-nitrification and predicted values 
+of the model. The graphs only enable qualitative agreement to be observed between experimental data 
+and model predictions. El-Temtamy et al. (1979b) performed tracer tests on a laboratory scale reactor 
+and correlated the radial concentration profile to the radius by varying the superficial gas velocity. 
+The authors obtained different values of the radial dispersion coefficient and found that this parameter 
+does not change with particle size as the fluid flow rates vary.  
+ 
+6.1.8.4 Biofilter reactors 
+Considering the ideal reactor model previously proposed, Jacob et al. (1996) solved the proposed 
+system of eight differential equations, using two methods to reduce the distributed parameter model to 
+a differential algebraic equation (DAE) system: the method of lines and orthogonal collocation. The 
+experiments were performed on synthetic wastewater to simulate the nitrification and denitrification 
+process. In the nitrification process, the experimental data was compared for nitrites and carbon 
+concentrations, and a very good agreement was found between the experimental and the model 
+results. In the denitrification process, the nitrate, nitrite, and carbon concentration were compared to 
+the experimental data and found to be in good agreement. It should be emphasized that the simulations 
+were performed without a real estimation of all parameters involved; in fact most of the parameters 
+were taken from the literature or measured experimentally. Thus, this model lacks a rigorous 
+parameters estimation procedure. De Clercq et al. (1999) performed a tracer test using a full-scale 
+reactor and obtained improved fitting of the model performance to the measured lithium effluent 
+	  concentration with a two-tank-in-series configura	  tion. This did not include the diffusion effect as th1	  e0y1	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+stated that this phenomenon does not influence the residence time distribution. Séguret and Racault 
+(1998) performed a tracer test in order to obtain an experimental RTD curve and to estimate the 
+immobile and mobile volume and the first moment of the proposed bio-diffusion model. The mobile 
+volume from the bio-diffusion model and the first order moment were compared to the free draining 
+volume and the mean retention time obtained experimentally. The authors determined that the mean 
+residence time is overestimated compared with the first order of the bio-diffusion model. The reason 
+may be an inaccurate fit of a decreasing exponential used to extend the RTD towards the infinite. It 
+should be noted that the authors proposed to implement the hydrodynamic model using a kinetic 
+biofilm model but did not demonstrate its applicability. To determine the range of validity of their 
+models, Muslu (1990) performed some experiments using a data collected by Lamb and Owen (1970). 
+In particular, the predicted and measured reactant removal efficiency, defined using the measured inlet 
+and outlet COD concentrations, were compared to flow rate values. Good agreement was found 
+between the experimental data and model results, with a determination coefficient equal to 0.98. 
+Baquerizo et al. (2005) performed a sensitivity analysis of the model parameters and a model 
+validation that compared the model results and experimental data referring only to the ammonia 
+concentration along the reactor height. They only reported graphs to describe the gas concentration 
+profiles along the biofilter bed for a low and a high ammonia inlet concentration, without giving a 
+correlation index. Iliuta and Larachi (2005) performed a parameter estimation and model validation 
+using experimental data, but they did not estimate the dispersion number because the extent of back-
+mixing in the liquid phase was quantified by a comprehensive Bodenstein number correlation (Piché 
+et al. 2002). Additionally, the authors found good correspondence between the model results and the 
+experimental data reported in the literature (Wisecaver and Fan 1989; Hirata et al. 1986). This 
+agreement reflects the validity of the model over a wide range of biofilm thicknesses and ascertains 
+the contribution of biological clogging in the hydrodynamic model. In Table 23 are listed all models 
+previously described and are compared the calibration and validation procedures adopted for each. 
+ 
+ 
+ 
+ 
+ 
+ 
+	   	   1	   02	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+Table 23. Model Calibration (C) and Validation (V): AS, FBR, BF, AF estimated parameters 
+Reactor C V Estimated Parameters Authors 
+- - - Lawrence and McCarty (1980); 
+- - - San (1989); 
+X X Kinetic parameters Muslu (2000a); 
+- - - San (1992); 
+- - -         
+AS X X Dispersion 
+  coefficient, kinetic  
+  and stoichiometric Makinia and Wells (2000a,b) 
+  parameters  
+     
+X X Peclet number Lee et al. (1999a,b) 
+X X Kinetic parameters (m, Y) Glover et al. (2006) 
+ - - - Le Moullec et al. (2010a,b) 
+FBR - - - Shieh et al. (1982) 
+- - - El-Temtamy et al. (1979a,b) 
+Kinetic parameters, 
+ X X external mass transfer coefficient, dispersion Lin (1991) 
+number 
+ - X     - Jacob (1996) 
+    
+X  - Number of reactor in series Fdz-Polanco (1994) 
+BF/TF X X Kinetic parameters Muslu (1990) 
+Kinetic and 
+X X stoichiometric Baquerizo et al. (2005) 
+parameters 
+-  X  Iliuta and Larachi (2005) 
+ 
+ 
+	  	  
+	   	   1	   03	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+ 6.2 Mathematical modelling of anaerobic plug flow reactor and non-ideal flow reactor 
+6.2.1 Introduction 
+Anaerobic biological processes are widely applied for wastewater and organic waste treatment. 
+Pioneering applications, not yet abandoned, were mainly based on low rate reactors using non-
+attached growth (McCarty and Smith; 1986). More recently, high rate anaerobic reactors using 
+biofilms and bioflocs to increase the mean cell residence time, have been also proposed and 
+successfully applied (Annachhatre, 1996). The growing interest towards anaerobic treatments can be 
+explained considering the advantages of these processes, which can be summarized as: i) positive 
+energy balance due to methane production; ii) no energy spending for aeration; iii) low biomass yield, 
+leading to reduced sludge production; iv) reduced requirement of nutrients, which allows the 
+treatment of many different substrates; v) low maintenance costs and little or no odour problems. Of 
+course the process has also some disadvantages such as the long start-up time, the sensitivity to toxic 
+compounds, the need to control alkalinity conditions and higher investments costs (Tchobanoglous et 
+al. 2003; Gavrilescu 2000). To study the sensitivity of anaerobic processes to various operational 
+conditions and to optimize the design of anaerobic reactors, several performance-prediction models 
+have been proposed, dealing with kinetic expressions that describe the degradation and the production 
+of organic and inorganic substrates inside the reactor. In some cases, these models have been coupled 
+with the hydrodynamic description of the process to take into account the variability existing among 
+the various configurations that certainly affect the overall performances of the treatment (Levin and 
+Gealt 1993; Le Moullec et al. 2008). 
+6.2.2 Mathematical modelling of UASB Reactors 
+UASB reactors were developed in the late 1970s in the Netherlands by Lettinga et al. (1980) and are 
+still widely used for wastewater treatment. The process is based on the development of a sludge bed, 
+localized at the bottom of the reactor, formed by the natural self-immobilization of anaerobic bacteria. 
+Above that bed a zone of finely suspended particles called sludge blanket is formed. A clear zone over 
+the sludge blanket constitutes the settling zone. The influent wastewater is distributed at the bottom of 
+the reactor and flows upward (Fig. 37a). 
+	   	   1	   04	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+	  
+	  	  	  	  	  	  	  
+	  	  	  	  	  	  	  	  	   	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  
+	  
+   a) UASB reactor 
+	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	   	  b) Anaerobic biofilter reactor 
+	   	   1	   05	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	  	   	  
+	   c) Anaerobic Fluidized Bed Reactor 
+Figure 37. Schematic representation of a) UASB reactor, b) Anaerobic Biofilter, c) Anaerobic 
+Fluidized Bed Reactor 
+ 
+6.2.2.1 Hydrodynamic based models 
+Mathematical models of UASB reactors generally distinguish the three over mentioned zones and the 
+reactor is described by Tank in Series derived models, usually named multi-compartment models 
+(Van der Meer and Heertjes, 1983; Bolle et al. 1986a,b; Costello et al.1991a,b; Wu and Hickey, 1997; 
+Narnoli and Indu, 1997). 
+Both Heertjes et al. (1978, 1982) and Bolle et al. (1986a,b) divided the reactor into three 
+compartments simulating the hydrodynamic conditions in the sludge bed and in the sludge blanket 
+using a CSTR model, and the hydrodynamic conditions in the settling zone using a PFR model. 
+Particularly Heertjes et al. (1978) assumed a by-pass flow between the inlet section and the second 
+reactor, a dead zone in the first reactor, and a return flow between the second and the first reactor (Fig. 
+38a), obtaining the following equation set: 
+V dC11 =Q C +Q ⋅C −Q ⋅C
+  dt
+0 0 2 2 1 1
+                       (51) 
+V dC22 =Q1C1 +Qk ⋅C0 −Qdt 2
+⋅C2 −Q ⋅C2
+                                  (52) 
+with:  
+	   	   1	   06	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+Q =Qk +Q0                                                                                        (53) 
+Q1 =Q0 +Q2                                                  (54) 
+V=V1 +V2 +V3 +Vd                                                 (55) 
+where: 
+Q = influent flow [L3T-1]; 
+Q  = by-pass flow [L3 -1k T ]; 
+Q0 = flow entering the sludge bed [L3T-1]; 
+Q1 = flow entering the sludge blanket [L3T-1]; 
+Q2 = return flow [L3T-1]; 
+V1 = ideally mixed region in the sludge bed volume [L3]; 
+Vd = dead space volume [L3]; 
+V2 = sludge blanket volume [L3]; 
+V3 = plug-flow region volume [L3]; 
+C  = substrate concentration in the sludge bed [ML-31 ]; 
+C2 = substrate concentration in the sludge blanket [ML-3]. 
+ 
+Bolle et al. (1986 a, b) introduced two main variations to the configuration assumed by the multi-
+compartment model proposed by Heertjes et al. (1978). He neglected the return flow between the first 
+and the second reactor, and added a by-pass between the inlet section and the third reactor (Fig. 38b). 
+The resulting equation set obtained by Bolle et al. (1986a) is therefore:  
+V dC11 = (1− SF1 ) ⋅Q ⋅C0 − (1− SF1 ) ⋅Q ⋅C    dt 1                             (56) 
+V dC22 = (1− SF1 ) ⋅Q ⋅C1 − (SF1 − SF2 ) ⋅Q ⋅C0 − (1− SF2 ) ⋅Q ⋅C    dt 2               (57) 
+where: 
+SF1 = fraction of flow by-passing the sludge bed; 
+SF2 = fraction of flow by-passing the sludge blanket. 
+ 
+	  	  
+	   	   1	   07	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+ 
+Vd
+Q1
+0
+Q C0 Q0 Q Q0
+0 0 Q2 V3C3 0
+0 V2 C2
+V1C1
+Qk
+0
+ 
+a. Block diagram proposed by Heertjes et  b. Block diagram proposed by Bolle et al.1986a,b 
+al. 1978a, b. 
+         
+Figure 38. Block diagram proposed by Heertjes et al. (1978 a,b) and Bolle et al. (1986a,b).  
+ 
+Ojha and Singh (2002) completed the previous models by developing and testing a theory based on 
+the flow resistance. They found that increasing the flow resistance in the reactor increases the 
+magnitude of short-circuiting flows in the sludge bed. Successively, assuming the same 
+schematization proposed by the previous authors, Singh et al. (2006) calculated the by-pass flow and 
+the dead-zone in steady-state conditions, using the following mass-balance equation: 
+                       (58) 
+where:  
+Ce = the exit concentration [ML-3];  
+re = the effective fraction of flow expressed as re=1-(Qb /Qi); 
+Qb = the by-pass flow [L3T-1]; 
+Qi = the influent flow [L3T-1]; 
+fe = the active space for flow expressed as fe = (1-Vd )/(Vd +Vr). 
+ 
+Wu and Hickey (1997), instead, modeled the sludge bed and the sludge blanket as a CSTR with a 
+dead volume, and the settling zone as a PFR with lateral dispersion (Fig. 39a), developing the 
+following equations:                  
+ V dC	   =V ⋅C0 (t) −Q ⋅C(t)
+                            (59) 
+dt 	   1	   08	   	   	   	   	  
+EFFLUENT
+INFLUENT
+CHAPTER 6 – LITERATURE REVIEW 
+∂C D ∂2C u ∂C
+= −
+ ∂t L ∂z 2 L ∂z                                 (60) 
+where: 
+V = CSTR working volume [L3]; 
+C0(t) = influent concentration [ML-3]; 
+Q = flow entering the working volume [L3T-1]; 
+z = axial coordinate [L]; 
+u = flow velocity within the PFR [LT-1]; 
+L = reactor length [L].   
+Assumed initial and boundary conditions were:  
+C(0,t) = C(t)      (61.a) 
+C(z,0) = C0       (61.b) 
+To avoid the need to evaluate too many parameters, Singhal et al. (1998) developed a simpler block 
+diagram to simulate the reactor, composed by two reactors in series, each characterized by an axial 
+dispersion (D1, D2), assuming that part of the liquid flow by-passes the first zone and enters directly 
+into the second one (Fig. 39b). The authors applied the following dispersion equation in dimensionless 
+form to both model's compartments. 
+2
+   ∂G ∂ G 1 ∂G= −                                     (62)  
+∂θ ∂η 2 Pe ∂η
+where: 
+q = t/t, dimensionless time; 
+h = z/L, dimensionless axial coordinate;  
+Pe = Peclet number;  
+G = C/C0, dimensionless concentration. 
+	   	   1	   09	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+Assumed initial condition for the first reactor was:      
+    C = 0 for h>0                                                     (62) 
+ 
+For the first zone of the model the equation (62) was solved analytically following the procedure 
+proposed by Smith (1981). The response of the second zone was evaluated by using the Crank-
+Nicholson method and applying the following boundary conditions:  
+1 ⎛ ∂C ⎞ S +QC
+− ⎜ ⎟ + (C) = 1(θ )⎜ ⎟ η>0 η = 0,θ ≥ 0
+     Pe ⎝ ∂η ⎠η 0 (S +Q)>                     (63.a) 
+⎛ ∂C ⎞
+⎜⎜ ⎟ = 0 η =1,θ ≥ 0
+        ⎝ ∂η
+⎟
+⎠                                                      (63.b) 
+  
+The model proposed by Wu and Hickey (1997) was later reconsidered by Zeng et al. (2005). The 
+authors added to the previous equations the following expression of the dispersion coefficient, 
+obtained from a non reactive tracer test:  
+ 
+D = D +ua +bη0                                              (64) 
+where:  
+a, b and Do = empirical parameters; 
+u = flow velocity [LT-1]. 	  
+Vd
+ 
+Q CSTR Dispersed   
+flow V1 D1 V2D2
+Zone 2  
+Zone 1
+Qr  
+ 
+a) Wu and Hickey (1997)                                                  b) Singhal et al. (1998)  
+ 
+Figure 39. Block diagrams of UASB reactor proposed by Wu and Hickey 
+(1997), b) Singhal et al. (1998). 
+ 	  
+	   	   1	   10	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+ 
+ 6.2.2.2 Models coupling hydrodynamic with anaerobic digestion conversions 
+In the literature there are also several attempts to model these reactors considering both the hydraulic 
+and biochemical behavior. One attempt was done by Batstone et al. (2005) and Mu et al. (2008), who 
+introduced reaction terms into dispersion equation using the biochemical model ADM1 proposed by 
+Anaerobic digestion I.W.A. working group (Batstone et al. 2002). Similarly Kalyuzhnyi et al. (1997, 
+1998) introduced the following equation to simulate the biochemical process, that was solved under 
+steady-state conditions, using the Danckwert boundary conditions:    
+∂C(z, t) ∂ ⎡D(z, t) ∂C(z, t)⎤ ∂= ⎢ ⋅ ⎥ − [u(z, t) ⋅C(z, t)]+ r(z, t) −M (z, t)                      (65) ∂t ∂z ⎣ ∂z ⎦ ∂z
+where:  
+r(z,t) = reaction term; 
+M(z,t) = gas transfer coefficient. 
+Later the authors developed a more complete model combining the granular sludge dynamics, the 
+solid-liquid-gas interactions, hydrodynamics with the biological conversions and the liquid phase 
+equilibrium chemistry (Kalyuzhnyi et al., 2006). They introduced the following expression for the 
+vertical velocity of sludge aggregates: 
+     u(z, t) V= R −WS                                                         (66) T ⋅CS
+where: 
+VR = the reactor liquid volume [L3]; 
+T = the retention time [T]; 
+CS = the reactor cross section [L]; 
+WS = the settling velocity for sludge solids [LT-1]. 
+ 
+They also used the dispersion coefficient expression for sludge aggregates, developed by Narnoli and 
+Indu (1997):  
+2
+⎡ ⎛ ⎞⎤
+D(z t ⎛ ⎞, ) − A= A2 ⋅ ⎢q(z, t) ⋅⎜⎜1−exp⎜
+3
+⎜ ⎟⎟
+⎢⎣ ⎝ ⎝ q(z, t)
+⎟ ⎥
+⎠⎟⎠⎥⎦                                                       (67) 
+where: 
+	  A2, A3 = empirical parameters [ad.]; 	   1	   11	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+q(z, t) = surface gas production [L3T-1]. 
+The resulting equation system was solved under unsteady-state conditions. Danckwert boundary 
+conditions were used only for the soluble substrates while, for the biomass, the authors took into 
+account the wash-out in the last compartment, assumed to be equal to the upward liquid velocity: 
+u(0) ⋅ Xi (0, t) = D(0, t)
+dXi (0, t) z = 0
+ dz                                                  (68.a) 
+u(H ) ⋅ Xi (H , t) = D(H , t)
+dXi (H , t) z = H
+dz                                                 (68.b) 
+where:  
+Xi (0, t) = biomass concentration at reactor inlet [ML-3]; 
+X (H, t) = biomass concentration at reactor outlet [ML-3i ]. 
+ 
+Batstone et al. (2005) and Penã et al. (2006) used only one advective-diffusive equation to describe 
+the entire reactor. Particularly the model proposed by Batstone et al. (2005) combines the internal 
+recycle proposed by Bolle et al. (1986a,b) with the internal bypass proposed by Singhal et al. (1998). 
+The authors considered the internal flow bidirectional, assuming either a recycle flow from the 
+beginning of the second half of the reactor length to the influent section, or a by-pass from the influent 
+section to the second half of the reactor length. Finally, Ren et al. (2009) developed the first 3-D 
+transient CFD model to elucidate the hydrodynamics of the three-phase (gas-liquid-solid) UASB 
+reactor. In the CFD simulation, a multiphase control volume, composed of one continuous 
+(wastewater) and two dispersed (gas bubbles and microbial granules) phases, were analysed with the 
+Eulerian-model (Dìez et al. 2007). 
+ 
+6.2.2.3 Models comparisons  
+The models proposed by Van der Meer and Heertjes, 1983, Bolle et al. 1986a, b, Costello et al. 1991a, 
+b, Ojha and Singh (2002) and Singh (2005) are CSTR in series models and present a lot of 
+assumptions but are simple to apply; the results can present a big degree of uncertainty. More 
+complete models taking into account the dispersion related to reactor configuration are the ones 
+proposed by Wu and Hickey (1997), Singhal (1998) and Zang et al. (2005). But the best models are 
+	  those proposed by Kalyuzhnyi et al. (2006), Bats	   tone et al. (2005), Mu et al. (2008) and Penã et1 	  a1l.2	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+(2006), who considered biochemical reactions and dispersion flow integrating in dispersion model 
+also ADM1 model. Finally it is also useful to apply CFD models that are more complex than the 
+previous models but describe the hydrodynamic phenomena more in detail, considering the local 
+process that happens in the reactor, one attempt was done by Ren et al. (2009). 
+6.2.3.  Mathematical modelling of Anaerobic Biofilters 
+ABFs are anaerobic packed-bed reactors, characterized by the formation of a biofilm responsible for 
+the development of the anaerobic degradation of the influent substrate (Fig. 37 b). The influent flow 
+can travel along the reactor both in the upflow mode (UAF configuration) or in the downflow mode 
+(DAF configuration), although the first configuration is most widely applied (Fig. 37 b). The 
+advantages of ABFs are the operational simplicity, elimination of mixing devices, better capability to 
+withstand large toxic shock loads and the absence of a secondary clarifier. The major disadvantage are 
+related to the cost of the packing material and to the possibility of packing clogging caused by the 
+solids and biomass accumulation in the packing media (Gavrilescu, 2000; Rajeshwari et al., 2000). 
+To define the hydraulic behavior of ABFs it is important to take into account: i) the nature of the 
+anaerobic processes occurring within the reactor; ii) the production of biogas and iii) the accumulation 
+of biological solids.  
+One of the earliest attempts to model hydraulic behavior of such reactors was done by Young and 
+McCarty (1968) who proposed one of the first models for ABFs, based on reactors in series. They 
+developed a model of the process based on the premises of an ideal plug flow condition, making some 
+adjustments to take into account the effect of solids accumulation, the consequence of mixing due to 
+gas production and the existence of a diffusion gradient between the bulk liquid and the biological 
+solids surfaces. Young and Young (1988) proposed a new model as a combination of ideal systems, 
+composed by: a first CSTR, representing the inlet zone; an ideal plug-flow reactor with a dead zone, 
+representing the central part of the reactor and a second CSTR representing the outlet zone (Fig. 40a). 
+The dead-space region was introduced to take into account the physical configuration of the vessel,  
+the formation of stagnant eddies near the discontinuities such as corners, baffles and contact points of 
+the packing material, and the formation of stagnant areas adjacent to the surface. 
+Escudié et al. (2005) modeled the reactor considering two interconnected regions: a completely mixed 
+one representing the mixed liquid and a dead zone representing the biofilm (Fig. 40b). The resulting 
+	  mass balances were:  	   1	   13	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+V1C1 = (Q1 ⋅Cin +Q2 ⋅C2 )− (Q1 ⋅C1 +Q2 ⋅C1)                                         (69) 
+V C = (Q ⋅C −Q ⋅C )                                                                (70) 2 2 2 1 2 2
+where: 
+ 
+V1 = ideal Continuous Stirred Tank Reactor (‘‘CSTR1’’), which represents the easily mixed liquid in 
+the reactor [L3];V2 = ideal Continuous Stirred Tank Reactor (‘‘CSTR2’’), which represents the biofilm 
+zone [L3];C2 = the tracer concentration within the biofilm [ML-3];C1 = the tracer concentration within 
+the CSTR -31 [ML ];Cin = inlet tracer concentration [ML-3];Q1 = inlet liquid flow rate [L3T-1]; Q2 = 
+liquid flow rate between the two theoretical CSTRs [L3T-1]. 
+Assuming:  
+C1(0)
+M
+=
+V   (71) 
+C2 (0) = 0   (72) 
+A different configuration, composed by a CSTR with a dead zone, followed by a plug flow reactor, 
+and including a by-pass of the first reactor (Fig. 40c) was proposed by Smith et al. (1996). The authors 
+assumed that the flow through the mixed zone and the plug flow zones was sequential and localized in 
+correspondence of the biofilter bed, while the dead zone (Vd) was assumed to be parallel to the mixed 
+zone with a transfer flow between them, characterized by a transfer rate proportional to the difference 
+in concentration between the two zones.  
+  
+  
+  
+  
+ 
+ 
+ 
+ 
+ 
+ 
+	   	   1	   14	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+ 
+ 
+ Q1
+ 
+ V1 V2S1 S2
+ 
+  
+a. b. 
+ 
+ 
+c.   
+ 
+Figure 40. Modelling schemes of anaerobic biofilters proposed by a)Young and Young (1988), b) 
+Escudié et al. (2005) and c) Smith et al. (1996). 
+ 
+Finally Huang and Jih (1997) coupled a dispersion model with a deep-biofilm kinetic neglecting the 
+radial dispersion and the substrate removed by dispersed cells. They obtained the following equation:   
+∂S ∂S ⎛ ∂ 2S ⎞
+ε + u = D⎜⎜ ⎟∂t ∂Y ∂Y 2 ⎟
+− aJ (73) 
+⎝ ⎠                                    
+where: 
+S = the substrate concentration in the bulk liquid [ML-3]; 
+Y = the spatial distance [L]; 
+a = the specific biofilm surface area [L]; 
+ε = the fraction of reactor volume; 
+	  J = the substrate flux at biofilm surface [ML
+-2T-1],	   assumed equal to: 1	   15	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+J ∂S= β
+∂t                                               (74) 
+where: 
+β  = partition coefficient. 
+Equation (74) was solved considering steady-state conditions and applying the Dirichlet boundary 
+conditions. The authors additionally manipulated the equation normalizing it with reactor height and 
+obtaining the following expression: 
+∂S ∂S 1 ⎛ ∂ 2S ⎞
+θ + = ⎜⎜ ⎟t Y Pe 2 ⎟                            ∂ ∂ * ⎝ ∂Y * ⎠                                                 (75)
+where:  
+Y* Y= ;                                                                             
+H
+H (ε + β ⋅ε )
+θ = = estimated HRT
+u .                                
+6.2.3.2 Models comparisons  
+ 
+The models proposed by Young and McCarty (1968), Young and Young (1988) are CSTR in series 
+models old, simple to apply and the results can present a big degree of uncertainty. More complete 
+models taking into account the dispersion related to reactor configuration are the ones proposed by  
+Escudié et al. (2005), Huang and Jih (1997) and Smith (1996), who introduced a more complete model 
+considering also the effect of biofilm growth.  
+6.2.4 Mathematical modeling of Anaerobic Biological Fluidized Bed Reactors 
+An AFBR is a vertical bed of inert particles (sand, pumice, activated coal) that serve as carrier 
+material for the biofilm development. The liquid to be treated is pumped through the bed at a 
+sufficient velocity to cause ﬂuidization (Fig. 37c). In the ﬂuidized state the carrier material provide a 
+large speciﬁc surface for attached biomass growth. This feature permits to attain a long solids 
+residence time for the development of the biological reactions and a low concentration of suspended 
+solids. Mathematical reactor models for AFBRs have been developed as CSTR (Worden and 
+Donaldson 1987) or PFR (Bonnet et al. 1997). Models for AFBRs generally consist of three pa1r1ts6 	   	   	   	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+(Saravanan and Sreekrishnan, 2006): i) a bed fluidization model which describes the effect and the 
+feature of inert particles; ii) a biofilm model which describes the rate of substrate conversion per 
+individual granule and iii) a reactor flow model, which links the biofilm and the bed fluidization 
+models to yield the substrate concentration as a function of the axial position within the AFBR. 
+Many investigations suggested also that an axial dispersed plug flow model can be successfully used 
+to simulate the hydrodynamic process is occurring in AFBRs (Seok and Komisar 2003; Otton et al. 
+2000; Buffière et al. 1998 a, b; Schwarz et al. 1996-1997; Diez and Blanco 1995). 
+Bonnet et al. (1997) assumed that no dispersion occurs in AFBR reactors. The authors extended the 
+PFR model considering un-steady state conditions and taking into account many components involved 
+in the process such as: organic matter, VFA, methane, carbon dioxide, acidogenic and methanogenic 
+bacteria. The dynamic model was developed considering the liquid and solid phase separately to 
+compute the mass balance for all the process components and the momentum equation to link the 
+solid and the liquid velocities. The authors used the model to study the effect of different parameters, 
+including hydraulic and biological variables. 
+Buffière et al. (1998a, b) stated that the liquid mixing is well represented by an axially dispersed PFR 
+model. Studying the effect of gas production on the hydrodynamic behavior of an AFBR, the authors 
+demonstrated that this production is able to modify the axial mixing degree, which is responsible for 
+the establishment of a concentration gradient in the reactor. In contrast Diez and Blanco (1995) stated 
+that it is possible to study the AFBR as a solid-liquid fluidized bed neglecting the effect of biogas on 
+the hydrodynamic behavior. The authors also described the important role of the biofilm growth on 
+the hydrodynamic behavior showing that the biofilm produces significant effects on the relationship 
+between the up-flow velocity and the bed expansion.  
+Turan and Ozturk (1996) studied the effect of the anaerobic biomass concentration on the hydraulic 
+retention time and the dispersion coefficient. The authors applied the axial dispersion equation and 
+defined the values of the Peclet number using the equation proposed by Van der Laan et al. (1957):  
+σ 2 (θ ) = 2Pe−1 − 2Pe−2[1− exp(−Pe)]                          (76) 
+where: 
+σ2 (θ) = the variance of the theoretical response curve for closed reactor.  
+Similarly, Seok and Komisar (2003) developed an axial-dispersion model to simulate the behaviour of 
+AFBRs, neglecting the effect of the gas formation on the hydrodynamic behaviour. They applied their 
+	  model to quasi-steady state conditions, consideri	  ng no external mass transfer resistance due to go1	  o1d7	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+local mixing and small external boundary layers (Buffière et al. 1998c; Schwarz et al. 1996), 
+obtaining the following mass balance equation: 
+∂Ci (z, t) u ∂C (z, t) ∂
+2C (z, t)
+= − i +D i 2 +Πi (z, t)+M C (z, t)∂t ε ∂z ∂z w,i i                             (77) 
+∂C j (z, t) u ∂C (z, t) ∂
+2C (z, t)
+= − j +D j 2 +Π j (z, t)+ rw, j (z, t)+Tj (z, t) ∂t ε ∂z ∂z                 (78) 
+where: 
+Ci = concentration of the suspended microbial species i in the bulk liquid [ML-3]; 
+Cj = concentration of substrate j in the bulk liquid [ML-3]; 
+u = superficial liquid velocity [LT-1];  
+ε = bed porosity;  
+D = axial dispersion coefficient [L2T-1];  
+Π  j = exchange rate of microbial species i between bulk liquid and bio-particle [ML-3T-1]; 
+Mw,i = net growth rate of microbial species i in the bulk liquid [T-1]; 
+Πj =  transport rate of substrate j from the bulk liquid into the biofilm [ML-3T-1]; 
+rw,j = net formation rate of substrate j in the bulk liquid [ML-3T-1]. 
+ 
+The authors rearranged equations (77-78) introducing moving boundaries conditions and a system of 
+normalized time-dependent spatial coordinates to simulate the bed expansion, the segregation along 
+the reactor height and the microbial population distribution both along the reactor height and inside the 
+biofilm. They paid particular attention to the bio-particle segregation phenomena associated with the 
+biofilm exchange processes observed in the experimental study, but they partly neglected the 
+theoretical interpretation of the hydrodynamics. 
+ 
+6.2.4.1 Models comparisons  
+The model proposed by Bonnet et al. (1997) is plug-flow model, simple to apply but the results can 
+present a big degree of uncertainty. More complete models taking into account the dispersion related 
+to reactor configuration are the ones proposed by Seok and Komisar (2003), Otton et al. (2000), 
+Buffière et al. (1998 a, b), Schwarz et al. (1996-1997) and Diez and Blanco (1995). More complete 
+models are the ones where also the gas production is taken into account, such as the models proposed 
+	  by Buffière et al. (1998a, b). 	   1	   18	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+6.2.5. Mathematical modeling of wet and dry digesters treating bio-solids 
+The term digester is usually referred as anaerobic reactors used for the treatment of OFMSW or 
+sewage sludge. The process is termed low-solids, or wet, whenever the TS in the feed below 10%, and 
+high-solids, or dry, whenever the TS is higher than 20%. Wet processes take place in closed reactors 
+equipped with mixing systems aimed at minimizing the in-homogeneities in the treated fluid. 
+Nonetheless RTD studies carried out on full-scale digesters have shown that actively mixed volumes 
+are generally as low as 23% of the total volume Monteith and Stephenson (1981), and therefore, 
+together with traditional models assuming CSTR conditions, different approaches able to take into 
+account the effect of non-ideal mixing conditions have also been proposed. Dry processes, instead, 
+take place in different reactors working in batch or continuous conditions. They have been rarely 
+modelled in terms of hydrodynamic conditions. One attempt was done by Zaher and Chen (2006) who 
+built mathematical models for industrial scale plug flow reactors (Dranco, Kompogas and Valorga 
+designs). The authors used both ADM1 and Aquasim® software (Reichert, 1998) as a simulation 
+platform. All different designs were modelled imposing CSTR in series configuration and introducing 
+bifurcations to take into account recycling effects. One of the earliest attempts to model non-ideal 
+mixing conditions of wet digesters was done by Smith et al. (1993). The authors proposed the same 
+approach used to model the ABFs, considering three zones: a small initial mixed zone, a large main 
+mixed zone and a dead zone. A dispersion coefficient was also used to describe the cross boundary 
+movement of the substrate from the mixed zones into the dead zone. Mendoza and Sharratt (1999) 
+proposed a compartment model with a confined-gas mixing (Fig. 41). The authors assumed that the 
+circulation around the uptake tube can be represented by an ideally mixed compartment. Moreover 
+they assumed that the fluid circulation, down the tank and back to the draft tube inlet, can be 
+represented by a number of equally sized tanks-in-series (Fig. 41). The mass balances resulted in the 
+following set of linear first-order ordinary differential equations:  
+dCm ⎛C1,1 −Cm ⎞ Cb −C= ⎜ ⎟+ m
+dt ⎜⎝ αt ⎟r ⎠ αtc                                               (79) 
+dC1,1 N (C0 −C1,1) N (Cm −C= + 1,1
+)
+dt (1−α)tr 2(1−α)tc                                      (80) 
+dC1,3 N(C= 1,1
+−C1,2 )                                                     (81) 
+dt 2(1−α)tc
+	   	   1	   19	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+ dCb N(C −C ) N(C −C )= 1,3 b + 2,3 b                                     (82) 
+dt 2(1−α)tr 2(1−α)tc
+where: 
+C = non-reactive substrate concentration [ML3]; 
+m = index of components inside mixed volume Vm; 
+b = index of components inside mixed volume Vb; 
+1, 2, 3 = index of components inside mixed volumes V1, V2, V3 respectively; 
+tr = the mean retention time in the vessel [T]; 
+tc = the circulation time [T]; 
+N = the number of reactors in series; 
+	  α  =  the ratio of ideally mixed volume to the total liquid volume. 
+	   	  	  
+Figure 41. Flow reactor scheme of anaerobic digester proposed by Mendoza and Sharratt  (1999), 
+where m = index of components inside mixed volume Vm , n = the number of reactors in series, Q = 
+flow-rate. 
+ 
+Another simple two region model was proposed by Mendoza and Sharratt (1998) (Fig.42). This model 
+assumes that the whole volume can be divided into two sections, called, respectively, flow-through 
+region and retention region. Both regions are assumed to be perfectly mixed but the transfer of 
+material between them is limited, as the retention region behaves like a stagnant zone. Different levels 
+of mixing are accomplished by adjusting the relative volume of the flow-through region and the 
+e	   xchange rate between regions expressed as the 	   turnover time of material in the vessel. The m1a	   s2s0	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+balance for a generic component j (Fig. 42) yields to a set of ordinary differential equations which can 
+be summarized: 
+ dC1, j C0, j −C1, j C= + 2, j −C1, j ± R(C )                                     (83) 
+dt ατ αθ 1, j
+dC2, j C2, j −C= 2, j ± R(C )                                                  (84) 
+dt (1−α)θ 1, j
+where: 
+j = index of different components involved in mass balance: degradable portion of viable activated 
+sludge microorganism, particulate solids requiring hydrolysis, soluble substrates for acid formers, 
+degradable portion of acidogenic biomass, VFA for methanogens, methanogenic biomass, methane; 
+t = V/Qexch, is the turnover time [T]; 
+Qexch = flow exchange between zones [L3T-1]; 
+α  = ratio of the volume in flow-through region to the total reactor volume [ad.]; 
+(1-α)  =  relative volume of the retention region [ad.]. 
+ 
+In the set of the presented equations, equation (83) with odd numbers, applies to the flow-through 
+zone whereas equation (84), with even numbers, applies to the retention zone. 
+ 
+Figure 42. Reactor flow model of anaerobic digesters proposed by Mendoza and Sharratt (1998), 
+where the subscript: 1= flow-through region; 2 = retention region; exch = exchange between zones; α 
+= ratio of the volume in flow-through region to the total reactor volume; S1, S2 = soluble substrate 
+COD concentration; P1, P2 = degradable particulate COD concentration; X1, X2 = biomass 
+concentration. 
+Later, Keshtkar et al. (2003) proposed the same mathematical model as Mendoza and Sharratt (1998) 
+	  combining the two-region mixing model with a pr	  oper structured kinetic model. 1	   21	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+Vavilin et al. (2001, 2003) introduced a system of parabolic partial differential equations in a 2D 
+reactor imposing cylindrical symmetry.  The proposed system describes the VFA and methanogenic 
+biomass concentration profiles along the rector height at different times. More in detail, the authors 
+tried to simulate anaerobic reactor which treat solid waste by applying distributed model that includes 
+diffusion and advection of VFA and methanogenic biomass. 
+Vesvikar and Al-Dahhan (2005) carried out 3-D steady-state Computational Fluid Dynamics (CFD) 
+simulations of anaerobic digesters to visualize the flow patterns, obtaining the hydrodynamic 
+parameters of the reactors. Another attempt to develop a mathematical model with CFD simulations 
+was done by Wu and Chen (2008) who conducted a numerical simulation of the flow field to 
+qualitatively and quantitatively characterize the mixing and dead zones. The CFD model developed 
+was based on continuity and momentum equations and on the standard semi-empirical turbulence 
+model proposed by Launder and Spalding (1974). 
+Terashima et al. (2009) proposed a homogeneous single-phase, laminar flow CFD model and selected 
+a momentum equation for simulating the flow patterns in the digester. The authors introduced the 
+following Uniformity Index (UI), using as statistical parameter Relative Mean Deviation (RMD), that 
+characterizes the mixing inside the anaerobic reactor: 
+m
+V =∑Vi
+   i=1                                                                (85)  
+m
+∑Ci ⋅Vi
+C = i=1
+  V                                                            (86) 
+m
+∑[Ci −C ' ⋅Vi ]
+UI = i=1                                                      (87) 
+V ⋅C
+where: 
+V = the volume of digester [L3]; 
+Vi  = the partial volume for numerical calculation [L3]; 
+Ci = the local tracer substrate concentration [ML-3];  
+C’ = the average tracer concentration in the digester [ML-3]. 
+ 
+	   	   1	   22	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+6.2.5.1 Models comparisons  
+The model proposed by Monteith and Stephenson (1981), Mendoza and Sharratt (1998, 1999), Smith 
+et al. (1993) and Keshtkar et al. (2003) are CSTR in series models, simple to apply but the results can 
+present a big degree of uncertainty. More complete models taking into account the dispersion related 
+to reactor configuration are the ones proposed by Vavilin et al. (2001, 2003). Finally it is also useful 
+to apply CFD models that are more complex than the previous models but describe the hydrodynamic 
+phenomena more in detail, considering the local process that happens in the reactor, these attempts 
+were done by Terashima et al. (2009), Wu and Chen (2008) and Vesvikar and Al-Dahhan (2005). 
+6.2.6. Model comparisons and validation and calibration 
+6.2.6.1 Models comparisons 
+The models presented above for UASB, fluidized bed reactor, biofilter reactor and anaerobic digester 
+treating bio-solids have different advantages and disadvantages. Furthermore there are some models 
+which can be useful in some situation and not in others.  
+ 
+6.2.6.2 UASB reactor model validation and calibration 
+Tracer experiments (performed with non reactive substrate) were carried out to validate the multi-
+compartment models proposed for UASB reactors (Ojha and Singh, 2002; Bolle et al. 1986a,b; Wu 
+and Hickey, 1997). Some of them were used to calibrate the model’s parameters. Ojha and Singh 
+(2002) estimated each of the hydraulic parameters of the models proposed by Bolle et al. (1986a,b) 
+and Wu and Hickey (1997), obtaining always good values of the determination coefficient, defined as:  
+n
+∑(xi − x)2
+R2 = i=1
+n  . 
+Batstone et al. (2005) compared the multi-compartment models with the axial-dispersion model and 
+obtained the best fitting between the experimental data of tracer tests operated at laboratory scale and 
+the model's results in case of a multi-compartment model with eight tanks. The authors also, used lab-
+scale experimental data to calibrate their model, estimating the dispersion number as well as 1th2e3 	   	   	   	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+governing biochemical kinetic parameters such as the maximum uptake rate and the half-saturation 
+concentration.  
+The CSTR model proposed by Singh et al. (2006) was tested at different temperatures, fixing the HRT 
+= 10 hours. Data fitting resulted to be satisfying for temperature values higher than 22°C, with a 
+determination coefficient varying between 0.98 and 0.94, supporting the assumption that a complete 
+mix flow pattern exists inside the reactor at elevated temperatures. At lower temperatures, instead, the 
+model was proven to be inadequate to describe the data sets, probably because of the reduced biogas 
+production.  
+Because of the important role of biogas production on the reactor hydrodynamic behavior Wu and 
+Hickey (1997) carried out a calibration of their model at bench scale, varying the gas production rate. 
+Lately Singhal et al. (1998) demonstrated that a simple two-compartment axial-dispersion model was 
+adequate to explain the fluid flow characteristics without sacrifying the accuracy of the predictions. 
+They found a good fitting between the model predictions and the response of an UASB reactor to an 
+impulsive input of a non-reactive tracer. Zeng et al. (2005) developed a parameter estimation 
+procedure to yield acceptable agreement between measured and calculated tracer trajectories and 
+obtained a correlation between the dispersion number and the up-flow velocity for different reactor 
+heights. Wu and Hickey (1997) observed the responses of an UASB reactor to an influent step 
+increase, predicting the working volume, the dead volume and the plug-flow reactor volume which 
+resulted in a close agreement with the total reactor volume. The authors performed also a sensitivity 
+analysis on the major factors influencing the reactor performances and found that the distribution of 
+the tracer within the reactor was largely dependent on diffusion processes. Kalyuzhnyi et al. 
+(1997,1998) made a comparison between the experimental data of Alphenaar et al. (1993) and the 
+model predictions, obtaining a determination coefficient >0.99. The authors demonstrated that the 
+dispersed plug-flow model was able to describe adequately a sufficiently big pool of experimental 
+data but revealed also the same deficiencies in its conceptual structure. In particular they showed that 
+the model overestimates the effluent substrate concentration and the amount of volatile suspended 
+solids in the reactor. Lately Kalyuzhnyi et al. (2006) compared model's predictions and experimental 
+data recorded by Yan et al. (1989, 1993). Although they did not report the obtained values of the 
+determination coefficient or any other statistical index, it is possible from represented the diagrams to 
+appreciate a close trend between the experimental data and the simulated ones, especially in terms of 
+COD reduction.  
+	   	   1	   24	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+Mu et al. (2008) used the ADM1 as a basis for the development of a comprehensive distributed 
+parameter model, named ADM1d, that used a hyperbolic tangent function to describe the biomass 
+distribution within a one compartment model. The authors made a comparison of ADM1 and ADMld 
+outputs and showed that ADMld was better suited for modeling anaerobic reactors with limited 
+mixing and high organic load, such as UASB reactors. The model was also validated by Tartakovsky 
+et al. (2008), using the experimental results obtained at laboratory scale. They found that ADM1d 
+gives a good description of biogas flow rates, methane concentration, COD effluent concentrations 
+and VFA under different organic loads and recirculation rates. Additionally the authors demonstrated 
+that the model was able to simulate COD and VFA gradients along the reactor height. Batstone et al. 
+(2005) performed also tracer tests at full scale and demonstrated that the best fitting of experimental 
+tracer tests was achieved with the two-CSTR model. Penã et al. (2006) and Penã (2002)	  demonstrated 
+that the ideal flow pattern occurs only when the operational conditions are close to the design 
+scenario, with a particular reference to the HRT design value. They showed that when the reactor is 
+under-loaded, there is a hydrodynamically dispersed flow pattern with the coexistence of a well-mixed 
+fraction, stagnant zones and short-circuiting flows. The authors obtained a correlation between the 
+dispersion number, the effluent concentrations of COD and the effluent concentration of total 
+suspended solids revealing that the optimal hydrodynamic condition occurs somewhere in between the 
+two ideal flow extremes (i.e., plug flow and complete mixing). Ren et al. (2009) performed a 3-D 
+unsteady CFD model to visualize the phase holdup and obtained their flow patterns in a UASB 
+reactor. The simulation results further confirmed the discontinuity in the mixing behavior throughout 
+the UASB reactor and the key role of the dispersion coefficient, that decreases along the axis of the 
+reactor. In order to better describe the hydrodynamic behavior of the reactor they successfully 
+introduced the Increasing-sized CSTRs (ISC) model and made a comparison with a CSTR in series 
+model demonstrating that the results of the first one match the measured non-reactive substrate 
+trajectories better than the results of the second one.  
+ 
+6.2.6.3 Anaerobic Biofilters model validation and calibration 
+Young and Young (1988) performed tracer experiments in order to define the dead space volume and 
+the mixing ratio as a function of Reynolds number for the model proposed to simulate ABFs hydraulic 
+behavior. The authors demonstrated that the plug flow and the dead space increase with the specific 
+	   	   1	   25	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+surface area of the media. Although the authors recognized the interference between the hydrodynamic 
+and the biological process they did not presented a complete model to simulate both. 
+Escudié et al. (2005) validated the proposed model and estimated the following key parameters from a 
+tracer curve analysis: the volume of the first theoretical CSTR, the volume of the dead zone and the 
+value of the exchange flow between the two reactors. The values were obtained by minimizing the 
+difference between the experimental data and the model results.  
+Smith et al. (1993) carried out hydrodynamic studies to define scale-up strategies, obtaining a 
+correlation between laboratory scale reactor tracer tests and the volume of plug flow and mixed zone 
+of full-scale reactors. Varying the impeller power, the authors defined with tracer tests and 
+computational methods, the values of the dispersion coefficients, the volumes of the dead zone, the 
+initial mixed zone and the large main zone. The authors also investigated through tracer studies the 
+effect of liquid up-flow velocity and biogas production on the degree of rector mixing. Thus they 
+obtained different values of hydrodynamic parameters with different operating conditions and media 
+types inside the reactor. 
+Tay et al. (1996) performed tracer tests to define the hydraulic characteristics of ABFs. The study 
+revealed that the behavior of ABF reactors reflects more closely a plug-flow system with a certain 
+degree of dispersion: this is clearly shown by the obtained values of the dispersion number, ranging 
+from 0.0022 to 0.0045 for an HRT varying from 24 h to 6 h. Additionally the study demonstrated that 
+the hydrodynamics and the extent of mixing can regulate the mass transfer and can have an important 
+influence on the degree of contacts between the substrate and the bacteria, therefore affecting the 
+whole ABF efficiency. In a second study, Tay and Show (1998) performed tracer tests considering 
+dirty-bed and clean-bed conditions. They observed with clean bed conditions hydraulic flow patterns 
+closer to a plug-flow system with a relatively large amount of dispersion, while in the case of dirty-
+bed conditions the flow pattern was found to be more similar to completely mixed flow conditions 
+with high value of the dead-space (from 43-51%).  
+Huang and Jih (1997) made tracer experiments with a laboratory scale reactor to study the diffusion 
+inside the reactor and thus defining the value of the Peclet number. Estimated values ranged from 0.01 
+to 1.5, reflecting that back-mixing occurs in biofilters due to the rising bubbles of biogas. Additionally 
+the authors compared the experimental data and simulation results with reference to COD removal 
+efficiency, obtaining a standard deviation of +/- 5%. The calculated COD removal efficiency using the 
+CSTR model was found to be close to or lower than that using the axial dispersion model. They a1ls2o6 	   	   	   	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+studied the VFA profile along the reactor and claimed that the flow pattern in the liquid phase was 
+completely mixed. 
+6.2.6.4 Anaerobic Fluidized Bed Reactor model validation and calibration 
+Buffière et al. (1996) performed tracer experiments on an AFBR at very low gas flow rates and 
+observed that the axially dispersed plug-flow model was not accurate enough to simulate the 
+experimental data. In fact the tracer response curves were characterized by secondary peaks, 
+suggesting the presence of an internal recycle current. The tank in series model led to a better fitting 
+of the experimental data at low gas velocities. However, the model performance was equivalent to the 
+performance of the axially dispersed plug flow model at higher gas velocities. The authors Buffière et 
+al. (1998a,b) correlated the degree of mixing in the bioreactor to the Peclet number, showing that the 
+mixing conditions of the liquid phase have a slight influence on the reactor performances. 
+Buffière et al. (1998a,b) stated that for modeling purpose of AFBRs it is necessary to know the 
+variations of the Peclet number and of the axial dispersion coefficient. The authors tested several 
+correlations to fit the experimental determination of the dispersion number, and found that the most 
+appropriate one was the expression proposed by Muroyama and Fan (1985), which corresponds to the 
+expression of a modified Peclet number, calculated with the column diameter as space length 
+parameter: 
+DcU1 =1.01U 0.7381 U
+−0.167D−0.583
+ε ⋅ z g c                                         (88) 
+where: 
+U1 = liquid velocities [LT-1]; 
+Ug = gas velocities [LT-1]; 
+Dc = column diameter [L2]; 
+z = column length [L]. 
+ 
+Turan and Ozturk (1996) obtained a correlation between the biological growth concentration and the 
+ratio between Peclet and Reynolds numbers with a determination coefficient equal to 0.569. Assuming 
+clean media, they also obtained a correlation between the HRT, Peclet and Reynolds numbers ratio: 
+Pe 0.312t = 26.6⎛ ⎞⎜ ⎟ r 2 = 0.54
+  ⎝Re ⎠                       (89) 
+	   	   1	   27	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+ 
+Otton et al. (2000) performed tracer tests using a simple tubular reactor to calibrate and validate the 
+proposed hydrodynamic model. They quantified the recycling effect as a plug flow with a variable 
+delay and the fluidization effect as an axial dispersion phenomenon. The authors only qualitatively 
+discussed the validation; the presented graphs indicate a satisfactory agreement between all 
+experimental data and the model simulation, but the model could not describe small variations of the 
+operating parameters that occurred inside the reactor. 
+ 
+6.2.6.5 Wet and dry digesters model validation and calibration 
+Mendoza and Sharratt (1999) carried out tracer experiments at different flow rates to define the 
+number of tanks-in series able to better simulate non-ideal flow in wet digesters. The authors obtained 
+experimental results making tracer tests and demonstrated a good fitting between compartment model 
+results and experimental tests. In the previous work, Mendoza and Sharratt (1998) did not performed 
+any model calibration and validation but made an evaluation of the impact of the mixing parameters 
+and showed that the relative volume of the flow-through region has a more significant effect than the 
+turnover time (θ). The authors demonstrated that the degree of the liquid mixing affects the residence 
+time distribution and the distribution of the components inside the reactor, influencing the kinetic rates 
+of the anaerobic process. 
+Keshtkar et al. (2003) compared preliminary simulations with sequencing batch experimental runs, 
+measuring methane yield at various organic loading rates for an HRT = 3 days, to determine the most 
+appropriate set of mixing model parameters. 
+In the context of CFD models, Wu and Chen (2008) operated model's validation by comparing the 
+predicted velocities with the experimental data proposed by Pinho and Whitelaw (1990). Finally, 
+Terashima et al. (2009) made a comparison between experimental and CFD tracer response curve, 
+finding a reasonably good fitting and analyzed the progress of mixing in the digester by defining a 
+new parameter of uniformity index (UI). The developed model could be a usefull tool to define the 
+required time for complete mixing in a full-scale digester at different solid concentrations and 
+different mixing rate. Also Vesvikar and Al-Dahhan (2005) carried out 3D steady-state CFD 
+simulations considering different digester configurations. The authors performed CFD simulation in 
+	  terms of overall flow pattern, location of circu	  lation cells and stagnant regions, trends of liq1u	   i2d8	   	   	   	   	  
+CHAPTER 6 – LITERATURE REVIEW 
+velocity profiles, and volume of dead zones. The results showed good qualitative comparison with the 
+experimental data in terms of flow pattern, location of dead zones and trends in velocity profile. 
+6.2.7. Conclusion 
+Development of high-rate reactors has made anaerobic treatment an attractive option to treat 
+wastewaters and bio-solids. In this chapter, mathematical models to simulate plug flow and dispersed 
+plug flow of four specific anaerobic bioreactor configurations, i.e. Upflow Anaerobic Sludge Blanket 
+Reactors, Anaerobic Fluidized Bed Reactors, Anaerobic Biofilters, wet and dry Digesters are 
+reviewed. This review details the effect of hydrodynamics/flow pattern on the reactor performance. 
+Most models are based on CSTR in series and axial dispersion equations to simulate the 
+hydrodynamics of plug flow reactors. They mainly differ by the numerical techniques and the 
+boundary conditions used to solve the mathematical equations. Model calibration is often aimed at 
+assessing the key hydrodynamic parameters, i.e. the dispersion number or the Peclet number, by 
+operating tracer test. When the model includes both a hydrodynamic module of the reactor and a 
+biochemical module to simulate the biochemical reactions, model calibration is also aimed at 
+assessing the kinetic constants. The research also describes the attempts to validate the proposed 
+models, illustrating the models capability to fit the experimental data. In all reported models 
+reasonably good fitting was found between model results and experimental data.  
+Most of the models described in this chapter are useful tools for operational optimization of waste and 
+wastewater treatment plants but there are still only few attempts to apply the proposed models for 
+optimum design and scale-up of these bioreactors. This indicates that further research efforts should 
+be focused on such design models to provide a mathematical tool for bioreactor sizing purposes
+ 
+ 
+ 
+ 
+	   	   1	   29	   	   	   	   	  
+CHAPTER 7– DISCUSSION AND CONCLUSIONS 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+CHAPTER 7 
+Discussion and Conclusions 
+ 
+	  	  
+ 
+	  	  
+	  	  
+	  
+	  	  
+	  	  
+	   	   1	   30	   	   	   	   	  
+CHAPTER 7– DISCUSSION AND CONCLUSIONS 
+7.1 Discussion and Conclusions 
+ 
+In the present research, the effect of TS content on dry and wet AD of different complex organic 
+substrates was studied. The results indicate that water plays in both conditions an essential role on the 
+specific methane production rate and VS degradation. In terms of final methane production yield, a 
+different behaviour between wet and dry AD conditions was found. In particular in wet AD of carrot 
+waste the same value of the final methane production yield, i.e. 450 mL/gVS with a standard deviation 
+of 14.23 was found. This is not in agreement with the results obtained in both dry and semidry 
+conditions with both rice straw and food waste. In these cases a higher final methane production yield 
+was found with lower TS values. This last finding is in agreement with previous tests performed by 
+Abbassi-Guendouz et al. (2012), Fernández et al. (2008) and Dong et al. (2010).  
+It is worth mentioning the existence of a linear relationship obtained in the case of carrot waste and 
+food waste between TS content and initial methane production rate (Fig. 43). Such relationship was 
+also observed by Lay et al. (1997b) on AD of selected dry organic waste (e.g. sludge cake, meat, 
+carrot, rice, potato and cabbage), Le Hyaric et al. (2012) on AD of cellulose, Abbassi-Guendouz et al. 
+(2012) on AD of cardboard, Mora-Naranjo et al. (2004) for waste samples excavated from landfill and 
+Pommier et al. (2007) for paper waste. The presented results confirm that the TS content, also in wet 
+AD, has a strong effect on the kinetic rates. At lower TS, due to the increasing water content and 
+better transport and mass transfer conditions, it seems to be plausible that the microorganisms are 
+better sustained with soluble substrates (Mora-Naranjo et al. 2004). This was not confirmed by the 
+tests carried out on rice straw (Fig. 43). This can be due to the different substrate composition and to 
+the complex nature of lignocellulosic compounds and difficult bio-availability of cellulose (Sambusiti, 
+2013). Further tests have to be done to explain this behaviour in detail. In particular a larger range of 
+TS have to be investigated to understand in detail the correlation between TS content and initial 
+methane production rate.  
+	   	   1	   31	   	   	   	   	  
+CHAPTER 7– DISCUSSION AND CONCLUSIONS 
+ 
+Figure 43. Linear correlation between initial methane production rate and TS for anaerobic digestion 
+of carrot waste, food waste and rice straw. 
+ 
+Inhibition tests were carried out to investigate the specific inhibition processes that take place with 
+complex organic compounds. A different behaviour in terms of VFAs concentration was found. In wet 
+AD of carrot waste no VFAs accumulation was observed, and all the concentrations were lower than 
+the inhibition threshold values, while in dry and semidry digestion acid accumulation was found. This 
+means that inhibition occurs with lack of water and this inhibition is the cause of the lower final 
+methane production yield with higher TS contents. However, in the specific case of rice straw, it was 
+noticed a similar value of the final specific methane production yield in the case of dry and semi–dry 
+conditions but a significant difference in terms of VFAs concentrations between these two different 
+tests. This might be due to another inhibition mechanism that occurs beyond a threshold value of TS 
+content, that can explain the similar value of final methane production at different TS contents. Thus, 
+the soluble phenols was analysed to understand better the process inhibition with higher TS content. 
+An accumulation of free phenolic compounds in the liquid bulk of the digesting mixture was found 
+and can explain the inhibition problems observed over TS content of 15%. This can be related to the 
+effect of the hydrolysis of lignocellulosic material that is composing the rice straw. Thus, there is a 
+transfer of phenolic matter from the solid matrix of the digestate to the liquid matrix. In reactors with 
+TS content of 23.4 %, due the lack of water, at parity of phenolics release, the hydrolysis brings to 
+higher concentrations that are probably above the methanation inhibition limit. This could explain the 
+specific methane production kinetics as well as the VFA accumulation due to the inhibition of the 
+	  methanogenesis step.  	   1	   32	   	   	   	   	  
+CHAPTER 7– DISCUSSION AND CONCLUSIONS 
+Further studies were also done to compare the process performances also in terms of VS and COD 
+degradation. For both substrates, rice straw and food waste, the better performances were observed at a 
+lower TS content. This finding is in agreement with the measured final methane production yield.  
+It has to be stressed that the higher TS content in the batch reactor without mixing implies 
+heterogeneous conditions inside the reactor and possible accumulations of inhibitory compounds 
+inside specific reactor zones are likely to occur. In full-scale reactor the accumulation of inhibitory 
+compound in a specific reactor zone could imply operating problems and reactor acidification. Thus it 
+is important for each specific reactor configuration to monitor the process and identify specific 
+conditions that could determine such inhibition problems.  	  
+In particular, further studies have to be done to individuate the highest TS content that can be accepted 
+in an anaerobic reactor over that acidification phenomena occur, i.e. the maximum TS value before a 
+complete process inhibition. On this topic, only one work has been already done by Abbassi-Guendoz 
+et al. (2012), who found a threshold concentration of 30% TS that determine an inhibitory effect in 
+high solids anaerobic digestion. This threshold could correspond to an inhibition of anaerobic 
+digestion at high solids content due to accumulation of metabolic by-products, such as volatile fatty 
+acids. 
+Moreover further research is needed to define the optimal TS of anaerobic digestion of food waste and 
+rice straw. In the present work the wet digestion was individuated as the best option to maximize the 
+specific final methane yield, but there is a need to make also an economical balance taking into 
+account different process costs. In particular for a specific full-scale reactor, it has to be done a 
+balance between the economical return related to higher specific methane production and the 
+additional costs of water use, digestate production and pre-treatments needed. However this study is 
+beyond the scope of this research and it has to be treated case by case considering a specific reactor 
+configuration and waste type to be treated. 
+Another instrument useful for full-scale reactor operation can be a complete mathematical model of 
+the anaerobic digestion process considering dry and wet conditions. This model can simulate the 
+effect of TS content on the process performances. In this thesis a mathematical model was proposed 
+and the model calibration was done only using the data obtained from batch experiments. The 
+proposed model can be applied to simulate full-scale application, and also can be calibrated by using 
+the data of full-scale plant considering the nature and quantity of the substrate to be treated and the 
+specific reactor configuration. 
+	   	   1	   33	   	   	   	   	  
+CHAPTER 7– DISCUSSION AND CONCLUSIONS 
+Considering all the results obtained in the present work, still a lot of efforts have to be done yet to 
+understand in deep the dry anaerobic digestion process, in particular the following research gaps and 
+needs should be considered: 
+•  increase the understanding of the effect of the reactor configuration, optimizing the operating 
+conditions; 
+•  increase the understanding of the dry anaerobic digestion processes through the comprehensive 
+analysis of the roles of phase separation, microbial community distribution patterns, hydrogen ion 
+partial pressure and accumulation of toxic compounds;   
+• understand the different effect of specific process inhibitors such as (Heavy Metals) HMs on 
+different TS anaerobic digestion processes; 
+• define optimized reactor configurations in terms of mixing conditions for different TS contents in 
+the reactor. This can be addressed performing hydrodynamic tests aimed at assessing the mixing effect 
+and the degree of dispersion in the reactor in order to define a configuration capable to reduce the 
+dispersion and short-circuiting problems. 
+Hydrodynamic experiments on plug flow laboratory scale reactor can be conducted with water and 
+tracer, to understand how the hydrodynamic is influenced by flow-rate variations and reactor 
+configurations (length, diameter, presence of impellers) and individuate the degree of dispersion with 
+different flow-rate values. Hydrodynamic experiments should be conducted also in anaerobic 
+conditions with inoculum and substrate to assess the effect of the substrate amount in the reactor and 
+TS content on the degree of dispersion. Further efforts have to be done also to study full-scale reactor 
+hydrodynamics and to model the AD process considering dispersion conditions. 
+	   	   1	   34	   	   	   	   	  
+REFERENCES 
+	  
+References 
+ 
+Ábalos, M., Bayona, J., Pawliszyn, J., (2000). Development of a headspace solid-phase 
+microextraction procedure. for the determination of free volatile fatty acids in waste waters. J. of 
+Chromatogr A, 873, 107-115. 
+ 
+Abbassi-Guendouz, A., Brockmann, D., Trably, E., Dumas, C., Delgenès, J.P., Steyer, J.-P. & Escudié 
+R. (2012) Total solids content drives high solid anaerobic digestion via mass transfer limitation. 
+Bioresour. Technol., 111, 55–61. 
+ 
+Ahring, B.K., Sandberg, M., Angelidaki, I., (1995). Volatile fatty acids as indicators of process 
+imbalance in anaerobic digestors. Appl. Microbiol. Biot., 43, 559-565. 
+ 
+Alex, J., Kolisch, G., and Krause, K. (2002). Model structure identification for wastewater treatment 
+simulation based on computational fluid dynamics. Water Sci. Technol. 45(4-5), 325-334. 
+ 
+Alphenaar, P.A., Visser, A. and Lettinga, G. (1993). The effect of liquid upward velocity and 
+hydraulic retention time on granulation in UASB reactors treating waste water with a high sulphate 
+content. Bioresour. Technol., 43, 249–258. 
+ 
+Amani, T., Nosrati, M., Sreekrishnan, T.R., (2010). Anaerobic digestion from the viewpoint of 
+microbiological, chemical, and operational aspects - a review. Environ. Rev. 18, 255–278. 
+ 
+Annachhatre, A.P. (1996). Anaerobic treatment of industrial wastewaters. Resour. Conserv. 
+Recycl., 16, 161-66. 
+ 
+	   	   1	   35	   	   	   	   	  
+REFERENCES 
+APHA. (1998) Standards Methods for the Examination of Water and Wastewater, 20th ed., United 
+Book Press, Inc., Baltimore, Maryland. 
+ 
+ATV. (1991). Bemessung von einstufigen Belebungsanlagen ab 5000 Einwohnerwerten. Arbeitsblatt 
+A 131, ATV, St. Augustin, BRD.            
+ 
+Baquerizo, G., Maestre, J.P., Sakuma, T., Deshusses, M.A., Gamisans, X., Gabriel, D. and Lafuente, 
+J.A. (2005). Detailed model of a biofilter for ammonia removal: model parameters analysis and model 
+validation. Chem. Eng. J. 113 (2-3), 205-214. 
+ 
+Batstone, D.J., Hernandez, J.L.A. and Schmidt, J.E. (2005). Hydraulics of laboratory and full-scale 
+upflow anaerobic sludge blanket (UASB) reactors. Biotech. and Bioeng. 91 (3), 387–391. 
+ 
+Batstone, D. J., Keller, J., Angelidaki, I., Kalyuzhnyi, S.V., Pavlostathis, S.V., Rozzi, A., Sanders, 
+W.T.M., Siegrist, H. & Vavilin, V.A. (2002) Anaerobic digestion model no.1. Sci. Tech. Rep. No. 13, 
+IWA Publishing, London. 
+ 
+Benedetti, L., Bixio, D., Claeys, F. and Vanrolleghem, P.A. (2008). Tools to support a model-based 
+methodology for emission/immission and benefit/cost/risk analysis of wastewater systems that 
+considers uncertainties. Environ. Modell. Softw. 23(8), 1082-1091. 
+ 
+Bhatia, B., Nigam, K.D.P., Auban, D. and Hebrard, G. (2004). Effect of a new high porosity packing 
+on hydrodynamics and mass transfer in bubble columns. Chem. Eng. Process. 43 (11), 1371-1380. 
+ 
+Bolle, W.L., van Breugel, J., van Eybergen, G.C., Kossen, N.W.F., van Gils, W. (1986a). An integral 
+dynamic model for the UASB reactor. Biotechnol. Bioeng. 28(11), 1621-1636. 
+ 
+Bolle, W.L., van Breugel, J., van Eybergen, G.C., Kossen, N.W.F., Zoetemeyer, R.J. (1986b). 
+Modeling the liquid flow in up-flow anaerobic sludge blanket reactors. Biotechnol. Bioeng. 28(11), 
+1615-1620. 
+	   	   1	   36	   	   	   	   	  
+REFERENCES 
+ 
+Bollon, J., Le-Hyaric, R., Benbelkacem, H., Buffière, P., (2011). Development of a kinetic model for 
+anaerobic dry digestion processes: Focus on acetate degradation and moisture content. Biochem. Eng. 
+J. 56, 212-218.  
+ 
+Bollon, J., Benbelkacem, H., Gourdon, R., Buffière, P., (2013) Measurement of diffusion coefficients 
+in dry anaerobic digestion media. Chemical Engineering Science, 89, 115-119 
+ 
+Bolzonella, D., Innocenti, L., Pavan, P., Traverso, P., Cecchi, F. (2003). Semi-dry thermophilic 
+anaerobic digestion of the organic fraction of municipal solid waste: focusing on the start-up phase. 
+Bioresour. Technol. 86, 123-129. 
+ 
+Bonnet, B., Dochain, D., Steyer, JP.(1997). Dynamical modelling of an anaerobic digestion ﬂuidized 
+bed reactor. Water Sci Technol., 36, 285–292 
+ 
+Braha, A. and Hafner, F. (1985). Use of Monod kinetics on multi stage bio reactors. Water Res. 19, 
+1217-1227.  
+ 
+Brown, D., Shi, J., Li, Y. (2012). Comparison of solid-state to liquid anaerobic digestion of 
+lignocellulosic feedstocks for biogas production. Bioresour. Technol. 124, 379–386. 
+ 
+Brown, D. and Yebo, L. (2013). Solid state anaerobic co-digestion of yard waste and food waste for 
+biogas production. Bioresour. Technol. 127, 275-280. 
+ 
+Bryers, J.D. (1985) Structured modelling of the anaerobic digestion of biomass particulates. 
+Biotechnol. Bioeng. 27, 638–649 
+ 
+Buffière, P. (1996). Modeling and experiments on the influence of hydrodynamics on the performance 
+of an anaerobic fluidized bed reactor, Ph.D Thesis, INSA Toulouse No. 410. 
+	   	   1	   37	   	   	   	   	  
+REFERENCES 
+ 
+Buffière, P., Fonade, C. and Moletta, R.. (1998a). Liquid mixing and phase hold-ups in gas producing 
+fluidized bed bioreactors. Chem. Eng. Sci. 53 (4), 617-627. 
+ 
+Buffière, P., Fonade, C. and Moletta, R. (1998b). Mixing and phase hold-ups variations due to gas 
+production in anaerobic fluidized-bed digesters: Influence on reactor performance. Biotechnol. 
+Bioeng. 60(1), 36-43. 
+ 
+Buffière, P., Steyer, J., Fonade, C and Moletta, R. (1998c). Modeling and experiments on the 
+influence of biofilm size and mass transfer in a fluidized bed reactor for anaerobic digestion. Water 
+Res., 32(3), 657–668. 
+ 
+Buffière, P., Loisel, D., Bernet, N. & Delgenes, J.P. (2006). Towards new indicators for the prediction 
+of solid waste anaerobic digestion properties. Water Sci. Technol., 53, 233-241 
+ 
+Chang, H.T. and Rittmann, B.E. (1987). Mathematical modeling of biofilm on activated carbon. 
+Environ Sci. Technol. 21(3), 273-280. 
+ 
+Charles, W., Walker, L., & Cord-Ruwisch, R. (2009). Effect of pre-aeration and inoculum on the 
+start-up of batch thermophilic anaerobic digestion of municipal solid waste. Bioresour. Technol., 100, 
+2329-2335. 
+ 
+Costa Reis, L.G and Sant’Anna, G.L. (1985). Aerobic treatment of concentrated wastewater in a 
+submerged bed reactor. Water Res., 19, 1341-1345. 
+ 
+Costello, D.J., Greenfield, P.F., Lee, P.L. (1991a). Dynamic modelling of a single-stage high-rate 
+anerobic reactor-I. Model Derivation. Water Res. 25, 847-858. 
+ 
+	   	   1	   38	   	   	   	   	  
+REFERENCES 
+Costello, D.J., Greenfield, P.F., Lee, P.L. (1991b). Dynamic modelling of a single-stage high-rate 
+anerobic reactor-II. Model verification. Water Res., 25, 859-871 
+ 
+Dai, X., Duan, N., Dong, B., Dai, L. (2013). High-solids anaerobic co-digestion of sewage sludge and 
+food waste in comparison with mono digestions: Stability and performance. Waste Manage., 33, 308-
+316. 
+ 
+Danckwerts, PV. (1953) Continuous flow systems, distributions of residence times. Chem. Eng. Sci. 
+2,1-13.                                                                                                                                            
+ 
+Davidson, J. F., Clift, R. and Harrison, D. (1985) Fluidization. Pergamon Press. Oxford. 
+ 
+De Baere, L., Mattheeuws, B., Velghe, F. (2010). State of the art of anaerobic digestion in Europe, In: 
+Twelfth International Congress on Anaerobic Digestion. IWA, Guadalajara, Mexico. 
+ 
+De Clercq, B., Coen, F., Vanderhaegen, B. and Vanrolleghem, P.A. (1999). Calibrating simple models 
+for mixing and flow propagation in wastewater treatment plants. Water. Sci. Technol., 39, 61-69.  
+ 
+Diez-Blanco, R., Garcia-Encina, V., Fernandez-Polanco, P.A., (1995). Effect of biofilm growth, gas 
+and liquid upflow velocities on the expansion of an anaerobic fluidized bed reactor (AFBR). Water 
+Res., 29, 1649–1654. 
+ 
+Dıez, L., Zima, B.E., Kowalczyk, W., Delgado, A. (2007). Investigation of multi- phase flow in  
+sequencing batch reactor (SBR) by means of hybrid methods. Chem. Eng. Sci. 62,1803-1813.  
+ 
+Dong, L., Zhenhong, Y. & Yongming, S. (2010) Semi-dry mesophilic anaerobic digestion of water 
+sorted organic fraction of municipal solid waste (WS-OFMSW). Bioresour. Technol.,101, 2722-2728. 
+ 
+Edelmann, W. (2003) Biomethanization of the Organic Fraction of Municipal Solid Wastes. In: Mata-
+	  Alvarez, J. (Ed.). IWA Publishing, London, 265–3	   01.  1	   39	   	   	   	   	  
+REFERENCES 
+ 
+Elefsiniotis, P., Wareham, D., Smith, M. (2004). Use of volatile fatty acids from an acid-phase 
+digester for denitrification. J. of Biotechnol., 114, 289-297 
+ 
+Escudié, T., Conte, J.P., Steyer, J.P., Delgenès. (2005). Hydrodynamic and biokinetic models of an 
+anaerobic fixed-bed reactor. Proc. Bioch. 40, 2311-2323. 
+ 
+Esposito, G., Frunzo, L., Panico, A, d’Antonio, G. (2008). Mathematical modelling of disintegration – 
+limited co-digestion of OFMSW and sewage sludge. Water Sci. Technol. 58, 1513–1519. 
+ 
+Esposito, G., Frunzo, L., Panico, A., Pirozzi, F. (2011a). Modelling the effect of the OLR and OFMSW 
+particle size on the performances of an anaerobic co-digestion reactor. Process Biochem. 46, 557–565. 
+ 
+Esposito, G., Frunzo, L., Panico, A., Pirozzi F. (2011b). Model calibration and validation for OFMSW 
+and sewage sludge co-digestion reactors. Waste Manage. 31, 2527–2535. 
+ 
+Esposito, G., Frunzo, L., Liotta F., Panico, A., Pirozzi, F. (2012a). Bio-methane potential tests to 
+measure the biogas production from the digestion and co-digestion of complex organic substrates. 
+Open Environ. Engine J. 5, 1–8. 
+ 
+Esposito, G., Frunzo, L., Giordano, A., Liotta, F., Panico, A., Pirozzi, F. (2012b). Anaerobic co-
+digestion of organic wastes. Rev. Environ. Sci. Biotechnol. 11, 325–341. 
+ 
+Esposito, G., Frunzo, L., Panico, A., Pirozzi, F. (2012c). Enhanced bio-methane production from co-
+digestion of different organic wastes. Env. Technol., 33, 2733-2740 
+ 
+Eckenfelder, W.W., Goronszy, M.C. and Watkin, A.T. (1985). Comprehensive Activated Sludge 
+Design. Developments in Environmental Modeling No. 7 Mathematical Models in Biological Waste 
+Water Treatment, S.E. Jorgensen and M.J. Gromiec, eds. Amsterdam, 95-132.    
+ 
+	   	   1	   40	   	   	   	   	  
+REFERENCES 
+El-Temtamy, S.A., El-Sharnoub, Y.D. and El Halwagi, M.M. (1979a). Liquid dispersion in gas-liquid 
+fluidized beds: Part I: Axial and radial dispersion. The dispersed plug-flow model.Chem. Eng. J. 18, 
+161-168. 
+ 
+El-Temtamy, S.A., El-Sharnoub, Y.D. and El Halwagi, M.M. (1979b). Liquid dispersion in gas-liquid 
+fluidized beds: Part II: Axial dispersion. The axially dispersed plug-flow model. Chem. Eng.  
+J. 18, 151-159. 
+ 
+Esposito, G., Fabbricino, M., & Pirozzi, F. (2003). Four-substrate design model for single sludge 
+predenitrification system. J. of Env. Eng., 129, 394-401. 
+ 
+Fall, C. and Loaiza-Navia, J.L. (2007). Design of a tracer test experience and dynamic calibration of 
+the hydraulic model for a full-scale wastewater treatment plant by use of AQUASIM. Water. Env. 
+Res., 79, 893-900 
+ 
+Fan, L.S., Kigie, K., Long, T.R. and Tang, W.T. (1987). Characteristics of a draft-tube gas-liquid 
+solid fluidized bed reactor for phenol-degradation. Biotechnol. Bioeng. 30, 498-504. 
+ 
+Fernández, J., Perez, M., Romero, L. (2008). Effect of substrate concentration on dry mesophilic 
+anaerobic digestion of organic fraction of municipal solid waste (OFMSW). Bioresour. Technol. 99, 
+6075–6080. 
+ 
+Fernández, J., Pérez, M., Romero, L.I. (2010). Kinetics of mesophilic anaerobic digestion of the 
+organic fraction of municipal solid waste: Influence of initial total solid concentration. Bioresour. 
+Technol., 101, 6322–6328. 
+ 
+Fdez-Güelfo, L. A., Álvarez-Gallego, C., Sales, D. and Romero García, L.I. (2012). Dry-thermophilic 
+anaerobic digestion of organic fraction of municipal solid waste: Methane production modeling. Waste 
+Manage. 32, 382-388. 
+ 
+Fdz-Polanco, F., Garcìa, P. and Santiago, V. (1994). Influence of Design and Operation Parameters on 
+	  the Flow Pattern of Submerged Filters. J. Chem. T	  echnol. Biot. 61, 153-158. 1	   41	   	   	   	   	  
+REFERENCES 
+Forster-Carneiro, T., Pérez, M., Romero, L.I. and Sales, D. (2007). Dry-thermophilic anaerobic 
+digestion of organic fraction of the municipal solid waste: focusing on the inoculum sources. Bioresour. 
+Technol. 98, 3195–3203. 
+ 
+Forster-Carneiro, T., Pérez, M., Romero, L. (2008). Influence of total solid and inoculum contents on 
+performance of anaerobic reactors treating food waste. Bioresour. Technol. 99, 6994–7002. 
+ 
+Froment, G.F., Bischoff, K.B. (1990). Chemical Reactor Analysis and Design, 2nd ed. John Wiley & 
+Sons, New York. 
+ 
+Gavrilescu, M. 2002. Engineering concerns and new developments in anaerobic waste-water treatment. 
+Clean. Technol. Envir. 3, 346-362. 
+ 
+Gerardi, M.H. (2003). The Microbiology of Anaerobic Digesters. Wiley, John & Sons, New York. 
+ 
+Ghosh, S. (1985). Solid-phase methane fermentation of solid waste. J. of Ener. Res. Technol., 107, 
+402-405. 
+ 
+Glover, G.C., Printemps, C., Essemiani, K. and Meinhold, J. (2006). Modelling of wastewater 
+treatment plants - How far shall we go with sophisticated modelling tools? Water Sci. Technol. 53, 
+79-89. 
+ 
+Graef, S.P. and Andrews, J.F. (1974). Stability and control of anaerobic digestion. J. of Water Poll. 
+Cont. Fed., 666-683. 
+ 
+Gray, N.F., Learner, MA. (1984). Comparative pilot scale investigation into upgrading the 
+performance of percolating filters by partial medium replacement. Water Res., 18, 409-422. 
+ 
+G	   uendouz, J., Buffière, P., Cacho, J., Carrere, M	  ., Delgenes, J.P. (2010). Dry anaerobic digestion1	   4in2	   	   	   	   	  
+REFERENCES 
+batch mode: design and operation of a laboratory-scale, completely mixed reactor. Waste Manag. 30, 
+1768–1771. 
+ 
+Gustavsson, J., Cederberg, C., Sonesson, U., van Otterdijk, R., Meybeck, A. (2011). Global food 
+losses and food waste. Rome: Food and Agriculture Organization of the United Nations (FAO). 
+ 
+Hanaki, K., Hirunmasuwan, S., & Matsuo, T. (1994). Selective use of microorganisms in anaerobic 
+treatment processes by application of immobilization. Water Res. 28, 993-996. 
+ 
+Henze, M., Grady, C. P.L., Gujer, W., Marais, G.V.R., Matsuo, T. (1987). Activated Sludge Model 
+No. 1. Scientiﬁc and Technical Report No. 1, IAWQ, London. 
+ 
+Heertjes, P.M. and Van Der Meer, R.R. (1978). Dynamics of liquid flow in an up-flow reactor-used 
+for anaerobic treatment of wastewater. Biotechnol. Bioeng., 20, 1577-1594. 
+ 
+Heertjes, P.M., Kujivenhoven, L.I and van der Meer, R.R. (1982). Fluid flow pattern in upflow 
+reactors for anaerobic treatment of beet sugar factory wastewater. Biotechnol. Bioeng., 24, 443-459. 
+ 
+Hill, D.T. (1982). A comprehensive dynamic model for animal waste methanogenesis. Trans. ASAE 
+25, 1374–1380 
+ 
+Hills, D.J. and Nakano, K. (1984). Effects of particle size on anaerobic digestion of tomato solid 
+wastes. Agricul. Wastes, 10, 285–295 
+ 
+ Hills, D. J. and Roberts, D.W. (1981). Anaerobic digestion of dairy manure and field crop residues. 
+ Agri. Wastes, 3, 179-89. 
+ 
+	   	   1	   43	   	   	   	   	  
+REFERENCES 
+Hirata, A., Hosaka, Y. and Umezawa, H. (1986). Biological treatment of water and wastewater in 
+three-phase fluidized bed. Proc. of the Third World Congress in Chemical Engineering, vol. III, 
+Tokyo, 3, 556.  
+ 
+Huang, J-S. and Jih, C-G. (1997). Deep- Biofilm kinetics of substrate utilization in anaerobic filters. 
+Wat. Res. 31, 2309-2317. 
+Huang, W., Wu, C., Xia, B. and Xia, W. (2005). Computational Fluid Dynamic Approach for 
+Biological System Modeling. arXic:q-bio/0508006v1[q-bio.QM].  
+ 
+Jacob, J., Pingaud, H., Le Lann, J.M., Bourrel, S., Babary, J.P. and Capdeville, B. (1996). Dynamic 
+simulation of bioﬁlters. Simulat. Pract. Theory. 4, 335-348. 
+ 
+ Janssen, P.H.M. and Heuberger, P.S.C. (1995). Calibration of process-oriented models. Ecol. Model.  
+83, 55–66. 
+ 
+ Jha, A. K., Li, J., Nies, L. and Zhang, L. (2013). Research advances in dry anaerobic digestion process  
+of solid organic wastes. Afr. J. Biotechnol., 10, 14242-14253. 
+ 
+Jeris J.S. (1977). Biological fluidized bed for BOD and nitrogen removal. J. Water Pollut. Control 
+Fed. 49, 816-831. 
+ 
+Jin, B., Wilén, B. M. and Lant, P., (2004). Impacts of morphological, physical and chemical properties 
+of sludge flocs on dewaterability of activated sludge. Chem. Eng. J., 98, 115-126. 
+ 
+Kalyunzhnyi, S., Federovich, V., Lens, P., Pol, H. and Lettinga, G. (1998). Mathematical modelling as 
+a tool to study population dynamics between sulfate reducing and methanogenic bacteria. 
+Biodegradation. 9, 187-199. 
+ 
+	   	   1	   44	   	   	   	   	  
+REFERENCES 
+Kalyunzhnyi, S., Federovich, V. (1997). Integrated Mathematical Model of UASB Reactor for 
+Competition between sulphate reduction and methanogenesis. Wat. Sci. Tech., 36, 201-208. 
+ 
+Kalyunzhnyi, S., Vyacheslav, V., Federovich, V. and Lens, P. (2006). Dispersed plug flow model for 
+upflow anaerobic sludge bed reactors with focus on granular sludge dynamics. J. Ind. Microbiol. Biot. 
+33, 221-237. 
+ 
+Karthikeyan, O.P. and Visvanathan, C., (2012). Bio-energy recovery from high-solid organic 
+substrates by dry anaerobic bio-conversion processes: a review. Rev. Env. Sci. Biotechnol., 12, 257-
+284. 
+ 
+Keshtkar, A. B. Meyssami, G. Abolhamd, H. Ghaforian, M. Khalagi Asadi. (2003). Mathematical 
+modeling of non-ideal mixing continuous flow reactors for anaerobic digestion of cattle manure. 
+Bioresour. Technol. 87, 113-124. 
+ 
+Khudenko, B.M. and Shpirt, E. (1986). Hydrodynamic parameters of diffused air systems. Water Res. 
+20, 905-915.  
+ 
+Kim, S.D. and Kang, Y. (1997). Heat and Mass transfer in three-phase fluidized bed reactors-an  
+overview. Chem. Eng. Sci. 52, 3639-3660.  
+ 
+Kim, D.-H. and Oh, S.E., (2011). Continuous high-solids anaerobic co-digestion of organic solid 
+wastes under mesophilic conditions. Waste Manage., 31, 1943-1948. 
+ 
+King, R.O. and Forster, C.F. (1990). Effects of sonication on activated sludge. Enzyme Microb. Tech. 
+12, 109-115. 
+ 
+Kshirsagar, S.R., Phadke, N.S. and Tipnis, S.S. (1972). Detention time studies in trickling ﬁlter. 
+Indian J. Environ. Hlth. 14, 95-104. 
+	   	   1	   45	   	   	   	   	  
+REFERENCES 
+Kyoto, P., (1997). United Nations framework convention on climate change. Kyoto Protocol, Kyoto. 
+ 
+Iliuta, I. and Larachi, F. (2005). Modeling simultaneous biological clogging and physical plugging in 
+trickle-bed bioreactors for wastewater treatment. Chem. Eng. Sci. 60, 1477-1489. 
+ 
+Lamb, R. and Owen, S.G.H. (1970). A suggested formula for the process of biological filtration. 
+Water Pollut. Control., 69, 209-220. 
+ 
+Launder B.E. and Spalding, B.P. (1974). The numerical computation of turbulent flows. Comput. 
+Method Appl. M. 3, 269-289. 
+ 
+Lawrence, A.W. and McCarty, P.L. (1970). Unified basis for biological treatment design and 
+operation.  J. San. Eng., 96, 757-778.  
+ 
+Lay, JJ., Li YY. & Noike, T. (1997a) Influences of pH and moisture content on the methane 
+production in high-solids sludge digestion. Water Res., 31, 1518–1524 
+ 
+Lay, JJ., Li, YY., Noike, T., Endo, J. and Ishimoto, S. (1997b) Analysis of environmental factors 
+affecting methane production from high-solids organic waste. Water Sci. Technol., 36, 493-500. 
+ 
+Lay JJ., Li YY., Noike, T. (1998) Developments of bacterial population and methanogenic activity in 
+a laboratory-scale landfill bioreactor. Water Res. 32, 3673–3679 
+ 
+Lee, T.T., Wang, F. Y., Newell, R.B. (1999a). Dynamic modelling and simulation of activated sludge 
+process using orthogonal collocation approach. Water Res. 33, 73-86. 
+ 
+Lee, T.T., Wang, F.Y., Newell, R.B. (1999b). Dynamic simulation of bioreactor systems using  
+orthogonal collocation on finite elements. Comp. Chem. Eng., 23, 1247-1262. 
+ 
+Le Hyaric, R., Chardin, C., Benbelkacem, H., Bollon, J., Bayard, R., Escudié, R. and Buffière,1 P4.6 	   	   	   	   	   	   	   	  
+REFERENCES 
+(2011). Influence of substrate concentration and moisture content on the specific methanogenic 
+activity of dry mesophilic municipal solid waste digestate spiked with propionate. Bioresour. Technol. 
+102, 822–827. 
+ 
+Le Hyaric, R., Benbelkacem, H., Bollon, J., Bayard, R., Escudiè, R. and Buffière, P. (2012). Influence 
+of moisture content on the specific methanogenic activity of dry mesophilic municipal solid waste 
+digestate. J. of Chem. Techn. Biotechnol., 87, 1032-1035. 
+ 
+Le Moullec, Y., Potier O., Gentric, C. and Leclerc, J.P. (2008). Flow field and residence time 
+distribution simulation of a cross-flow gas–liquid wastewater treatment reactor using CFD. Chem. 
+Eng. Sci., 63, 2436-2449. 
+ 
+Le Moullec, Y., Gentric, C., Potier, O. and Leclerc, J.P. (2010a). CFD simulation of the 
+hydrodynamics and reactions in an activated sludge channel reactor of wastewater treatment. Chem. 
+Eng. Sci., 65, 492-498. 
+ 
+Le Moullec, Y., Gentric, C., Potier, O., Leclerc, J.P. (2010b). Comparison of systemic, compartmental 
+and CFD modelling approaches: application to the simulation of a biological reactor of wastewater 
+treatment. Chem. Eng. Sci., 65, 343-350. 
+ 
+Le Moullec, Y., Potier, O., Gentric, C., & Leclerc, J. P. (2011). Activated sludge pilot plant: 
+Comparison between experimental and predicted concentration profiles using three different 
+modelling approaches. Water Res., 45, 3085-3097.  
+ 
+Levin, M.A. and Gealt M.A. (1993). Overview of biotreatmen practices and promises. Levin M.A. 
+and Gealt M.A, eds. Biotreatment of industrial and hazardous waste. McGraw-Hill, Philadelphia (PA), 
+71-72. 
+ 
+Li, Y., Park, S.Y., Zhu, J. (2011). Solid-state anaerobic digestion for methane production from organic 
+waste. Renew. Sust. Energ. Rev., 15, 821-826. 
+	   	   1	   47	   	   	   	   	  
+REFERENCES 
+ Liotta, F., d’Antonio, G., Esposito, G., Fabbricino, M., Frunzo, L., van Hullebusch, E. D., Lens, 
+N.L. and Pirozzi, F. (2014). Effect of moisture on disintegration kinetics during anaerobic 
+digestion of complex organic substrates. Waste Manage. Res. 32, 40-48. 
+Lianhua, L., Dong, L., Yongming, S., Longlong, M., Zhenhong, Y., Xiaoying, K. (2010). Effect of 
+temperature and solid concentration on anaerobic digestion of rice straw in South China. Int. J. 
+Hydrogen. Energ., 35, 7261-7266. 
+ 
+Lin S.H. (1991). A mathematical model for a biological fluidized bed reactor. J. Chem. Technol. 
+Biot., 51, 473-482.  
+ 
+Lissens, G., Vandevivere, P., De Baere, L., Biey, E., Verstraete, W. (2001). Solid waste digestors: 
+process performance and practice for municipal solid waste digestion. Water Sci. Technol., 44, 91-102 
+ 
+Lovett, D.A., Travers S.M. and Davey K.R. (1984). Activated sludge treatment of abattoir 
+wastewater-I: Influence of sludge age and feeding pattern. Water Res., 18, 429-434. 
+ 
+ Lü, F., Hao, L., Zhu, M., Shao, L., He, P. (2012). Initiating methanogenesis of vegetable waste at low 
+inoculum-to-substrate ratio: importance of spatial separation. Bioresour. Technol. 105, 169–173. 
+ 
+Makinia, J. and Wells, SA. (1999). Improvements in modeling dissolved oxygen in activated sludge 
+systems. Proc. of the 8th IAWQ Conference on Design, Operation and Economics of Large 
+Wastewater Treatment Plants, Budapest, 518-525.                    
+ 
+Makinia, J. and Wells, S.A. (2000a). A general model of the activated sludge reactor with dispersive 
+flow-I. model development and parameter estimation. Water. Res., 34, 3987-3996. 
+ 
+Makinia, J. and Wells, S.A. (2000b). A general model of the activated sludge reactor with dispersive 
+flow-II. Model verification and application. Water Res., 34, 3997-4006. 
+ 
+Makinia, J. and Wells, S.A. (2005). Evaluation of empirical formulae for estimation of the 
+	  longitudinal dispersion in activated sludge rectors	  . Water Res., 39, 1533-1542.  1	   48	   	   	   	   	  
+REFERENCES 
+ 
+Mann, A.T., Stephenson, T. (1997). Modeling biological Aerated Filters for Wastewater Treatment. 
+Water Res., 31, 2443-2448. 
+ 
+Martin AD. (2000). Interpretation of residence time distribution data. Chem. Eng. Sci., 55, 5907-5917. 
+ 
+Martinov, M., Hadjiev, D. and Vlaev, S.D. (2010). Liquid flow residence time in a fibrous fixed bed 
+reactor with recycle. Bioresour. Technol., 101, 1300-1304. 
+ 
+Mata-Alvarez J., Mace, S. and Llabres, P. (2000). Anaerobic digestion of organic solid wastes. An 
+overview of research achievements and perspectives. Bioresour. Technol. 74, 3–16. 
+ 
+Mendoza R.B. and Sharratt, P.N. (1998). Modelling the effects of imperfect mixing on the performance 
+of anaerobic reactors for sewage sludge treatment. J. Chem. Tech. and Biotech. 71, 121–130. 
+ 
+Mendoza R.B. and Sharratt, P.N. (1999). Analysis of retention time distribution (RTD) curves in an 
+anaerobic digester with confined-gas mixing using a compartment model. Wat. Sci. Techn. 40, 49-56. 
+ 
+Meunier, A.D. and Williamson, K.J. (1981). Packed bed reactors: simplified model. J. Environ. Eng., 
+107, 303-317. 
+ 
+Mezaoui, A. (1979). Etude de l'épuration biologique sur lits bactériens à remplissage plastique. Ph.D. 
+thesis, University of Montpellier, Montpellier, France. 
+ 
+Michelsen, M.L. and Østergaard K. (1970). Hold-up and fluid mixing in gas-liquid fluidised beds. 
+Chem. Eng. J., 1, 37-46. 
+                                                                                                                                 
+Milbury, W.F., Pipes, W.O. and Grieves, R.B. (1965). Compartmentalization of aeration tanks. J. San. 
+Eng., 91 (SA3), 45-61. 
+ 
+Moletta, R., Verrier, D. and Albagnac, G. (1986). Dynamic modelling of anaerobic digestion. Water 
+	  Res. 20, 427–434. 	   1	   49	   	   	   	   	  
+REFERENCES 
+  
+ Monteith, H. D. and Stephenson, J.P. (1981). Mixing efficiencies in full-scale anaerobic digesters by 
+ tracer methods. J. WPCF. 53, 78-84. 
+ 
+Mora-Naranjo N., Meima J.A., Haarstrick A. & Hempel DC. (2004). Modelling and experimental 
+investigation of environmental influences on the acetate and methane formation in solid waste. Waste 
+Manage., 24, 763–773. 
+ 
+Motte, J. C., Escudié, R., Bernet, N., Delgenes, J. P., Steyer, J. P., Dumas, C. (2013). Dynamic effect 
+of total solid content, low substrate/inoculum ratio and particle size on solid-state anaerobic digestion. 
+Bioresour. Technol., 144, 141-148. 
+ 
+Mulcahy, L.T. and La Motta, E.J. (1978). Mathematical model of the fluidized bed biofilm reactor. 
+Proc. of 51st Annual Conference, Water Pollution Control Federation, Anaheim, CA; 
+ 
+Mulcahy, L.T., Shieh W.K., LaMotta, E.J. (1980). Kinetic model of biological denitriﬁcation in a 
+ﬂuidized bed bioﬁlm reactor (FBBR). Progr. Water. Technol., 12, 143-157.  
+ 
+Mulcahy, L.T., Shieh, W.K. and LaMotta, E.J. (1981). Simplified Mathematic Models for a Fluidized-
+Bed Biofilm Reactor. AIChE Symp. Boston, Portland; Chicago, 273-285.  
+ 
+Muroyama, K. and Fan, LS. (1985). Fundamentals of gas–liquid–solid ﬂuidization. AIChE Journal., 
+31, 1-34. 
+ 
+Muslu, Y. (1984). Dispersion in granular media trickling filters. J. Environ. Eng. ASCE, 110, 961-
+976.  
+ 
+Muslu, Y. (1986). Distribution of retention times in model biological filters containing packed 
+spheres. Water Res., 20, 259-265. 
+ 
+Muslu, Y. (1990). Use of dispersed flow models in design of biofilm reactors. Water Air Soil Poll., 
+53, 297-314. 
+	   	   1	   50	   	   	   	   	  
+REFERENCES 
+Muslu, Y. and San, A.H. (1990). Mixing characteristics of suspended growth systems. Part 1. The 
+mathematical model. J. Disper. Sci. Technol., 11, 363-378. 
+ 
+Muslu, Y. (2000a). Numerical approach to plug-flow activated sludge reactor kinetics. Comput. Biol. 
+Med., 30, 207-223.    
+ 
+Muslu, Y. (2000b). Application of Monod kinetics on cascade reactors-in series. J. Chem. Technol. 
+Biot., 75, 1151-1159. 
+ 
+Mussoline, W. (2013). Enhanced Methane Production from Pilot-Scale Anaerobic Digester Loaded 
+with Rice Straw. Open Env. Eng. J., 6, 32-39 
+ 
+Mussoline, W., Esposito, G., Lens, P., Garuti, G., Giordano, A. (2012). Design considerations for a 
+farm-scale biogas plant based on pilot-scale anaerobic digesters loaded with rice straw and piggery 
+wastewater. Biomass. Bioenerg., 46, 469-478 
+ 
+Nogita, S., Saito, Y. and Kuge, T. (1983). A new indicator of the activated sludge process: Nitrous 
+oxide. Water Sci. Technol., 13, 199-204. 
+ 
+Nyadziehe, K.T. (1980). Réacteur biologique à ruissellement sur garnissage plastique. Ph.D. thesis, 
+University of Montpellier, Montpellier, France. 
+ 
+Oleszkiewicz, J.A. (1981). Aerobic and anaerobic biofiltration of agricultural effluents. Agric. 
+Wastes., 3, 285-296.  
+ 
+Olivet, D., Valls, J., Gordillo, M., Freixo, A. and Sanchez, A. (2005). Application of residence time 
+distribution technique to the study of the hydrodynamic behaviour of a full‐scale wastewater treatment 
+plant plug‐flow bioreactor. J. Chem. Technol. and Biotech., 80, 425-432. 
+ 
+Olsson, G. and Andrews, J.F. (1978). The dissolved oxygen profile-A valuable tool for control of the 
+	  activated sludge process. Water Res., 12, 985-100	  4. 1	   51	   	   	   	   	  
+REFERENCES 
+ 
+Ojha, C., Singh, R. (2002). Flow distribution Parameters in Relation to Flow Resistence in an UpFlow 
+Anaerobic Reactor System. J. Environ. Eng., 128, 196-200. 
+ 
+Otton, V., Hihn, J.Y., Béteau, J.F,. Delpech, F. and Chéruy, A. (2000). Axial dispersion of liquid in 
+fluidisedbed with external recycling: two dynamic modelling approaches with a view to control. 
+Biochem. Eng. J., 4, 129-136. 
+ 
+Park, Y., Davis, M.E. and Wallis, D.A. (1984). Analysis of a Continuous, Aerobic Fixed-Film 
+Bioreactor. I. Steady-State Behavior. Biotechnol. Bioeng., 26, 457-467. 
+ 
+Pavlostathis, S.G. and Giraldo‐Gomez, E. (1991). Kinetics of anaerobic treatment: a critical review. 
+Crit. Rev. Env. Technol., 21, 411-490 
+ 
+Penã, M.R. (2002). Advanced primary treatment of domestic waste-water in tropical countries: 
+development of high-rate anaerobic ponds. Ph.D. Thesis, University of Leeds, Leeds, England. 
+ 
+Penã, M.R., Mara, D.D. and Avella, G.P. (2006). Dispersion and treatment performance analysis of an 
+UASB reactor under different hydraulic loading rates. Water Res., 40, 445-452. 
+ 
+Pérez, J., Poughon, L., Dussap, C. G., Montesinos, J. L. and Gòdia, F. (2005). Dynamics and steady 
+state operation of a nitrifying fixed bed biofilm reactor: mathematical model based description. Pro. 
+Biochem., 40, 2359-2369. 
+ 
+Piché, S., Larachi, F., Iliuta, I. and Grandjean, B.P.A. (2002). Improving predictions of liquid back-
+mixing in trickle-bed reactors using a neural network approach. J. Chem. Tech. Biotech., 77, 989-998. 
+ 
+	   	   1	   52	   	   	   	   	  
+REFERENCES 
+Pinho, F.T. and Whitelaw, J.H. (1990). Flow of non-Newtonian fluids in a pipe. J. Non-Newtonian 
+Fluid Mech. 34, 129–144. 
+ 
+Pohl, M., Heeg, K., Mumme, J. (2013). Anaerobic digestion of wheat straw–Performance of 
+continuous solid-state digestion. Bioresour. Technol. 146, 408-415. 
+ 
+Pommier, S., Chenu, D., Quintard, M. and Lefebvre, X. (2007). A logistic model for the prediction of 
+the influence of water on the solid waste methanization in landfills. Biotechnol. Bioeng., 97, 473-482. 
+ 
+Potier, O., Leclerc, J.P. and Pons, M.N. (2005). Influence of geometrical and operational parameters 
+on the axial dispersion in an aerated channel reactor. Water Res., 39, 4454-4462. 
+ 
+Qu, X., Vavilin, V. A., Mazéas, L., Lemunier, M., Duquennoi, C., He, P. J. and Bouchez, T. (2009). 
+Anaerobic biodegradation of cellulosic material: Batch experiments and modelling based on isotopic 
+data and focusing on aceticlastic and non-aceticlastic methanogenesis. Waste Manage., 29, 1828-
+1837. 
+ 
+Ramin, E., Sin, G., Mikkelsen, P. S. and Plósz, B. (2011). Significance of uncertainties derived from 
+settling tank model structure and parameters on predicting WWTP performance-A global sensitivity 
+analysis study. 8th IWA Symposium on Systems Analysis and Integrated Assessment. Watermax, 476-
+483. 
+ 
+Ratkocivh, N., Horn, W., Helmus, F.P., Rosenberger, S., Naessens, W., Nopens, I., Bentzen, T.R. 
+(2013). Activated sludge rheology: A critical review on data collection and modelling. Water Res., 42, 
+463-482. 
+ 
+Reith, J.H., Wijffels, R.H., Barten, H. (2003). Bio-methane and Bio-hydrogen: Status and Perspectives 
+of Biological Methane and Hydrogen Production. Dutch Biological Hydrogen Foundation, Petten, 
+Netherlands. 
+	   	   1	   53	   	   	   	   	  
+REFERENCES 
+Rigopoulos, S. and Jones, A. (2003). A hybrid CFD–reaction-engineering framework for multiphase 
+reactor modeling: basic concept and application to bubble column reactors. Chem. Eng. Sci., 58, 
+3077-3089. 
+ 
+Rittmann, B.E. (1982). Comparative Performance of Biofilm Reactor. Biotechnol. Bioeng., 24, 1341-
+1370.  
+ 
+Ren, T.T, Mu, Y.H., Harada B.J., Yu H.Q. (2009). Hydrodynamics of upflow anaerobic sludge 
+blanket reactors. Aiche J., 55, 516-528. 
+ 
+Reichert, P. (1998).  User manual of AQUASIM 2.0 for the identification and simulation of aquatic 
+systems, Swiss Federal Institute for Environmental Science and Technology, Dubendorf, Switzerland 
+Sambusiti, C. (2013). Physical, chemical and biological pretreatments to enhance biogas production 
+from lignocellulosic substrates. PhD thesis, Politecnico di Milano, Milano, Italy.  
+ 
+San, H.A. (1989). A kinetic model for ideal plug-flow reactors. Water Res., 23, 647-654. 
+ 
+San, H.A. (1992). Mechanism of biological treatment in plug flow or batch systems. J. Env. Eng. 
+Proc., 118, 614-628. 
+ 
+San, H.A. (1994). Impact of dispersion and reaction kinetics on performance of biological reactors 
+solution by ‘‘S’’ series. Water Res., 28, 1639-1651.   
+ 
+Sánchez, O., Michaud, S., Escudié, R., Delgenès, J. P., & Bernet, N. (2005). Liquid mixing and gas–
+liquid mass transfer in a three-phase inverse turbulent bed reactor. Chem. Eng. J., 114, 1-7. 
+ 
+Sanders, W.T.M., Geerink M., Zeeman G. & Lettinga G. (2000). Anaerobic hydrolysis kinetics of 
+particulate substrates. Water Sci. Technol., 41, 17-24. 
+ 
+	   	   1	   54	   	   	   	   	  
+REFERENCES 
+Sant’Anna, J.R. (1980). Contribution à l'étude de l'hydrodynamique des réacteurs biologiques utilisés 
+en traitement des eaux usées. Ph.D. thesis, INSA Toulouse, Toulouse, France. 
+ 
+Saravanan, V. and Sreekrishnan, T.R. (2006). Modelling anaerobic biofilm reactors-a review. J. 
+Environ. Man., 81, 1-18. 
+ 
+Särner E. (1978). Plastic-packed trickling filters, Bulletin Series Va, No. 21. Lund Institute of 
+Technology, University of Lund, Lund, Sweden.  
+ 
+Schwarz, A., Yahyavi, B., Mosche, M., Burkhardt, C., Jordening, H-J, Buchholz, K., Reuss, M. 
+(1996). Mathematical modelling for supporting scale up of anaerobic wastewater treatment in a 
+fluidized bed reactor. Water. Sci. Technol. 34, 501-508. 
+ 
+Schwarz, A., Yahyavi, B., Mosche, M., Burkhardt, C., Jordening, H-J, Buchholz, K., Reuss, M.(1997). 
+Mathematical modelling and simulation of an industrial scale fluidized bed reactor for anaerobic 
+wastewater treatment-scale-up effect on pH-gradients. Water Sci. Technol. 36, 219-227 
+ 
+Séguret, F. and Racault, Y. (1998). Hydrodynamic behaviour of full-scale submerged bioﬁlter and its 
+possible influence on performances. Wat. Sci. Tech., 38, 249-256.  
+ 
+Séguret, F., Racault, Y. and Sardin, M. (2000). Hydrodynamic behavior of full-scale trickling ﬁlters. 
+Water Res., 34, 1551-1558.  
+ 
+Seok, J. and Komisar, S. (2003). Integrated Modeling of Anaerobic Fluidized Bed Bioreactor for  
+Deicing Waste Treatment. I.: Model Derivation. J. Environ. Eng. 129,100-109.  
+ 
+Service B.I., Preparatory Study on Food Waste across E.U.-27 for the European Commission, 2010, p. 
+14, http://ec.europa.eu/environment/eussd/pdf/bio_foodwaste_report.pdf, accessed 6 July 2012. 
+ 
+	  Sharma, S.K., Mishra, I.M., Sharma, M.P. and S	   aini, J.S. (1988). Effect of particle size on biog1	  a5s5	   	   	   	   	  
+REFERENCES 
+generation from biomass residues. Biomass. 17, 251–263. 
+ 
+Shi, L.J., Huang, M., Zhang, W.Y. and Liu, H.F. (2013). Effect of Dry Matter Concentration on Dry 
+Anaerobic Digestion of Animal Manure and Straw. Appl. Mech. and Mat., 253, 897-902. 
+ 
+Shi, J., Xu, F., Wang, Z., Stiverson, J. A., Yu, Z. and Li, Y. (2014). Effects of microbial and 
+non-microbial factors of liquid anaerobic digestion effluent as inoculum for solid-state anaerobic 
+digestion of corn stover. Bioresour. Technol. 157, 188-196. 
+ 
+Shieh, W., Mulcahy, L.T. and LaMotta, E.J. (1982). Mathematical model for the fluidized bed  
+biofilm reactor. Enzyme Microb. Tech., 4, 269-276.   
+ 
+Siegrist, H., Renggli, D. and Gujer, W. (1993). Mathematical modelling of anaerobic mesophilic 
+sewage sludge treatment. Water Sci. Technol. 27, 25–36. 
+ 
+Singh, K., Viraraghavan, T., Bhattacharyya, D. (2006). Sludge Blanket Height and Flow Pattern in 
+UASB Reactor: Temperature effects. J. Environ. Eng. 132, 895-900.  
+ 
+Singhal, A., Gomes, J., Praveen, V.V., Ramachandran, K.B. (1998). Axial Dispersion Model for 
+Upflow Anaerobic Sludge Blanket Reactors. Biotechnol. Prog. 14, 645-648. 
+ 
+Smith, J.M. (1981). Chemical Engineering Kinetics, 3rd ed., McGraw Hill Inc., New York.  
+ 
+Smith, L.C., Elliot, D.J., James, A. (1993). Characterisation of mixing patterns in an anaerobic 
+digester by means of tracer curve analysis. Ecol. Model. 69, 267-285.  
+ 
+Smith, L.C., Elliot, D.J., James, A. (1996). Mixing in upflow anaerobic filters and its influence on 
+performance and scale-up. Water Res. 30, 3061-3073. 
+	   	   1	   56	   	   	   	   	  
+REFERENCES 
+ 
+Smith, P.H., Bordeaux, F. M., Goto, M., Shiralipour, A., Wilkie, A., Andrews, J.F., Ide, S.M. and 
+Barnett, W. (1988). Biological production of methane from biomass. In Methane From Biomass: A 
+Systems Approach, 291-255. Elsevier Applied Science, London.  
+ 
+Tariq M.N. (1975). Retention time in trickling filters. Progr. Water. Technol., 7, 225-234. 
+ 
+Tartakovsky, B., Mu, S.J., Zeng, Y., Lou, S.J., Guiot, S.R. and Wu, P. (2008). Anaerobic digestion 
+model No.1 –based distributed parameter model of an anaerobic reactor: II. Model validation. 
+Bioresour. Technol. 99, 3676-3684.  
+ 
+Tay, J.H., Show, K.Y. and Jeyaseelan, S. (1996). Effects of media characteristics on the performance 
+of upflow anaerobic packed-bed reactors. J. Envir. Engrg. Div., ASCE. 122, 469-476. 
+ 
+Tay, J.H. and Show, K.Y. (1998). Media-Induced Hydraulic Behavior and Perfomance of Upflow 
+Biofilters. J. Envir. Engrg. Div. ASCE. 124, 720-729. 
+Tchobanoglous, G., Burton F.L., Stensel, H.D. 2003. Wastewater Engineering Treatment and Reuse, 
+4th Edn. Metcalf and Eddy. Inc. McGraw-Hill Company. 
+ 
+Teefy, S. (1996). Tracer studies in water treatment facilities: A protocol and case studies. AWWA 
+Research Foundation and American Water Works Association, Denver, CO. 
+ 
+Terashima, M., Goel, R., Komatsu, K., Yasui, H., Takahashi, H., Li, Y.Y. and Noike, T. (2009). CFD 
+simulation of mixing in anaerobic digesters. Bioresour. Technol., 100, 2228-2233. 
+ 
+Trinet, F., Heim, R., Amar, D., Chang, H.T. and Rittmann, B.E. (1991). Study of biofilm and 
+fluidization of bioparticles in a three-phase fluidized-bed reactor. Water Sci. Technol., 23, 1347-135145.7 	   	   	   	   	   	   	   	  
+REFERENCES 
+ 
+Tuček, F., Chudoba, J. and Maděra, V. (1971). Unified basis for design of biological aerobic treatment 
+processes. Water Res., 5, 647-680. 
+ 
+Turan, M. and Ozturk, I. (1996). Longitudinal Dispersion and biomass hold-up of anaerobic fluidized 
+bed reactor. Water. Sci. Technol., 43, 461-468. 
+ 
+Turian, R.M., Fox, G.E. and Rice, R.A. (1975). The dispersed flow model for a biological reactor as 
+applied to the activated sludge process. Can. J. Chem. Eng., 53, 431-437.  
+ 
+U.S.E.P.A., (1993). EPA/625/R-93/010. United States Environmental protection Agency Office of 
+Research and Development, Washington, DC. 
+ 
+U.S.E.P.A., (2001). METHOD 1684 Total, Fixed, and Volatile Solids in Water, Solids, and Biosolids, 
+in: (4303), E.a.A.D. (Ed.), Washington, DC 20460. 
+ 
+Valorgas (2012). Seventh Framework Programme Theme Energy.2009.3.2.2.Biowaste as feedstocl for 
+a 2nd generation. University of Southampton (Soton).  
+ 
+Van der Laan (1957). Notes on the diffusion-type model for the longitudinal mixing in flow. Chem. 
+Eng. Sci., 6, 187-191. 
+ 
+Van Der Meer, R.R., Heertjes, P.M. (1983). Mathematical description of anaerobic treatment of 
+wastewater in upflow reactors. Biotechnol. Bioeng., 25, 2531-2556. 
+ 
+Vandevenne, L. (1986). Epuration secondaire par lits bactériens. Final Report, CEBEDEAU-A.S.B.L, 
+Liège, Belgium. 
+ 
+	   	   1	   58	   	   	   	   	  
+REFERENCES 
+Vandevivere, P. (1999). New and broader applications of anaerobic digestion. Critical Rev. Env. Sci. 
+and Technol., 29, 151-173. 
+ 
+Vavilin, V.A., Lokshina, L.Y., Rytov, S.V., Kotsyurbenko, O.R., Nozhevnikova, A.N. and Parshina, 
+S.N. (1997). Modelling methanogenesis during anaerobic conversion of complex organic matter at 
+low temperatures. Water Sci. Technol., 36, 531–538 
+ 
+Vavilin, V.A., Lokshina, L.Y. (1996a). Modeling of volatile fatty acids degradation kinetics and 
+evaluation of microorganism activity. Bioresour. Technol. 57, 69–80. 
+ 
+Vavilin, V.A., Rytov, S.V., Lokshina, L.Y. (1996b). A description of hydrolysis kinetics in anaerobic 
+degradation of particulate organic matter. Bioresour. Technol., 56, 229–237 
+ 
+Vavilin, V.A., Rytov, S.V., Lokshina, L.Y., Pavlostathis, S.G. and Barlaz, M.A. (2003). Distributed 
+model of solid waste anaerobic digestion: Effects of leachate recirculation and pH adjustment. 
+Biotechnol. Bioeng. 81, 66-73 
+ 
+Vavilin, V.A., Rytov, S.V., Lokshina, L.Ya. and Rintala, J.A. (1999). Description of hydrolysis and 
+acetoclastic methanogenensis as the rate-limiting steps during anaerobic conversion of solid waste 
+into methane. In: Mata-Alvarez, J., Tilche, A., Cecchi, F. (Eds.), Proceedings of the Second 
+International Symposium on Anaerobic Digestion of Solid Wastes, Barcelona,1-4 June, 15-18, 
+Barcelona, SP . 
+ 
+Vavilin, V.A., Rytov, S.V., Lokshina, L.Y., Rintala, J. A. and Lyberatos, G. (2001). Simplified 
+hydrolysis models for the optimal design of two-stage anaerobic digestion. Water Res., 35, 4247-4251 
+ 
+Veeken, A. and Hamelers B. (1999). Effect of temperature on hydrolysis rates of selected biowaste 
+components. Bioresour. Technol., 69, 249-254. 
+ 
+	   	   1	   59	   	   	   	   	  
+REFERENCES 
+Vermande, S. (2005). Hydraulics and biological modelling of activated sludge basins. PhD thesis, 
+INSA Toulouse, Toulouse, France.  
+ 
+Vesvikar, M.S. and Al-Dahhan, M. (2005). Flow pattern visualization in a mimic anaerobic digester 
+using CFD. Biotechnol. Bioeng., 89, 719–732.  
+ 
+Wang, Z., Xu, F., Li, Y. (2013). Effects of total ammonia nitrogen concentration on solid-state 
+anaerobic digestion of corn stover. Bioresour. Technol. 144, 281–287. 
+ 
+Ward, A. J., Hobbs, P. J., Holliman, P. J., Jones, D.L. (2008). Optimisation of the anaerobic digestion 
+of agricultural resources. Bioresour. Technol. 99, 7928-7940. 
+ 
+Wisecaver, K.D. and Fan, L.S. (1989). Biological phenol degradation in a gas-liquid-solid fluidized 
+bed reactor. Biotechnol. Bioeng., 33,1029-1038. 
+ 
+Wehner, J.F. and Wilhelm, R.H. (1956). Boundary conditions of flow reactor. Chem. Eng. Sci., 6, 89-
+93.  
+ 
+Worden RM and Donaldson TL. (1987). Dynamics of a biological fixed film for phenol degradation 
+in a fluidized bed reactor. Biotechnol. Bioeng., 30, 398-405. 
+ 
+Wu, M.M. and Hickey, R.F. (1997). Dynamic model for UASB reactor including reactor hydraulics, 
+reaction, and diffusion. J. Environ. Eng. 123, 244–252. 
+ 
+Wu, B. and Chen, S. (2008). CFD simulation of non-Newtonian fluid flow in anaerobic digesters. 
+Biotechnol. Bioeng., 99, 700-711. 
+ 
+Xu, F., Li, Y. (2012). Solid-state co-digestion of expired dog food and corn stover for methane 
+production. Bioresour. Technol. 118, 219–226. 
+ 
+	   	   1	   60	   	   	   	   	  
+REFERENCES 
+Yan, J.Q., Lo, K.V., Liao, P.H. (1989). Anaerobic digestion of cheese whey using up-flow anaerobic 
+sludge blanket reactor. Biol. Wastes. 27, 289–305. 
+ 
+Yan, J.Q., Lo, K.V., Pinder, K.L. (1993). Instability caused by high strength of cheese whey in a 
+UASB reactor. Biotechnol. Bioeng. 41, 700–706. 
+ 
+Young, J. C, and McCarty, P. L. (1968). The anaerobic filter for waste treatment. Tech. Report No. 
+87, Dept. of Civ. Engrg., Stanford Univ., Stanford, Calif. 
+ 
+Yu, J. (1999). A three-phase ﬂuidized bed reactor in the combined anaerobic/aerobic treatment of 
+wastewater. J. Chem. Technol. Biot., 74, 619-62. 
+ 
+Zaher, U. and Chen, S., (2006). Interfacing the IWA anaerobic digestion model no1 (ADM1) with 
+manure and solid waste characteristics. Proc. 79th Annual WEF Conference and Exposition 
+(WEFTEC), October 21–25, Dallas, USA. 
+ 
+Zeng, Y., Mu, S.J., Lou, S.J., Tartakovsky, B., Guiot, S.R. and Wu, P. (2005). Hydraulic modeling 
+and axial dispersion analysis of UASB reactor. Biochem. Eng. J. 25, 113-123. 
+ 
+Zeshan and Annachhatre, A.P. (2012). Dry anaerobic digestion of municipal solid waste and digestate 
+management strategies. Asian Institute of Technology. 
+ 
+Zhang, R., El-Mashad, H. M., Hartman, K., Wang, F., Liu, G., Choate, C., Gamble, P. (2007). 
+Characterization of food waste as feedstock for anaerobic digestion. Bioresour. Technol. 98, 929-935. 
+ 
+Zhang, R. and Zhang, Z. (1999). Biogasification of rice straw with an anaerobic-phased solids digester 
+system. Bioresour. Technol. 68, 235-245. 
+ 
+	   	   1	   61	   	   	   	   	  
+REFERENCES 
+Zhu, J., Zheng, Y., Xu, F., Li, Y. (2014). Solid-state anaerobic co-digestion of hay and soybean   
+processing waste for biogas production. Bioresour. Technol. 154, 240-247. 
+ 
+Zima, P., Makinia, J., Swinarski, M., & Czerwionka, K. (2009). Combining computational fluid 
+dynamics with a biokinetic model for predicting ammonia and phosphate behavior in aeration tanks. 
+Water Env. Res., 81, 2353-2362. 
+ 
+Zupančič, G.D. and Roš, M. (2012). Determination of Chemical Oxygen Demand in Substrates from 
+Anaerobic Treatment of Solid Organic Waste. Waste and Biom. Valor., 3, 89-98. 
+	   	   1	   62	   	   	   	   	  
diff --git a/examples/theses/These_Nathalie_Mitton.pdf b/examples/theses/These_Nathalie_Mitton.pdf
new file mode 100644
index 00000000..e7a491d7
Binary files /dev/null and b/examples/theses/These_Nathalie_Mitton.pdf differ
diff --git a/examples/theses/These_Nathalie_Mitton/fulltext.pdf b/examples/theses/These_Nathalie_Mitton/fulltext.pdf
new file mode 100644
index 00000000..e7a491d7
Binary files /dev/null and b/examples/theses/These_Nathalie_Mitton/fulltext.pdf differ
diff --git a/examples/theses/These_Nathalie_Mitton/fulltext.pdf.txt b/examples/theses/These_Nathalie_Mitton/fulltext.pdf.txt
new file mode 100644
index 00000000..0408604d
--- /dev/null
+++ b/examples/theses/These_Nathalie_Mitton/fulltext.pdf.txt
@@ -0,0 +1,5069 @@
+AUTO-ORGANISATION DES RESEAUX SANS FIL
+MULTI-SAUTS A GRANDE ECHELLE.
+Nathalie Mitton
+To cite this version:
+Nathalie Mitton. AUTO-ORGANISATION DES RESEAUX SANS FIL MULTI-SAUTS A
+GRANDE ECHELLE.. Computer Science. INSA de Lyon, 2006. French. <tel-00599147>
+HAL Id: tel-00599147
+https://tel.archives-ouvertes.fr/tel-00599147
+Submitted on 8 Jun 2011
+HAL is a multi-disciplinary open access L’archive ouverte pluridisciplinaire HAL, est
+archive for the deposit and dissemination of sci- destine´e au de´poˆt et a` la diffusion de documents
+entific research documents, whether they are pub- scientifiques de niveau recherche, publie´s ou non,
+lished or not. The documents may come from e´manant des e´tablissements d’enseignement et de
+teaching and research institutions in France or recherche franc¸ais ou e´trangers, des laboratoires
+abroad, or from public or private research centers. publics ou prive´s.
+Me´moire
+pre´sente´ par
+Nathalie MITTON
+en vue de l’obtention du diploˆme
+DOCTORAT EN INFORMATIQUE ET
+RESEAUX
+de l’INSA de Lyon
+AUTO-ORGANISATION DES RE´ SEAUX
+SANS FIL MULTI-SAUTS A` GRANDE
+E´ CHELLE.
+Soutenue le 27/03/2006.
+Nume´ro d’ordre : 2006-ISAL-0023.
+Apre`s avis de : Franc¸ois BACCELLI
+Catherine ROSENBERG
+David SIMPLOT-RYL
+Devant la commission d’examen forme´e de :
+Bartlomiej (Bartek) BLASZCZYSZYN
+Charge´ de recherche a` l’INRIA - TREC
+Serge FDIDA
+Professeur a` l’Universite´ Pierre et Marie Curie – Paris VI
+E´ ric FLEURY (Directeur de the`se)
+Professeur a` l’INSA de LYON
+Isabelle GUE´ RIN LASSOUS (Directrice de the`se)
+Charge´e de recherche habilite´e a` l’INRIA - ARES
+David SIMPLOT-RYL (Rapporteur)
+Professeur a` l’Universite´ de Lille
+pour les travaux effectue´s au Centre d’Innovations en Te´le´communications & Inte´gration
+de services de l’INSA de Lyon (CITI) sous la direction du Pr. E´ ric Fleury et du Dr. Isabelle
+Gue´rin-Lassous.
+Table des matie`res
+1 Introduction 7
+1.1 Me´thodologies et notations . . . . . . . . . . . . . . . . . . . . . . . 10
+1.1.1 Mode`le utilise´ dans les analyses stochastiques . . . . . . . . . 10
+1.1.2 Mode`le de simulation . . . . . . . . . . . . . . . . . . . . . . 11
+2 E´ tat de l’art 13
+2.1 Clusters a` 1 saut . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 14
+2.2 Clusters a` k sauts . . . . . . . . . . . . . . . . . . . . . . . . . . . . 18
+2.3 Clusters hie´rarchiques . . . . . . . . . . . . . . . . . . . . . . . . . . 21
+2.4 Conclusion . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 22
+3 Algorithme de clustering 23
+3.1 Introduction . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 23
+3.2 La me´trique de densite´ . . . . . . . . . . . . . . . . . . . . . . . . . 24
+3.3 La formation des clusters . . . . . . . . . . . . . . . . . . . . . . . . 24
+3.4 Maintenance de la structure . . . . . . . . . . . . . . . . . . . . . . . 28
+3.5 Analyse de la me´trique . . . . . . . . . . . . . . . . . . . . . . . . . 28
+3.5.1 Recherche de la meilleure k-densite´ . . . . . . . . . . . . . . 28
+3.5.2 Densite´ moyenne . . . . . . . . . . . . . . . . . . . . . . . . 29
+3.5.3 Re´partition des valeurs de densite´ . . . . . . . . . . . . . . . 31
+3.6 Analyse de la structure . . . . . . . . . . . . . . . . . . . . . . . . . 31
+3.6.1 Analyse the´orique du nombre de clusters . . . . . . . . . . . 31
+3.6.2 Caracte´ristiques des clusters . . . . . . . . . . . . . . . . . . 33
+3
+4 TABLE DES MATIE`RES
+3.7 Comparaison a` d’autres heuristiques . . . . . . . . . . . . . . . . . . 36
+3.7.1 Comparaison avec DDR . . . . . . . . . . . . . . . . . . . . 36
+3.7.2 Comparaison avec l’heuristique Max-Min d-cluster . . . . . . 39
+3.8 Analyse de l’auto-stabilisation . . . . . . . . . . . . . . . . . . . . . 42
+3.8.1 Pre´-requis . . . . . . . . . . . . . . . . . . . . . . . . . . . . 43
+3.8.2 Construction d’un DAG de hauteur constante . . . . . . . . . 44
+3.8.3 Analyse de la construction du DAG de couleurs . . . . . . . . 45
+3.8.4 Utilisation des couleurs pour le clustering . . . . . . . . . . . 48
+3.8.5 Validation des proprie´te´s auto-stabilisantes . . . . . . . . . . 50
+3.9 Conclusion . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 52
+3.10 Publications . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 53
+3.11 Annexes . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 54
+3.11.1 Analyse de la densite´ moyenne . . . . . . . . . . . . . . . . . 54
+3.11.2 Calcul analytique du nombre de clusters . . . . . . . . . . . . 56
+3.11.3 Temps de transmission borne´ . . . . . . . . . . . . . . . . . . 58
+4 Diffusion 61
+4.1 Introduction . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 61
+4.2 E´ tat de l’art . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 62
+4.3 Analyse the´orique . . . . . . . . . . . . . . . . . . . . . . . . . . . . 64
+4.4 Notre contribution a` la diffusion . . . . . . . . . . . . . . . . . . . . 66
+4.4.1 Se´lection des passerelles . . . . . . . . . . . . . . . . . . . . 66
+4.4.2 L’algorithme de diffusion . . . . . . . . . . . . . . . . . . . . 71
+4.5 Analyses et re´sultats de simulations . . . . . . . . . . . . . . . . . . 72
+4.5.1 E´ lection et utilisation des passerelles . . . . . . . . . . . . . . 72
+4.5.2 Performances de la diffusion . . . . . . . . . . . . . . . . . . 74
+4.5.3 Robustesse de la diffusion . . . . . . . . . . . . . . . . . . . 79
+4.6 Analyse de la se´lection des MPR dans OLSR . . . . . . . . . . . . . 82
+4.6.1 La se´lection des MPR . . . . . . . . . . . . . . . . . . . . . 82
+4.6.2 Analyse . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 84
+4.6.3 Re´sultats nume´riques et simulations . . . . . . . . . . . . . . 88
+4.6.4 Conse´quences . . . . . . . . . . . . . . . . . . . . . . . . . . 90
+4.7 Conclusion et perspectives . . . . . . . . . . . . . . . . . . . . . . . 91
+4.8 Publications . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 92
+4.9 Annexes . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 93
+TABLE DES MATIE`RES 5
+5 Localisation et routage 97
+5.1 Introduction . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 97
+5.2 Localisation et routage . . . . . . . . . . . . . . . . . . . . . . . . . 100
+5.2.1 Re´sume´ et analyse de complexite´ . . . . . . . . . . . . . . . 101
+5.3 Notre proposition . . . . . . . . . . . . . . . . . . . . . . . . . . . . 102
+5.3.1 Pre´liminaires . . . . . . . . . . . . . . . . . . . . . . . . . . 102
+5.3.2 Distribution des partitions de l’espace virtuel - ILS . . . . . . 103
+5.3.3 Enregistrement . . . . . . . . . . . . . . . . . . . . . . . . . 104
+5.3.4 De´parts et arrive´es . . . . . . . . . . . . . . . . . . . . . . . 104
+5.3.5 Ajouter de la redondance et de la robustesse . . . . . . . . . . 106
+5.3.6 Ope´ration de look-up . . . . . . . . . . . . . . . . . . . . . . 106
+5.3.7 Routage sur le re´seau physique . . . . . . . . . . . . . . . . . 112
+5.4 Simulations . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 114
+5.4.1 SAFARI . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 114
+5.4.2 Comparaison des structures . . . . . . . . . . . . . . . . . . 116
+5.4.3 Look-up et routage . . . . . . . . . . . . . . . . . . . . . . . 118
+5.5 Conclusion . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 122
+5.6 Publications . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 124
+6 Conclusion et perspectives 125
+6.1 Conclusion . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 125
+6.2 Perspectives . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 126
+6 TABLE DES MATIE`RES
+Chapitre 1
+Introduction
+De nos jours, les gens se de´placent et communiquent de plus en plus. Ils ont de´sormais
+besoin de nouvelles technologies leur permettant de fac¸on simple et rapide de re´cupe´rer
+diverses informations et de communiquer avec des personnes distantes pouvant eˆtre
+n’importe ou` dans le monde. Ces dernie`res anne´es ont vu le de´veloppement technolo-
+gique de nombreux composants et appareils e´lectroniques de toute sorte pour re´pondre
+a` ces nouveaux besoins. Ces appareils communicants sont de plus en plus petits, ont
+des capacite´s de calcul de plus en plus performantes et sont de plus en plus re´pandus.
+On les rencontre partout dans notre quotidien : a` la maison, au bureau, dans les voi-
+tures, etc. Les acce`s a` l’information deviennent omnipre´sents a` travers les te´le´phones
+portables, ordinateurs portables, PDA et les technologies de communications sans fil.
+Cependant, l’apparition et l’expansion de ces phe´nome`nes ont e´galement conduit a`
+une explosion de la complexite´ a` tout niveau, a` un point de´passant les capacite´s hu-
+maines a` controˆler et se´curiser. L’intervention humaine doit eˆtre remplace´e par une
+auto-gestion du syste`me par les machines. C’est ce qu’on appelle l’autonomic compu-
+ting. Afin d’assurer l’ubiquite´ des informations, les entite´s technologiques doivent eˆtre
+mises en re´seau et eˆtre capables de re´pondre aux de´fis suivants :
+Auto-configuration et auto-organisation. Chaque entite´ doit eˆtre capable de se
+configurer elle-meˆme a` partir d’interactions locales avec les autres entite´s afin
+de faire e´merger un comportement global qui assure le bon fonctionnement
+du re´seau. Elle doit s’adapter aux modifications de la topologie du re´seau. Par
+exemple, les entite´s doivent eˆtre capables d’e´tablir des routes pour joindre les
+personnes souhaite´es ou acce´der a` une information donne´e.
+Auto-gue´rison. Lorsqu’une panne se produit, le re´seau doit eˆtre capable de la loca-
+liser, de l’identifier et de l’isoler afin qu’elle ne contamine pas l’ensemble du
+re´seau, et si possible de la corriger.
+Auto-optimisation. Chaque entite´ doit pre´server les ressources globales du re´seau afin
+de lui assurer une dure´e de vie aussi longue que possible, tout en effectuant
+correctement les taˆches qui lui sont alloue´es.
+7
+8 CHAPITRE 1. INTRODUCTION
+Auto-protection. Le re´seau doit eˆtre capable d’apprendre de ses fautes et des at-
+taques exte´rieures qui surviennent. Il doit pouvoir les identifier rapidement et
+se prote´ger contre elles.
+Tous ces de´fis doivent pouvoir eˆtre adresse´s en tenant compte des contraintes
+intrinse`ques des entite´s technologiques et des technologies de communication.
+L’autonomic computing couvre ainsi un tre`s large domaine des re´seaux informatiques,
+tous pre´sentant des contraintes supple´mentaires spe´cifiques. Au sein de ce large spectre
+que repre´sente l’autonomic computing et qui repre´sente un re´el de´fi scientifique pour
+les anne´es a` venir, je me suis oriente´e lors de ma the`se vers le domaine des re´seaux
+sans fil tels que les re´seaux ad hoc ou les re´seaux de capteurs, qui offre l’avantage
+d’eˆtre plus cible´ en termes d’applications, tout en englobant un grand nombre des de´fis
+scientifiques pre´sente´s ci dessus.
+Les re´seaux sans fil multi-sauts sont des re´seaux radio mobiles sans aucune infrastruc-
+ture, ce qui leur permet une implantation rapide. Ils peuvent aussi eˆtre couple´s a` un
+LAN pour e´tendre la couverture d’une infrastructure existante. Les entite´s peuvent
+apparaıˆtre, disparaıˆtre, se de´placer inde´pendamment les unes des autres. La topolo-
+gie du re´seau est e´volutive. Les terminaux peuvent communiquer dans la limite de
+la porte´e de leur communication radio. Un sche´ma de communication multi-sauts est
+ne´cessaire pour permettre a` deux correspondants distants de communiquer. Dans ce
+sche´ma de communication, chaque terminal peut eˆtre utilise´ comme routeur pour re-
+layer les communications d’autres terminaux. La configuration de ces routes multi-
+sauts est re´alise´e par un protocole de routage. Afin d’eˆtre efficaces, ces protocoles
+de routage doivent conside´rer les caracte´ristiques intrinse`ques du re´seau (topologie en
+constante e´volution), des terminaux (taille me´moire et capacite´s de calcul limite´es...)
+et du me´dium de communication (bande passante limite´e, interfe´rences...).
+Il existe aujourd’hui de nombreux protocoles de routage pour de tels re´seaux. Cepen-
+dant, bien qu’efficaces sur des re´seaux peu denses ou de petite ou moyenne taille, aucun
+d’eux ne peut eˆtre utilise´ sur de grandes e´chelles car ils ge´ne´reraient trop de trafic de
+controˆle ou ne´cessiteraient des tables de routage trop importantes. L’une des solutions
+commune´ment propose´es pour le routage sur de grandes e´chelles est d’introduire un
+routage hie´rarchique en regroupant ge´ographiquement des entite´s proches en clusters
+et en utilisant des sche´mas de routage diffe´rents au sein des clusters et entre les clus-
+ters. Une telle approche permet a` chaque entite´ de stocker la totalite´ des informations
+de son cluster et seulement une partie des informations concernant les autres clusters
+et de cette fac¸on, permet une extensibilite´ du re´seau.
+Dans ce document, je pre´sente une solution d’utilisation de re´seau sans fil multi-sauts
+dense. Ce document est organise´ suivant les diffe´rentes e´tapes de cette solution : or-
+ganisation du re´seau, diffusion, localisation et routage. A` chaque e´tape, les re´sultats
+obtenus ont e´te´ analyse´s par simulation, par des e´tudes comparatives avec des solu-
+tions existantes et, lorsque cela e´tait possible par une analyse the´orique. Le premier
+chapitre est la pre´sente introduction, dans laquelle je pre´sente les notations utilise´es au
+cours du document et les mode`les utilise´s pour les e´tudes analytiques et les simula-
+tions. Dans le chapitre 2, les diffe´rentes approches propose´es dans la litte´rature pour
+organiser un re´seau en clusters sont pre´sente´es. Seules les me´thodes qui proposent une
+9organisation du re´seau sont mentionne´es. Il existe e´galement de nombreuses e´tudes sur
+l’apport de cette organisation sur la capacite´ du re´seau comme c’est le cas de [37] mais
+cet aspect n’est pas l’objet de cette the`se et ces e´tudes ne sont donc pas pre´sente´es dans
+ce chapitre.
+Le chapitre 3 de´crit notre solution de clustering et en e´tudie les diffe´rentes ca-
+racte´ristiques. L’algorithme de clustering se base sur une nouvelle me´trique qui permet
+de lisser des petits changements de topologie. Les clusters sont construits en s’adap-
+tant a` la topologie sous-jacente, sans contrainte ni parame`tre fixe´ a priori. Une analyse
+the´orique permet de de´gager certaines proprie´te´s comme une borne supe´rieure sur le
+nombre de clusters obtenus sur une surface donne´e. Des simulations de´gagent des ca-
+racte´ristiques de la structure obtenue et comparent ses performances aux structures
+obtenues a` partir d’autres protocoles de clustering existants. Il en ressort que notre
+algorithme construit des clusters qui offrent le meilleur comportement face a` la dy-
+namicite´ des entite´s du re´seau. Dans ce chapitre, nous montrons e´galement que notre
+algorithme est auto-stabilisant localement, ce qui lui confe`re de bonnes proprie´te´s pour
+le passage a` l’e´chelle et la re´sistance aux fautes.
+A` partir des caracte´ristiques de´gage´es de la structure de clusters, nous proposons deux
+grandes applications indispensables a` tout re´seau : une diffusion efficace d’information
+et un processus de routage. Nous construisons donc une seule structure pour diverses
+applications. Le processus de diffusion est pre´sente´ et e´tudie´ dans le chapitre 4. Ce
+protocole de diffusion a pour avantage d’avoir deux de´clinaisons : il peut permettre une
+diffusion globale a` l’ensemble du re´seau et/ou une diffusion limite´e au sein d’un cluster.
+Il ne demande que peu d’e´changes et de calculs. La diffusion ainsi ge´ne´re´e s’ave`re
+solliciter moins d’entite´s que les protocoles de diffusion existants et donc consomme
+moins d’e´nergie, tout en e´tant plus robuste face a` des cassures de liens.
+Le chapitre 5 aborde le processus de routage hie´rarchique applique´ a` la structure. Il
+s’agit d’un protocole de routage indirect (c.a`.d. effectue´ en deux temps) qui pre´sente
+une approche originale, en conside´rant le sche´ma inverse de celui ge´ne´ralement utilise´
+dans la litte´rature. En effet, les caracte´ristiques des clusters ont montre´ qu’un sche´ma
+classique pre´senterait les meˆmes proble`mes d’extensibilite´ rencontre´s dans un re´seau a`
+plat, comme nous le verrons. Ce processus de routage inte`gre un processus de locali-
+sation base´ sur les tables de hachage distribue´es et sur la mise en œuvre d’un routage
+adapte´ aux re´seaux sans fil, comme le routage par intervalle. Le protocole de rou-
+tage fournit des routes proches de l’optimal tout en maintenant O(1) informations sur
+chaque entite´.
+Le dernier chapitre conclut ce document et donne plusieurs perspectives a` l’ensemble
+des travaux mene´s au cours de cette the`se. Ce travail a e´te´ re´alise´ dans le cadre de ma
+the`se effectue´e au sein du laboratoire CITI de l’INSA de Lyon et de l’e´quipe INRIA
+ARES, sous la direction d’E´ ric FLEURY et d’Isabelle GUE´RIN LASSOUS.
+10 CHAPITRE 1. INTRODUCTION
+1.1 Me´thodologies et notations adopte´es au cours de la
+the`se
+Un re´seau sans fil multi-sauts peut eˆtre mode´lise´ par un graphe G = (V,E) ou` V
+repre´sente l’ensemble des terminaux mobiles etE repre´sente les liaisons radios existant
+entre ces stations. Dans notre approche, nous n’avons conside´re´ que des liens radios bi-
+directionnels, c.a`.d qu’un lien e = (u, v) existe si les stations u et v sont a` porte´e de
+communication radio l’une de l’autre.
+Nous notons dist(u, v) la distance euclidienne de u a` v et d(u, v) la distance dans
+le graphe (en nombre de sauts) entre les nœuds u et v. Cette distance correspond au
+nombre de sauts minimum que l’on doit faire pour rejoindre v depuis u. Nous notons
+Γk(u) le k-voisinage (ou le voisinage a` k sauts) du nœud u. Le k-voisinage d’un nœud
+est l’ensemble des nœuds a` k sauts de lui : Γk(u) = {v 6= u | d(u, v) ≤ k}. Nous
+notons δk(u) = |Γk(u)| la cardinalite´ de cet ensemble. On note ge´ne´ralement Γ(u)
+pour Γ1(u). On remarquera que u n’appartient pas Γk(u) (∀k > 0, u ∈/ Γk(u)). Par
+de´finition, δ1(u) = δ(u) = |Γ1(u)| est le degre´ du nœud u.
+Nous de´signons par C(u) le cluster auquel appartient le nœud u et H(u) son cluster-
+head.
+Nous utilisons e(u/C) pour de´noter l’excentricite´ du nœud u dans un cluster C. L’ex-
+centricite´ d’un nœud est la plus grande distance entre u et tout autre nœud du meˆme
+cluster C : e(u/C) = maxv∈C(u)(d(u, v)). Le diame`tre d’un cluster C, note´ D(C), est
+la plus grande excentricite´ dans ce cluster : D(C) = maxu∈C(e(u/C)).
+1.1.1 Mode`le utilise´ dans les analyses stochastiques
+Lors des diffe´rentes analyses the´oriques que nous avons mene´es, nous repre´sentons un
+re´seau sans fil multi-sauts par un processus ponctuel de Poisson d’intensite´ constante
+λ.
+Un processus de Poisson est un processus ponctuel pour lequel la disposition des points
+est comple`tement ale´atoire a` chaque re´alisation. L’une des proprie´te´s caracte´risant le
+processus de Poisson est que le nombre de points dans une zone donne´e est inde´pendant
+des autres points du processus. Le processus de Poisson est le processus repre´sentant
+le mieux la distribution des nœuds du re´seau dans l’espace. Dans cette the`se, nous
+n’avons conside´re´ que des processus de Poisson homoge`ne (intensite´ constante dans le
+plan) et isotrope (proprie´te´s invariantes par rotation).
+Pour simuler une re´alisation d’un processus de Poisson homoge`ne d’intensite´ λ dans
+un carre´ de surface S, on de´finit d’abord le nombre de points N du semis en tirant un
+nombre pseudo-ale´atoire dans une loi de Poisson de parame`tre λ × S. Le nombre de
+λkpoints N prend les valeurs k avec la probabilite´ suivante : P(N = k) = k! exp(−λS).
+λ repre´sente alors le nombre moyen de nœuds par unite´ de surface. Pour chaque point
+i, l’abscisse xi et l’ordonne´e yi sont ensuite de´finies par un nombre pseudo-ale´atoire
+tire´ dans une loi uniforme.
+1.1. ME´THODOLOGIES ET NOTATIONS 11
+Si Φ est le processus de Poisson conside´re´, on de´signe par Φ(S) l’ensemble des points
+du processus Φ distribue´s dans la surface S. Nous conside´rons qu’il existe un lien entre
+deux points du processus u et v si dist(u, v) ≤ R ou` R est la porte´e de communication
+radio des nœuds (u et v sont voisins).
+1.1.2 Mode`le de simulation
+1+2R
+1
+           
+           
+           
+           
+           
+w
+           
+           
+           
+            W
+           
+           
+           
+FIG. 1.1 – Seuls les nœuds de w sont conside´re´s pour les mesures simule´es mais le
+processus de point est distribue´ dans W afin d’e´liminer les effets de bord.
+Toutes les simulations mene´es lors de cette the`se suivent le meˆme mode`le. Nous avons
+utilise´ un simulateur que nous avons de´veloppe´. Ce simulateur suppose une couche
+MAC ide´ale, c.a`.d qui ne ge´ne`re aucune collision. Utiliser ce simulateur plutoˆt qu’un
+simulateur re´seau qui prend en compte les collisions et caracte´ristiques des protocoles
+de niveaux infe´rieurs nous permet de focaliser notre e´tude sur le comportement des
+protocoles de niveau 3 uniquement, sans tenir compte des ale´as des protocoles utilise´s
+au niveau des autres couches.
+Les nœuds sont de´ploye´s ale´atoirement suivant un processus de Poisson dans une
+feneˆtre carre´e de (1 + 2R) × (1 + 2R) avec diffe´rentes intensite´s λ. On conside`re
+que deux nœuds u et v sont voisins si dist(u, v) ≤ R ou` R est la porte´e de communi-
+cation radio des nœuds. Dans chaque cas, chaque statistique est la moyenne sur plus de
+1000 simulations. Les mesures ne sont prises en compte que si l’ensemble des nœuds
+forment une composante connexe (aucune entite´ n’est isole´e dans le re´seau).
+De fac¸on a` e´liminer les effets de bords de cette feneˆtre, les diffe´rentes mesures ne sont
+calcule´es que sur les nœuds se trouvant dans une feneˆtre centralew de taille 1×1 (voir
+Figure 1.1), l’ensemble des points du processus e´tant distribue´s dans la feneˆtreW et les
+points de w restant impacte´s par les points en dehors de w. Cette technique est appele´e
+”minus-sampling”. Pour une description plus de´taille´e, se re´fe´rer a` [76] page 132.
+12 CHAPITRE 1. INTRODUCTION
+Chapitre 2
+E´ tat de l’art
+Un re´seau ad hoc ne repose sur aucune infrastructure fixe. Les entite´s sont
+inde´pendantes les unes des autres et communiquent entre elles par radio, sans utiliser
+de station de base. Afin de permettre des communications entre deux stations n’e´tant
+pas a` porte´e radio l’une de l’autre, les nœuds interme´diaires doivent relayer le message.
+Afin que le relais des messages soit efficace, il faut e´tablir des routes entre les nœuds,
+de fac¸on a` ce que chaque entite´ sache vers quelle autre station envoyer le message pour
+qu’il puisse atteindre sa destination. C’est le roˆle principal des protocoles de routage.
+Les protocoles de routage classiques standardise´s au sein du groupe de travail MANET
+(Mobile Ad hoc NETwork) de l IETF1’ se montrent efficaces sur des re´seaux de petite
+ou moyenne taille mais passent difficilement a` l’e´chelle [46, 71].
+Il existe classiquement deux grandes familles de protocoles de routage dans la
+litte´rature et au sein du groupe MANET :
+– pro-actif : les routes sont e´tablies et maintenues en permanence sur chaque nœud.
+L’avantage d’un tel processus est qu’une route est disponible imme´diatement quelle
+que soit la destination. Les inconve´nients sont la taille des tables de routage a` main-
+tenir sur chaque nœud (taille en O(n) si n est le nombre de nœuds dans le re´seau) et
+le nombre de messages de controˆle a` envoyer pe´riodiquement pour maintenir a` jour
+les routes qui ne sont pas toujours employe´es.
+– re´actif : les routes sont cherche´es a` la demande. L’avantage d’un tel protocole
+est qu’il permet d’alle´ger en moyenne les tables de routage et de ne pas envoyer
+pe´riodiquement des messages de recherche de route. L’inconve´nient est que lors-
+qu’une route est ne´cessaire, la recherche de route vers le nœud destination peut eˆtre
+tre`s longue, incluant une forte latence et ne´cessitant une inondation du re´seau.
+Ainsi, avec de tels protocoles ”a` plat”, lorsque la taille re´seau grandit, le trafic de
+controˆle a tendance a` devenir pre´-dominant laissant une part congrue aux communi-
+cations re´elles. Cela se traduit e´galement par une augmentation de la latence et/ou
+une explosion de la table de routage. Pour palier ce proble`me, une des solutions com-
+1http ://www.ietf.org/html.charters/manet-charter.html
+13
+14 CHAPITRE 2. E´TAT DE L’ART
+mune´ment propose´es est d’introduire un routage hie´rarchique et d’organiser des nœuds
+en groupes aussi nomme´s clusters.
+Le clustering consiste en un de´coupage virtuel du re´seau en groupes de nœuds proches
+ge´ographiquement. Ces groupes sont appele´s clusters. Ils sont ge´ne´ralement identifie´s
+par un nœud particulier, un chef de groupe aussi nomme´ cluster-head. Dans la plupart
+des algorithmes de clustering, les clusters sont construits a` partir d’une me´trique par-
+ticulie`re qui permet d’assigner un chef a` chaque nœud ; le cluster e´tant alors constitue´
+du cluster-head et de tous les nœuds qui lui sont rattache´s. L’ide´e initiale du routage
+hie´rarchique est de permettre a` chaque entite´ de stocker la totalite´ des informations de
+son cluster et seulement une partie des informations concernant les autres clusters. Cela
+minimise la taille des tables de routage et la quantite´ de trafic ge´ne´re´.
+Outre le fait de rendre le routage plus efficace, le clustering pre´sente e´galement d’autres
+avantages. Il peut faciliter le partage des ressources et/ou la synchronisation au sein
+d’un cluster et permettre une re´-utilisation spatiale des fre´quences radio pour minimiser
+les interfe´rences [50]. Plus important encore, l’organisation d’un re´seau apporte aussi
+plus de stabilite´ [61].
+De nombreuses solutions de clustering ont e´te´ propose´es. La majorite´ d’entre elles pro-
+posent l’utilisation d’une me´trique qui permet aux nœuds de se choisir un chef. Cette
+me´trique peut eˆtre par exemple l’identifiant ou le degre´ des nœuds, une valeur de mobi-
+lite´ des nœuds ou encore une somme ponde´re´e de tous ces e´le´ments. D’autres solutions
+cherchent dans un premier temps a` de´terminer un ensemble dominant connecte´ sur le-
+quel les clusters sont baˆtis. Une grande partie des solutions de clustering construisent
+des clusters a` 1 saut (dits 1-clusters), c.a`.d des clusters ou` chaque nœud est a` un saut
+de son chef de cluster. Les protocoles donnant naissance a` des k-clusters (clusters ou`
+chaque nœud est a` au plus k sauts de son cluster-head) sont plus re´cents et plus rares.
+Dans ce chapitre, nous dressons un e´tat de l’art qui permet de passer en revue les
+principaux types de solutions propose´es dans la litte´rature pour organiser un re´seau ad
+hoc en clusters.
+2.1 Clusters a` 1 saut
+De nombreux algorithmes de clustering produisent des clusters a` 1 saut. L’un des al-
+gorithmes les plus anciens est ”l’algorithme du plus petit ID” ou LCA, propose´ initia-
+lement par Ephremides, Wieselthier et Baker dans [28]. Chaque nœud se de´signe ou
+non cluster-head en se basant sur son identifiant et celui de ses voisins. Un nœud peut
+avoir trois statuts diffe´rents : cluster-head, passerelle ou nœud ordinaire. A` l’origine,
+tous ont un statut de nœud ordinaire. Si un nœud u a le plus petit identifiant parmi les
+nœuds de son voisinage, il se de´clare cluster-head. Sinon, il attend que tous ses voisins
+ayant un identifiant plus petit que le sien ait de´clare´ leur statut. Si au moins l’un d’eux
+s’est de´clare´ chef, u de´clare a` son voisinage son statut de nœud ordinaire. u appartient
+alors a` chacun des clusters de ses voisins s’e´tant de´clare´ chef. Si tous les voisins de u
+ayant un identifiant plus petit que celui de u se sont de´clare´s nœuds ordinaires (car ils
+2.1. CLUSTERS A` 1 SAUT 15
+se sont attache´s a` un autre de leur voisin de plus petit ID), u se de´clare cluster-head.
+Une fois que chaque nœud a de´clare´ son statut de nœud ordinaire ou de cluster-head,
+si un nœud entend parmi ses voisins plus d’un cluster-head, il se de´clare passerelle.
+Le protocole LCA est notamment utilise´ par le routage CBRP (Cluster Based Routing
+Protocol) [42], pour la formation des clusters.
+Par la suite, avec le protocole HCC (High Connectivity Clustering), Gerla et Tsai [36]
+ont cherche´ a` apporter plus de stabilite´ a` la structure de clusters forme´s par le LCA, en
+utilisant le degre´ des nœuds plutoˆt que leur identifiant. Le nœud ayant le plus fort degre´
+dans son voisinage se de´clare cluster-head. Si deux voisins ont le meˆme degre´, c’est ce-
+lui de plus petit identifiant qui prend sa de´cision le premier. L’ide´e est que des nœuds
+de fort degre´ sont de bons candidats pour eˆtre cluster-heads car ils couvrent un grand
+nombre de nœuds et le nombre de clusters re´sultant en sera re´duit. Par ailleurs, l’identi-
+fiant d’un nœud e´tant unique, un nœud de faible ID aura tendance a` rester cluster-head
+longtemps, malgre´ la mobilite´ des nœuds. Ne´anmoins, si ce nœud est tre`s mobile, il
+de´truira constamment la structure.
+Ainsi, ces protocoles construisent des clusters a` 1 saut qui se recouvrent (les passerelles
+appartiennent a` plusieurs clusters). Cette structure a e´te´ propose´e pour acheminer les
+messages de controˆle et de routage ou` seuls les cluster-heads et les passerelles agissent.
+Leur maintenance s’ave`re couˆteuse car le mouvement d’un nœud peut engendrer des
+re´actions en chaıˆne et ne´cessiter une reconstruction totale de la structure. C’est pour-
+quoi les auteurs de [24] ont propose´ ”Least Cluster Change” (LCC). LCC ajoute une
+e´tape de maintenance des clusters forme´s avec le LCA ou le HCC. Les clusters ne
+sont reconstruits que si deux cluster-heads se retrouvent voisins (le nœud de plus faible
+degre´ et/ou de plus fort ID suivant le cas abandonne le roˆle de cluster-head) ou si un
+nœud ordinaire n’a plus aucun cluster-head dans son voisinage (il relance le processus
+de clustering). De cette fac¸on, LCC ame´liore la stabilite´ de la structure. Cependant, les
+re´actions en chaıˆne de re-construction ne sont que limite´es et ne sont pas comple`tement
+supprime´es du fait qu’un seul nœud peut re-lancer la proce´dure de clustering s’il n’a
+plus aucun cluster-head dans son voisinage.
+Le protocole MOBIC [13], autre protocole de clustering a` 1 saut, applique le meˆme
+algorithme que LCA et HCC mais utilise une me´trique base´e sur la mobilite´ plutoˆt que
+le degre´ ou l’identifiant des nœuds. Cette me´trique cherche a` caracte´riser la mobilite´
+relative d’un nœud. L’ide´e est qu’un nœud peu mobile est un bon candidat pour eˆtre
+cluster-head car stable. Pour calculer sa mobilite´ relative, un nœud mesure le niveau
+de signal qui l’unit a` chacun de ses voisins. La mobilite´ d’un nœud u est calcule´e a`
+partir des rapports entre ce niveau de signal et celui mesure´ a` l’e´tape pre´ce´dente pour
+chaque voisin de u, l’atte´nuation du signal e´tant de´pendante de la distance se´parant les
+nœuds. Le nœud dont la mobilite´ est la plus faible dans son voisinage devient cluster-
+head. Les auteurs de MOBIC utilise l’algorithme LCC pour la maintenance de leur
+structure en ajoutant une re`gle supple´mentaire : si deux cluster-heads u et v arrivent
+dans le voisinage l’un de l’autre, le cluster-head v de plus fort identifiant n’abandonne
+son roˆle de cluster-head que si u fait toujours partie de ses voisins apre`s une certaine
+pe´riode de temps. Cela permet de ne pas reconstruire la structure si deux cluster-heads
+ne se retrouvent voisins que pour une courte pe´riode. La mobilite´ des nœuds n’est plus
+reconside´re´e par la suite a` moins d’avoir a` reconstruire toute la structure. Cependant, les
+16 CHAPITRE 2. E´TAT DE L’ART
+inconve´nients du LCC ne sont pas e´limine´s. Bien que la prise en compte de la mobilite´
+des nœuds semble inte´ressante pour de´terminer les cluster-heads, cette me´thode est un
+peu complexe et ne´cessite que les nœuds soient en mesure d’estimer les puissances de
+signal. De plus, elle ne conside`re pas certains phe´nome`nes physiques qui provoquent
+des atte´nuations he´te´roge`nes du signal.
+Plutoˆt que d’utiliser l’identifiant ou le degre´ des nœuds, d’autres protocoles de clus-
+tering utilisent une somme ponde´re´e de plusieurs me´triques. Cette cate´gorie d’algo-
+rithmes vise a` e´lire le cluster-head le plus adapte´ a` une topologie pour une utilisation
+donne´e. Par exemple, dans un re´seau de senseurs ou` l’e´nergie est un facteur impor-
+tant, le parame`tre d’e´nergie re´siduelle peut obtenir un poids plus e´leve´ dans la somme
+ponde´re´e de la me´trique re´sultante. WCA [20] est un protocole utilisant une somme
+ponde´re´e de quatre crite`res : la diffe´rence de degre´ Dv , la somme des distances avec
+les voisinsPv , la vitesse relative moyenneMv et le temps de service en tant que cluster-
+head. Pour un nœud v, la diffe´rence de degre´ Dv est la diffe´rence entre le degre´ de v
+et une constante M repre´sentant le nombre de nœuds qu’un cluster-head peut servir.
+Cependant, les auteurs n’explicitent pas le moyen de de´terminer M . La mobilite´ rela-
+tive Mv est obtenue comme dans MOBIC. Les distances Pv entre v et ses voisins sont
+calcule´es a` l’aide d’un GPS. L’e´lection se fait en se basant la` encore sur l’algorithme
+de LCA, le nœud dont la somme ponde´re´e de ces crite`res est la plus petite devenant
+cluster-head. Les clusters sont ensuite maintenus sans plus reconside´rer la me´trique
+ponde´re´e. Le processus de clustering est relance´ quand un nœud arrive dans une zone
+couverte par aucun cluster-head, ceci pouvant entraıˆner des re´actions de reconstruction
+en chaıˆne comme dans les algorithmes pre´ce´dents.
+Ainsi, plusieurs me´thodes de clustering a` 1 saut se basent sur l’algorithme du LCA
+et changent juste le crite`re de de´cision. C’est pourquoi Basagni, dans [12] reprend
+l’algorithme de LCA en donnant comme crite`re un poids ge´ne´rique que chacun de´finit
+comme il le souhaite. Il en e´tudie alors the´oriquement les diffe´rentes proprie´te´s.
+Toutes les me´thodes de clustering mentionne´es jusqu’a` maintenant produisent des clus-
+ters recouvrants, c.a`.d. une structure dans laquelle un nœud peut appartenir a` plusieurs
+clusters. Leur inconve´nient majeur est que le mouvement d’un nœud peut provoquer
+la re-construction d’un cluster, qui, par re´action en chaıˆne, provoque le re-construction
+de la structure entie`re. Afin d’e´viter cela, d’autres protocoles de clustering ont e´te´ pro-
+pose´s, produisant des clusters non re-couvrants : un nœud appartient a` exactement un
+cluster.
+Dans 3HBAC [82], les auteurs proposent un protocole qui impose trois sauts entre deux
+cluster-heads. Le nœud ayant le plus fort degre´ dans son voisinage se de´clare cluster-
+head. Ses voisins s’attachent a` lui et se de´clarent ”nœuds membres”. Les nœuds voisins
+de ces nœuds membres et non voisins d’un cluster-head se de´clarent ”unspecified” et ne
+peuvent plus eˆtre cluster-head. Lorsque deux cluster-heads se retrouvent dans le voisi-
+nage l’un de l’autre, celui de plus grand identifiant abandonne son roˆle de cluster-head
+et devient un nœud membre. Ses voisins deviennent soit membres (s’ils sont voisins du
+cluster-head) soit non spe´cifie´s. Les re´actions en chaıˆne de re-construction sont ainsi
+e´vite´es.
+Dans ”Adaptive Clustering” [50], les auteurs n’utilisent le statut de cluster-head que
+2.1. CLUSTERS A` 1 SAUT 17
+pour la formation des clusters. Une fois les clusters forme´s, la notion de cluster-head
+disparaıˆt, chaque nœud du cluster tenant alors le meˆme roˆle. La motivation des au-
+teurs est que les cluster-heads peuvent devenir des goulots d’e´tranglement par la suite,
+sources de perte de trafic et saturation de bande passante. De plus, les cluster-heads
+seraient appele´s a` de´penser leur e´nergie plus vite que les autres nœuds. Pour construire
+de tels clusters, chaque nœud maintient un ensemble Γ qui initialement contient les
+identifiants de tous ses 1-voisins. Un nœud n’est autorise´ a` diffuser son statut (cluster-
+head, membre, non spe´cifie´) que s’il posse`de un identifiant plus petit que les nœuds de
+Γ. Il ne se de´clare cluster-head que s’il a un identifiant plus petit que tous les nœuds
+de son ensemble Γ. Sur re´ception du statut d’un nœud u, les voisins de u suppriment
+u de leur ensemble Γ. Si u a annonce´ qu’il e´tait cluster-head, ses voisins s’attachent
+a` lui s’ils n’e´taient encore membres d’aucun cluster ou si le cluster-head auquel ils
+s’e´taient attache´s avait un identifiant plus grand que u. Le processus s’arreˆte lorsque
+l’ensemble Γ de chaque nœud est vide. Comme le roˆle de cluster-head disparaıˆt une
+fois les clusters forme´s, la maintenance de la structure est un peu diffe´rente que dans
+les cas pre´ce´dents. Chaque nœud doit connaıˆtre son voisinage a` deux sauts. De cette
+fac¸on, il sait si les membres de son cluster restent a` deux sauts de lui. Si deux nœuds
+du meˆme cluster se retrouvent e´loigne´s de plus de deux sauts, seul celui encore voisin
+du nœud de plus fort degre´ dans le cluster reste dans le cluster. L’autre doit se rattacher
+a` un autre cluster. Bien que n’utilisant pas la notion de cluster-head, la maintenance de
+cet algorithme maintient le nœud de plus fort degre´ au centre du cluster, ce qui peut
+revenir au meˆme que de l’e´lire comme cluster-head. Le protocole de maintenance de
+l’”Adaptive Clustering” a ensuite e´te´ repris par les auteurs de [44] qui se proposent de
+l’appliquer au LCA.
+Tous les algorithmes de´crits jusqu’a` pre´sent peuvent eˆtre qualifie´s de protocoles de
+”clustering actif”, c.a`.d. que des messages de controˆle sont envoye´s dans le but de
+construire et maintenir les clusters. A` l’oppose´, les auteurs de [47] proposent un proto-
+cole de ”clustering passif”, c.a`.d. qu’ils n’utilisent aucun message de´die´ a` la construc-
+tion des clusters. Les clusters ne sont cre´e´s que lorsque ne´cessaires, c.a`.d. lorsqu’un
+nœud a une information a` diffuser. Le protocole de clustering passif utilise alors ces
+messages d’information pour construire les clusters, en ajoutant des champs aux pa-
+quets d’information. Un nœud a quatre statuts possibles : cluster-head, passerelle, nœud
+ordinaire et non de´fini. Par de´faut, le statut des nœuds est non de´fini. Seul un nœud
+ayant un statut non de´fini peut devenir cluster-head. Si un tel nœud a un message a`
+envoyer, il se de´clare cluster-head et diffuse son statut en l’ajoutant a` l’information
+qu’il devait envoyer. Les nœuds voisins d’un cluster-head deviennent des nœuds or-
+dinaires, les nœuds voisins de plusieurs cluster-heads deviennent des passerelles. Les
+nœuds ordinaires ne relaient pas les messages de diffusion. Aucun message n’e´tant
+de´die´ a` la maintenance de la structure, les passerelles et les nœuds ordinaires activent
+des compteurs lorsqu’ils rec¸oivent des nouvelles de leur(s) cluster-head(s). S’ils restent
+sans nouvelle d’eux le temps que leur compteur expire, les nœuds ordinaires reprennent
+un statut non de´fini et les passerelles prennent le statut de nœud ordinaire ou non de´fini
+suivant le nombre de cluster-heads qu’elles entendent encore.
+Comme nous venons de le voir, il existe de nombreux protocoles de clustering a` 1
+saut. Les solutions les plus anciennes proposaient des clusters recouvrants. Ce type de
+18 CHAPITRE 2. E´TAT DE L’ART
+clusters permet principalement de baˆtir un ensemble dominant connecte´ sur le re´seau
+(constitue´ des cluster-heads et des passerelles) pour pouvoir diffuser une information
+(principalement pour le routage) sur le re´seau sans solliciter tous les nœuds. Puis
+d’autres e´tudes ont donne´ des clusters non-recouvrants, plus robustes face a` la mo-
+bilite´ des nœuds. Ce type de clusters permet e´galement d’autres applications comme la
+re´utilisation spatiale de fre´quences ou de codes (les nœuds de deux clusters non voisins
+peuvent utiliser la meˆme fre´quence). Puis, des propositions plus re´centes sont apparues
+permettant la construction de clusters a` k sauts, encore plus robustes et permettant de
+nouvelles applications comme l’application de zones de services ou de protocole de
+routage hie´rarchique.
+2.2 Clusters a` k sauts
+La me´thode la plus re´pandue pour la construction de clusters a` k sauts est une extension
+des algorithmes de clustering a` 1 saut. Par exemple, les auteurs de [23] ge´ne´ralisent
+l’algorithme de Lin et Gerla [50]. Leur algorithme suppose que chaque nœud connaıˆt
+ses voisins situe´s jusqu’a` k sauts de lui. Le nœud ayant le plus petit identifiant parmi
+les nœuds a` au plus k sauts de lui, diffuse son statut de cluster-head a` ses k-voisins.
+Lorsque tous les nœuds de son k-voisinage ayant un plus identifiant que lui ont dif-
+fuse´ leur de´cision d’eˆtre chef de cluster ou de s’attacher a` un autre chef, le nœud u
+peut prendre sa propre de´cision de s’attacher au nœud de son k-voisinage de plus pe-
+tit identifiant s’e´tant de´clare´ chef de cluster s’il existe, ou de cre´er son propre cluster
+sinon. De la meˆme fac¸on que pour les clusters a` 1 sauts, ce meˆme algorithme est uti-
+lise´ en utilisant diffe´rentes me´triques. Dans le meˆme papier [23], les auteurs proposent
+e´galement d’utiliser le k-degre´ (δk) des nœuds (nombre de voisins a` au plus k sauts)
+pour de´terminer le cluster-head : le nœud de plus fort k-degre´ et de plus petit identifiant
+en cas d’e´galite´ est promu chef de cluster. Les clusters re´sultants sont des k-clusters
+(chaque nœud est a` au plus k sauts de son chef) recouvrants (un nœud peut appartenir a`
+plusieurs clusters). Deux chefs sont e´loigne´s d’au moins k + 1 sauts. Cependant, nous
+retrouvons les meˆmes inconve´nients que pour les algorithmes de clusters a` 1 saut, a`
+savoir qu’un petit changement de nœuds peut engendrer une reconstruction comple`te
+de la structure.
+Les auteurs de [67] introduisent une me´trique qu’ils appellent ”associativite´” qui se
+veut repre´senter la stabilite´ relative des nœuds dans leur voisinage. Pour chaque nœud,
+l’associativite´ comptabilise le temps que chacun des nœuds de son voisinage reste ef-
+fectivement dans son voisinage et en fait la somme sur chaque voisin. A` chaque pe´riode
+de temps, un nœud u conside`re quels sont ses voisins actuels de´ja` pre´sents lors de la
+pe´riode pre´ce´dente et ajoute +1 a` la valeur associe´e a` chacun d’eux. Si un voisin a
+disparu, la valeur qui lui e´tait associe´e passe a` 0, si un autre apparaıˆt, il prend la valeur
+1. A` chaque pe´riode de temps, l’associativite´ de u est la somme des valeurs associe´es a`
+chacun de ses voisins. Cette valeur prend donc en compte la stabilite´ de u (si u est rela-
+tivement stable dans son voisinage, il aura une forte associativite´) et le degre´ des nœuds,
+cette valeur n’e´tant pas normalise´e. L’algorithme de formation des clusters est le sui-
+vant. Un nœud conside`re les nœuds de son k-voisinage ayant un degre´ supe´rieur a` une
+2.2. CLUSTERS A` K SAUTS 19
+valeur seuil et e´lit parmi eux celui ayant la plus forte associativite´. Le plus fort degre´
+et le plus faible identifiant sont ensuite utilise´s pour rompre les e´galite´s. Les clusters
+re´sultants sont e´galement des k-clusters recouvrants mais qui visent a` eˆtre plus stables
+dans le temps et dans l’espace que ceux se basant sur le simple degre´ ou identifiant.
+Dans [51], Lin et Chu proposent une approche base´e sur aucune me´trique particulie`re.
+Lorsqu’un nœud u arrive dans le re´seau, il est en phase ”d’initialisation”. Il demande
+alors a` ses voisins s’ils sont comme lui en phase d’initialisation ou s’ils ont un cluster-
+head et dans ce cas, a` quelle distance ce cluster-head se situe-t-il. Si tous les voisins
+de u sont en phase d’initialisation, u s’e´lit chef de cluster et diffuse cette information.
+Tous les r-voisins de u qui n’ont aucun autre chef plus proche que u s’attache au cluster
+de u. Sinon, u s’attache au cluster de son voisin dont le chef est le plus proche et a` au
+plus r sauts de lui. Si tous les cluster-heads des clusters de ses voisins sont a` plus de r
+sauts de u, u se de´clare chef de cluster et rallie a` son cluster tous ses voisins a` moins
+de r sauts dont le chef est plus e´loigne´ que u. Si deux cluster-heads se retrouvent a`
+moins deD sauts l’un de l’autre,D < r, le chef de cluster de plus faible identifiant doit
+ce´der son roˆle et tous les membres de son cluster doivent se trouver un autre chef. Cette
+me´thode de clustering est inte´ressante dans la mesure ou` elle produit des r-clusters non
+recouvrants ou` les chefs sont e´loigne´s de au moins D sauts. Cela assure une certaine
+stabilite´ a` la structure. Cependant, l’abandon du roˆle de cluster-head par un nœud peut
+engendrer de fortes re´actions en chaıˆne.
+Une approche plus originale est celle propose´e par Fernandess et Malkhi dans [32].
+Leur algorithme se de´compose en deux phases. La premie`re e´tape consiste a` trou-
+ver un arbre couvrant du re´seau base´ sur un ensemble dominant connecte´ de cardi-
+nalite´ minimale (MCDS). Les auteurs proposent d’utiliser l’algorithme de [2] pour
+construire le MCDS mais pre´cisent que n’importe quelle me´thode peut eˆtre utilise´e. La
+seconde phase de l’algorithme consiste en une partition de l’arbre couvrant en 2k-sous-
+arbres, un 2k-sous-arbre e´tant un arbre de diame`tre au plus 2k sauts. Chaque sous-arbre
+consiste en un k-cluster. Cependant, une telle approche a une complexite´ temporelle et
+une complexite´ en messages en O(n) (n e´tant le nombre de nœuds dans le re´seau)
+et est par conse´quent difficilement extensible. De plus, les auteurs n’abordent pas la
+maintenance d’une telle construction, qui ne semble pas triviale.
+Les auteurs de Max-Min d-cluster [4] utilisent l’identifiant des nœuds pour construire
+des k-clusters non recouvrants. Cependant, leur algorithme est un peu plus complexe
+que ceux vus jusqu’a` maintenant. Il se de´compose en trois phases. Lors de la premie`re
+phase, chaque nœud collecte l’identifiant de ses voisins jusqu’a` d sauts et en garde le
+plus grand qu’il diffuse de nouveau a` d sauts lors de la seconde phase. Chaque nœud
+garde alors le plus petit des identifiants qu’il rec¸oit lors de cette deuxie`me phase (le
+plus petit parmi les plus grands). La troisie`me e´tape consiste au choix du cluster-head
+base´ sur les identifiants collecte´s lors des deux phases pre´ce´dentes. Si un nœud u a
+vu passer son propre identifiant lors de la deuxie`me phase, il devient chef de cluster.
+Sinon, si u a vu passer un identifiant durant chacune des phases 1 et 2, il e´lit le nœud
+portant cet identifiant comme chef. Sinon, u e´lit comme chef le nœud de plus grand
+identifiant dans son d voisinage. La structure re´sultante s’ave`re robuste, cependant la
+latence induite par l’algorithme est non ne´gligeable.
+20 CHAPITRE 2. E´TAT DE L’ART
+Dans [3], les meˆmes auteurs introduisent une notion d’identifiant virtuel. Le but est
+d’apporter une certaine e´quite´ entre les nœuds et d’e´viter qu’un meˆme nœud soit trop
+longtemps cluster-head et e´puise ainsi ses ressources, tout en assurant qu’il le reste
+suffisamment longtemps pour apporter une stabilite´ a` la structure. Les nœuds prennent
+le roˆle de cluster-head tour a` tour. Initialement, l’identifiant virtuel d’un nœud est e´gal
+a` son propre identifiant. A` chaque pe´riode de temps, chaque nœud non cluster-head
+incre´mente de 1 son identifiant virtuel jusqu’a` atteindre un maximum MAXV ID. Le
+nœud ayant l’identifiant virtuel le plus fort parmi ses k-voisins devient le cluster-head.
+En cas de conflits, c’est le nœud qui a le moins ope´re´ en tant que chef qui devient
+cluster-head (et de plus fort identifiant normal si toujours e´galite´). Un nœud qui de-
+vient cluster-head prend ajoute a` son ancienne valeur d’identifiant virtuelle MAXV ID
+de fac¸on a` assurer qu’il conserve le plus fort identifiant virtuel et reste cluster-head.
+Un nœud reste cluster-head pendant une pe´riode de temps ∆(t) au bout de laquelle
+il passe son identifiant virtuel a` 0 et abandonne son roˆle de chef. Lorsque deux chefs
+entrent dans le voisinage l’un de l’autre, celui de plus faible identifiant virtuel aban-
+donne son roˆle. Dans le meˆme papier, les auteurs proposent e´galement une construction
+ou` l’identifiant virtuel de base serait le degre´ des nœuds. Cet algorithme permet donc
+la formation de k-clusters en assurant une certaine stabilite´ de la structure. Ne´anmoins,
+elle ne´cessite une synchronisation des nœuds afin que chacun se base sur la meˆme
+pe´riode de temps pour incre´menter son identifiant virtuel et surtout pour comptabili-
+ser la pe´riode durant laquelle il est cluster-head. Or, une synchronisation dans de tels
+re´seaux est non triviale et ne´cessite beaucoup de messages.
+Les auteurs de [45] proposent un autre type d’algorithme, formant cette fois des clusters
+sans chef de cluster. Pour cela, chaque nœud ne´cessite e´galement la connaissance de
+son k-voisinage. Un cluster est forme´ par un ensemble de nœuds tel qu’il existe entre
+deux nœuds de cet ensemble un chemin d’au plus k-sauts. Si k = 1, chaque cluster
+est une clique. Un nœud appartenant a` plusieurs clusters est dit nœud frontie`re. Les
+clusters sont donc recouvrants. Malheureusement, cet algorithme implique beaucoup
+de messages de controˆle, de maintenance et de donne´es a` ge´rer par les nœuds.
+Les auteurs de DDR [59] proposent e´galement une structure sans cluster-head. Contrai-
+rement a` la plupart des algorithmes de formation de k-clusters, les nœuds ne ne´cessitent
+que de la connaissance de leur 1-voisinage. La formation des clusters se base sur la
+construction d’un arbre. Chaque nœud choisit comme pe`re son voisin de plus faible
+identifiant. Il existe alors exactement une areˆte sortante par nœud. Cela conduit a` la
+formation d’un arbre. Tous les nœuds du meˆme arbre appartiennent au meˆme cluster.
+Le diame`tre de tels clusters n’est pas fixe´ a priori et s’adapte automatiquement a` la to-
+pologie sous-jacente. Cet algorithme a e´te´ ensuite repris par Baccelli [7] en y ajoutant
+la notion de cluster-head et en controˆlant la taille des clusters. Pour cela, un nœud a
+le droit de se choisir comme pe`re s’il a le plus fort identifiant dans son 1-voisinage. Il
+existe alors des nœuds sans areˆte sortante qui deviennent des cluster-heads. Ces cluster-
+heads ont alors la possibilite´ de borner la hauteur des arbres a` d sauts en diffusant l’in-
+formation le long des branches de l’arbre. Si la branche est trop longue, le nœud se
+trouvant a` d+1 sauts de son cluster-head doit s’attacher a` un autre pe`re (et donc casser
+la branche).
+D’autres algorithmes comme ceux propose´s dans [39, 60] ne proposent qu’une solution
+2.3. CLUSTERS HIE´RARCHIQUES 21
+de maintenance. Par exemple, les auteurs de [60] proposent de maintenir un certain
+nombre de nœuds dans un cluster, qui de´pendrait du nombre d’entite´s que le cluster-
+head est en mesure de ge´rer. L’ide´e est de maintenir en permanence le nombre de nœuds
+entre deux seuils. Si un cluster est trop petit, le chef de cluster doit e´lire parmi ses
+clusters voisins celui le plus adapte´ pour une fusion, c’est-a`-dire celui dont le nombre
+de nœuds permet la fusion des deux clusters. Si aucun ne correspond, le chef de cluster
+doit de´terminer un cluster qui peut lui ce´der des entite´s pour un meilleur e´quilibrage du
+nombre de nœuds. Si les clusters sont trop gros, le chef doit e´lire parmi ses membres
+un autre cluster-head et scinder son cluster en deux. Il reste cluster-head d’un cluster
+re´sultant tandis que le nœud qu’il a e´lu devient chef du second cluster. Cette me´thode
+est cependant tre`s couˆteuse en calculs, latence et messages et supporte mal le passage
+a` l’e´chelle du re´seau.
+2.3 Clusters hie´rarchiques
+Il existe e´galement des propositions de structures hie´rarchiques a` plusieurs niveaux,
+c’est-a`-dire ou` les clusters sont ensuite regroupe´s en d’autres clusters de niveaux
+supe´rieurs et ainsi de suite. Bien que la majorite´ des algorithmes vus jusqu’a` main-
+tenant peuvent eˆtre applique´s re´cursivement sur les clusters pour former des clusters de
+niveau supe´rieur, ils n’ont pas e´te´ e´crits dans ce but contrairement aux exemples que
+nous e´nonc¸ons ici.
+Dans [11], Banerjee et Khuller se basent sur un arbre couvrant, construit graˆce a` un
+parcours en largeur, pour la construction de k-clusters. Les clusters sont forme´s par
+branche, en fusionnant re´cursivement deux sous-arbres de l’arbre couvrant jusqu’a`
+obtenir une taille correcte. Le processus est alors re´-ite´re´ jusqu’a` obtenir un certain
+nombre de niveaux.
+Dans [5], les auteurs cherchent a` combiner les partitions physiques et logiques des
+nœuds ainsi que leur mobilite´. Pour cela, ils utilisent un GPS. Les auteurs supposent
+que les nœuds re´pondent a` un mode`le de mobilite´ de groupe. L’algorithme consiste
+ensuite a` regrouper en un meˆme cluster les nœuds proches ge´ographiquement et qui
+se de´placent a` un vitesse semblable dans une meˆme direction. Le processus est ensuite
+re´-ite´re´ jusqu’a` obtenir le nombre de niveaux voulu.
+La structure de cellules hie´rarchiques de SAFARI [69] est base´e sur une auto-se´lection
+des nœuds en tant que drums (cluster-heads). Le nombre de niveaux hie´rarchiques
+s’e´tablit automatiquement en fonction de la topologie sous-jacente des nœuds. Les
+clusters de niveau i sont groupe´s en clusters de niveau i+1 et ainsi de suite, les simples
+nœuds e´tant conside´re´s comme des cellules de niveau 0. Chaque cluster-head de niveau
+i se choisit un cluster-head de niveau i + 1. Tous les cluster-heads de niveau i ayant
+choisi le meˆme cluster-head de niveau i+ 1 appartiennent au meˆme cluster de niveau
+i + 1. Un cluster-head u de niveau i de´cide de monter ou descendre son niveau en
+fonction du nombre de cluster-heads de niveau i + 1 et i − 1 qui existent a` une cer-
+taine distance. S’il n’existe aucun cluster-head de niveau supe´rieur a` une distance plus
+petite que Di (Di constante de´pendant du niveau i du cluster-head) de u, u de´cide
+22 CHAPITRE 2. E´TAT DE L’ART
+d’augmenter son niveau. Si deux cluster-heads de meˆme niveau sont a` moins de h×Di
+(0 < h < 1, facteur d’hyste´resis) sauts, le cluster-head de plus grand identifiant des-
+cend son niveau. Un cluster-head de niveau i est e´galement cluster-head de tout niveau
+j tel 0 < j < i. Cet algorithme construit des k-clusters hie´rarchiques, ou` k de´pend du
+niveau du nœud i : k = Di. D1 doit eˆtre fixe´. A` partir de la`, Di de´pendant de Di−1, le
+rayon des clusters de chaque niveau est fixe´. Cette structure hie´rarchique peut cepen-
+dant n’eˆtre utilise´e que dans un cadre pre´cis de routage, propose´ par les auteurs. Nous
+verrons cette utilisation plus en de´tail dans le chapitre 5.
+2.4 Conclusion
+Ainsi, il existe de nombreux protocoles de clustering dans la litte´rature. Tous cependant
+ne sont pas adapte´s a` une extension du re´seau comme nous avons pu le constater. En
+effet, des clusters a` 1 saut ne peuvent pas eˆtre utilise´s dans ce cadre du fait du nombre
+de clusters qu’ils ge´ne´reraient sur de la larges e´chelles et du fait que le moindre chan-
+gement a` l’e´chelle d’un nœud provoquerait une reconstruction de la structure. En effet,
+si le re´seau compte beaucoup d’entite´s, ces changements peuvent eˆtre fre´quents et mi-
+nimes a` l’e´chelle du re´seau. Les clusters a` k sauts sont moins de´veloppe´s. Beaucoup
+s’inspirent des protocoles de clustering a` 1 saut et en gardent les inconve´nients. Dans
+ma the`se, j’ai propose´ un nouvel algorithme de clustering a` k sauts pouvant s’adap-
+ter aux petites modifications du re´seau. Cet algorithme prend note des inconve´nients
+des protocoles existants et tente de les e´viter, comme nous le verrons de`s le chapitre
+suivant.
+Chapitre 3
+Algorithme de clustering, stable
+et robuste
+3.1 Introduction
+Notre principal objectif est de proposer un moyen d’utiliser des re´seaux sans fil tre`s
+denses. Comme nous l’avons vu, l’une des solutions possibles est d’introduire une
+hie´rarchie dans le re´seau en construisant des clusters. Afin de permettre une extensibi-
+lite´ totale et ne pas avoir a` reconstruire les clusters apre`s chaque mouvement individuel
+d’un nœud, nous avons cherche´ a` construire des clusters qui n’aient aucun parame`tre
+fixe´ a` l’avance, qu’il s’agisse du rayon, du diame`tre ou de nombre de nœuds par clus-
+ter. Ces parame`tres doivent s’adapter d’eux-meˆmes a` la topologie du re´seau, qui e´volue
+au cours du temps. De plus, l’heuristique se doit d’eˆtre distribue´e et asynchrone tout
+en minimisant le nombre d’informations a` e´changer. Notre algorithme n’utilise que
+des messages de type ”PAQUET HELLO” comme ceux utilise´s dans OLSR [25] afin
+de de´couvrir le 2-voisinage d’un nœud. Les clusters forme´s doivent eˆtre stables (les
+cluster-heads doivent conserver ce statut suffisamment longtemps pour limiter le trafic
+de controˆle ne´cessaire a` la reconstruction des clusters) tout en s’adaptant aux change-
+ments de la topologie sous-jacente. Enfin, afin d’ame´liorer la stabilite´ de la structure,
+e´tant donne´ que les nœuds trop mobiles pour initier une communication n’ont aucun
+besoin de la structure, ils ne participent pas a` la phase de construction et restent des
+nœuds inde´pendants. Dans le cas contraire, de par leur mobilite´, ils pourraient obliger
+le re´seau a` re-construire inutilement les clusters.
+Comme mentionne´ dans le chapitre 2, diffe´rentes me´triques ont e´te´ utilise´es pour le
+choix des cluster-heads dans les algorithmes de clustering. L’identifiant des nœuds
+e´tant immuable, il permet de conserver les chefs de cluster tre`s longtemps. Cependant
+de tels clusters sont inde´pendants de la topologie sous-jacente et ne sont pas toujours
+adapte´s. Le degre´ des nœuds s’ave`re l’une des me´triques les plus adapte´es, l’ide´e e´tant
+23
+24 CHAPITRE 3. ALGORITHME DE CLUSTERING
+qu’un chef de fort degre´ permet de couvrir un grand nombre de nœuds, ce qui per-
+met d’en minimiser le nombre. Cependant, un mouvement individuel d’un nœud dans
+des clusters base´s sur cette me´trique peut conduire a` une re´-organisation comple`te du
+re´seau, alors que la structure globale du re´seau reste inchange´e.
+Base´s sur cette constatation, nous avons introduit une nouvelle me´trique, que nous
+avons appele´e densite´. L’ide´e est que, si un petit changement de topologie intervient
+dans le voisinage d’un nœud, son degre´ δ peut changer alors que globalement son
+voisinage est conserve´. Notre me´trique est une densite´ de liens et cherche a` lisser les
+petits changements de topologie qui interviennent au niveau individuel d’un nœud, tout
+en permettant aux clusters de s’adapter a` la topologie sous-jacente.
+3.2 La me´trique de densite´
+La k-densite´ d’un nœud, note´e ρk(u), est le ratio du nombre de liens par le nombre de
+nœuds dans le k-voisinage d’un nœud.
+De´finition 1 (densite´) La k-densite´ d’un nœud u ∈ V est
+|e = (v, w) ∈ E |w ∈ {u,Γk(u)} et v ∈ Γk(u)|
+ρk(u) =
+δk(u)
+La 1-densite´ (e´galement note´e ρ(u)) est donc le rapport entre le nombre de liens entre
+u et ses voisins plus le nombre de liens entre les voisins de u et le nombre de ses voisins
+(par de´finition, son degre´).
+Afin d’illustrer cette me´trique, prenons l’exemple repre´sente´ sur la Figure 3.1.
+Conside´rons le nœud p et calculons sa 1-densite´ ρ(p). ρ(p) est le ratio entre le nombre
+d’areˆtesL(p) et le nombre de nœuds (|Γ(p)|) dans le 1-voisinage Γ(p) de p. Les nœuds
+de Γ(p) sont les nœuds gris fonce´ (Γ(p) = {a, b, c, d, e, f}). L(p) repre´sente alors le
+nombre de liens entre p et ces nœuds (liens en pointille´s) et le nombre de liens entre ces
+nœuds (liens tiret). Ainsi, L(p) = 4 + 6 = 10 et δ(p) = 6 d’ou` ρ(p) = 10/6 = 5/3.
+On remarquera que pour calculer ρk(p), p doit connaıˆtre Γk+1(p) afin de connaıˆtre les
+liens existant entre ses k-voisins.
+3.3 La formation des clusters
+Chaque nœud u surveille son voisinage et juge ainsi de sa mobilite´ relative. Si cette
+dernie`re n’est pas trop importante, alors u participe a` l’algorithme de clustering, si-
+non, il reste un nœud inde´pendant. L’ide´e est qu’un nœud trop mobile ne pourra pas
+instancier de communications avec les autres entite´s du re´seau. Il n’a donc pas besoin
+d’appartenir a` un cluster puisqu’il ne pourrait pas en tirer avantage. De meˆme, si un
+3.3. LA FORMATION DES CLUSTERS 25
+b a
+p f
+c
+d e
+FIG. 3.1 – Illustration de la me´trique de densite´.
+nœud trop mobile est pris en compte dans la construction des clusters, il risque de
+casser la structure inutilement de par les nombreuses cassures de liens induites par sa
+forte mobilite´ et obligera le re´seau a` reconstruire les clusters. Cette valeur de mobilite´
+relative d’un nœud u peut eˆtre calcule´e en ve´rifiant la constance du voisinage de u, en
+conside´rant par exemple le nombre de nœuds restant dans le voisinage de u pendant un
+certain temps.
+Pe´riodiquement, chaque nœud suffisamment stable calcule sa densite´ et la diffuse lo-
+calement a` son 1-voisinage. Chacun est alors en mesure de comparer sa propre densite´
+a` celle de ses voisins ”suffisamment stables”. A` partir de la`, un nœud de´cide soit de
+s’e´lire comme cluster-head (s’il posse`de la plus forte densite´), soit de choisir comme
+pe`re son voisin de plus forte densite´. En cas d’e´galite´, afin de privile´gier la stabilite´
+de la structure, le nœud choisi sera celui de´ja` e´lu au tour pre´ce´dent s’il est en course,
+sinon celui de plus petit identifiant. De cette fac¸on, deux voisins ne peuvent pas eˆtre
+tous deux cluster-heads. Cette me´thode d’e´lection construit implicitement une foreˆt
+couvrante oriente´e.
+Si un nœud u choisit le nœud w, on dit que w est le pe`re de u (note´ P(u) = w)
+dans l’arbre de clustering et que u est un fils de w (note´ u ∈ Ch(w)). Si aucun nœud
+n’a e´lu le nœud u comme pe`re (Ch(u) = ∅), u est une feuille d’un des arbres, sinon,
+u est qualifie´ de nœud interne. Le pe`re d’un nœud peut s’eˆtre choisi comme pe`re un
+autre nœud de son voisinage et ainsi de suite. Un arbre s’e´tend automatiquement, sans
+contrainte sur sa hauteur, jusqu’a` atteindre les frontie`res d’un autre arbre. Tous les
+nœuds appartenant au meˆme arbre appartiennent alors au meˆme cluster. Afin d’apporter
+une stabilite´ plus importante, un chef de cluster ne doit pas eˆtre trop excentre´ dans son
+propre cluster. En effet, si un chef de cluster se trouve a` la frontie`re de son cluster et
+qu’il bouge, il a plus de chance d’entrer en compe´tition avec un autre chef et ainsi de
+casser les deux clusters. C’est pourquoi, nous ajoutons une re`gle supple´mentaire qui
+indique que tout nœud voisin d’un cluster-head doit s’attacher a` ce cluster-head. Si un
+nœud est voisin de plusieurs cluster-heads, une fusion est instancie´e entre ces clusters
+et le cluster re´sultant a pour chef le cluster-head en compe´tition de plus forte densite´.
+De cette fac¸on, deux cluster-heads sont distants de 3 sauts minimum. Supposons un
+nœud u voisin d’un chef de cluster H ( H ∈ Γ1(u)) mais qui ne l’a pas choisi comme
+pe`re (P(u) 6= H), alors, deux cas sont possibles :
+– soit le pe`re de u est e´galement cluster-head ; dans ce cas les deux clusters fusionnent.
+26 CHAPITRE 3. ALGORITHME DE CLUSTERING
+Le cluster-head final est le nœud le plus fort parmi ceux en compe´tition : P(u).
+(Puisque u pouvait choisir entre H et P(u) et a choisi P(u)). H n’est plus cluster-
+head, il choisit u comme son pe`re ;
+– soit le pe`re de u s’est attache´ a` un autre de ses voisins et n’est pas cluster-head ; cela
+signifie que u se situe a` au moins deux sauts de son chef. Il change alors de pe`re et
+choisit H.
+E´ tant donne´ un nœud v ∈ V , pour tout nœud u ∈ Γ1(v), on de´finit Age(u)
+comme le nombre de pe´riodes successives ou` un nœud u a choisi v comme pe`re. On
+de´finit e´galement ≺ comme un indicateur d ordre binaire tel que pour (u, v) ∈ V 2’ , ,
+u ≺ v si et seulement si {ρk(u) < ρk(v)} ou {ρk(u) = ρk(v) ∧Age(u) < Age(v)}
+ou {ρk(u) = ρk(v) ∧Age(u) = Age(v) ∧ Id(v) < Id(u)}.
+L’algorithme s’auto-stabilise quand chaque nœud connaıˆt l’identite´ de son cluster-head.
+Algorithm 1 Formation des clusters
+Pour tout nœud u ∈ V
+⊲ Initialisation des variables.
+H(u) = P(u) = −1
+∀v ∈ Γ1(u), Age(v) = 0
+while ((H(u) = −1) ou (H(u) 6= Hold(u)))
+⊲ Boucle jusqu’a` stabilisation
+Hold(u) = H(u)
+Scrutation du voisinage
+Calcul de la valeur de mobilite´
+if (Mobilite < SeuilMobilite)
+Re´cupe`re Γk+1(u)
+Calcule ρk(u)
+Diffuse localement ρk(u) a` ses 1-voisins.
+⊲ Cette diffusion locale peut s’effectuer par exemple en ajoutant la valeur de ρk(u) dans
+un paquet HELLO.
+⊲ A` ce moment, le nœud u connaıˆt la k-densite´ de tous ses voisins et peut choisir son pe`re.
+if (∀v ∈ Γ1(u), v ≺ u) then H(u) = u ⊲ u devient cluster-head.
+else
+⊲ ∃w ∈ Γ1(u) t.q.∀v ∈ {u} ∪ Γ1(u), v ≺ w
+P(u) = w
+H(u) = H(w)
+⊲ Soit P(w) = H(w) = w donc u est directement lie´ a` son chef de cluster, soit w
+a choisi un autre nœud x comme pe`re (∃ x ∈ Γ1(w) | P(w) = x) et re´cursivement
+H(u) = H(w) = H(x).
+end
+if ((H(u) = u) et (∃v ∈ Γ1(u) | P(v) 6= u)) then
+⊲ u est cluster-head, mais tous ses voisins ne l’ont pas choisi comme pe`re.
+if (P(v) = H(v)) then
+⊲ Au moins deux cluster-heads (H(u) et H(v)) ont un voisin commun v. Si P(v) =
+H(v) alors u ≺ H(v). u s’e´crase et choisit v comme pe`re (les clusters C(u) et C(v)
+fusionnent).
+P(u) = v et H(u) = H(v)
+Age(v)++ et ∀w ∈ Γ1(u), Age(w) = 0.
+end
+3.3. LA FORMATION DES CLUSTERS 27
+end
+if (∃v ∈ Γ1(u) t.q. {(H(v) = v) et (H(P(u)) 6= H((u))})
+⊲ u n’est pas chef et est a` plus de 2 sauts de son chef (son pe`re n’est pas chef) alors qu’il
+compte un chef parmi ses voisins. Il change de pe`re.
+P(u) = v et H(u) = v
+Age(v)++ et ∀w ∈ Γ1(u)Age(w) = 0.
+end
+Diffuse localement P(u) et H(u)
+end
+Exemple
+Afin d’illustrer cette heuristique, exe´cutons l’Algorithme 1 sur le graphe de la figure 3.2
+en conside´rant la 1-densite´. Dans le 1-voisinage du nœud a, on a deux voisins (Γ1(a) =
+{d, i}) et deux liens ({(a, d), (a, i)}), d’ou` ρ(a) = 1 ; le voisinage du nœud b compte
+4 voisins (Γ1(b) = {c, d, h, i}) et cinq liens ({(b, c), (b, d), (b, h), (b, i), (h, i)}), d’ou`
+ρ(b) = 54 . La table 3.1 montre les valeurs finales des densite´s des nœuds.
+c b h e
+j
+l
+d
+g
+i
+a k
+f m
+FIG. 3.2 – Exemple.
+Nœuds a b c d e f g h i j k l m
+Degre´ 2 4 1 4 2 2 2 3 4 2 4 2 2
+Nb Liens 2 5 1 5 2 3 2 4 5 3 5 3 3
+Densite´ 1 1.25 1 1.25 1 1.5 1 1.33 1.25 1.5 1.25 1.5 1.5
+TAB. 3.1 – Densite´ des nœuds du graphe de la figure 3.2.
+Dans cet exemple, le nœud c e´lit son voisin b (P(c) = b) dont la densite´ est la plus
+forte dans Γ1(c) ∪ {c} (∀v ∈ Γ1(c) ∪ {c} , v ≺ b). Le nœud de plus forte densite´
+dans le voisinage de b est h, d’ou` P(b) = h. Comme h a la plus forte densite´ dans
+son voisinage, il devient son propre pe`re et donc cluster-head : H(h) = h. Le nœud
+c choisit b qui choisit h et tous trois appartiennent au meˆme cluster de cluster-head
+h et donc : H(c) = H(b) = H(h) = h. ρ(j) = ρ(f) : ni j ni f n’e´taient choisis
+auparavant, c’est donc le plus petit identifiant qui tranche. Supposons j ≺ f , alors
+P(j) = f et P(f) = f d’ou`H(f) = H(j) = f . Aucun nœud n’ayant choisi a, j, c, e,
+i, g et m comme pe`re, ils deviennent des feuilles. Finalement, nous obtenons une foreˆt
+couvrante du re´seau, compose´e de trois arbres de racines h, l et f (figure 3.3(a)), qui
+donnent naissance a` trois clusters (figure 3.3(b)).
+28 CHAPITRE 3. ALGORITHME DE CLUSTERING
+c b h e c b h e
+j j
+l l
+d d
+g g
+i i
+a k a k
+f m f m
+(a) Arbres de clustering. (b) Clusters.
+FIG. 3.3 – Arbres (a) et clusters (b) construits avec l’Algorithme 1 sur le graphe de la
+figure 3.2 (Les cluster-heads/racines apparaissent en blanc).
+3.4 Maintenance de la structure
+La maintenance de cette structure construite a` partir de l’heuristique de la k-densite´
+est simple, e´tant donne´ que chaque nœud n’a besoin que de son k + 1-voisinage pour
+la construire. En effet, d’apre`s la taxonomie e´tablie par [81], un algorithme peut eˆtre
+qualifie´ de local si chaque nœud n’a besoin que de la connaissance de son 1 et 2 voi-
+sinage pour l’exe´cuter, ou de quasi-local, si les nœuds ne´cessitent une information
+dans un voisinage borne´. Cela implique une maintenance rapide. Chaque nœud calcule
+pe´riodiquement ses valeurs de mobilite´ et de densite´. S’il est suffisamment stable, il
+compare sa densite´ a` celle de ses voisins et choisit pe´riodiquement son pe`re. Un nœud
+non stable a` l’origine et dont le voisinage se stabilise peut ainsi s’attacher a` la structure
+sans la de´truire.
+3.5 Analyse de la me´trique
+Dans cette section, nous nous sommes inte´resse´s aux diffe´rentes caracte´ristiques de
+notre me´trique de densite´.
+Dans un premier temps, nous avons calcule´ sa valeur the´orique moyenne a` l’aide de la
+ge´ome´trie stochastique et des calculs de Palm. Puis, nous avons compare´ les diffe´rentes
+k-densite´s. Nous verrons ainsi que la 1-densite´ est non seulement la densite´ la moins
+couˆteuse mais e´galement la plus stable face a` la mobilite´ des nœuds et que les cluster-
+heads se´lectionne´s agissent comme des bassins d’attraction. Nous terminerons cette
+partie par une analyse de la re´partition des valeurs de densite´ parmi les nœuds du
+re´seau.
+3.5.1 Recherche de la meilleure k-densite´
+Nous nous sommes interroge´s sur les diffe´rentes k-densite´s : laquelle est la plus
+ade´quate ? En effet, nous avons vu que pour calculer une k-densite´, chaque nœud doit
+connaıˆtre son k+1 voisinage. Ainsi, plus k augmente, plus la k-densite´ est couˆteuse en
+3.5. ANALYSE DE LA ME´TRIQUE 29
+messages, utilisation de bande passante et latence. C’est pourquoi, nous avons compare´
+par simulation les structures forme´es par la 1-densite´ et la 2-densite´.
+Comme le montre la table 3.2, la 2-densite´ construit moins de clusters que la 1-densite´.
+Un nœud est plus excentre´ dans son cluster avec k = 2. Ne´anmoins, ces caracte´ristiques
+tre`s similaires ne nous permettent pas de trancher entre les diffe´rentes densite´s. C’est
+pourquoi, nous avons e´galement compare´ le comportement des structures obtenues
+avec les densite´s 1 et 2 face a` la mobilite´ des nœuds. En effet, la densite´ la plus
+inte´ressante sera celle qui offre la meilleure stabilite´, c.a`.d qui reconstruit moins sou-
+vent les clusters lorsque les nœuds se de´placent, limitant ainsi les e´changes de messages
+de controˆle et de mise a` jour des tables de routage. Un nœud peut quitter son cluster et
+migrer dans un autre sans que cela ne casse la structure de clusters.
+750 nœuds 3000 nœuds 5000 nœuds
+k-densite´ 1 2 1 2 1 2
+Nb clusters 4.67 3.01 4.23 2.53 4.42 2.43
+D(C) 7.1 9.72 9.25 11.67 9.4 12.15
+e˜(u/C) 4.86 6.45 6.21 7.03 6.02 8.42
+TAB. 3.2 – Comparaison des k-densite´s.
+Pour cela, nous avons simule´ un re´seau ou` les nœuds peuvent choisir ale´atoirement
+de bouger a` diffe´rentes vitesses allant de 0 a` 1.6m/s (pie´tons) dans des directions
+ale´atoires (Mode`le de mobilite´ Random Way Point) pendant 500s . La table 3.3 donne
+le nombre moyen de reconstructions de clusters durant la simulation.
+Moy Min Max
+1-densite´ 7.5 2 13
+2-densite´ 9.4 4 14
+TAB. 3.3 – Nombre de clusters re-contruits apre`s mobilite´ des nœuds.
+La 2-densite´ reconstruit plus souvent la structure que la 1-densite´. La 1-densite´ s’ave`re
+donc la densite´ la plus robuste et la moins couˆteuse puisqu’elle ne ne´cessite la connais-
+sance que du 2-voisinage d’un nœud, tout comme dans OLSR. De plus, utiliser une
+k-densite´ avec k > 2 serait trop couˆteux et impliquerait une maintenance moins effi-
+cace. C’est pourquoi, par la suite, on ne conside´rera que la 1-densite´.
+3.5.2 Densite´ moyenne
+Nous analysons ici la 1-densite´ moyenne ρ˜(u) d’un nœud u. On conside`re un re´seau
+sans fil multi-sauts ou` les nœuds sont distribue´s suivant un processus de Points de Pois-
+son d’intensite´ constante λ. Nous calculons alors la 1-densite´ moyenne en conside´rant
+une distribution de Palm. Dans une telle distribution, un nœud 0 est artificiellement
+30 CHAPITRE 3. ALGORITHME DE CLUSTERING
+ajoute´ a` la distribution poissonienne. Ce nœud 0, place´ a` l’origine du plan, sert de base
+d’observation pour les calculs. Sous la probabilite´ de Palm, ce nœud existe presque
+suˆrement. Puisque le processus est stationnaire, la densite´ moyenne de 0 est valide
+pour tout autre point du processus.
+Soit ρ(0) la densite´ moyenne du nœud 0. Φ de´signe le processus ponctuel : Φ(S)
+repre´sente le nombre de points du processus se trouvant sur une surface S donne´e.
+S i l b l d d y ′o t B(u,R) a ou e e centre u et e ra on R et Bu la boule centre´e en u de rayon
+R prive´e du singleton {u} ′: B = B(u,R)\ {u} o et o, u . E P de´signent respectivement
+l’espe´rance et la probabilite´ sous la distribution de Palm.
+Nous cherchons donc a` calculer la densite´ moyenne ρ˜(u) = oE [ρ(0)] d’un nœud quel-
+conque u.
+Lemme 1 La 1-densite´ moyenne d(e tout nœud)u s’e´crit :√ ( − {− })o 1 3 3 1 exp λpiR2ρ˜(u) = E [ρ(0)] = 1 + pi − λR2 −
+2 4 pi
+La preuve de ce lemme est donne´e en annexes 3.11.1. L’ide´e est de compter le nombre
+de liens dans le voisinage d’un nœud. Un lien existe entre deux nœuds s’ils sont a`
+une distance infe´rieure ou e´gale a` R. Si v est un voisin de u, alors, il existe autant
+de liens entre v et un autre voisin de u que de voisins communs a` u et v (nœuds a`
+distance infe´rieure a` R a` la fois de u et de v). Le nombre de voisins communs a` u et v
+correspond au nombre de points se trouvant a` l’intersection des zones de transmission
+de u et v. Cette surface est la zone repre´sente´e en bleu sur la figure 3.4. Par la suite,
+nous de´noterons par A(r) cette surface. Le calcul de ρ˜ consiste a` sommer le nombre
+de points se trouvant en moyenne dans cette zone pour chacun des voisins v de u en
+fonction de la distance euclidienne r de u a` v. Les liens e´tant ainsi compte´s deux fois,
+la somme finale est divise´e par deux.
+R u v R
+r
+FIG. 3.4 – Intersection du voisinage de deux nœuds voisins u et v. Les nœuds se trou-
+vant dans la zone bleue sont des voisins communs a` u et v.
+3.6. ANALYSE DE LA STRUCTURE 31
+Afin de ve´rifier la validite´ de nos re´sultats analytiques, nous avons compare´ les valeurs
+de densite´ moyenne obtenues par analyses et par simulation. Le mode`le de simulation
+utilise´ est celui de´crit dans le Chapitre 1.1. La table 3.4 donne les re´sultats pour une
+valeur de R = 0.1 et diffe´rentes valeurs d’intensite´ λ du processus de Poisson. Notons
+que la the´orie et la simulation s’accordent parfaitement.
+500 nœuds 600 nœuds 700 nœuds
+The´orie Simulation The´orie Simulation The´orie Simulation
+δ˜ 15.7 15.3 18.8 18.3 22.0 21.2
+ρ˜ 4.7 5.0 5.6 5.9 6.5 6.8
+800 nœuds 900 nœuds 1000 nœuds
+The´orie Simulation The´orie Simulation The´orie Simulation
+δ˜ 25.1 25.0 28.3 27.9 31.4 31.0
+ρ˜ 7.5 7.1 8.4 8.6 9.3 9.4
+TAB. 3.4 – Degre´ et densite´ moyens des nœuds.
+3.5.3 Re´partition des valeurs de densite´
+La figure 3.5 montre comment les valeurs de densite´ sont re´parties. La figure 3.5(a)
+donne le nombre de nœuds ayant une valeur de densite´ donne´e. Les barres verticales
+indiquent les valeurs prises par les cluster-heads. La figure 3.5(b) donne un exemple
+de distribution des densite´s dans le plan. Les cluster-heads apparaissent en bleu. Plus
+la couleur des nœuds est jaune, plus leur densite´ est forte. Nous pouvons constater que
+dans chaque cluster, les densite´s les plus fortes se situent autour des chefs de cluster.
+Plus un nœud est loin d’un cluster-head, plus sa densite´ est faible. Les cluster-heads
+forment des sortes de bassin d’attraction, ce qui apporte une stabilite´ a` la structure.
+3.6 Analyse de la structure
+Afin de pouvoir au mieux utiliser la structure de clusters forme´e par notre heuristique,
+nous en avons e´tudie´ certaines caracte´ristiques par simulation et quand nous le pou-
+vions, par analyse the´orique en utilisant la ge´ome´trie stochastique.
+3.6.1 Analyse the´orique du nombre de clusters
+Dans cette section, nous avons cherche´ a` calculer analytiquement le nombre de clus-
+ters (ou de cluster-heads) produit par l’algorithme de clustering (algorithme 1). Comme
+pour le calcul de la densite´ moyenne (section 3.5.2), nous utilisons la ge´ome´trie sto-
+chastique suivant le mode`le de´fini dans la section 1.1.
+32 CHAPITRE 3. ALGORITHME DE CLUSTERING
+(a) Histogramme. Nombre de nœuds du re´seau ayant une (b) Plus la couleur est rouge, plus la
+densite´ donne´e. densite´ est grande. Cluster-heads en
+bleu.
+FIG. 3.5 – Distribution des valeurs de densite´ parmi les nœuds. Les cluster-heads ap-
+paraissent en bleu. Plus la couleur des nœuds est jaune, plus leur densite´ est forte.
+Nous utilisons les meˆmes notations et la meˆme mode´lisation que pre´ce´demment, a`
+savoir que l’on conside`re un re´seau sans fil multi-sauts ou` les nœuds sont distribue´s
+suivant un processus ponctuel de Poisson Φ d’intensite´ constante λ.
+On cherche dans un premier temps a` calculer le nombre de clusters (ou cluster-heads)
+dans un espace C.
+Lemme 2 Le nombre moyen de cluster-heads appartenant a` un domaine C est :
+[Nombre de cluster heads dans C] = λν(C) oE - PΦ (0 est chef )
+ou` ν(C) repre´sente la mesure de Lebesgue1 dans IR2.
+Pour de´terminer le nombre moyen de cluster-heads, il nous faut donc dans un premier
+temps calculer oPΦ (0 est chef ), probabilite´ qu’un nœud soit chef. Les nœuds e´tant dis-
+tribue´s uniforme´ment et inde´pendamment, cette probabilite´ est la meˆme pour tous les
+nœuds. Cela revient a` calculer la probabilite´ qu’un nœud ait la plus forte densite´ dans
+son voisinage.
+Lemme 3 La probabilite´ qu’un point 0 so(it chef sous la probabilite´ d)e Palm est :
+o o
+PΦ (0 est chef) = PΦ ρ(0) > max ρ(Yk)
+k=1,..,Φ(B0)
+Nous avons cherche´ a` calculer cette quantite´ mais n’avons pu obtenir qu’une borne
+supe´rieure.
+1La mesure de Lebesgue sur IR d’un intervalle coı¨ncide avec sa longueur, la mesure de Lebesgue d’une
+re´gion de l espace sur IR2’ coı¨ncide avec la surface de cet espace. Pour une de´finition plus formelle, se re´fe´rer
+a` [76], chapitre 1.
+3.6. ANALYSE DE LA STRUCTURE 33
+Conjectu(re 1 Une borne supe´rieure)pou(r la probabili∑+∞ (
+te´ qu’u)n n)œud soit chef est :
+1 λpiR2
+n
+o 2
+PΦ ρ(0) > max ρ(Yk) ≤ 1 + exp {−λpiR }
+k=1,..,Φ(B0) n n!
+n=1
+Les de´tails du calcul sont donne´s en annexes 3.11.2. L’ide´e est dans un premier temps
+de conditionner la probabilite´ que 0 soit chef par le fait qu’il ait ou non des voisins. Si
+0 n’a pas de voisin, 0 est chef avec la probabilite´ 1. Dans le cas contraire, on majore
+cette probabilite´ par la probabilite´ qu’un voisin v de 0 ait la plus forte densite´ parmi
+Γ(0), les voisins de 0, probabilite´ que l’on peut calculer sous Palm.
+La figure 3.6 repre´sente la borne supe´rieure du nombre de clusters pour diffe´rentes
+valeurs de R et de λ (avec R diminuant de bas en haut). On peut voir que lorsque
+que l’intensite´ des nœuds augmente, la borne supe´rieure du nombre de clusters tend
+asymptotiquement vers une constante, ce qui permet a` notre structure de supporter le
+passage a` l’e´chelle du re´seau.
+Upper bound of the number of clusters in function of the process intensity
+160
+140
+120
+100
+80
+60
+40
+500 1000 1500 2000 2500 3000
+lambda
+FIG. 3.6 – Borne supe´rieure du nombre de clusters en fonction de λ (en abscisse) et de
+R (diffe´rentes courbes : de bas en haut R = 0.1, 0.09, 0.08, 0.07, 0.06, 0.05 m).
+3.6.2 Caracte´ristiques des clusters
+Les re´sultats donne´s dans cette section ont e´te´ obtenus par simulation, en utilisant le
+mode`le de´crit dans la section 1.1. La table 3.5 re´sume les caracte´ristiques principales
+des clusters pour R = 0.1 et diffe´rentes valeurs de λ.
+On remarquera que malgre´ l’augmentation de l’intensite´ des nœuds, l’excentricite´
+moyenne e˜(u/C) d’un nœud dans son cluster et la hauteur moyenne des arbres de
+clustering restent constante, du fait du nombre constant de clusters. Ceci va s’ave´rer
+eˆtre un atout lors de l’utilisation de notre structure pour effectuer une diffusion (cf.
+chapitre 4) ou pour router sur cette structure (cf. chapitre 5). Nous pouvons e´galement
+noter qu’une grande partie des nœuds sont des feuilles dans l’arbre de clustering (en-
+viron 75%). Comme nous le verrons dans le chapitre 4, cette proprie´te´ va elle aussi
+s’ave´rer fort utile lors d’une diffusion d’un message sur une telle structure.
+34 CHAPITRE 3. ALGORITHME DE CLUSTERING
+500 nœuds 600 nœuds 700 nœuds
+# clusters/arbres 11.76 11.51 11.45
+e˜(u/C) 3.70 3.75 3.84
+e˜(H(u)/C(u)) 3.01 3.09 3.37
+Hauteur des arbres 3.27 3.34 3.33
+% feuilles 73,48% 74,96% 76,14%
+Degre´ dans l’arbre des nœuds non feuilles 3.82 3.99 4.19
+Voronoı¨ : distance euclidienne 84.17% 84.52% 84.00%
+Voronoı¨ : nombre de sauts 85.43% 84.55% 84.15%
+800 nœuds 900 nœuds 1000 nœuds
+# clusters/arbres 11.32 11.02 10.80
+e˜(u/C) 3.84 3.84 3.84
+e˜(H(u)/C(u)) 3.17 3.19 3.23
+Hauteur des arbres 3.34 3.43 3.51
+% feuilles 76,81% 77,71% 78,23%
+Degre´ dans l’arbre des nœuds non feuilles 4.36 4.51 4.62
+Voronoı¨ : distance euclidienne 83.97% 83.82% 83.70%
+Voronoı¨ : nombre de sauts 83.80% 83.75% 83.34%
+TAB. 3.5 – Caracte´ristiques des clusters.
+Forme des clusters.
+Comme le montre la figure 3.7, les clusters ressemblent a` un diagramme de Vo-
+ronoı¨ construit autour des chefs de clusters. Si S est un ensemble de n sites de l’espace
+euclidien, pour chaque site p de S, la cellule de Voronoı¨ V (p) de p est l’ensemble des
+points de l’espace qui sont ge´ographiquement plus proches de p que de tous les autres
+sites de S. Le diagramme de Voronoı¨ de V (S) est la de´composition de l’espace en
+cellules de Voronoı¨ des sites de l’espace.
+Ainsi, cela signifierait qu’e´tant donne´s les cluster-heads, un nœud s’est attache´ a` celui
+le proche de lui en distance euclidienne. Afin d’e´valuer cette caracte´ristique, nous avons
+mene´ des simulations pour connaıˆtre le pourcentage de nœuds se situant dans la cellule
+de Voronoı¨ de leur chef et e´tant donc plus pre`s de lui que de tout autre chef en distance
+euclidienne. De plus, comme dans un re´seau sans fil, on ne conside`re pas la distance
+euclidienne mais la distance en nombre de sauts, nous avons e´galement regarde´ quelle
+proportion de nœuds e´taient plus proches en nombre de sauts de leur propre chef plutoˆt
+que de tout autre. Les re´sultats nume´riques sont donne´s dans la table 3.5. La figure 3.8
+donne pour une topologie de clusters (figure 3.8(a)) la proportion des nœuds se situant
+dans la ”bonne” cellule de Voronoı¨ en distance euclidienne (figure 3.8(b)) et en nombre
+de sauts (figure 3.8(c)). On remarquera que plus de 80% sont plus proches de leur
+cluster-head que d’un autre aussi bien en distance euclidienne qu’en nombre de sauts.
+Ceci pre´sente un avantage e´galement pour la diffusion d’un message dans un cluster,
+comme nous le verrons plus tard dans le chapitre 4.
+3.6. ANALYSE DE LA STRUCTURE 35
+1
+0.9
+0.8
+0.7
+0.6
+0.5
+0.4
+0.3
+0.2
+0.1
+0
+0 0.1 0.2 0.3 0.4 0.5 0.6 0.7 0.8 0.9 1
+1
+0.9
+0.8
+0.7
+0.6
+0.5
+0.4
+0.3
+0.2
+0.1
+0
+0 0.1 0.2 0.3 0.4 0.5 0.6 0.7 0.8 0.9 1
+FIG. 3.7 – Structure de clusters (sche´mas de gauche) et diagramme de Voronoı¨ corres-
+pondants (sche´mas de droite) pour λ = 1000 et λ = 500.
+(a) Topologie (b) Voronoı¨ euclidien (c) Voronoı¨ sauts
+FIG. 3.8 – Pour une structure de clusters (a), les nœuds dans la ”bonne” cellule de
+Voronoı¨ en distance euclidienne (b) ou en nombre de sauts (c) apparaissent en noir.
+36 CHAPITRE 3. ALGORITHME DE CLUSTERING
+3.7 Comparaison a` d’autres heuristiques
+Dans le but d’e´valuer notre heuristique et d’eˆtre en mesure de la situer parmi les
+heuristiques existantes, nous la comparons a` d’autres heuristiques de la litte´rature :
+DDR [59] et Max-Min d-cluster [4]. Ces heuristiques, de´crites dans le chapitre 2
+construisent des clusters dont le rayon est supe´rieur a` 1 saut comme notre heuristique.
+Max-Min d-cluster utilise l’identifiant des nœuds mais cherche a` ne pas toujours fa-
+voriser l’identifiant le plus fort et ainsi e´viter que les plus grands identifiants soient
+toujours cluster-heads. DDR, quant a` lui, est tre`s semblable a` notre algorithme mais
+se base sur le degre´ des nœuds.
+3.7.1 Comparaison avec DDR
+L’heuristique de DDR [59] construit des clusters de fac¸on assez similaire a` la noˆtre
+mais utilise le degre´ des nœuds comme me´trique au lieu de la densite´. Tout comme dans
+notre cas, le rayon des clusters n’est pas fixe´ a` l’avance et s’adapte automatiquement a`
+la topologie sous-jacente. Le degre´ est moins couˆteux que la densite´ puisqu’il ne´cessite
+la connaissance du 1-voisinage seulement. C’est pourquoi, nous avons voulu comparer
+les structures de clusters obtenues pour chacune des heuristiques.
+(a) Clusters DDR (b) Clusters Densite´
+FIG. 3.9 – Exemple de structure obtenue pour λ = 1000 et R = 0.1 avec DDR (a) et
+avec la 1-densite´ (b).
+Nb clusters Nb nœuds par cluster D˜(C) e˜(u/C)
+DDR 10.0 100 5.8 4.2
+densite´ 11.1 90.9 5.0 3.8
+TAB. 3.6 – Comparaison des clusters de DDR et de ceux obtenus par notre heuristique.
+3.7. COMPARAISON A` D’AUTRES HEURISTIQUES 37
+Les re´sultats sont donne´s par la figure 3.9 et la table 3.6. On remarquera que les struc-
+tures sont tre`s semblables. Nous avons alors compare´ la robustesse des structures face
+a` la mobilite´ des nœuds. Afin de permettre le passage a` l’e´chelle de la structure et de
+limiter les e´changes entre les nœuds, les chefs de cluster doivent rester chefs aussi long-
+temps que possible tout en maintenant des clusters adapte´s a` la topologie sous-jacente.
+Les auteurs de [66] donnent la de´finition suivante de la robustesse : ”one measure of ro-
+bustness of the topology is given by the maximum number of nodes that need to change
+their topology information as a result of a movement of a node 2” . C’est pourquoi,
+nous avons mene´ des simulations en appliquant une mobilite´ sur les nœuds et releve´
+la proportion de chefs e´tant re´-e´lus. Plus ce ratio est grand, moins importants sont les
+changements des informations des tables de routage des nœuds.
+Dans nos simulations, chaque nœud peut bouger ale´atoirement dans une direction
+ale´atoire a` une vitesse ale´atoire allant de 0 a` 10m/s (mode`le voiture) et de 0 a` 1.6m/s
+(mode`le pie´ton) durant 15 minutes (Mode`le Random Way Point). La table 3.7 donne le
+pourcentage de cluster-heads re´-e´lus toutes les 2 secondes par chacune des heuristiques.
+Les re´sultats montrent qu’en moyenne, notre heuristique reconstruit moins souvent les
+clusters que DDR. Elle s’ave`re donc eˆtre plus robuste.
+500 nœuds 600 nœuds 800 nœuds 1000 nœuds
+ρ DDR ρ DDR ρ DDR ρ DDR
+1.6m/s 68.7% 65% 67.2% 63.5% 64.5% 62.4% 62.2% 56.8%
+10m/s 30.1% 27.5% 27% 25.3% 26.2% 23.1% 24.8% 20.35%
+TAB. 3.7 – % de cluster-heads re´-e´lus.
+De par la mobilite´ des nœuds, un nouveau nœud peut apparaıˆtre dans le voisinage
+d’un autre. De fac¸on a` comprendre pourquoi la me´trique de densite´ est plus stable que
+le degre´ utilise´ par DDR, nous avons analyse´ comment le voisinage d’un nœud est
+perturbe´ par l’apparition de ce nouveau nœud. La structure de clusters se re-construit si
+le nœud qui avait le plus fort degre´ ou la plus forte densite´ dans son voisinage se trouve
+un voisin dont le degre´ ou la densite´ est devenu(e) plus fort(e) que le/la sien(ne), donc
+si l’ordre des degre´s ou densite´s entre les nœuds a change´.
+Nous conside´rons un processus ponctuel de Poisson d’intensite´ λ, distribue´ dans une
+boule de rayon 2R centre´e en un point 0 : B(0, 2R). Nous conside´rons alors le degre´ et
+la densite´ de ce point 0 ainsi que ceux d’un de ses voisins y choisi arbitrairement. Nous
+ajoutons alors le nœud mobile u dans le voisinage de 0. u est un nœud uniforme´ment
+distribue´ dans B(0, R). Nous pouvons alors calculer la probabilite´ que l’ordre des
+degre´s de 0 et y change a` cause de la pre´sence de u. Cela ne peut se faire que si u
+n’est pas voisin de y et si δ(0) = δ(y) ou δ(0) = δ(y)− 1. En effet, si u est voisin a` la
+fois de 0 et de y, l’ordre ne changera pas. Si u n’est voisin que de 0 et si δ(0) > δ(y),
+seul le degre´ de 0 augmente, ce qui ne change pas l’ordre. De meˆme si δ(0) < δ(y)−1,
+meˆme si le degre´ de 0 augmente de 1, il reste infe´rieur a` δ(y).
+2Une mesure de la robustesse de la topologie est donne´e par le nombre maximum de nœuds qui doivent
+changer leur information sur la topologie pour le mouvement d’un nœud.
+38 CHAPITRE 3. ALGORITHME DE CLUSTERING
+Soit C une variable de´signant la re´gion du plan B(0, R)\B(y,R). C correspond a` la
+zone de voisinage du nœud 0 dans laquelle les nœuds ne sont pas voisins de y (Voisi-
+nage de 0 non colore´ sur la figure 3.4 ou` on prend u = 0 et v = y). ν(C) est la mesure
+de Lebesgue de C = B(0, R)\B(y,R).
+La probabilite´ P1 que u ne soit voisin que du nœud 0 revient a` la probabilite´ que u se
+t d l d C D P = ν(C)rouve ans a zone e . ’ou` : 1 piR2 .
+La probabilite´ P2 que δ(0) = δ(y) est la probabilite´ que 0 et y aient autant de voisins
+non communs avant l’arrive´e de u. D’ou` :
+∑∞
+P2 = P(Φ(B(0, R)\B(y,R)) = k)× P(B(y,R)\B(0, R) = k)
+k∑=0∞ λ2kν(C)2k
+= exp−2λν(C)
+k!k!
+k=0
+La probabilite´P3 que δ(0) = δ(y)−1 est la probabilite´ que y ait un voisin non commun
+avec 0 en plus de 0. D’ou` :
+∑∞
+P3 = P(Φ(B(0, R)\B(y,R)) = k)× P(Φ(B(y,R)\B(0, R)) = k + 1)
+k∑=0∞ λ2k+1ν(C)2k+1
+= exp−2λν(C)
+k!(k + 1)!
+k=0
+A` partir de la`, pour obtenir la probabilite´ Pp que l’ordre change, il nous faut faire la
+moyenne sur tous les points y, en multipliant par la probabilite´ que y existe, c.a`.d. par
+la probabilite´ P(Φ(B(0, R)) > 0) que le nœud 0 ait au moins un voisin. Sachant que
+y est uniforme´ment distribue´ dans B(0, 2R), la probabilite´ Pp que l’ordre change peut
+alors s’e´crire :
+Pp = E [P1(P2 + P3)]P( (Φ(B(0, R)) > 0)− {− })= E [[P1(P2 + P )] 1 exp λpiR2∑ 3 ]+∞ 2nν(C) (λν(C)) λν(C) ( − {− })= E (1 + ) 1 exp λpiR2
+piR2 n!n! n+ 1
+n=0
+Malheureusement, nous n’avons pas e´te´ en mesure de donner un re´sultat analytique
+donnant la probabilite´ que l’ordre des densite´s des nœuds 0 et y soit perturbe´ par l’ar-
+rive´e du nœud u. Ne´anmoins, nous avons obtenu une approximation par simulation. La
+figure 3.10 donne les probabilite´s que l’ordre change pour les deux me´triques (obtenues
+par simulation) et la probabilite´ Pp obtenue analytiquement pour le degre´.
+Ces re´sultats correspondent a` ceux obtenus pre´ce´demment dans la table 3.7. La pro-
+babilite´ que l’ordre des me´triques change avec l’apparition d’un nœud mobile dans un
+voisinage est plus importante pour le degre´ que pour la densite´. Cela tend a` prouver
+que la structure base´e sur la densite´ est plus stable que celle base´e sur le degre´.
+3.7. COMPARAISON A` D’AUTRES HEURISTIQUES 39
+ 0.1
+degree
+density
+theoritical probability for the degree as metric
+ 0.09
+ 0.08
+ 0.07
+ 0.06
+ 0.05
+ 0.04
+ 0.03
+ 15  20  25  30  35  40  45  50  55
+mean number of neighbors
+FIG. 3.10 – Probabilite´ que l’ordre des me´triques change entre deux voisins.
+3.7.2 Comparaison avec l’heuristique Max-Min d-cluster
+L’heuristique Max-Min d-cluster [4] produit e´galement des clusters dont le rayon est
+supe´rieur a` 1. La structure de Max-Min a obtenu de tre`s bons re´sultats de stabilite´. Elle
+utilise l’identifiant des nœuds mais tente de contrebalancer le fait qu’un cluster-head
+e´lu sur cette me´trique garde son roˆle quasi-inde´finiment, en e´lisant non pas le plus
+grand ou plus petit identifiant mais le nœud posse´dant le plus petit identifiant parmi les
+plus grands identifiants des nœuds se trouvant a` au plus d sauts de lui. Le parame`tre d
+est le rayon des clusters et doit eˆtre fixe´ a priori.
+Structure.
+Nb clusters Nb de nœuds par cluster D˜(C) e˜(u/C)
+densite´ 11.1 90.9 5.0 3.8
+Max-Min 2-cluster 28.6 34.9 3.6 3.1
+Max-Min 3-cluster 13.3 75.2 4.9 3.4
+Max-Min 4-cluster 8.2 122.0 6.5 4.9
+TAB. 3.8 – Caracte´ristiques des clusters de la densite´ et de Max-Min d-cluster.
+Dans un premier temps, nous avons simule´ Max-Min d-cluster pour plusieurs valeurs
+du rayon d. Les re´sultats donne´s dans la table 3.8 nous montrent que l’heuristique Max-
+Min pour d = 3 est la plus proche de notre heuristique. Par la suite, c’est celle que nous
+conside´rerons.
+La figure 3.11 donne le nombre de clusters produits par notre heuristique et par Max-
+Min 3-cluster pour λ = 1000 et diffe´rentes valeurs de R.
+On remarquera que le nombre de clusters obtenu est similaire pour les deux me´triques
+mais Max-Min 3-cluster construit des clusters plus petits lorsque le re´seau est peu
+probabilities
+40 CHAPITRE 3. ALGORITHME DE CLUSTERING
+55
+MaxMin
+Density
+50
+45
+40
+35
+30
+25
+20
+15
+10
+5
+60 70 80 90 100 110 120 130 140 150
+Radius (meters)
+FIG. 3.11 – Nombre de clusters forme´s pour diffe´rentes valeurs de R avec la densite´
+(−×−) et Max-Min 3-cluster (−+−).
+dense. Notre heuristique s’adapte mieux aux re´seaux peu denses puisqu’il produit des
+clusters plus adapte´s et en plus petit nombre. De plus, contrairement a` l’heuristique de
+Max-Min, notre algorithme n’autorise pas la formation de clusters a` un seul nœud qui
+sont inutiles.
+Les figures 3.12 (a) et (b) donnent un exemple de structure de clusters obtenue par
+simulation par chacune des heuristiques sur une meˆme distribution des nœuds. Dans
+les deux cas, les clusters semblent homoge`nes. Les chefs de clusters sont bien re´partis
+dans l’espace.
+(a) Clusters obtenus par Max-Min 3- (b) Clusters obtenus par notre heuris-
+cluster tique
+FIG. 3.12 – Exemple d’une structure de clusters pour une topologie a` 1000 nœuds de
+rayon de transmission R = 0.1 obtenue avec Max-Min 3-cluster (a) et avec l’heuris-
+tique utilisant la densite´ (b).
+# of clusters
+3.7. COMPARAISON A` D’AUTRES HEURISTIQUES 41
+Comparaison face a` la mobilite´ des nœuds.
+De la meˆme fac¸on que pour DDR, nous avons compare´ l’heuristique de Max-Min
+et la noˆtre face a` la mobilite´ des nœuds, en effectuant des simulations ou` les nœuds
+bougeaient a` diffe´rentes vitesses ale´atoires. Nous avons pu constater que Max-Min d-
+cluster re´-e´lit les meˆmes cluster-heads dans plus de 90% des cas. Cela e´tait pre´visible
+e´tant donne´ que l’e´lection conside`re l’identite´ des nœuds qui ne change pas lorsque les
+nœuds bougent. En se basant seulement sur ces re´sultats, on pourrait donc pre´tendre
+que Max-Min est plus stable que notre heuristique. Seulement, l’identifiant des nœuds
+e´tant inde´pendant de la topologie sous-jacente, les clusters nouvellement reforme´s ne
+sont pas toujours adapte´s a` la topologie. Afin d’e´valuer cela, nous avons conside´re´ plus
+en de´tail l’apparition des nœuds.
+Dans les re´sultats suivants, pre´sente´s dans la table 3.9, nous conside´rons une topologie
+initiale de 500 nœuds dans laquelle apparaissent progressivement de fac¸on ale´atoire,
+dix vagues de 100 nouveaux nœuds, avec des identifiants ale´atoires. Ces re´sultats
+donnent le pourcentage de cluster-heads re´-e´lus et le pourcentage d’augmentation du
+nombre de clusters dans le re´seau.
+% cluster-heads re´-e´lus Evolution du nombre de clusters
+densite´ 94.3% +0%
+Max-Min 3-cluster 100% +46%
+TAB. 3.9 – Comparaison de Max-Min 3-cluster et de l’heuristique de densite´ face a`
+l’arrive´e des nœuds.
+On remarque que meˆme si Max-Min re´-e´lit toujours les meˆmes chefs de cluster, l’heu-
+ristique en e´lit e´galement d’autres. L’heuristique de densite´ quant a` elle incorpore les
+nouveaux nœuds dans les clusters existants. Le comportement de Max-Min est duˆ au
+fait que si un nouveau nœud a un identifiant supe´rieur au chef de´ja` en place, il cre´e´ son
+propre cluster en ne modifiant les clusters existants que s’il est dans le voisinage d’un
+ancien chef. Dans le cas contraire, les anciens clusters restent inchange´s. Le nouveau
+nœud e´tant souvent le seul nœud de son cluster nouvellement forme´.
+Comparaison des structures sur des topologies non uniformes.
+Enfin, nous avons compare´ les structures obtenues par notre heuristique et Max-Min sur
+des topologies de nœuds non uniformes. Les nœuds sont distribue´s autour de quelques
+points choisis ale´atoirement qui pourraient repre´senter des villes. Les figures 3.13 (a)
+et (b) illustrent une telle topologie. On peut remarquer que notre heuristique ge´ne`re
+moins de clusters avec des cluster-heads mieux centre´s. Max-Min ge´ne`re la` aussi des
+clusters a` 1 nœud ou des clusters-heads voisins. Par exemple, sur une meˆme topologie
+de 1000 nœuds, notre heuristique ge´ne`re 8.7 clusters en moyenne contre 15.25 clusters
+pour Max-Min.
+42 CHAPITRE 3. ALGORITHME DE CLUSTERING
+(a) Clusters obtenus par Max-Min 3- (b) Clusters obtenus par notre heuris-
+cluster tique
+FIG. 3.13 – Distribution non uniforme de nœuds : clusters obtenus avec Max-Min 3-
+cluster (a) et avec la me´trique de densite´ (b).
+Complexite´.
+L’heuristique de Max -Min d-cluster se compose de 3 phases de diffusion de messages
+a` d sauts : une phase re´cupe´rant le plus grand identifiant a` d sauts, une phase re´cupe´rant
+le plus petit identifiant parmi les plus grands a` d sauts et enfin une phase pour diffuser
+l’identite´ du chef de cluster. Notre heuristique, quant a` elle, est purement locale et
+ne ne´cessite qu’une information sur le 2-voisinage obtenue par des messages diffuse´s
+uniquement dans le 1-voisinage. Max-Min d-cluster s’ave`re donc plus couˆteux en terme
+de messages et de latence que notre algorithme.
+3.8 Analyse de l’auto-stabilisation
+Comme nous avons pu le constater dans le chapitre 2, il existe de nombreux proto-
+coles de clustering pour les re´seaux sans fil. Cependant, seulement tre`s peu ve´rifient
+la robustesse de leur algorithme et, meˆme quand c’est le cas, l’e´valuation est mene´e
+par simulation et jamais via une analyse the´orique. Dans cette section, nous appliquons
+les principes d’auto-stabilisation a` notre algorithme de clustering. L’auto-stabilisation
+est la proprie´te´ d’un syste`me a` atteindre seul une configuration dans laquelle il a un
+comportement correct, en partant de n’importe quelle configuration arbitraire. A` l’aide
+d’une approche the´orique, nous montrons que, sous certaines hypothe`ses, l’algorithme
+est auto-stabilisant localement et que le temps de convergence est faible et borne´. Nous
+validons ensuite cette proprie´te´ par simulation.
+3.8. ANALYSE DE L’AUTO-STABILISATION 43
+3.8.1 Pre´-requis
+Nous pre´sentons dans un premier temps les diffe´rentes hypothe`ses. Nous conside´rons
+que l’algorithme se stabilise lorsque chaque nœud connaıˆt l’identite´ de son cluster-
+head. Le temps de stabilisation est donc lie´ a` la hauteur des arbres de clustering, l’iden-
+tite´ du chef devant eˆtre transmise jusqu’aux feuilles de l’arbre. Nous suivons les meˆmes
+principes et hypothe`ses que dans [38] :
+Hypothe`ses. Nous supposons qu’il existe une constante τ > 0 telle que la probabilite´
+qu’un paquet soit transmis sans collision entre deux nœuds voisins est au moins τ . Cela
+implique que nous supposons que tous les nœuds parviennent a` e´mettre avec succe`s
+un message en une e´tape de temps de´pendant de τ . Cela correspond aux hypothe`ses
+classiques concernant les canaux multi-acce`s [14]. Cette hypothe`se est justifie´e en an-
+nexes 3.11.3. Nous supposons e´galement qu’il existe une constante∆ connue, telle que
+pour tout nœud u, δ(u) ≤ ∆. Ceci peut eˆtre ve´rifie´ par un controˆle de topologie qui est
+en mesure d’ajuster la porte´e de communication ou la puissance de transmission des
+nœuds lorsque le re´seau est trop dense.
+Notation. Nous de´crivons les algorithmes sous la forme de re`gles garde´es. G → S
+repre´sente une telle re`gle, ou` G est un pre´dicat sur les variables locales d’un nœud,
+S une affectation de ces meˆmes variables locales. Si le pre´dicat G (la garde) est
+vrai, l’affectation S est exe´cute´e, sinon elle est ignore´e. Certaines gardes peuvent eˆtre
+de´clenche´es sur e´ve´nement, par exemple lors de la re´ception d’un message. Nous sup-
+posons que ces e´ve´nements s’exe´cutent de manie`re atomique lors de la re´ception d’un
+message. Pour toute configuration du syste`me, quand une garde G est vraie, G est
+dite activable dans cette configuration. L’ope´rateur [] correspond a` la composition non-
+de´terministe des re`gles garde´es ; ([]q : q ∈ Mp : Gq → Sq) est une formula-
+tion re´duite de l’expression Gq1 → Sq [] Gq → Sq [] · · · [] Gq → Sq , ou`1 2 2 k k
+Mp = {q1, q2, . . . , qk}.
+Se´mantique de l’exe´cution. L’exe´cution du syste`me consiste pour chaque nœud a`
+e´valuer pe´riodiquement ses re`gles garde´es. Nous supposons que chaque re`gle acti-
+vable est exe´cute´e en un temps constant (ou ignore´e si la re`gle n’est pas activable).
+De manie`re ge´ne´rale, nous conside´rons que lorsqu’un nœud exe´cute son programme,
+toutes ses re`gles activables sont effectivement exe´cute´es en un temps constant (par
+exemple en suivant le mode`le du tourniquet).
+Propagation des variables partage´es. Certaines variables des nœuds sont dites par-
+tage´es. Suivant le sche´ma pre´sente´ en [38], les nœuds diffusent pe´riodiquement les
+valeurs de leurs variables partage´es. Cela signifie que lorsqu’un nœud affecte une va-
+leur a` une variable partage´e, nous supposons que cette instruction est transforme´e de
+telle sorte que, d’une part la variable partage´e est re´gulie`rement transmise au voisinage
+du nœud, et que d’autre part cette retransmission s’effectue de manie`re probabiliste
+pour e´viter les collisions. Une implantation possible peut eˆtre trouve´e dans [38]. Dans
+la suite, nous supposons e´galement que le sche´ma de [38] est utilise´ pour obtenir Γ(u)
+et Γ2(u) pour chaque nœud u.
+44 CHAPITRE 3. ALGORITHME DE CLUSTERING
+3.8.2 Construction d’un DAG de hauteur constante
+Un DAG ou Directed Acyclic Graph est un graphe simple oriente´ et sans boucle. Dans
+notre algorithme, comme dans tout algorithme utilisant l’identifiant des nœuds comme
+crite`re de de´cision finale sans contrainte sur le rayon du cluster (comme dans DDR),
+le pire cas en terme de stabilisation et de formation de clusters se rencontre quand
+tous les nœuds ont la meˆme valeur de de´cision (comme le degre´ ou la densite´) et que
+les identifiants des nœuds sont uniques et mal distribue´s. L’algorithme peut alors ne
+construire qu’un seul cluster dont le diame`tre est aussi grand que celui du re´seau, le
+temps de stabilisation de´pendant de ce diame`tre. De plus, il est e´vident que construire
+un tel cluster est inutile puisque nous pourrions tout aussi bien utiliser directement
+le re´seau. Pour pallier cet inconve´nient, il peut s’ave´rer utile d’allouer une couleur aux
+nœuds, couleur choisie dans un espaceΩ constant et plus petit que celui des identifiants,
+de fac¸on a` ce que les couleurs soient localement uniques (dans notre cas, les couleurs
+doivent eˆtre uniques a` distance 2 pour qu’un nœud puisse choisir entre deux voisins en
+compe´tition) et d’utiliser ces couleurs comme crite`re de de´cision finale. Un DAG peut
+alors eˆtre construit a` partir de ces couleurs en orientant les areˆtes entre les voisins de la
+couleur la plus grande vers la plus petite.
+Notre construction de DAG a` hauteur constante est base´e sur la technique ale´atoire
+de´crite dans [38], mais utilise un espace de couleur beaucoup plus petit Ω (|Ω| =
+∆6 dans [38] tandis que ∆2, ou meˆme ∆ est suffisant dans notre cas avec ∆ =
+maxu∈V δ(u)).
+Soit Coloru ∈ Ω une variable partage´e de´signant la couleur du nœud u. Soit
+ColorΓ(u) = {)Color v | v ∈ Γ(u)}, ou` )Colorv re´fe`re a` la copie en cache de
+la variable partage´e Colorv au nœud u. En d’autres termes, Color v correspond a` la
+couleur que u pense que v a.
+Supposons que random(S) choisit avec une probabilite´ uniforme un e´le´ment dans un
+ensemble S. Le nœud u{utilise la fonction suivante pour calculer Coloru :
+)Coloru si )Color ∈6 Color( ) = u Γ(u)newColor Coloru
+random(Ω \ ColorΓ(u)) sinon
+L’algorithme de construction d’un DAG a` hauteur constante est le suivant :
+N1 : VRAI → Coloru := newColor(Coloru)
+The´ore`me 1 L’algorithme N1 stabilise avec probabilite´ 1 en un temps constant vers
+un DAG de hauteur infe´rieure ou e´gale a` |Ω|+ 1.
+Preuve 1 La preuve de ce the´ore`me est similaire a` celle de [38]. Supposons que la
+hauteur du DAG soit supe´rieure a` |Ω| + 1. Cela signifie qu’il existe au moins deux
+nœuds de meˆme couleur sur une branche du DAG (sur un chemin reliant la racine a`
+une feuille). Or, les areˆtes du DAG sont oriente´es en fonction des couleurs des nœuds
+qui sont ordonne´es. Si sur la meˆme branche, il existe deux nœuds u et v de meˆme
+couleur, cela implique que Coloru < Colorv , ce qui contredit l’hypothe`se d’ordre total
+des couleurs. 
+3.8. ANALYSE DE L’AUTO-STABILISATION 45
+3.8.3 Analyse de la construction du DAG de couleurs
+Nous avons cherche´ a` caracte´riser le DAG que nous construisons et son couˆt. Pour
+cela, nous avons analyse´ analytiquement et par simulation le temps de construction
+du DAG qui correspond au temps de stabilisation de l’algorithme de coloriage. Nous
+avons e´galement mesure´ par simulation l’influence de la taille du domaine des couleurs
+Ω sur ce temps de stabilisation et sur la taille du DAG re´sultant. Comme nous allons
+le voir, il en ressort qu’un compromis est a` faire pour de´terminer le parame`tre Ω : plus
+la valeur de |Ω| est grande, plus le temps de convergence de N1 est faible mais plus la
+hauteur du DAG est importante. Une hauteur de DAG importante augmente le temps
+de stabilisation des algorithmes qui se basent sur ces DAG.
+Analyse the´orique du temps de convergence.
+Le temps de convergence de l’algorithme de coloriage N1 correspond au nombre
+d’e´tapes ne´cessaires avant que chaque nœud ait une couleur unique dans son voisinage.
+Pour mener cette e´tude the´orique, nous nous sommes inspire´s du protocole NAP [21].
+Nous mode´lisons l’algorithme de coloriage par des lance´s successifs de boules dans des
+urnes. L’ensemble des couleurs est repre´sente´ par M urnes dans lesquelles L boules
+repre´sentant les nœuds sont distribue´es.
+L’algorithme de coloriage peut eˆtre mode´lise´ de la fac¸on suivante en termes d’urnes et
+de boules :
+Algorithm 2 COLORIAGE(L, M )
+⊲ Entre´es : M urnes et L boules
+⊲ Pre´-condition : M ≥ L
+if (L 6= 0) then
+Lance ale´atoirement L boules dans les M urnes ;
+Met de coˆte´ toutes les urnes contenant exactement une boule avec leur boule ;
+Soit c ≤M le nombre d’urnes isole´es ;
+Appelle COLORIAGE(L− c, M − c) ;
+end
+On remarque qu’une telle analyse ne conside`re que des graphes complets. Dans un
+re´seau sans fil qui n’est pas ne´cessairement un graphe complet, deux nœuds voisins (A
+et B) n’e´tant pas en conflit mutuel peuvent tout de meˆme tirer une nouvelle couleur
+simultane´ment s’ils sont chacun en conflit avec un autre de leur voisin non visible par
+A ou B, ce qui n’est pas conside´re´ dans cette analyse. Ainsi, l’e´tude suivante nous
+fournit une borne infe´rieure sur le temps de stabilisation de l’algorithme. Cet aspect est
+plus de´taille´ dans [55].
+Dans chaque voisinage, le but est alors de n’avoir qu’une seule boule (un nœud) as-
+socie´e a` une seule urne donne´e (une couleur). Soit la variable ale´atoire N repre´sentant
+le nombre d’ite´rations ne´cessaires pour obtenir une telle configuration. Le temps de
+convergence moyen de l’algorithme est l’espe´rance de N : E[N ]. Pour de´terminer
+46 CHAPITRE 3. ALGORITHME DE CLUSTERING
+E[N ], nous conside´rons une chaıˆne de Markov a` temps discret X = {Xn, n ∈ N}
+sur l’espace I = 0, 1, ..., L. Xn = i repre´sente le fait qu’apre`s n transitions, exacte-
+ment i boules et urnes ont e´te´ mises de coˆte´.
+Nous notonsP(L,M) = (pi,j(L,M))(i,j)∈I2 la matrice de probabilite´ de transition de
+la chaıˆne de Markov X . L’espe´rance E[N ] peut eˆtre de´duite du calcul des pi,j(L,M).
+pi,j(L,M) repre´sente la probabilite´ d’avoir exactement j urnes de coˆte´ au temps n+1
+sachant que i urnes e´taient de coˆte´ au temps n. pi,j(L,M) peut aussi eˆtre vu comme
+la probabilite´ d’obtenir exactement j − i urnes avec exactement une boule en lanc¸ant
+L− i boules dans M − i urnes. Nous obtenons donc, pour tout i ≤ j :
+pi,j(L,M) = pi,j = p0,j−i(L− i,M − i). (3.1)
+X est acyclique et l’e´tatL est un e´tat absorbant. Cela signifie que pour tout i ∈ I−{L}
+et tout j ∈ I, pi,j(L,M) = 0 si i > j et pL,L(L,M) = 1.
+Graˆce a` la relation 3.1, nous pouvons ne calculer que les valeurs des p0,j−i(L−i,M−i)
+pour i ≤ j pour obtenir toutes les valeurs de la matrice P(L,M).
+p0,j(L,M) est la probabilite´ d’obtenir exactement j urnes avec exactement une boule
+lors du lancer de L boules dans M urnes. Le cas j = L conduit au proble`me des
+anniversaires, d’ou` :
+M !
+p0,L(L,M) =
+(M − L)!ML
+Pour j < L, nous proce´dons de la sorte. L boules sont lance´es dans M urnes. On note
+K0(L,M) le nombre d’urnes vides et K1(L,M) le nombre d’urnes contenant exacte-
+ment une boule. Soit aL,M (k, j) la distribution jointe des deux variables ale´atoires K0
+et K1 :
+aL,M (k, j) = P[K0(L,M) = k, K1(L,M) = j]
+Les p0,j(L,M) peuvent alors s’e´crire :
+∑M
+p0,j(L,M) = P[K1(L,M) = j] = aL,M (k, j)
+k=0
+Ainsi, afin de calculer la matrice de transition P(L,M), il ne nous reste qu’a`
+de´terminer les aL,M (k, j). Pour cela, nous raisonnons par re´currence en conditionnant
+le re´sultat du dernier lancer : pour obtenir k urnes vides et j urnes avec exactement une
+boule en lanc¸ant L boules dans M urnes il faut qu a` la fin du lancer de la L − 1ieme, ’
+balle :
+1. soit avoir k + 1 urnes vides et j − 1 urnes avec exactement une boule et lancer
+la dernie`re boule dans une urne vide ;
+2. soit avoir k urnes vides et j + 1 urnes avec exactement une boule et lancer la
+dernie`re boule dans une urne qui contenait exactement une boule ;
+3. soit avoir k urnes vides et j urnes avec exactement une boule et lancer la dernie`re
+boule dans une urne qui contenait au moins deux boules.
+3.8. ANALYSE DE L’AUTO-STABILISATION 47
+Pour L ≥ 2, on obtient :
+k + 1 j + 1 M − (j + k)
+aL,M (k, j) = aL−1,M (k+1, j−1)1{j≥1}+ aL−1,M (k, j+1)+ aL−1,M (k, j)
+M M M
+ou` 1{c} = 1 si la condition c est remplie et 0 sinon.
+Les aL,M (k, j) peuvent eˆtre calcule´s par re´cursion en conside´rant que si L = 1 :
+a1,M (k, j) = 1{k=M−1, j=1}
+On remarque aussi que aL,M (k, j) = 0 si j > L, si k = M ou si j+k > M . De meˆme,
+si j = L, on a aL,M (k, L) = 0 pour k 6= M − L et aL,M (M − L,L) = p0,L(L,M).
+Une fois la matrice de probabilite´s de transition obtenue, on peut de´terminer la dis-
+tribution de N (P [N = n] pour n = 0, . . . ,∞) et sa valeur moyenne E [N ]. Les cal-
+culs sont les meˆmes que ceux mene´s dans l’e´tude du protocole NAP. Ils de´rivent des
+re´sultats classiques des chaıˆnes de Markov. Nous les utilisons directement ici.
+Nous de´finissonsQ la sous-matrice obtenue a` partir deP(L,M), en retirant la dernie`re
+ligne et la dernie`re colonne qui correspondent a` l’e´tat absorbant L.
+Soit α le vecteur ligne contenant la distribution initiale des probabilite´s des e´tats tran-
+sitoires de X . α est tel que α = (P [X0 = i])i=0,...,L−1. La chaıˆne de Markov X
+commence en l’e´tat 0 avec la probabilite´ 1, d’ou` α = (1, 0, . . . , 0).
+De par les re´sultats classiques des chaıˆnes de Markov, on obtient :
+[N = n] = αQn−1P (I −Q)1, pour n ≥ 1,
+∑∞
+P [N > n] = αQk−1(I −Q)1 = αQn1, pour n ≥ 0,
+k=n+1
+∑∞
+−1
+E [N ] = P [N > n] = α (I −Q) 1
+n=0
+ou` I est la matrice identite´ et 1 le vecteur colonne unite´, tous deux de dimension L.
+On note V = (Vi)0≤i≤L−1 le vecteur d’espe´rance conditionnelle de´fini par Vi =
+| O − −1E [N X0 = i]. n a V = (I Q) 1. D’ou` E [N ] = αV = V0. Le vecteur V est
+solution du syste`me line´aire (I−Q)V = 1. Cela peut s’e´crire e´galement V = 1+QV .
+Ainsi, comme la matrice P(L,M) est acyclique, on obtient, pour i = L− 2 . . . , 0 :
+L
+1 ∑−1
+V = 1 + p V i − i,j j1 pi,i j=i+1
+Comme VL−1,L−1 = 1/(1 − pL−1,L−1), on peut obtenir V0 re´cursivement, et ainsi,
+obtenir le temps de convergence moyen E [N ].
+48 CHAPITRE 3. ALGORITHME DE CLUSTERING
+Simulations.
+Afin de valider nos re´sultats the´oriques et de mesurer l’impact de la taille du domaine
+des couleurs Ω sur le temps de convergence et sur la hauteur du DAG, nous avons mene´
+des simulations utilisant plusieurs valeurs de |Ω|. Nous avons simule´ l’Algorithme N1
+tili t | | | | 2en u san Ω = (maxp∈V Γ(p) ) , cette valeur e´tant celle conside´re´e par certains
+algorithmes auto-stabilisants base´s sur le coloriage [38]. Nous avons e´galement e´tudie´
+l’Algorithme N1 en utilisant |Ω| = 2 × (maxp∈V |Γ(p)|). De plus, comme dans les
+re´seaux sans fil, les nœuds n’ont aucune connaissance globale du re´seau et donc, aucun
+moyen a priori de connaıˆtre le plus fort degre´ du graphe, nous avons e´galement mene´
+des simulations en utilisant une taille de domaine de couleur propre a` chaque nœud,
+t ll q ∀ ∈ | | | | 2e e ue : p V, Ωp = ( Γ(p) ) .
+Nous avons alors conside´re´ le temps de convergence et la taille du DAG induit.
+Dans un premier temps, nous avons compare´ les re´sultats the´oriques et de simulation
+afin de valider chaque approche. La table 3.10 montre les temps de convergence de
+l’algorithme de coloriage a` distance 1 sur une topologie grille ou` chaque nœud interne
+a respectivement 4 ou 8 voisins. On remarque que les re´sultats s’accordent.
+4 voisins 8 voisins
+2 ∗Max Max2 2 ∗Max Max2
+The´orie Simulation The´orie Simulation The´orie Simulation The´orie Simulation
+2.14 2.14 1.56 1.61 1.56 1.67 1.15 1.21
+TAB. 3.10 – Temps de stabilisation the´orique et obtenu par simulation avec |Ω| =
+(max |N |)2p∈V p ) et |Ω| = 2× (maxp∈V |Np|) dans une grille a` 4 et 8 voisins.
+La figure 3.14 montre l’influence de la taille du domaine sur le temps de convergence
+et la hauteur du DAG dans le cas d’un coloriage a` distance 1. Les re´sultats montrent
+clairement que plus la valeur de |Ω| est grande, plus le temps de convergence de N1 est
+faible mais plus la hauteur du DAG est importante. Il y a donc un compromis a` faire
+pour de´terminer le parame`tre Ω.
+3.8.4 Utilisation des couleurs pour le clustering
+Dans cette section, nous re´-e´crivons l’algorithme de clustering avec les re`gles d’auto-
+stabilisation. Chaque nœud u maintient deux variables partage´es : ρ(u) et H(u) ou`
+ρ(u) est la densite´ du nœud u et H(u) son cluster-head.
+Afin d’utiliser le DAG des couleurs dans l’algorithme de clustering,
+nous rede´finissons l’ope´rateur d’ordre binaire ≺ de´fini dans la sec-
+tion 3 2 de la fac¸on suivante : pour (u, v) ∈ V 2. , u ≺ v si et
+seulement si {ρ(u) < ρ(v)} ou {ρ(u) = ρ(v) ∧Age(u) < Age(v)} ou
+{ρ(u) = ρ(v) ∧Age(u) = Age(v) ∧ Colorv < Coloru}. Soit max≺ la fonction
+de maximum associe´e a` l’ope´rateur d’ordre binaire ≺. Quand un nœud u calcule le
+3.8. ANALYSE DE L’AUTO-STABILISATION 49
+3 2
+2.8
+1.95
+2.6
+2.4
+1.9
+2.2
+2 1.85
+1.8
+1.8 |Omega| = 2 * Degre Max
+1.6 |Omega| = Degre Noeud au carre
+|Omega| = 2 * Degre Max |Omega|= Degre Max au carre
+1.4 |O|mOemgeag| a=|  D= eDgereg rneo Meuadx  aauu  ccaarrrree 1.75
+1.2
+1 1.7
+500 600 700 800 900 1000 1100 500 600 700 800 900 1000 1100
+Intensite du processus lambda Intensite du processus lambda
+(a) Temps de stabilisation (b) Hauteur du DAG
+FIG. 3.14 – Influence de Ω.
+re´sultat de ≺ ou de max≺, il utilise les valeurs cache de son voisinage en supposant
+)Coloru = Coloru et )ρ(u) = ρ(u).
+Nous de´finisson{s maintenant la fonction clusterHead d’e´lection de cluster-head :
+u si ∀v ∈ Γ(u), v ≺ u,
+clusterHead = H(max≺{v ∈ Γ(u)}) sinon.
+L’algorithme s’exe´cute comme suit :
+R1 : VRAI → ρ(u) := densite
+R2 : VRAI → H(u) := clusterHead
+Lemme 4 Partant de n’importe quelle configuration initiale, chaque nœud u a une
+valeur de densite´ correcte ρ(u) en un temps borne´ constant.
+Preuve 2 Apre`s un temps constant, chaque nœud u a une vue correcte de son 2-
+voisinage. Puis, apre`s l’exe´cution de la re`gle R1, la densite´ ρ(u) du nœud u est cor-
+recte. 
+Lemme 5 Partant de n’importe quelle configuration initiale, chaque nœud u a une
+valeur correcte pour H(u) en un temps borne´ constant.
+Preuve 3 Supposons que tout nœud a une valeur correcte de sa densite´ (vrai apre`s
+un temps constant d’apre`s le Lemme 4). Apre`s que la variable partage´e ρ(u) ait e´te´
+communique´e sans collision a` tout nœud de Γ(u) (cela arrive apre`s un temps constant),
+chaque nœud a une valeur cache correcte pour la densite´ de chacun de ses voisins.
+Nous conside´rons maintenant le DAG induit par la relation ≺ (note´ DAG≺ par la
+suite). En un temps constant, les racines de DAG≺ ont une valeur correcte de l’identite´
+de leur cluster-head (puisqu’il s’agit de leur propre identifiant). Supposons que tout
+nœud a` distance infe´rieure ou e´gale a` n des racines de DAG≺ a une valeur correcte de
+l’identite´ de leur cluster-head. Sur exe´cution de la re`gle R2 sur les nœuds a` distance
+Temps de stabilisation
+Hauteur du DAG induit
+50 CHAPITRE 3. ALGORITHME DE CLUSTERING
+n+1 des racines de DAG≺, ces nœuds obtiennent alors une valeur correcte de l’identite´
+de leur cluster-head (puisque le cluster-head est de´termine´ de fac¸on de´terministe (i)
+par la densite´ et la topologie locale – qui est fixe – et (ii) par l’identite´ des cluster-heads
+des nœuds a` distance infe´rieure ou e´gale a` n des racines de DAG≺). Par induction, le
+temps ne´cessaire a` la stabilisation de l’algorithme est proportionnel a` la hauteur du
+DAG≺.
+Nous prouvons maintenant que la hauteur du DAG≺ est borne´e par une constante. Les
+couleurs des nœuds sont borne´es par une constante |Ω|. Le nombre d’areˆtes dans le
+1 voisinage d un nœud est borne´e par ∆2- ’ , le nombre de 1-voisins est borne´ par ∆,
+d ou` le nombre de valeurs possibles pour la densite´ est au plus de ∆3’ , . Le nombre de
+couples (densite´ couleur) possibles pour un nœud est |Ω|∆3, , lui-meˆme borne´ par une
+constante. Ainsi, la hauteur du DAG≺ est lui-aussi borne´ par une constante.
+L’algorithme stabilise en un temps proportionnel a` la hauteur du DAG≺, celle-ci e´tant
+constante. Donc le temps de stabilisation est lui aussi borne´ par une constante. 
+3.8.5 Validation des proprie´te´s auto-stabilisantes
+Comme mentionne´ dans la section 3.8.1, nous supposons l’existence d’une constante
+τ > 0 telle que chaque nœud est en mesure de diffuser localement une trame et d’en
+recevoir une de chacun de ses voisins en un temps borne´, appele´ une e´tape de temps.
+Apre`s une e´tape, chaque nœud connaıˆt ses 1-voisins. Apre`s deux e´tapes, il connaıˆt ses
+2-voisins et peut calculer sa valeur de densite´ et apre`s trois e´tapes, il connaıˆt son pe`re.
+Le nombre d’e´tapes ne´cessaires a` un nœud pour connaıˆtre l’identite´ de son cluster-head
+de´pend directement de la distance qui l’en se´pare et est borne´ par la hauteur de l’arbre
+auquel il appartient.
+Les simulations mene´es ici nous ont permis d’e´valuer l’importance de l’introduction
+des couleurs. Le mode`le de simulation est toujours celui de´crit dans le chapitre 1.1.
+Les nœuds sont de´ploye´s suivant un Processus de Points de Poisson avec diffe´rentes
+valeurs de λ et de R.
+L’allocation des couleurs se fait suivant l’Algorithme N1. Chaque nœud se choisit
+ale´atoirement une couleur entre 0 et |Ω| = ∆2 (avec ∆ = maxv∈V δ(u)). Il com-
+pare alors sa couleur a` celle de ses voisins. Si deux voisins ont la meˆme couleur, le
+nœud dont la couleur est la plus petite se choisit une autre couleur et ainsi de suite jus-
+qu’a` ce qu’il n’existe aucune paire de nœuds voisins portant la meˆme couleur. A` partir
+de la`, les clusters sont construits suivant l’algorithme 1 en utilisant les couleurs comme
+crite`re de de´cision finale.
+Les caracte´ristiques des clusters obtenus sont donne´es dans la table 3.11 pour λ = 1000
+et diffe´rentes valeurs deR. Bien que donne´s pourλ = 1000, les re´sultats sont similaires
+quelle que soit la valeur de λ.
+On remarque que quel que soit R (et donc le degre´ δ des nœuds), l’excentricite´
+moyenne des cluster-heads et la hauteur des arbres varient peu. Cela confirme notre
+hypothe`se stipulant que la transmission de l’identite´ du chef de cluster se fait en un
+3.8. ANALYSE DE L’AUTO-STABILISATION 51
+temps constant. On notera e´galement que dans un tel cas ou` les densite´s et identifiants
+des nœuds sont uniforme´ment distribue´s, l’utilisation des couleurs n’apporte pas grand
+chose. Cela est duˆ au fait que dans une telle distribution, les nœuds utilisent uniquement
+les densite´s pour de´terminer leur pe`re puisqu’elles sont rarement e´gales.
+R = 0.05 (δ = 7.85) R = 0.08 (δ = 20.11) R = 0.1 (δ = 31.42)
+Couleurs avec sans avec sans avec sans
+Nb clusters 61.0 61.4 19.2 19.5 11.7 11.7
+e˜(H(u)/C(u)) 2.6 2.6 3.1 3.1 3.2 3.2
+Hauteur arbre-cluster 2.7 2.7 3.3 3.3 3.5 3.5
+TAB. 3.11 – Caracte´ristiques des clusters pour une topologie ge´ome´trique ale´atoire
+avec λ = 1000.
+Conside´rons maintenant un sce´nario ou` les nœuds sont distribue´s dans une grille avec
+des identifiants allant croissant de la gauche vers la droite et du bas vers le haut. Dans
+ce cas, tous les nœuds inte´rieurs de la grille ont la meˆme valeur de densite´ et le meˆme
+degre´. Le seul moyen de choisir leur pe`re est d’utiliser les identifiants. Comme ceux-
+ci sont mal re´partis, tous les nœuds vont finalement s’attacher au meˆme cluster-head,
+comme le montre le tableau 3.12. Dans un pareil cas, on remarquera que l’introduction
+des couleurs est utile car elle permet de re´duire de fac¸on drastique le nombre d’e´tapes
+ne´cessaires avant la stabilisation (puisqu’elle re´duit fortement la hauteur des arbres de
+clustering) et de construire des clusters plus adapte´s. La figure 3.15 montre un exemple
+de clusters obtenus pourR = 0.05. Les cluster-heads apparaissent en bleu, une couleur
+par cluster. Sur la figure 3.15(a), les couleurs ne sont pas utilise´es et seulement un
+cluster est cre´e´. Sur la figure 3.15(b), les couleurs sont conside´re´es et plusieurs clusters
+homoge`nes sont cre´e´s.
+Grille 32× 32 Grille 18× 18 Grille 15× 15
+Couleurs avec sans avec sans avec sans
+Nb clusters 52.8 1.0 29.3 1.0 18.5 1.0
+e˜(H(u)/C(u)) 3.4 29.1 4.1 19.1 3.6 6.5
+Hauteur arbres-cluster 3.7 83.4 4.7 100.5 4.5 32.1
+TAB. 3.12 – Caracte´ristiques des clusters forme´s sur une grille a` 8 voisins.
+Dans cette partie, nous avons introduit un me´canisme supple´mentaire dans la construc-
+tion des clusters qui permet a` notre algorithme de se stabiliser en un temps rapide
+et borne´ et ce, quelle que soit la topologie sous-jacente. Ce caracte`re local d’auto-
+stabilisation apporte une stabilite´ a` notre algorithme et une robustesse face aux pannes
+et attaques. En effet, lorsqu’un tel phe´nome`ne survient, l’auto-stabilisation permet au
+re´seau de ne pas eˆtre impacte´ dans son ensemble par la cassure de liens. Les nœuds
+sont capables d’isoler la faute et de la re´parer.
+52 CHAPITRE 3. ALGORITHME DE CLUSTERING
+(a) sans utiliser les couleurs (b) en conside´rant les couleurs
+FIG. 3.15 – Exemple de constructions obtenues pour des grilles a` 8 voisins.
+3.9 Conclusion
+Dans ce chapitre, nous avons introduit une nouvelle me´trique qui permet d’organiser
+un re´seau sans fil multi-sauts en clusters. Nous avons ensuite analyse´ cette me´trique
+analytiquement et par simulation, ainsi que la structure de clusters qu’elle permet de
+construire. L’algorithme de clustering et le calcul de cette me´trique sont locaux, dis-
+tribue´s et ne ne´cessitent la connaissance que du voisinage a` deux sauts pour chaque
+nœud. Ils sont donc peu couˆteux et permettent une maintenance locale donc rapide.
+L’algorithme de clustering ne repose sur aucun parame`tre fixe´ a priori et a e´te´ prouve´
+auto-stabilisant en un temps borne´ et constant. La structure de clusters forme´e pre´sente
+d’inte´ressantes caracte´ristiques. Compare´e a` d’autres algorithmes de la litte´rature, elle
+s’ave`re plus robuste face a` la mobilite´ des nœuds et s’adapte mieux a` la topologie sous-
+jacente.
+Tout re´seau doit permettre aux entite´s de communiquer et ne´cessite pour cela un pro-
+tocole de routage/localisation et un processus de diffusion de messages. Graˆce aux
+caracte´ristiques de notre structure de clusters que nous avons de´gage´es au travers de
+nos e´tudes et analyses, nous avons pu proposer deux utilisations de la structure qui
+tirent avantage de ces proprie´te´s : un processus de diffusion (chapitre 4) et un proces-
+sus de localisation et de routage (chapitre 5) pour permettre aux entite´s du re´seau de
+communiquer.
+3.10. PUBLICATIONS 53
+3.10 Publications
+1. Colloques et confe´rences internationaux avec comite´ de lecture :
+(a) Self-stabilization in self-organized Multihop Wireless Networks. Nathalie
+Mitton, E´ ric Fleury, Isabelle Gue´rin-Lassous and Se´bastien Tixeuil. Work-
+shop on Wireless Ad Hoc Networking (WWAN’05), Juin 2005, Columbus,
+Ohio, USA.
+(b) Self-organization in large scale ad hoc networks. Nathalie Mitton, Anthony
+Busson and E´ ric Fleury. Mediterranean Ad Hoc Networking Workshop
+(MED-HOC-NET’04), Juin 2004, Bodrum, Turquie.
+2. Colloques et confe´rences nationaux :
+(a) Auto-stabilisation dans les re´seaux ad hoc. Nathalie Mitton, E´ ric Fleury,
+Isabelle Gue´rin-Lassous et Se´bastien Tixeuil. ALGOTEL’05, Mai 2005,
+Presqu’ıˆle de Giens, France.
+(b) Auto-organisation dans les re´seaux ad-hoc a` grandes e´chelles. Nathalie
+Mitton, Anthony Busson et E´ ric Fleury. ALGOTEL’04, Mai 2004, Batz-
+sur-mer, France.
+(c) Auto-organisation dans les re´seaux ad-hoc a` grandes e´chelles. Natha-
+lie Mitton et E´ ric Fleury. Journe´es Graphes Re´seaux et Mode´lisation,
+GRM’03, De´cembre 2003, Paris, France.
+3. Rapports de recherche :
+(a) On Fast Randomized Colorings in Sensor Networks. Nathalie Mitton, E´ ric
+Fleury, Isabelle Gue´rin-Lassous and Bruno Se´ricola and Se´bastien Tixeuil.
+LRI-1416. Juin 2005.
+(b) Self-stabilization in self-organized Multihop Wireless Networks. Nathalie
+Mitton, E´ ric Fleury, Isabelle Gue´rin-Lassous and Se´bastien Tixeuil. RR-
+5426. De´cembre 2004.
+(c) Analysis of the Self - organization in Multi-hops wireless networks. Natha-
+lie Mitton, Anthony Busson and E´ ric Fleury. RR-5328. Octobre 2004.
+(d) Self-organization in large scale ad hoc networks. Nathalie Mitton and E´ ric
+Fleury. RR-5042. De´cembre 2003.
+4. Se´minaires, pre´sentations, expose´s :
+(a) Auto-organisation dans les re´seaux ad hoc grandes e´chelles. Nathalie Mit-
+ton, E´ ric Fleury. Se´minaire ACI Pair a` Pair - Arcachon - France - 6-7 Mai
+2004.
+54 CHAPITRE 3. ALGORITHME DE CLUSTERING
+3.11 Annexes
+3.11.1 Analyse de la densite´ moyenne
+Nous donnons ici la preuve du lemme 1 qui donne la valeur moyenne de la 1-densite´
+d’un nœud :
+Lemme 1 La 1-densite´ moyenne d(e tout nœud)u est :√ ( − {− })o 1 3 3 1 exp λpiR2ρ˜(u) = E [ρ(0)] = 1 + pi − λR2 −
+2 4 pi
+Preuve 4 Soit (Yi)i=1,..,Φ(B′ ), chacun des points de Φ se trouvant dans B′0. Par0
+de´finition de la densite´, on a :  
+1 Φ∑(B′0) Φ(B′ ∩B′o [ρ(0)] = 1 + o 0 Y )iE E 
+2 Φ(B′ )
+i=1 0
+′ l b l d i d i l { } ′Bu est a ou e centre´e en u e rayon R, pr ve´e u s ng eton u : Bu =
+B(u,R)\ {u} Φ(B′ ∩B′. 0 Y ) correspond au nombre de voisins communs aux nœuds 0i
+et Yi. En faisant ainsi la somme des voisins communs a` 0 et Yi pour tous les Yi, on ob-
+tient le nombre de liens entre les voisins de 0. Cependant, chaque lien est ainsi compte´
+deux fois (un lien entre Yi et Yj est compte´ quand on conside`re Yi voisin commun de
+Yj et 0 et quand on conside`re Yj voisin commun de 0 et Yi). C’est pourquoi on se doit
+de diviser cette somme par 2.
+Nous supposons que ρ(0) = 1 si le nœud 0 n a aucun voisin (Φ(B′’ 0) = 0). Nous
+di i l l d d d d ′con t onnons par a va eur u egre´ u nœu 0 : δ(0) = Φ(B0). Nous obtenons
+alors :
+∑+∞
+o [ρ(0)] = o [ρ |δ = 0] o(δ = 0) + oE E 0 0 P 0 E [ρ0|δ0 = k] oP (δ0 = k)
+k=1
+∑  ∑ ∣∣ ′+∞ Φ(B 0)1 Φ(B′ ′0 ∩B Y )
+= 1 + o  iE ∣Φ(B′0) = k o ′P (Φ(B 0) = k)
+2 Φ(B′0)
+k=1 i=1
+∑+∞∑k1 1 [ ∣∣ ]
+= 1 + o Φ(B′ ∩B′ )∣Φ(B′ ) = k × oE 0 Y 0 P (Φ(B′0) = k)
+2 k i
+k=1 i=1
+(3.2)
+Les nœuds (Yi)[i=1,..,k e´tant in
+l p o ′ ∩ ′ ∣∣
+de´pendants ]et uniforme´ment distribue´s dans B′0,
+es e´rance Φ(B B )∣Φ(B′’ E 0 Y 0) = k est la meˆme pour tout i, i = 1, .., ki
+3.11. ANNEXES 55
+(et donc pour tout voisin Yi de 0). On note ν(S) la mesure de Lebesgue de la
+re´gion du plan S dans IR2 Connaissant ν(B′ ∩ B′ ) et sachant que Φ(B′. ) = k,
+a(lors le nombre de) 0 Yi 0nœuds dans B′ ′0 ∩ B Y suit une loi binomiale de parame`trei
+ν(B′ ∩B′ )
+k − 1, 0 Yiν(B ) .′0
+′ ′
+L b y d p i d i − ν(B 0∩B Y )e nom re mo en e o nts ev ent : (k 1) iν(B ) .′0
+D’ou`, pour tout i = 1, .., k :
+[ ∣∣∣ ] (k − 1) [ ∣∣∣ ]o Φ(B′ ∩B′E 0 Y ) Φ(B′0) = k = o ′ ′ ′E ν(B 0 ∩Bi 2 Y ) Φ(B 0) = kpiR i
+− (3.3)(k 1)
+= o ′ ′E [ν(B 0 ∩B2 Y )]piR i
+Cette e´galite´ 3 3 vient du fait que la surface ν(B′ ∩ B′. 0 Y ) ne de´pend pas du nombrei
+de Yi, puisque les nœuds Yi sont inde´pendants.
+Si on pose que le nœud Yi est a` une distance r du nœud 0, l’ai√re de l’intersection
+B′ ′ ′ ′ 2 r 20 ∩ B Y devient ν(B 0 ∩ B Y ) = A(r) = 2R arccos 2R − r R − r
+2
+4 , commei i
+illustre´ sur la figure 3.4.
+Puisque les Y sont uniforme´ment distribue´s dans B′i 0, la valeur moyenne de l’aire
+intersection est :
+o [ν(B′ ∩B′E 0 Y )] =i ∫oE [A(r)]2pi ∫ R A(r)
+=
+0 ( 20 piR√ )
+r dr dθ
+3 3
+= R2 pi −
+4
+Soit p la probabilite´ que deux voisins de 0 soient eux-meˆmes voisins. p est la valeur
+moyenne de l’aire d’intersection divise´e par la surface totale ou` peuvent se trouver les
+voisins de 0 (piR2). On a :
+∫ ( √ ) √
+∈ ∩ 2
+1 u 2− − u − 3 3p = P (Y2 B0 BY ) = 2 arccos u 1 udu = 11 pi u=0 2 4 4pi
+≈ 0.5865
+56 CHAPITRE 3. ALGORITHME DE CLUSTERING
+Ce re´sultat combine´ a` celui de l’e´quation 3.2 nous donne :
+∑∑ ( √ )+∞ k
+o 1 1 k − 1 3 3
+E [ρ(0)] =1 + pi − o (Φ(B′P 0) = k)
+2 k
+∑k=1 i=1 (
+pi ) 4
++∞ − √1 k 1 3 3
+=1 + pi − oP (Φ(B′0) = k)
+2
+k=( pi 41 √ ) (∑ )+∞ ∑+∞1 − 3 3=1 + pi × k o (Φ(B′P 0) = k)− o ′P (Φ(B 0) = k)
+2pi ( 4√ ) k=1
+1 − 3 3 ( − ( − { }))
+k=1
+=1 + pi λpiR2 1 exp λpiR2
+2pi 4
+(3.4)
+L’e´galite´ 3.4 de´coule du the´ore`me de Slyvniack dont l’une des conse´quences est que
+l b d ′e nom re e voisins Φ(B0) de 0, sous la probabilite´ de Palm, suit une loi de Poisson
+discre`te de parame`tre λpiR2. 
+3.11.2 Calcul analytique du nombre de clusters
+Nous donnons ici les calculs de´taille´s de la borne du nombre de clusters donne´ dans le
+the´ore`me 1. Nous bornons la probabilite´ qu’un nœud soit chef.
+Conjecture 1 Une borne supe´rieure pour la probabilite´ qu’un nœud soit chef est :
+( ) ( ∑+∞ ( ) )n
+o 1 λpiR
+2
+PΦ ρ(0) > max ρ(Yk) ≤ 1 + exp {−λpiR2}
+k=1,..,Φ(B0) n n!
+n=1
+Preuve 5 Calculer la probabilite´ pour un nœud d’eˆtre chef revient a` calculer la pro-
+babilite´ pour un nœud d’avoir la plus forte densite´ dans son voisinage.
+Nous conside´rons le point 0. Soient B0 = B(0, R) la boule de rayon R centre´e en 0
+′
+et B0 la boule de rayon R centre´e en 0 prive´e du singleton {0}. Soit (Yi)i=1,..,Φ(B′ ),0
+chacun des points de Φ se trouvant dans B′0.
+La densite´ des points de B0 est e´qui-distribue´e puisque les positions de ces points sont
+uniforme´ment et in(de´pendamment distribue´es dans B0. D’ou` :∣ )
+o ∣∣ ′ ≤ 1P ρ(Yi) > max ρ(Yk) Φ(B0) = n
+k=1,..,n;k 6=i n
+Si l i i i ( ′e po nt 0 n’a aucun vo s n Φ(B0) = 0), 0 est un cluster-head.
+3.11. ANNEXES 57
+Nous(avons : )
+o
+P ρ(0) > max ρ(Yk)
+( ′k=1,..,Φ(B )0 ∣∣ )∣ ( ) ( )o ′ ′ ′=P ρ(0) > max ρ(Yk) Φ(B0) > 0 oP Φ(B0) > 0 + oP Φ(B0) = 0
+′
+k=1,..,Φ(B )
+0
+On note : ( ∣∣ )∣ ( )p = o ′ ′0 P ρ(0) > max ρ(Yk) Φ(B0) > 0 × oP Φ(B0) > 0
+′
+k=1,..,Φ(B )
+0
+Si nous su(pposons que les densite´s sont e´qui-distribue´es, nous a)vons :∣∣∣ ( )p < o ′ ′0 P ρ(Y1) > max(ρ(0), max ρ(Yk)) Φ(B0) > 0 × oP Φ(B0) > 0
+k=2,..,Φ(B′ )
+0
+Il s’agit d’une conjecture, en effet nous n’avons pas re´ussi a` de´montrer ce re´sultat.
+Cependant d’apre`s nos simulations, quelle que soit la densite´ des nœuds, la quantite´
+p0 est deux a` trois fois plus petite que le terme de droite de cette ine´galite´.
+De plus, comme l’e´ve`nement
+E1 = {ρ(Y1) > max(ρ(0), max ρ(Yk))}
+k=2,..,Φ(B′ )
+0
+est inclus dans l’e´ve`nement
+E2 = {ρ(Y1) > max ρ(Yk))}
+k=2,..,Φ(B′ )
+0
+nous pouvons majorer la probabilite´ que E1 se produise par la probabilite´ que E2 se
+re´alise. Nous obtenons :
+( ) ( )
+p0 ≤ o o
+′ o o ′
+P [(E1]× P Φ(B0) > 0 ≤ P [E2]× P∣∣ )
+Φ(B0) > 0( )
+o ′ ′p0 ≤ P ρ(Y1) > max ρ(Yk)∣Φ(B0) > 0 × oP Φ(B ) > 0
+′
+k=2,..,Φ(B )
+∑ ( 0 ∣ )
+0
++∞
+o ∣ ′= oP ρ(Y1) > max ρ(Yk)∣Φ(B0) = n × P (Φ(B′0) = n)
+n∑=1+∞ ( )
+′
+k=2,..,Φ(B )
+0
+1 λpiR2
+n
+≤ exp {−λpiR2}
+n n!
+n=1
+58 CHAPITRE 3. ALGORITHME DE CLUSTERING
+De plus, d’apre`s le the´ore`me de Slivnyak [76], le nombre de points sous la distribution
+de Palm dans un espace Bore´lien de IR2 qui ne contient pas le point 0, suit une loi de
+Poisson discre`te. Nous en de´duisons :
+( ) ∑+∞ ( )2 n
+o 1 λpiR
+P ρ(0) > max ρ(Yk) ≤ exp {−λpiR2}+ exp {−λpiR2}
+k=1,..,Φ(B0) n n!
+n=1
+
+Comme, d’apre`s le lemme 3, le nombre de clusters est tel que
+[Nb de clusters dans C] = λν(C) oE PΦ (0 est chef ), on obtient une borne supe´rieure
+pour le nombre de clusters forme´s par notre algorithme dans une surface C :
+∑+∞ ( )1 λpiR2 n
+E [Nb de clusters dans C] ≤ λν(C) exp {−λpiR2}+ exp {−λpiR2}
+n n!
+n=1
+3.11.3 Temps de transmission borne´
+Dans cette partie, nous justifions l’hypothe`se suivante : ”il existe une constante τ > 0
+telle que chaque nœud est en mesure de diffuser localement une trame et d’en recevoir
+une de chacun de ses voisins en un temps borne´ ∆(τ)” faite dans la section 3.8.5 pour
+prouver le caracte`re d’auto-stabilisation de notre algorithme.
+Dans [83], les auteurs fournissent une analyse des performances du protocole IEEE
+802.11 pour la couche MAC des re´seaux sans fil. En conside´rant un graphe a` n stations,
+toutes a` porte´e de transmission les unes des autres (c.a`.d. que le graphe de communica-
+tion est complet), les auteurs mode´lisent l’activation de la pe´riode de contention par les
+nœuds avant l’e´mission d’une trame. La dure´e de cette pe´riode de´pend des collisions
+qui ont pu se produire pour cette trame auparavant. On trouve en particulier dans ce
+papier la probabilite´ Psuc qu’il y ait une transmission re´ussie parmi les n stations en un
+slot de temps donne´. Une transmission est conside´re´e comme re´ussie si exactement une
+station e´met pendant cette pe´riode de temps. Si pc est la probabilite´ qu’il y ait au moins
+un paquet transmis sur le me´dium parmi les n stations (pc est aussi donne´ dans [83]),
+nous avons :
+P = (n− 1)((1 − p )(n−2)/(n−1)suc c + pc − 1)
+Nous montrons maintenant que le temps moyen au bout duquel tous les voisins d’un
+nœud ont e´mis avec succe`s, est borne´ par une constante. Soit X la variable ale´atoire
+de´signant le nombre de slots de temps ne´cessaire pour que n stations arrivent a` e´mettre
+avec succe`s. Dans le meilleur cas, chaque station parle a` tour de roˆle. Ceci donne :
+[X < n] = 0 et [X = n] = PnP P suc.
+P [X = k, k > n] est la probabilite´ qu’a` la fin des (k−1) premiers slots, (n−1) stations
+ont e´mis avec succe`s et que la nieme station re´ussit a` transmettre sa trame durant le slot
+k. Nous avons :
+3.11. ANNEXES 59
+( − )( )k 1 n
+[X = k, k > n] = (1 − P )(k−n+1)PnP − − suck n+ 1 n 1 suc
+Les n − 1 premie`res stations ont e´mis pendant les k − 1 premiers slots. On conside`re
+donc la probabilite´ de choisir k − (n− 1) slots parmi les k − 1 premiers slots pendant
+lesquels aucune transmission n’a eu lieu ou une collision est apparue, multiplie´ par le
+nombre de possibilite´s de choisir la nieme station qui e´met durant le kieme slot.
+On en de´duit le nombre moyen de slots ne´cessaire E [X ] pour que chacune des n sta-
+tions parvienne a` e´mettre avec succe`s.
+∑∞
+E [X ] = kP [X = k]
+k=0 ∑∞
+= nP [X = n] + kP [X = k]
+( k∑=n+1 ( )( ) )∞
+= Pnsuc ×
+k − 1 n
+n+ k (1− P )(k−n+1)
+k − n+ 1 n− suc1
+k=n+1
+Ceci peut eˆtre de´rive´ en : ( )
+n 1
+E [X ] = Psuc (n+ n(n+ 1)( − (n+ 1) + nP )Pn sucsuc )
+1
+= nPnsuc 1 + (n+ 1)( − (n+ 1) + nPsuc)Pnsuc
+Ainsi, comme Psuc de´pend uniquement de n et que nous supposons n borne´ par une
+constante, E [X ] est aussi constant. D’ou` notre hypothe`se stipulant ”une constante τ >
+0 telle que chaque nœud est en mesure de diffuser localement une trame et d’en recevoir
+une de chacun de ses voisins en un temps borne´ ∆(τ)”.
+60 CHAPITRE 3. ALGORITHME DE CLUSTERING
+Chapitre 4
+Diffusion
+4.1 Introduction
+Comme nous avons pu le constater, auto-organiser un re´seau sans fil tel un re´seau
+ad hoc ou de capteurs, pre´sente de nombreux avantages. Cependant, de tels re´seaux
+ne´cessitent e´galement un me´canisme efficace de diffusion d’information. La diffusion
+(ou broadcast) consiste a` transmettre un message depuis un nœud source vers l’en-
+semble des entite´s du re´seau. Une telle ope´ration est employe´e par la grande majorite´
+des protocoles de routage (pour la de´couverte des routes entre les entite´s du re´seau).
+Cette ope´ration s’ave`re aussi utile a` une station de base dans un re´seau de capteurs lors
+de la diffusion d’une requeˆte ou de mise a` jour logicielle sur tous les capteurs. Cette
+ope´ration, indispensable donc a` tout re´seau sans fil, a fait l’objet de nombreux travaux
+avec, comme but premier, la re´duction du nombre de nœuds retransmettant le message
+lors de sa diffusion a` l’ensemble du re´seau.
+Les bonnes proprie´te´s d’un protocole de diffusion efficace sont les suivantes :
+– extensibilite´ : il supporte le passage a` l’e´chelle ;
+– accessibilite´ : une grande majorite´ des nœuds du re´seau joignables par la source
+(appartenant a` la meˆme composante connexe) rec¸oit le message (plus de 90%) ;
+– e´conome : l’e´nergie et la bande passante consomme´es sont minimise´es (le nombre
+de messages retransmis et de re´ceptions redondantes est re´duit).
+E´ tant donne´ qu’un re´seau sans fil ne´cessite a` la fois une auto-organisation et un pro-
+tocole de diffusion, nous proposons d’utiliser la structure d’arbres forme´e par l’algo-
+rithme 1, non seulement pour organiser le re´seau en clusters, mais e´galement pour
+e´tablir une base propice a` une diffusion efficace, tirant avantage de certaines de ses
+caracte´ristiques. Ainsi, une seule structure est cre´e´e pour deux ope´rations : l’organi-
+sation et la diffusion. Notre algorithme de diffusion n’autorise que les nœuds internes
+des arbres a` retransmettre le message. Comme nous l’avons constate´ dans le chapitre 3,
+une grande proportion des nœuds sont des feuilles (environ 75%). Par conse´quent, une
+diffusion base´e sur un tel ensemble n’autorise que peu de nœuds a` e´mettre. L’ensemble
+61
+62 CHAPITRE 4. DIFFUSION
+des arbres de clustering forme une foreˆt couvrante, donc un ensemble ou` tout nœud
+est soit un nœud interne, soit directement voisin d’un nœud interne. Ne´anmoins, cet
+ensemble n’est pas connecte´ puisque les arbres sont inde´pendants. Pour que la diffu-
+sion touche toutes les entite´s du re´seau, il faut tout d’abord connecter ces arbres en
+e´tablissant des passerelles entre eux. Lors de la diffusion, seuls les nœuds internes et
+ceux constituant les passerelles seront autorise´s a` retransmettre le message. Notre algo-
+rithme permet deux types de diffusion : une diffusion ge´ne´rale d’un message a` tous les
+nœuds du re´seau mais e´galement une diffusion d’un message limite´e a` l’inte´rieur d’un
+cluster. Pour ce dernier cas de figure, comme la hauteur des arbres est petite et proche
+de l’optimal (excentricite´ du chef de cluster) et que les clusters sont proches de cellules
+de Voronoı¨ (chapitre 3), un nœud recevra rapidement une information provenant de son
+chef.
+Dans ce chapitre, nous de´crivons dans un premier temps notre algorithme de diffu-
+sion reposant sur la structure d’arbres ainsi que les algorithmes de se´lection des passe-
+relles. Nous donnons ensuite une analyse the´orique d’une diffusion dans tout le re´seau,
+montrant que le nombre de re´ceptions par nœud peut s’exprimer comme le produit
+des degre´s des relais par la probabilite´ pour un nœud d’eˆtre un relais. Les simulations
+viennent illustrer notre analyse the´orique, comparer sur divers aspects plusieurs proto-
+coles existant et en e´valuer la robustesse. E´ tonnamment, il apparaıˆt que les protocoles
+les plus fiables ne sont pas ceux produisant le plus de relais mais ceux dont les relais
+ont le plus fort degre´. Les comparaisons entre ces diffe´rents algorithmes montrent aussi
+que notre heuristique de diffusion pre´sente le meilleur compromis entre la consomma-
+tion d’e´nergie (nombre d’e´missions et re´ceptions) et la robustesse. Au cours de ces
+simulations, nous avons pu remarquer que l’heuristique de diffusion base´e sur les MPR
+(multi-points relais) de OLSR (voir section 4.2) pre´sentait tre`s peu de robustesse face
+a` la mobilite´ des nœuds. Afin de mieux comprendre le comportement des MPR, nous
+avons analyse´ cette heuristique plus en de´tail.
+La section 4.2 pre´sente quelques-unes des solutions de diffusion existant pour les
+re´seaux sans fil. La section 4.3 donne l’analyse the´orique de la diffusion, utilisant la
+ge´ome´trie stochastique et la distribution de Palm. La section 4.4 pre´sente la fac¸on dont
+nous utilisons la structure d’arbres sous-jacente afin de re´aliser une diffusion efficace.
+Nos comparaisons et e´valuations des diffe´rents algorithmes sont mene´es au travers des
+simulations de la section 4.5. La section 4.6 pre´sente l’analyse de la se´lection des MPR
+dans OLSR. Enfin, quelques remarques concluront ce chapitre (section 4.7).
+4.2 Les algorithmes de diffusion pour les re´seaux ad
+hoc dans la litte´rature
+Afin de pouvoir supporter une extension du re´seau, un protocole de diffusion dans
+les re´seaux sans fil se doit de limiter l’utilisation de la bande passante et la de´pense
+en e´nergie ; il doit donc minimiser le nombre de messages ge´ne´re´s tout en assurant
+qu’un maximum de nœuds connecte´s a` la source rec¸oivent le message (plus de 90%).
+Beaucoup de solutions ont e´te´ propose´es avec des hypothe`ses plus ou moins similaires
+4.2. E´TAT DE L’ART 63
+a` notre mode`le. Dans cette section, nous ne mentionnerons que ceux supposant les
+meˆmes hypothe`ses que nous, c’est a` dire qui supposent un mode`le a` antennes omni-
+directionnelles, sans controˆle de puissance. De plus, en supposant une couche MAC
+ide´ale (qui ne ge´ne`re aucune collision), on conside`re la diffusion efficace si tous les
+nœuds connecte´s a` la source rec¸oivent le message. Un e´tat de l’art plus complet concer-
+nant des solutions probabilistes, utilisant des antennes directionnelles ou conside´rant
+une couche MAC non ide´ale est donne´ dans [18].
+La me´thode de diffusion la plus triviale pour diffuser un message est l’inondation
+aveugle ou blind flooding : lorsqu’un nœud rec¸oit le message diffuse´ pour la premie`re
+fois, il le re´-e´met pour ses voisins. Ce me´canisme impose une charge e´norme au
+re´seau, engendrant un grand nombre de messages et de collisions, de´pensant beaucoup
+d’e´nergie et de bande passante. C’est pourquoi un tel me´canisme ne peut eˆtre envisage´
+pour un re´seau dense ou e´tendu. Ceci donna motive la mise au point de protocoles de
+diffusion plus intelligents qui minimisent le nombre de re-transmissions ne´cessaires
+en n’autorisant qu’un sous-ensemble de nœuds a` transmettre. Pour cela, on cherche a`
+trouver un ensemble ”dominant”. En effet, afin que tous les nœuds du re´seau rec¸oivent
+le message, chacun des nœuds doit eˆtre soit un dominant, soit voisin d’un dominant. La
+difficulte´ est alors de trouver un tel ensemble dominant connexe de taille minimum qui
+minimise e´galement le nombre de re´ceptions redondantes d’un message retransmis par
+cet ensemble. Ce proble`me est montre´ NP-difficile [34]. I. Stojmenovic et J. Wu [75]
+ont propose´ une classification des protocoles de diffusion en fonction du type d’en-
+semble dominant qu’ils utilisent : cluster-based ou base´ sur la formation de clusters,
+ensemble dominant de´pendant de la source et ensemble dominant inde´pendant de la
+source.
+Les solutions cluster-based [28, 36] sont les plus anciennes. Ces protocoles sont plus
+de´taille´s dans le Chapitre 2. L’ide´e est que chaque nœud ayant le plus petit identifiant
+(protocole Linked Cluster Architecture - LCA) ou le plus fort degre´ (High Connec-
+tivity Clustering - HCC) dans son 1-voisinage se de´clare teˆte de cluster. Ses voisins
+s’attachent a` lui. Si un nœud s’attache a` plus d’un cluster-head, il devient une passe-
+relle. L’ensemble dominant connexe re´sultant comprend les cluster-heads et les passe-
+relles. Par la suite, des optimisations ont e´te´ propose´es afin de minimiser la mainte-
+nance pour e´viter des re´actions en chaıˆne e´tendues a` tout le re´seau lors de mouvements
+de nœuds [24] ou afin de limiter le nombre de passerelles et donc la taille de l’ensemble
+dominant [81].
+Dans les propositions base´es sur des ensembles dominants de´pendant de la source [49,
+65], les e´metteurs se´lectionnent parmi leurs voisins les nœuds qui relaieront le message.
+L’ensemble des relais ainsi choisis par un nœud u est aussi petit que possible et tel
+que, chaque nœud a` 2 sauts de u est voisin d’au moins un de ces relais. Pour e´tablir
+cette se´lection, u ne´cessite une connaissance de son 2-voisinage uniquement. Lors de la
+diffusion, u fera suivre le message diffuse´ qu’il rec¸oit de v, seulement s’il le rec¸oit pour
+la premie`re fois et a e´te´ choisi comme relais de v. Les diffe´rents algorithmes diffe`rent
+ensuite sur la se´lection des relais, le plus connu e´tant celui base´ sur les Multi-Points
+Relais (MPR) de OLSR [65]. Dans OLSR, les MPR sont e´galement utilise´s pour e´tablir
+les tables de routage. La structure de diffusion a donc un usage double. Nous de´taillons
+plus la se´lection des MPR dans la section 4.6.
+64 CHAPITRE 4. DIFFUSION
+Les protocoles de diffusion utilisant des ensembles dominants inde´pendants de la
+source se´lectionnent cet ensemble inde´pendamment du nœud initiateur de la diffusion.
+C’est le cas de notre algorithme. Les nœuds de´cident d’eux-meˆmes s’ils sont ou non
+dans cet ensemble, contrairement aux solutions base´es sur des ensembles dominants
+de´pendant de la source, ou la de´cision est prise par un autre nœud. Beaucoup de solu-
+tions de ce type ont e´te´ propose´es. Dans chacune d’elles, les nœuds ne ne´cessitent que
+la connaissance de leur 2-voisinage pour prendre leur de´cision. Un protocole simple
+et efficace est le NES (Neighbor Elimination-Based Scheme) de Wu et Li [80], qui se
+base sur l’e´limination de voisins. Dans ce sche´ma, un nœud u est dit interme´diaire
+si au moins deux de ses voisins v et w ne sont pas eux-meˆmes voisins (u est l’in-
+terme´diaire entre v et w). A` partir de la`, deux re`gles de se´lection sont applique´es sur les
+interme´diaires afin de re´duire leur nombre. Les nœuds restants deviennent les membres
+de l’ensemble dominant et donc les relais lors d’une diffusion. Les re`gles de se´lection
+se basent sur une valeur de priorite´. Dans la version originale du NES, cette valeur est
+l’identifiant des nœuds. Puis, plusieurs variantes ont e´te´ propose´es utilisant pour cette
+valeur le degre´ du nœud ou l’e´nergie restante [26, 74]. Les auteurs de [74] proposent
+un autre type d’algorithme base´ sur l’e´limination des voisins que l’on peut re´sumer
+par ”Wait and See”. Sur re´ception d’un message de diffusion, un nœud attend pendant
+un temps ale´atoire. Durant cette pe´riode, il observe si un de ces voisins retransmet le
+message et dans ce cas, quels sont ses voisins recevant ainsi l’information. Si a` la fin de
+la pe´riode d’attente, il reste parmi ses voisins des nœuds n’ayant pas rec¸u le message,
+il l’e´met. Les auteurs de [19] ont ensuite propose´ une ame´lioration a` cet algorithme
+en conside´rant le RNG - Relative Neighborhood Graph (graphe de voisinage relatif)
+plutoˆt que le graphe re´el. Ces derniers sche´mas base´s sur l’e´limination de voisins (Wait
+& See et Wait & See base´ sur RNG) obtiennent d’excellentes performances en terme
+de nombre d’e´missions et de re´ceptions mais induisent une latence importante dans le
+processus de diffusion du fait de la pe´riode d’attente ale´atoire de chaque nœud.
+4.3 Analyse the´orique d’une diffusion dans un re´seau
+sans fil
+Comme nous avons pu le constater dans la section 4.2, la plupart des protocoles de
+diffusion visent a` re´duire le nombre de nœuds qui relaient le message, l’objectif princi-
+pal e´tant de minimiser l’e´nergie globale consomme´e pour diffuser le message. Comme
+les nœuds consomment de l’e´nergie non seulement pour transmettre mais aussi pour
+recevoir un message, un protocole de diffusion efficace en terme d’e´conomie d’e´nergie
+doit chercher a` minimiser E, avec E = Ctx × nbtx + Cry × nbry ou` Ctx (resp. Cry)
+est le couˆt e´nerge´tique d’une transmission (resp. re´ception) d’un paquet et nbtx (resp.
+nbry) est le nombre de fois ou` le message est e´mis (resp. le nombre de re´ceptions).
+Or, les nœuds des re´seaux ad hoc utilisant la technologie 802.11 [31], tout comme les
+capteurs [63], ne´cessitent approximativement autant d’e´nergie pour recevoir que pour
+e´mettre (Cry ≈ Ctx) et donc, ni les re´ceptions ni les transmissions ne peuvent eˆtre
+ne´glige´es lors du bilan e´nerge´tique.
+4.3. ANALYSE THE´ORIQUE 65
+Dans cette analyse, nous nous sommes inte´resse´s au nombre moyen de fois ou` un
+nœud donne´ rec¸oit un meˆme message lors d’une diffusion. Comme dans les ana-
+lyses the´oriques pre´ce´dentes, nous utilisons les proprie´te´s des processus ponctuels
+et les meˆmes notations, a` savoir : Φ(S) repre´sente le nombre de points du proces-
+sus Φ distribue´s sur la surface S, B(x,R) est la boule de rayon R centre´e en x et
+′
+Bx = B(x,R) \ {x}.
+Nous notons r le nombre moyen de re´ceptions d’un meˆme message par un nœud (qu’il
+soit un relais ou non). Nous donnons deux re´sultats pour r dans les Propositions 1 et 2,
+que nous utiliserons par la suite afin de comparer les diffe´rents algorithmes de diffusion
+e´tudie´s. Les re´sultats de r donne´s par ces deux propositions sont semblables mais la
+Proposition 1 conside`re le mode`le particulier que nous utilisons dans les simulations,
+de´crit dans le Chapitre 1.1 alors que les re´sultats de la proposition 2 sont e´galement
+applicables a` une classe plus large de graphes ale´atoires. Dans les deux cas, nous ne
+donnons ici que l’ide´e ge´ne´rale de la preuve, les preuves et calculs de´taille´s se trouvant
+en Annexes 4.9.
+Pour la Proposition 1, nous conside´rons un processus ponctuel stationnaire Φ d’inten-
+site´ λ > 0. Deux points (x, y) de Φ sont connecte´s (et donc voisins) si et seulement si
+la distance Euclidienne les se´parant est infe´rieure ou e´gale a` R (d(x, y) ≤ R), R e´tant
+le rayon de transmission radio des nœuds (mode`le de graphe ge´ome´trique ale´atoire).
+Proposition 1 E´tant donne´ un processus ponctuel stationnaire Φ d’intensite´ λ (λ >
+0), soit ΦRelay d’intensite´ λRelay un amincissement de Φ. Les points de ΦRelay
+repre´sentent les relais. Nous supposons que ΦRelay est toujours un processus ponc-
+tuel stationnaire. Le nombre moyen de re´ceptions d’un meˆme message par nœud r est :
+λ [ ]Relay ′
+r = oE Φ(B )
+[ ] λ ΦRelay 0
+′
+ou` oEΦ ΦRelay(B0) est l’espe´rance sous Palm par rapport au processus Φ (et donc
+l l ) d b d l d ′a va eur moyenne u nom re e re ais ans B0.
+La preuve de cette proposition est donne´e en annexes 4.9. Le nombre de re´ceptions
+d’un meˆme message rec¸u par un nœud de´pend du nombre de relais dans son voisinage.
+Le re´sultat s’interpre`te de la fac¸on suivante. Le nombre moyen de re´ceptions par nœud
+est le produit du degre´ moyen d’un relais par la probabilite´ pour un nœud donne´ d’eˆtre
+un relais (ou de fac¸on e´quivalente par le ratio du nombre de relais sur le nombre total
+de nœuds).
+Nous conside´rons maintenant des mode`les de graphes ale´atoires plus ge´ne´raux. Nous
+supposons que les degre´s des nœuds et le nombre de re´ceptions par nœud sont e´qui-
+distribue´es. A noter que nous ne supposons pas ces quantite´s inde´pendamment dis-
+tribue´es, ce qui fait que cette hypothe`se n’est pas restrictive. De plus, cette condition
+est ve´rifie´e par la plupart des graphes ale´atoires. Par exemple, un graphe ale´atoire de
+type Erdo¨s et Renyi [29] qui consiste en n sommets entre lesquels des areˆtes sont
+66 CHAPITRE 4. DIFFUSION
+place´es avec une probabilite´ uniforme p, inde´pendamment des autres areˆtes, ve´rifie nos
+hypothe`ses.
+Proposition 2 E´tant donne´ un graphe ale´atoire G(V,E) et un ensemble de relais
+Relay ⊂ V ou` les degre´s des nœuds et des relais ainsi que le nombre de re´ceptions
+par nœud sont e´qui-distribue´s.[Le no∣mbre moyen∣∣ ]
+de re´ceptions par nœud r s’e´crit :
+r = E δ(v1) v1 ∈ Relay P(v1 ∈ Relay) (4.1)
+La preuve de cette proposition est donne´e en annexes 4.9. L’ide´e est de voir que le
+nombre de re´ceptions d’un meˆme message rec¸ues par un nœud correspond au nombre
+moyen de relais qu’il a dans son voisinage. On peut de´duire le re´sultat ci-dessus, pour
+un graphe ge´ne´ral (proposition 2). Il est le meˆme que pour un graphe ge´ome´trique
+ale´atoire (proposition 1) : le nombre moyen de re´ceptions par nœud est le produit du
+degre´ des relais par la probabilite´ d’eˆtre un relais. Dans l’e´galite´ 4.1, v1 est un nœud
+choisi ale´atoirement parmi l’ensemble des sommets V . Le choix de v1 n’a aucun im-
+pact sur les re´sultats puisque la probabilite´ pour un nœud d’eˆtre un relais lors de la
+diffusion est e´qui-distribue´e et est la meˆme pour v1 que pour tout autre nœud du graphe.
+Dans cette analyse, nous avons montre´ que le nombre moyen de re´ceptions par nœud
+est le produit du degre´ moyen des relais par la proportion des relais. Si n est le nombre
+de nœuds dans le re´seau et proptx la proportion des relais (nbtx = n×proptx), l’e´nergie
+globale consomme´e s’e´crit :
+× × ( )E = nCry proptx p+ δRelay
+ou` p de´pend du type de technologie utilise´e par les nœuds radio (p ≈ 1 pour les cap-
+teurs [63], p ≈ 4 pour les nœuds utilisant la technologie 802.11 [31]). Il en ressort
+clairement que pour diminuer E, il faut jouer sur les parame`tres δRelay et proptx.
+4.4 Notre contribution a` la diffusion
+Dans cette section, nous introduisons dans un premier temps un algorithme permet-
+tant l’e´lection de nœuds passerelles entre nos clusters. Puis, dans un second temps,
+nous donnons l’algorithme permettant d’appliquer deux types de diffusion sur notre
+organisation en arbres : un algorithme de diffusion globale (dans tout le re´seau) et un
+algorithme de diffusion dans un cluster.
+4.4.1 Se´lection des passerelles
+On appelle nœud frontie`re un nœud comptant parmi ses voisins au moins un
+repre´sentant d’un ou plusieurs clusters autres que le sien.
+Une passerelle Gateway(C(u), C(v)) = 〈x, y〉 entre deux clusters voisins C(u) et C(v)
+est une paire de nœuds frontie`res 〈x, y〉 telle que x ∈ C(u), y ∈ C(v) et x ∈ Γ1(y).
+4.4. NOTRE CONTRIBUTION A` LA DIFFUSION 67
+c b h e
+j
+l
+d
+g
+i
+a k
+f m
+FIG. 4.1 – Exemple d’arbres de clustering forme´s par la me´trique de densite´.
+Dans une telle paire, on appelle le nœud x le nœud passerelle x = GW (C(u), C(v))
+et le nœud y le nœud miroir de la passerelle y = GWm(C(u), C(v)). Ces passe-
+relles sont oriente´es dans le sens ou` il existe une passerelle permettant a` C(u) de
+joindre C(v) ( Gateway(C(u), C(v))) et une autre qui permet a` C(v) de joindre C(u)
+(Gateway(C(v), C(u))), ces deux passerelles pouvant eˆtre diffe´rentes.
+Notre algorithme de se´lection des passerelles se de´roule en deux e´tapes. Dans un pre-
+mier temps, chaque nœud frontie`re, choisit localement son miroir dans les clusters
+voisins. Un nœud frontie`re et son miroir forment alors une paire de nœuds candidate
+au titre de passerelle. Dans un second temps, l’algorithme se´lectionne parmi ces paires
+candidates, la paire la plus ade´quate au roˆle de passerelle. Comme les nœuds de la
+passerelle seront invite´s a` re-transmettre un message diffuse´ dans tout le re´seau, l’algo-
+rithme de se´lection favorise l’e´lection des nœuds internes afin de minimiser le nombre
+d’e´metteurs. En effet, les nœuds internes appartiennent de´ja` a` l’ensemble des nœuds
+relais. Les se´lectionner en tant que passerelle n’ajoute aucun e´metteur et donc aucun
+message superflu.
+Cependant, il est clair que si une passerelle est le seul moyen de raccorder un ensemble
+du re´seau a` la source du message diffuse´, cette passerelle devient un point sensible.
+Afin d’ajouter de la robustesse au protocole envers une cassure de liens au niveau des
+passerelles, chaque nœud passerelle e´lit parmi ses voisins une passerelle de secours
+(ou de back-up). Cette dernie`re re´-e´mettra le message diffuse´ si et seulement si elle
+n’entend pas la passerelle principale. Nous reprenons ici la philosophie Wait & See vue
+dans la section 4.2. Dans la suite, nous de´taillons la se´lection des trois types de nœuds :
+miroir, passerelle et passerelle de secours.
+Se´lection des miroirs.
+Comme mentionne´ dans le chapitre 3.8, tout nœud u sait en un temps borne´ s’il existe
+parmi ses voisins un nœud v qui n’appartient pas au meˆme cluster que lui (C(u) 6=
+C(v)) et donc s’il est un nœud frontie`re. Chaque nœud frontie`re u doit se´lectionner
+son miroir parmi les nœuds de son voisinage appartenant a` un cluster diffe´rent du sien.
+Pour cela, dans un premier temps, u conside`re parmi ces nœuds ceux qui ne sont pas
+des feuilles et qui sont donc des transmetteurs dans tous les cas. u se´lectionne parmi eux
+le nœud de plus forte densite´. Si tous les nœuds conside´re´s sont des feuilles, u choisit
+68 CHAPITRE 4. DIFFUSION
+le nœud de plus faible degre´, de fac¸on a` limiter le nombre de re´ceptions occasionne´es
+lors de l’e´mission du message diffuse´ par le miroir.
+Si u est un nœud frontie`re du cluster C(v) (C(v) 6= C(u)), on note m(u, C(v)) le nœud
+miroir choisi par u dans C(v). Si u est voisin de plusieurs clusters diffe´rents du sien,
+il doit e´lire plusieurs miroirs, un dans chacun des clusters voisins. Par exemple, sur la
+figure 4.1, le nœud i doit se choisir deux miroirs, m(i, C(f)) dans C(f) et m(i, C(l))
+dans C(l).
+Algorithm 1 Se´lection du nœud miroir - EXE´CUTE´ SUR CHAQUE NŒUD FRONTIE`RE u,
+c.a.d., ∃v ∈ Γ1(u) s.t. C(v) 6= C(u)
+Pour chaque cluster voisin C pour lequel u est un nœud frontie`re : C =6 C(u) et
+∃v ∈ Γ1(u) ∩ C
+Se´lectionne l’ensemble S des nœuds tels que S = C ∩ {v | Γ1(u) | Ch(v) 6= ∅}.
+⊲ u conside`re dans un 1er temps l’ensemble des nœuds non feuilles, e´metteurs dans tous les cas.
+if (S 6= ∅) then Se´lectionne l ensemble S′’ des nœuds tels que
+S′ = {v | v = maxw∈Sρ(w)}.
+⊲ u conside`re les candidats ayant la plus forte valeur de densite´ dans le but de favoriser la
+stabilite´.
+else ⊲ Tous les candidats miroirs de u sont des feuilles.
+S = {C ∩ Γ1(u)}.
+Se´lectionne l ensemble S′ des nœuds tels que S′’ = {v | v = minw∈Sδ(w)}.
+⊲ u conside`re les feuilles de plus faible degre´ afin de minimiser le nombre de re´ceptions
+ge´ne´re´es lors de l’ajout de cette feuille dans l’ensemble des relais.
+end
+if (S′ = {v}) then m(u, C) = v.
+⊲ S′ ne contient qu’un nœud : le miroir de u.
+else m(u, C) = v tel que Id(v) = minw∈S′Id(w).
+⊲ Il existe des ex-aequo. u choisit le nœud de plus faible Id.
+end
+Se´lection des passerelles.
+La seconde e´tape de l’algorithme de se´lection de passerelle e´lit les passerelles reliant
+chaque cluster C a` chacun de ses clusters voisins C′, parmi les paires forme´es par un
+nœud frontie`re et son miroir dans C′. Cette e´tape ne´cessite que des informations concer-
+nant les nœuds frontie`res soient remonte´es a` la racine. Suivant la taxonomie de [81],
+cette e´tape est qualifie´e de quasi-locale car chaque entite´ ne´cessite des informations
+situe´es a` une distance borne´e (ici distance borne´e par la hauteur de l’arbre, elle-meˆme
+borne´e par une constante). La premie`re e´tape de l’algorithme qui permet aux nœuds
+frontie`res de se´lectionner leur miroir ne ne´cessite que des informations locales (de voi-
+sinage) et est qualifie´e de locale. Le fait que ces e´tapes soient locales ou quasi-locales
+sous-entend une maintenance rapide et une robustesse de l’algorithme envers la mobi-
+lite´ des nœuds [81].
+4.4. NOTRE CONTRIBUTION A` LA DIFFUSION 69
+La se´lection des passerelles de notre algorithme est distribue´e puisqu’une se´lection est
+ope´re´e a` chaque niveau de l’arbre. Tout comme la se´lection des miroirs, elle cherche
+a` favoriser l’e´lection des nœuds internes en tant que passerelles de fac¸on a` limiter les
+re´ceptions redondantes lors d’une diffusion d’un message. Les nœuds frontie`res en-
+voient leur Id a` leur pe`re en leur indiquant si eux-meˆmes et leur miroirs sont ou non
+des feuilles. Chaque pe`re choisit parmi tous ses fils frontie`res le meilleur candidat dont
+il envoie les informations a` son propre pe`re et ainsi de suite, jusqu’a` atteindre le cluster-
+head. La se´lection est donc semi-distribue´e puisque chaque nœud interne e´limine des
+candidats et n’en renvoie qu’un seul a` son pe`re. De cette fac¸on, seuls des paquets de pe-
+tites tailles sont envoye´s depuis les nœuds frontie`res jusqu’a` la teˆte de cluster. Comme
+mentionne´ en section 3.6.2-table 3.5, le degre´ moyen des nœuds internes est faible et
+constant quel que soit le nombre de nœuds, ce qui induit un nombre borne´ de messages
+a` chaque niveau. De plus, comme la hauteur des arbres est e´galement borne´e par une
+constante, le nombre de niveaux est lui aussi faible.
+De´finition 2 (Sous-arbre) v appartient au sous-arbre de racine u (note´ sT (u)) si
+l’une des trois conditions suivantes est remplie :
+– u = v,
+– u est le pe`re de v : u = P(v),
+– le pe`re de v appartient au sous-arbre de racine u : P(v) ∈ sT (u).
+C(x) est un cluster voisin du sous-arbre sT (u) si et seulement si C(x) 6= C(u) et il
+existe dans sT (u) un nœud v frontie`re du cluster C(x) : ∃z ∈ C(x) et y ∈ sT (u) tels
+que y ∈ Γ1(z).
+La passerelle entre deux clusters voisins est alors se´lectionne´e de la fac¸on suivante.
+L’algorithme est exe´cute´ par chaque nœud interne, apre`s re´ception des informations
+concernant tous les nœuds frontie`res de son sous-arbre. Pour chaque cluster voisin de
+son sous-arbre, un nœud interne u conside`re l’ensembleG des nœuds candidats (nœuds
+frontie`res) (G = {v ∈ sT (u) | ∃w ∈ Γ1(v) | C(w) 6= C(u)}). Il se´lectionne parmi eux
+le sous ensemble G′- ⊂ G des nœuds internes. Si G est seulement compose´ de nœuds
+feuilles (et donc G′ = ∅), la se´lection se poursuit parmi les nœuds de G directement.
+Le nœud u prend en priorite´ les nœuds dont le miroir est un nœud interne et il choisit
+parmi eux le nœud de plus forte densite´ si les candidats sont des nœuds internes ou
+de plus faible degre´ sinon. En cas d’e´galite´, le nœud de plus petit identifiant est e´lu.
+On remarque qu’entre deux clusters voisins C(u) et C(v), il existe deux passerelles
+Gateway(C(u), C(v)) et Gateway(C(v), C(u)) qui sont diffe´rentes dans la plupart des
+cas. Du fait de leur orientation et comme un relais ne re-transmet que sur la premie`re
+re´ception du message, dans la plupart des cas, seulement une de ces deux passerelles
+sera utilise´e lors d’une diffusion. Ce phe´nome`ne sera mis en e´vidence par les simula-
+tions de la section 4.5.
+Algorithm 2 Se´lection des passerelles - EXE´CUTE´ PAR CHAQUE NŒUD INTERNE u
+70 CHAPITRE 4. DIFFUSION
+Pour chaque cluster C =6 C(u) pour lequel ∃v ∈ sT (u) nœud frontie`re
+Conside`re l’ensemble G des candidats : G = {v ∈ sT (u) | ∃w ∈ Γ1(v) | C(w) = C}.
+Se´lectionne l ensemble G′ ⊂ G des nœuds v tel que G′’ = G ∩ {v|Ch(v) 6= ∅}.
+⊲ u conside`re en priorite´ les nœuds non feuilles.
+if (G′ 6= ∅) then
+⊲ u favorise les nœuds internes de plus forte densite´ ayant un nœud non feuille comme miroir.
+Se´lectionne l ensemble G” ⊂ G′ tel que G” = G′’ ∩ {v|Ch(m(v,C)) 6= ∅}.
+if (G” 6= ∅) then
+Se´lectionne l’ensemble Finalist ⊂ G” tel que
+Finalist = {v|ρ(v) = maxw∈G”ρ(w)} .
+⊲ Passerelle Nœud Interne↔Nœud Interne.
+else
+Se´lectionne l’ensemble Finalist ⊂ G” tel que
+Finalist = {v|ρ(v) = maxw∈G′ρ(w)} .
+⊲ Passerelle Nœud Interne↔Feuille.
+end
+else
+⊲ Tous les candidats sont des feuilles. u favorise ceux de plus faible degre´ ayant un nœud interne
+comme miroir.
+Se´lectionne l’ensemble G” ⊂ G tel que G” = G ∩ {v|Ch(m(v, C)) 6= ∅}.
+if (G” 6= ∅) then
+Se´lectionne Finalist ⊂ G” tel que Finalist = {v|δ(v) = minw∈G”δ(w)} .
+⊲ Passerelle Feuille↔Nœud Interne.
+else
+Se´lectionne Finalist ⊂ G” tel que Finalist = {v|δ(v) = minw∈G′δ(w)} .
+⊲ Passerelle Feuille↔Feuille.
+end
+end
+if (Finalist = {v}) then
+Winner = v.
+else
+Winner = {v|Id(v) = minw∈F inalistId(w)}.
+⊲ Conflits. u choisit le nœud de plus petit Id.
+end
+if (u = H(u)) then
+Winner est le nœud passerelle :
+Gateway(C(u),C) = 〈Winner, m(Winner,C)〉.
+else
+Envoie l’identite´ de Winner a` son pe`re P(u).
+end
+Se´lection de la passerelle de secours.
+Cette se´lection est purement locale et n’engendre aucun couˆt supple´mentaire. Elle tire
+avantage du caracte`re de diffusion du me´dium radio qui fait que lorsqu’un nœud e´met,
+tous les nœuds a` porte´e radio entendent le message, meˆme s’il ne leur est pas destine´.
+Quand un nœud frontie`re u envoie une information a` son pe`re durant le processus de
+4.4. NOTRE CONTRIBUTION A` LA DIFFUSION 71
+se´lection des passerelles (algorithme 2), chacun de ses voisins apprend la condition de u
+(feuille, nœud interne, nœud frontie`re, etc.). De cette fac¸on, le nœud passerelle apprend
+qui dans son voisinage e´tait e´galement candidat et ainsi peut servir potentiellement de
+passerelle de secours. Il se´lectionne ce nœud en choisissant parmi ses voisins un nœud
+frontie`re dont le miroir est diffe´rent du sien. Cette passerelle de secours agit de la fac¸on
+suivante. Sur re´ception d’un message de diffusion, la passerelle de secours enclenche
+un compte a` rebours. Si a` la fin de celui-ci, elle n’a pas entendu la passerelle principale
+e´mettre, elle e´met le message. Ce me´canisme n’ajoute aucune re´ception redondante et
+ajoute de la robustesse au processus de diffusion.
+4.4.2 L’algorithme de diffusion
+Dans un re´seau sans fil, un nœud peut avoir usage de trois sortes de broadcast :
+– une diffusion de voisinage : envoi d’un message a` tous ses 1-voisins (comme les
+paquets HELLO) ;
+– une diffusion localise´e : diffusion dans un cluster uniquement ;
+– une diffusion globale : diffusion d’un message dans tout le re´seau.
+Les passerelles ne seront utilise´es que dans le cas d’une diffusion globale, afin de re-
+layer le message diffuse´ d’un cluster a` l’autre. Afin de distinguer ces trois types de
+diffusions a` la re´ception d’un message, un nœud ne´cessite une indication dans le pa-
+quet rec¸u1. Quand une diffusion est effectue´e dans un cluster C(u), le message est
+relaye´ par tous les nœuds internes appartenant a` ce cluster. Quand le message doit eˆtre
+propage´ dans tout le re´seau, tous les nœuds internes du re´seau ainsi que les passerelles
+re´-e´mettent le message pour leurs voisins. Les passerelles (principales et de secours)
+e´tant oriente´es, elles ne re´-e´mettent que sous certaines conditions. Le nœud passe-
+relle GW (C(u), C(w)) re-transmet un message seulement s’il arrive de son propre
+cluster C(u). Un nœud passerelle miroir GWm(C(u), C(w)) ne re-transmet le mes-
+sage que s’il arrive du cluster C(u) pour lequel il est miroir. Ainsi, un nœud passe-
+relle miroir GWm(C(u), C(w)) re-transmet un message provenant de C(u) quel que
+soit le nœud qui le lui envoie et qui n’est donc pas ne´cessairement le nœud passe-
+relle GW (C(u), C(w)). Les passerelles de secours agissent comme de´crit dans la sec-
+tion 4.4.1.
+Algorithm 3 Algorithme de diffusion
+Pour tout nœud u, sur re´ception d’un message M provenant d’un nœud v ∈ Γ1(u)
+⊲ A noter que v est le nœud qui a transmis M a` u mais pas force´ment la source de la diffusion.
+if (u rec¸oit M pour la premie`re fois) then
+if Diffusion ge´ne´rale then
+if (Ch(u) 6= ∅) then
+Re´-e´met
+⊲ u est un nœud interne.
+else
+if ((C(u) = C(v)) et (u = GW (C(u),C(w))∀w ∈ V )) then
+⊲ u est un nœud passerelle et M provient de son propre cluster.
+1Les adresses IPv6 utilisent de´ja` ce ”scope” d’indication d’adresse multicast : local, global.
+72 CHAPITRE 4. DIFFUSION
+Re´-e´met
+end
+if ((C(u) 6= C(v)) et (u = GWm(C(v),C(u)))) then
+⊲M provient d’un cluster pour lequel u est une passerelle miroir.
+Re´-e´met
+end
+end
+else
+⊲ Il s’agit d’une diffusion dans un cluster.
+⊲M n’est re´-e´mis que par les nœuds internes dudit cluster.
+if ((C(v) = C(u)) et (Ch(u) 6= ∅)) then Re´-e´met end
+end
+end
+4.5 Analyses et re´sultats de simulations
+Dans un premier temps, nous avons simule´ le processus de se´lection des passerelles
+afin de l’e´valuer. Puis, nous avons simule´ des diffusions globales dans tout le re´seau et
+restreintes a` des clusters uniquement, en utilisant notre algorithme ainsi que d’autres
+protocoles existants afin de comparer les performances de chacun des protocoles de
+diffusion et de valider les re´sultats analytiques obtenus dans la section 4.3.
+4.5.1 E´ lection et utilisation des passerelles
+E´ tant donne´s deux clusters voisins C(u) et C(v), quatre types de passerelles sont pos-
+sibles :
+– Passerelle Feuille↔Feuille : GW (C(u), C(v)) et GWm(C(u), C(v)) sont deux
+nœuds feuilles. Ce type de passerelle est le plus couˆteux puisque son utilisation
+ajoute deux relais dans le processus de diffusion et cause donc plus de re´ceptions
+redondantes.
+– Passerelle Feuille↔Nœud interne : GW (C(u), C(v)) est une feuille et
+GWm(C(u), C(v)) est un nœud interne. Ce type de passerelle n’ajoute qu’un
+seul relais. Comme nous le verrons, c’est le type de passerelle le plus e´lu.
+– Passerelle Nœud Interne↔Feuille : GW (C(u), C(v)) est un nœud interne et
+GWm(C(u), C(v)) est un nœud feuille.
+– Passerelle Nœud Interne↔Nœud Interne : GW (C(u), C(v)) et GWm(C(u), C(v))
+sont deux nœuds internes. Ce type de passerelle est le moins couˆteux puisqu’il
+n’ajoute aucun e´metteur et donc n’engendre aucune re´ception superflue. Bien que
+cela soit le type de passerelle que l’algorithme cherche a` favoriser, il est le moins
+courant.
+La table 4.1 donne le nombre moyen de passerelles qu’un cluster doit e´lire et maintenir
+en moyenne vers ses clusters voisins, ainsi que le nombre de passerelles qui sont effec-
+tivement utilise´es lors de la diffusion d’un message dans tout le re´seau. On remarque
+4.5. ANALYSES ET RE´SULTATS DE SIMULATIONS 73
+500 nœuds 600 nœuds 700 nœuds
+#clusters 11.93 11.64 11.36
+#passerelles e´lues par cluster 5.86 6.02 6.16
+#passerelles utilise´es par cluster 1.76 1.74 1.73
+800 nœuds 900 nœuds 1000 nœuds
+#clusters 11.30 11.14 10.72
+#passerelles e´lues par cluster 6.20 6.22 6.26
+#passerelles utilise´es par cluster 1.76 1.68 1.66
+TAB. 4.1 – Nombre de passerelles e´lues et utilise´es par cluster lors d’une diffusion
+ge´ne´rale initie´e par une source choisie ale´atoirement.
+que le nombre de passerelles a` e´lire est raisonnable et quasiment constant malgre´ l’aug-
+mentation de l’intensite´ des nœuds. Ceci de´montre une bonne caracte´ristique pour l’ex-
+tensibilite´ de notre heuristique. Ne´anmoins, cette proprie´te´ e´tait pre´visible puisque,
+comme constate´ dans le chapitre 3.6.1, le nombre de clusters est constant a` partir d’une
+certaine intensite´ du processus sous-jacent et que les clusters forme´s correspondent
+grossie`rement a` des cellules de Voronoı¨ centre´es sur les cluster-heads. Comme, dans
+un diagramme de Voronoı¨, une cellule a 6 cellules voisines en moyenne, il en est de
+meˆme pour nos clusters et donc pour le nombre de passerelles qu’ils doivent e´lire.
+La figure 4.2(a) donne la proportion de chaque type de passerelles e´lues. On remar-
+quera que les deux types de passerelles qu’on retrouve le moins sont celles de type
+Feuille↔Nœud Interne et Nœud Interne↔Nœud Interne. Cela s’explique par le fait
+que, par construction, la majeure partie des nœuds frontie`res sont des feuilles et donc,
+la majeure partie des miroirs e´galement. Comme l’algorithme de se´lection conside`re
+en priorite´ les nœuds internes pour le nœud passerelle, aussitoˆt qu’un nœud non feuille
+est candidat, il est se´lectionne´. Comme il y a une majorite´ de feuilles sur les frontie`res,
+ce nœud interne a une forte probabilite´ d’avoir une feuille comme miroir. Ceci explique
+la forte proportion des passerelles Nœud Interne↔Feuille et Feuille↔Feuille. Plus le
+re´seau est dense, plus on a de chances de trouver des nœuds internes aux frontie`res.
+C’est pourquoi la proportion de passerelles de type Nœud Interne↔Feuille augmente
+avec le nombre de nœuds alors que la proportion de passerelles Feuille↔Feuille
+de´croıˆt.
+Quand une diffusion ge´ne´rale est effectue´e, toutes les passerelles ne sont pas
+ne´cessairement utilise´es. Si deux clusters voisins C(u) et C(v) sont relie´s par deux pas-
+serelles Gateway(C(u), C(v)) et Gateway(C(v), C(u)), dans la plupart des cas, seule-
+ment une des deux sera utilise´e. Comme le montre la table 4.1, le nombre de passerelles
+utilise´es est quasiment constant et reste faible, toujours compris entre 1 et 2. Cela si-
+gnifie que de fac¸on ge´ne´rale, ou le message diffuse´ pe´ne`tre un cluster et y meurt (dans
+ce cas, il n’utilise qu’une seule passerelle), ou il le traverse et dans ce cas utilise deux
+passerelles (une pour entrer et une pour en sortir). Ce phe´nome`ne s’explique par le fait
+que nous conside´rons une couche MAC ide´ale et que le message se propage a` la meˆme
+vitesse dans toutes les directions. Un message ne va donc pas ”contourner” un cluster
+74 CHAPITRE 4. DIFFUSION
+avant de l’inonder.
+La figure 4.2(b) illustre la proportion de chaque type de passerelle utilise´e lors d’une
+diffusion globale. La majorite´ des passerelles utilise´es sont celles n’ajoutant qu’un seul
+relais dans le processus de diffusions. Cela est vrai meˆme pour des petits nombres de
+nœuds alors que les passerelles Feuille↔Feuille e´taient majoritairement e´lues. Cela
+montre une nouvelle caracte´ristique d’extensibilite´ de notre algorithme de diffusion : il
+favorise l’utilisation des nœuds internes. Ainsi, comme le nombre moyen de passerelles
+utilise´es est faible et que chacune d’elles n’ajoute qu’un relais dans le processus de
+diffusion, le couˆt introduit par ces passerelles est faible.
+0.45 0.6
+0.55
+0.4 Feuille<->Feuille
+Noeud Interne<->Feuille
+Feuille<->Noeud Interne 0.5 Feuille<->Feuille
+Noeud Interne<->Noeud Interne Noeud Interne<->Feuille
+0.35 Feuille<->Noeud Interne0.45 Noeud Interne<->Noeud Interne
+0.3 0.4
+0.35
+0.25
+0.3
+0.2 0.25
+0.15 0.2
+0.15
+0.1
+0.1
+0.05 0.05
+500 550 600 650 700 750 800 850 900 950 1000 500 550 600 650 700 750 800 850 900 950 1000
+Intensite du processus lambda Intensite du processus lambda
+(a) Passerelles se´lectionne´es (b) Passerelles utilise´es
+FIG. 4.2 – Proportion de chaque type de passerelles se´lectionne´es et utilise´es par
+cluster.(+ : Feuille↔Feuille ; × : Nœud Interne↔Feuille ; ∗ : Feuille↔Nœud Interne ;
+2 : Nœud Interne↔Nœud Interne)
+4.5.2 Performances de la diffusion
+De fac¸on a` e´valuer notre algorithme, nous avons choisi de le comparer a` des proto-
+coles de diffusion existants les plus repre´sentatifs (cf. section 4.2) : blind flooding,
+HCC [36] (sche´mas cluster-based), Multi-Point Relais (MPR) [65] (ensemble domi-
+nant de´pendant de la source), le NES de Wu et Li [80] (ensemble dominant inde´pendant
+de la source) et le sche´ma ”Wait & See” de I. Stojmenovic, M. Seddigh et J. Zunic [74]
+(ensemble dominant base´ sur des valeurs ale´atoires). Comme mentionne´ lors des ana-
+lyses the´oriques de la section 4.3, nous cherchons a` comparer ces algorithmes en terme
+d’e´conomie d’e´nergie (nombre de messages envoye´s et rec¸us par nœud) et de bande
+passante (nombre de messages envoye´s au total), en cherchant a` calculer l’impact du
+degre´ des nœuds relais sur ces performances. C’est pourquoi nous avons releve´ la pro-
+portion des nœuds qui re´-e´mettent le message diffuse´, le degre´ de ces nœuds relais ainsi
+que l’impact de ces valeurs sur le nombre de copies redondantes d’un meˆme message
+rec¸ues par nœud.
+Dans la meˆme optique, nous avons simule´ deux variantes du protocole NES de Wu et
+Li : la version originale [80] ou` la valeur de priorite´ utilise´e par les nœuds est l’identi-
+Proportion de chaque type de passerelles elues
+Proportion de chaque type de passerelles utilisees
+4.5. ANALYSES ET RE´SULTATS DE SIMULATIONS 75
+fiant des nœuds, et une version ou` la valeur de priorite´ est le degre´ des nœuds (plus l’Id
+pour re´soudre les conflits) [26].
+Nous avons e´galement mesure´ la latence2, excepte´ pour le protocole NES-”Wait &
+See” ou` la latence de´pend de la taille de la feneˆtre dans laquelle les nœuds tirent un
+temps d’attente ale´atoire.
+A priori, un grand nombre de nœuds e´metteurs et de re´ceptions multiples ajoute de
+la redondance au protocole et le rend the´oriquement plus re´sistant face a` la mobilite´
+des nœuds et aux cassures de lien. C’est pourquoi, nous nous sommes inte´resse´s a`
+l’impact du nombre de re´ceptions redondantes et du degre´ des relais sur la robustesse
+des diffe´rents protocoles de diffusion.
+Diffusion d’un message dans tout le re´seau (diffusion ge´ne´rale)
+Nous analysons ici une diffusion d’un message dans tout le re´seau, initie´e par une
+source choisie ale´atoirement parmi les nœuds du re´seau.
+36 1
+34 Blind Flooding
+HCC 0.9
+MPR
+32 NES-’Wu et Li’
+NES-’Wu et Li, degre’ 0.8
+NES-’Wait&See’
+30 Arbres de densite Blind Flooding
+HCC
+0.7 MPR
+28 NES-’Wu et Li’
+NES-’Wu et Li, degre’
+26 0.6 NES-’Wait&See’Arbres de densite
+24 0.5
+22
+0.4
+20
+0.3
+18
+16 0.2
+14 0.1
+500 550 600 650 700 750 800 850 900 950 1000 500 550 600 650 700 750 800 850 900 950 1000
+Intensite du processus lambda Intensite du processus lambda
+(a) Degre´ des e´metteurs (b) Proportion d’e´metteurs
+FIG. 4.3 – Degre´ (a) et proportion (b) des e´metteurs en fonction des diffe´rents algo-
+rithmes de diffusion et du nombre de nœuds.(+ : Blind Flooding ; × : HCC ; ∗ : MPR ;
+2 : NES - Wu Li ; NES - Degre´ - Wu Li ; ⊖ NES - Wait & See ; • Arbres de densite´)
+La figure 4.3 montre le degre´ dans le graphe des nœuds relais ainsi que leur proportion
+dans le re´seau pour les diffe´rents algorithmes de diffusion conside´re´s.
+La figure 4.3(a) montre le degre´ des relais. Comme dans le Blind Flooding, tous les
+nœuds relaient le message, le degre´ moyen des relais correspond exactement au degre´
+moyen des nœuds dans le graphe. Nous pouvons voir que notre algorithme maximise
+le degre´ moyen des relais. En effet, notre algorithme e´lit les relais sur leur valeur de
+densite´ qui est quasiment proportionnelle a` leur degre´. La version originale du NES
+de Wu et Li et le NES-”Wait & See” e´lisent des relais de meˆme degre´, infe´rieur au
+degre´ moyen. Ceci est duˆ au fait que plus un nœud a de voisins, plus il a de chances
+2Temps au bout duquel tous les nœuds du re´seau ont rec¸u le message de diffusion.
+Degre des relais
+Proportion d’emetteurs
+76 CHAPITRE 4. DIFFUSION
+soit d’entendre l’un d’eux e´mettre avant la fin de son temps d’attente (dans le cas du
+protocole ”Wait & See”) soit d’avoir e´te´ ”e´limine´” par les re`gles de se´lection de l’algo-
+rithme de Wu et Li. On remarque e´galement que les courbes repre´sentant les degre´s des
+MPR et des relais dans le Blind Flooding sont confondues. Ceci montre que les relais
+utilise´s lors d’une diffusion avec les MPR sont choisis inde´pendamment de leur degre´.
+Les protocoles HCC et le NES-degre´ Wu de Li choisissent des relais de fort degre´ par
+construction, ce qui se retrouve dans les re´sultats.
+La figure 4.3(b) montre la proportion de relais dans le re´seau. Comme dans le blind
+flooding, tous les nœuds re-transmettent le message, cette proportion est e´gale a` 1. On
+observe que le protocole ”Wait & See” est l’heuristique ne´cessitant le moins de relais,
+ce qui implique que cette heuristique de´pense moins d’e´nergie en e´mission. Notre heu-
+ristique obtient des re´sultats proches. On remarquera e´galement que les deux variantes
+du protocole NES de Wu et Li ge´ne`rent approximativement le meˆme nombre de relais.
+Cependant, comme vu lors des analyses the´oriques, le nombre de re´ceptions par nœud
+ne peut eˆtre directement de´duit des re´sultats du degre´ des relais ou directement de la
+proportion d’e´metteurs puisqu’il est en fait le produit des deux. Comme certaines des
+heuristiques produisant le moins de relais sont e´galement celles dont les relais ont les
+plus forts degre´s, nous ne pouvons en de´duire laquelle minimise le plus le nombre de
+re´ceptions. Nous pouvons juste supposer que la variante du protocole NES utilisant
+l’identifiant des nœuds induira moins de re´ceptions que la variante utilisant le degre´
+des nœuds puisque pour un nombre e´quivalent de re´-e´metteurs, le degre´ de ses relais
+est plus faible. La figure 4.4 montre le nombre de re´ceptions par nœud d’un message
+diffuse´ dans tout le re´seau.
+35
+Blind Flooding
+HCC
+MPR
+NES-’Wu et Li’
+30 NES-’Wu et Li, degre’
+NES-’Wait&See’
+Arbres de densite
+25
+20
+15
+10
+5
+500 550 600 650 700 750 800 850 900 950 1000
+Intensite du processus lambda
+FIG. 4.4 – Nombre de re´ceptions par nœud en fonction du nombre de nœuds et des
+diffe´rents algorithmes de diffusion.(+ : Blind Flooding ; × : HCC ; ∗ : MPR ; 2 : NES
+- Wu Li ; NES - Degre´ Wu Li ; ⊖ NES - Wait & See ; • Densite´)
+Ainsi, lorqu’un message est diffuse´ a` tous les nœuds du re´seau, l’algorithme NES-
+”Wait & See” est celui induisant le moins de re´ceptions redondantes sur les nœuds,
+de´pensant ainsi moins d’e´nergie et de ressources. On remarque que notre algorithme
+obtient des re´sultats tre`s proches puisqu’il ne ge´ne`re qu’une re´ception de plus en
+moyenne par nœud que ”Wait & See”. De plus, le ”Wait & See” e´tant base´ sur des
+valeurs ale´atoires, la latence qu’il introduit est ine´vitablement supe´rieure a` celle intro-
+Nombre de receptions par noeud
+4.5. ANALYSES ET RE´SULTATS DE SIMULATIONS 77
+duite par notre protocole. On remarque e´galement que la version originale du NES de
+Wu et Li cause moins de re´ceptions que sa variante base´e sur le degre´ des nœuds.
+Latence : Puisque dans l’algorithme de se´lection des MPR, les relais sont choisis de
+fac¸on a` ce que le 2-voisinage d’un nœud soit atteint en 2 sauts, le k-voisinage de la
+source est atteint en k sauts. Sous l’hypothe`se d’une couche MAC ide´ale, les MPR
+donnent des re´sultats optimaux en terme de latence (ici e´quivalente aux nombres de
+sauts). C’est pourquoi nous avons compare´ la latence produite par notre heuristique
+a` celle produite par les MPR afin de mesurer l’e´cart entre notre solution et l’optimal.
+Nous conside´rons une unite´ de temps comme une e´tape de transmission (c.a`.d. 1 saut).
+Les re´sultats sont pre´sente´s dans la table 4.2. Meˆme si notre algorithme n’est pas op-
+timal en terme de latence, il ne s’en e´loigne gue`re (2 sauts au plus). La figure 4.5
+repre´sente la propagation temporelle d’une diffusion ge´ne´rale d’un message, initie´e
+au temps 0 par une source centrale (en vert sur les sche´mas). Les cluster-heads ap-
+paraissent en bleu. La couleur des autres nœuds de´pend du temps au bout duquel ils
+rec¸oivent le message. Plus la couleur est claire, plus le temps est long.
+(a) Propagation avec MPR (b) Propagation avec les arbres de
+densite´
+FIG. 4.5 – Temps de propagation d’un message diffuse´ dans tout le re´seau par une
+source centrale en utilisant les MPR (a) et notre me´trique (b).
+500 nœuds 700 nœuds 800 nœuds 900 nœuds 1000 nœuds
+MOY MAX MOY MAX MOY MAX MOY MAX MOY MAX
+MPR 5.13 8.97 4.88 8.40 4.88 8.40 4.81 8.23 4.78 8.07
+Densite´ 6.31 11.05 6.22 10.78 6.24 10.95 6.15 10.66 6.19 10.74
+TAB. 4.2 – Temps max et moyen pour recevoir le message. Les valeurs ”MAX” donnent
+le temps au bout duquel tous les nœuds du re´seau ont rec¸u le message. Les valeurs
+”MOY” donnent le temps moyen au bout duquel un nœud rec¸oit le message.
+78 CHAPITRE 4. DIFFUSION
+Diffusion dans un cluster.
+On suppose maintenant qu’une diffusion est initie´e dans chaque cluster, par chaque
+cluster-head. Nous avons donc autant de diffusions simultane´es que de clusters. Un
+nœud applique le protocole de diffusion (quel qu’il soit) en ne conside´rant que les
+nœuds appartenant au meˆme cluster que lui.
+1 35
+Blind Flooding
+Blind Flooding MPR
+MPR NES-’Wu&Li’
+0.9 NES-’Wu&Li’ NES-’Wu&Li-degre’
+NES-’Wu&Li-degre’ 30 NES-’Wait&See’NES-’Wait&See’ Arbres de densite
+Arbres de densite
+0.8
+25
+0.7
+0.6 20
+0.5
+15
+0.4
+10
+0.3
+0.2 5
+500 550 600 650 700 750 800 850 900 950 1000 500 550 600 650 700 750 800 850 900 950 1000
+Intensite du processus lambda Intensite du processus lambda
+(a) Proportion d’e´metteurs (b) Nombre de re´ceptions
+FIG. 4.6 – Proportion de e´metteurs (a) et Nombre moyen de re´ceptions par nœud (b)
+pour une diffusion dans un cluster en fonction de l’intensite´ du processus et du proto-
+cole utilise´.(+ : Blind Flooding ; × : MPR ; ∗ : NES - Wu Li ; 2 : NES - Degre´ Wu Li ;
+NES - Wait & See ; ⊖ Densite´ ).
+On remarque sur la figure 4.6, que pour ce type de diffusion, notre algorithme est
+celui qui minimise le plus le nombre de relais et de re´ceptions, obtenant meˆme des
+performances e´gales ou supe´rieures a` celles du protocole NES ”Wait & See”.
+Ces re´sultats confirment e´galement les re´sultats analytiques montrant que le nombre de
+re´ceptions ne peut eˆtre de´duit directement de la proportion d’e´metteurs. Par exemple,
+notre algorithme utilise moins de relais avec de plus forts degre´s que le ”Wait & See”
+pour finalement induire autant de re´ceptions par nœud.
+La table 4.3 et la figure 4.7 repre´sentent les re´sultats concernant la latence induite dans
+de telle diffusion par notre heuristique. Comme pour une diffusion ge´ne´rale, la latence
+obtenue est tre`s proche de l’optimale, s’en e´loignant seulement d’une demie unite´ de
+temps pour le temps moyen. Cela montre e´galement que, meˆme si les routes dans les
+arbres, du cluster-head vers les autres nœuds du cluster ne sont pas toujours les plus
+courtes, elles en sont tre`s proches.
+Remarque 3 A` l’exception de notre algorithme, base´ sur la densite´, une diffusion dans
+un cluster est e´quivalente a` une diffusion dans un environnement fini pour les autres
+algorithmes de diffusion, contrairement a` une diffusion ge´ne´rale qui correspond a` une
+diffusion dans un environnement non borne´. On remarquera que tous les protocoles
+sont plus robustes dans des environnements infinis.
+Proportion de noeuds emetteurs
+Nombre de receptions par noeud
+4.5. ANALYSES ET RE´SULTATS DE SIMULATIONS 79
+500 nœuds 700 nœuds 800 nœuds 900 nœuds 1000 nœuds
+MOY MAX MOY MAX MOY MAX MOY MAX MOY MAX
+MPR 1.76 4.71 1.78 4.85 1.81 4.83 1.81 4.80 1.82 5.00
+Densite´ 1.80 5.08 1.83 5.38 1.87 5.29 1.87 5.50 1.88 5.30
+TAB. 4.3 – Temps max et moyen pour recevoir le message dans un cluster. Les valeurs
+”MAX” donnent le temps au bout duquel tous les nœuds du re´seau ont rec¸u le message.
+Les valeurs ”MOY” donnent le temps moyen au bout duquel un nœud rec¸oit le message.
+(a) Clusters (b) Propagation avec MPR (c) Propagation avec les arbres
+de densite´
+FIG. 4.7 – Temps de propagation d’un message diffuse´ dans chacun des clusters
+repre´sente´s sur (a), en utilisant les MPR (b) et notre me´trique (c).
+4.5.3 Robustesse de la diffusion
+Apre`s avoir conside´re´ tous ces re´sultats, nous nous sommes interroge´s sur la robus-
+tesse de ces protocoles (toujours en conside´rant la couche re´seau uniquement) envers
+la cassure de liens. En effet, jusqu’a` maintenant, nous n’avons compare´ les diffe´rents
+protocoles qu’en terme d’e´nergie e´pargne´e en limitant les re´ceptions redondantes et le
+nombre de re´-e´metteurs. Cependant, la redondance apporte de la robustesse au proces-
+sus de diffusion. Il est donc le´gitime de se demander si une limitation de la redondance
+dans un environnement aux liens radios sensibles est bien une bonne approche ou si
+la redondance en terme de nombre de re´ceptions a re´ellement un impact sur la robus-
+tesse ? Nous nous sommes aussi interroge´s sur l’impact du degre´ des relais sur cette
+robustesse : pour une redondance de messages e´quivalente, est-il pre´fe´rable d’avoir
+peu de relais avec un fort degre´ ou un plus grand nombre de relais avec un plus petit
+degre´ ?
+Afin d’e´valuer cet aspect de la diffusion et de re´pondre a` ces diverses interrogations,
+nous avons applique´ une probabilite´ de cassure sur les liens et mesure´ la proportion
+de nœuds qui rec¸oivent encore le message diffuse´. Les simulations que nous avons
+faites supposent que le message se propage avant qu’aucune information de routage ne
+soit recalcule´e par les nœuds comme par exemple l’ensemble des MPR (pour l’heuris-
+tique des MPR), l’ensemble des voisins a` e´liminer (pour les sche´mas NES) ou le pe`re
+dans l’arbre de clustering (pour l’algorithme base´ sur la densite´). Comme dans le blind
+80 CHAPITRE 4. DIFFUSION
+flooding, tous les nœuds retransmettent le message, si des nœuds ne rec¸oivent pas le
+message, cela implique que le re´seau n’est plus connexe.
+La figure 4.8 donne la proportion des nœuds touche´s par la diffusion quand on applique
+une probabilite´ de cassure sur les liens pour les deux types de diffusion (ge´ne´rale et
+dans un cluster) et λ = 1000. Globalement, le comportement des diffe´rentes heuris-
+tiques est le meˆme pour les deux types de diffusion, excepte´ pour notre algorithme. Par
+exemple, le NES-”Wait & See” qui e´tait le meilleur protocole en terme de re´ceptions
+et d’e´metteurs est le protocole le moins robuste, quel que soit le type de diffusion.
+La figure 4.8(a) pre´sente les re´sultats pour une diffusion dans un cluster. E´ tonnamment,
+il ne semble pas que le nombre de re´ceptions redondantes et la robustesse du protocole
+soient lie´s. Par exemple, l’algorithme base´ sur les arbres de densite´ est l’un de ceux
+induisant le moins de re´ceptions redondantes et pourtant l’un des plus robustes.
+Il semble que les protocoles dont les relais ont un fort degre´ tendent a` eˆtre plus ro-
+bustes. En effet, des protocoles avec des relais a` fort degre´ (NES-degre´ et Densite´) sont
+tre`s robustes alors que ceux avec des relais a` plus faible degre´ comme les MPR ou
+le NES-”Wait & See” pre´sentent les pires comportements. Le NES-Wu&Li est moins
+robuste que sa variante NES-degre´ (qui augmente le degre´ des relais). La redondance
+en terme de nombre de re´ceptions multiples est donc tre`s couˆteuse en terme d’e´nergie
+consomme´e et de bande passante utilise´e, sans pour autant apporter plus de robustesse
+au processus de diffusion.
+Notre heuristique pre´sente une bonne robustesse envers les cassures de liens lors d’une
+diffusion dans un cluster. Comme elle minimise e´galement a` la fois le nombre de re-
+lais et le nombre de re´ceptions par nœud, elle constitue le meilleur compromis couˆt-
+robustesse-latence.
+1 1
+0.9 0.9
+0.8 0.8
+0.7 0.7
+0.6 0.6
+0.5 0.5
+0.4 0.4
+0.3 Blind Flooding 0.3 Blind Flooding
+MPR MPR
+NES-’Wu&Li’ NES-’Wu&Li’
+0.2 NES-’Wu&Li-degre’ 0.2 NES-’Wu&Li-degre’
+NES-’Wait&See’ NES-’Wait&See’
+Arbre de densite Arbres de densite
+0.1 0.1
+0 0
+0 0.2 0.4 0.6 0.8 1 0 0.2 0.4 0.6 0.8 1
+Probabilite de cassure de liens Probabilite de cassure de liens
+(a) Cassure de liens - diffusion dans un cluster (b) Cassure de liens - diffusion globale
+FIG. 4.8 – Proportion de nœuds recevant toujours le message de diffusion apre`s appli-
+cation d’une probabilite´ de cassure sur les liens lors d’une diffusion dans un cluster (a)
+ou dans tout le re´seau (b).
+Cependant, comme le montre la figure 4.8(b), notre algorithme est bien moins robuste
+lorsqu’il s’agit d’une diffusion globale. Il reste plus robuste que le NES-”Wait & See”
+Proportion de noeuds recevant le message
+Proportion de noeuds recevant le message
+4.5. ANALYSES ET RE´SULTATS DE SIMULATIONS 81
+mais bien moins que le protocole NES de Wu et Li. Ce re´sultat, couple´ au fait que
+notre heuristique est tre`s robuste lorsque le message est propage´ dans un cluster seule-
+ment, montre que les liens sensibles dans une diffusion ge´ne´rale sont les passerelles.
+En effet, si un cluster A ne peut eˆtre atteint que par le cluster B et que les nœuds de la
+passerelle de B vers A tombent, l’ensemble du cluster A est alors isole´ de la diffusion.
+Afin d’ajouter de la robustesse a` ce niveau, il est donc souhaitable d’e´lire plusieurs
+passerelles entre deux clusters voisins. E´ lire plus d’une passerelle n’ajoute aucun couˆt
+lors de la phase d’e´lection (aucun message supple´mentaire n’est utile) mais l’utilisation
+de passerelles supple´mentaires engendre plus d’e´metteurs et de re´ceptions redondantes
+lors de la propagation d’un message. Il y a donc un compromis a` faire entre le nombre
+de passerelles a` e´lire et le couˆt de leur utilisation. De fac¸on a` estimer ce compromis,
+nous avons simule´ une diffusion d’un message dans le re´seau en augmentant le nombre
+de passerelles utilise´es. Les re´sultats sont donne´s par la figure 4.9. L’ajout de passe-
+relles apporte vite de la robustesse au protocole, ce qui confirme le fait qu’il s’agissait
+bien des liens sensibles. Comme le montre la figure 4.9(a), e´lire trois passerelles entre
+chaque paire de clusters voisins permet d’obtenir la meˆme robustesse que pour le pro-
+tocole NES de Wu et Li, sans pour autant produire plus de re´ceptions et d’e´metteurs
+que ces heuristiques (figures 4.9(b) et 4.9(c)).
+1 1
+Blind Flooding
+0.9 MPR0.9 NES-’Wu et Li’
+NES-’Wait&See’
+0.8 Arbres de densite-1 passerelle0.8 Arbres de densite-2 passerellesArbres de densite-3 passerelles
+Arbres de densite-4 passerelles
+0.7
+0.7
+0.6
+0.6
+0.5
+0.5
+0.4 Blind Flooding
+MPR
+NES-’Wu&Li’ 0.4
+0.3 NES-’Wait&See’
+Arbres de densite-1 passerelle
+arbres de densite-2 passerelles 0.3
+0.2 Arbres de densite-3 passerellesArbres de densite-4 passerelles
+0.2
+0.1
+0 0.1
+0 0.2 0.4 0.6 0.8 1 500 550 600 650 700 750 800 850 900 950 1000
+Probabilite de cassure de liens Intensite du processus lambda
+(a) Robustesse (b) Proportion d’e´metteurs
+14
+Blind Flooding
+MPR
+NES-’Wu et Li’
+NES-’Wait&See’
+12 Arbres de densite-1 passerelleArbres de densite-2 passerelles
+Arbres de densite-3 passerelles
+Arbres de densite-4 passerelles
+10
++ Blind Flooding
+8 × MPR
+∗ NES - Wu Li
+6 2 NES - Wait & See
+Densite´ - 1 passerelle
+4 ⊖ Densite´ 2 passerelles
+500 550 600 650 700 750 800 850 900 950 1000 • Densite´ 3 passerelles
+Intensite du processus lambda △ Densite´ 4 passerelles
+(c) Re´ceptions par nœud (d) Le´gende
+FIG. 4.9 – Robustesse envers les cassures de liens (a), Proportion d’e´metteurs (b) et
+nombre de re´ceptions par nœud (c).
+Proportion de noeuds recevant le message
+Nombre de receptions par noeud
+Proportion d’emetteurs
+82 CHAPITRE 4. DIFFUSION
+4.6 Analyse de la se´lection des MPR dans OLSR
+Comme nous l’avons de´ja` vu, OLSR est un protocole de routage pro-actif pour les
+re´seaux ad hoc, re´cemment standardise´ a` l’IETF. Il utilise le concept des Multi-Points
+Relais (MPR) pour minimiser le trafic de controˆle et calculer les plus courts chemins
+entre toute paire de nœuds. Chaque nœud du re´seau choisit ses MPR dans son voisinage
+a` un saut. Lorsqu’un nœud u rec¸oit un message M d’un voisin v, il ne le re-transmet
+que si c’est la premie`re fois qu’il rec¸oit M et si v a de´signe´ u comme e´tant un de ses
+MPR. La se´lection des MPR consiste pour un nœud u a` choisir un ensemble minimal
+de nœuds parmi ses voisins de telle fac¸on que l’ensemble des 2-voisins de u soit ainsi
+couvert (c.a`.d. que chaque 2-voisin de u rec¸oit une transmission d’au moins un MPR
+de u). De cette fac¸on, meˆme si u ne conside`re que les MPR dans son voisinage, il peut
+joindre tous ses 2-voisins en 2 sauts, et par extension son k-voisinage en k sauts.
+Ce protocole est tre`s ce´le`bre et pourtant, il est loin d’obtenir les meilleurs re´sultats.
+Nous nous sommes alors penche´s sur la se´lection des MPR afin de l’analyser plus en
+de´tail et de comprendre pourquoi.
+4.6.1 La se´lection des MPR
+Comme la se´lection optimale d’un ensemble minimum de MPR est un proble`me NP-
+complet [40], nous donnons ici l’heuristique gloutonne de se´lection des MPR qui est
+celle actuellement utilise´e dans l’imple´mentation d’OLSR.
+Pour un nœud v ∈ Γ(u) nous notons d+, u (v) le nombre de nœuds que u peut atteindre
+en deux sauts via v :
+d+u (v) = |Γ2(u) ∩ Γ(v)|
+Pour un nœud v ∈ Γ (u) soit d−2 , u (v) le nombre de nœuds dans le voisinage de u qui
+permettent de connecter u et v en deux sauts :
+d−u (v) = |Γ(u) ∩ Γ(v)|
+Le nœud u se´lectionne dansΓ(u) un ensemble de nœuds couvrant inte´gralementΓ2(u).
+Cet ensemble est l’ensemble des MPR de u. Nous le notons MPR(u). Chaque nœud a
+donc son propre ensemble de MPR qui est diffe´rent d’un nœud a` l’autre. Par de´finition,
+MPR(u) est tel que : ⋃
+u ∪ Γ2(u) ⊂ Γ(v)
+v∈MPR(u)
+Conside´rant un nœud u, nous appelons ”nœud isole´” pour u, tout nœud v ∈ Γ2(u) pour
+lequel il n’existe qu’un chemin a` deux sauts de u a` v. En d’autres termes, un nœud v
+est dit isole´ pour u si d−u (v) = 1.
+L’algorithme de se´lection des MPR est exe´cute´ sur chaque nœud et suppose que chaque
+nœud connaıˆt ses voisins a` 1 et 2 sauts. Il se de´compose en deux e´tapes. Nous notons
+4.6. ANALYSE DE LA SE´LECTION DES MPR DANS OLSR 83
+MPR1 l’ensemble des nœuds MPR se´lectionne´s lors de la premie`re e´tape de l’algo-
+rithme. Les MPR1 permettent de couvrir les nœuds isole´s. L’algorithme de se´lection
+des MPR est le suivant.
+Algorithm 4 Algorithme glouton de se´lection des MPR - Exe´cute´ sur chaque nœud.
+Γ′(u) = Γ(u) et Γ′2(u) = Γ2(u).
+⊲ Premie`re e´tape
+Pour tout nœud v ∈ Γ(u)
+if (∃w ∈ Γ(v) ∩ Γ (u) | d−2 u (w) = 1) then
+Se´lectionne v comme MPR(u).
+⊲ Se´lectionne comme MPR(u), les nœuds de Γ(u) couvrant les nœuds ”isole´s”.
+Retire v de Γ′(u) et retire Γ(v) ∩ Γ (u) de Γ′2 2(u).
+end
+⊲ Seconde e´tape
+while (Γ′2(u) 6= ∅)
+Pour tout nœud v ∈ Γ′(u)
+if (d+(v) = max d+u w∈Γ′(u) u (w)) then
+Se´lectionne v comme MPR(u).
+⊲ Se´lectionne comme MPR(u) le nœud v permettant de rattacher le plus de nœuds de
+Γ2(u) a` u en deux sauts.
+Retire v de Γ′(u) et retire Γ(v) ∩ Γ (u) de Γ′2 2(u).
+end
+Afin de mieux comprendre cet algorithme, exe´cutons-le sur le nœud u en vert sur
+l’exemple de la figure 4.10. Les nœuds isole´s apparaissent en rouge, hachure´s hori-
+zontalement. Par exemple, le nœud t est un nœud isole´ pour u car le nœud h est le
+seul de ses voisins dans Γ(u). Le nœud h sera donc e´lu lors de la premie`re e´tape de
+l’algorithme : h ∈MPR1. De la meˆme fac¸on, u e´lira les nœuds bleus, hachure´s verti-
+calement h, i, c, g comme MPR1. Les nœuds k, j, t, s, r, q, o,m, l de Γ2(u) sont ainsi
+couverts. Le nœud u passe alors a` la seconde e´tape de l’algorithme et ne conside`re dans
+Γ2(u) que les nœuds non encore couverts (p et n) et dans Γ1 les nœuds non MPR1
+(b, f , e et d). Il ne garde donc qu’une vue re´duite de la topologie comme illustre´ sur
+la figure 4.10(b). Il se´lectionne alors son voisin de plus fort degre´ dans ce graphe.
+Comme le nœud e couvre n et p alors que f et d ne couvrent chacun qu’un nœud
+de Γ2(u) (resp. p et n), c’est e qui est e´lu. A partir de la`, tous les nœuds de Γ2(u)
+sont couverts par les nœuds se´lectionne´s comme MPR, l’algorithme s’arreˆte. On a :
+MPR(u) = {c, e, i, h, g}.
+Plusieurs algorithmes [8, 41, 53] ont e´te´ propose´s afin d’ame´liorer cet algorithme
+et re´duire le nombre de MPR se´lectionne´s. Cependant, aucun d’eux ne re´duit
+conside´rablement le nombre de MPR. Comme on peut le constater, la premie`re e´tape
+de l’algorithme glouton ne peut eˆtre supprime´e, quel que soit l’algorithme de se´lection,
+puisqu’elle seule permet de couvrir tous les nœuds isole´s. De plus, si on veut minimi-
+ser le nombre de MPR, cette e´tape doit eˆtre exe´cute´e en premier lieu. C’est pourquoi,
+toutes les variantes de cet algorithme ne portent en fait que sur la deuxie`me e´tape, ce
+qui laisse in fine une faible marge de manœuvre, comme nous allons le montrer.
+84 CHAPITRE 4. DIFFUSION
+  
+  
+  
+ l  b
+  
+  
+  
+  
+ k 
+  
+  
+ m 
+b   
+  
+ j               c
+  
+   i         
+      n
+n u d
+  
+t         u
+   d
+     
+   h
+     
+o
+      e e
+s    g  
+      f f
+p
+  
+ q 
+  
+   p
+ r    
+  
+  
+(a) Topologie globale - Les nœuds isole´s de u ap- (b) Topologie conside´re´e par u a` la fin
+paraissent en rouge et hachure´s horizontalement, les de la premie`re e´tape
+MPR1 de u apparaissent en bleu et hachure´s verti-
+calement.
+FIG. 4.10 – Illustration de l’algorithme de se´lection des MPR.
+4.6.2 Analyse
+Nous nous sommes inte´resse´s aux proprie´te´s d’un ensemble MPR se´lectionne´ par un
+nœud donne´. C’est pourquoi, dans notre analyse, nous ne conside´rons pas l’ensemble
+du re´seau mais un point particulier, ainsi que son voisinage a` 1 et 2 sauts. En effet,
+l’algorithme de se´lection de MPR est distribue´ et exe´cute´ inde´pendamment par chaque
+nœud a` partir de sa connaissance de son voisinage a` 1 et 2 sauts.
+Soit B(x,R) la boule de rayonR centre´e en x. Nous distribuons un processus ponctuel
+de Poisson d’intensite´ λ > 0 dans B(0, 2R) et ajoutons un point 0 au centre de la
+boule. Le voisinage de 0 est donc, par de´finition, l’ensemble des points du processus
+se trouvant dans B(0, R)\0. C’est pour ce point 0 que nous e´tudions l’algorithme de
+se´lection des MPR.
+Re´sultats ge´ne´raux.
+Avant de donner les re´sultats concernant l’e´tude des MPR, nous donnons des re´sultats
+plus ge´ne´raux qui nous serviront pour les calculs suivants.
+Soit A(r) l’aire de l’intersection de deux boules de rayon R dont les centres sont dis-
+tants de r (figure 4.11(a)) :
+( √r ) r2
+A(r) = 2R2 arccos − r R2 −
+2R 4
+et A1(u, r, R) l’aire de l’union de deux disques de rayons respectifs R et u et dont les
+centres sont distants de r (figure 4.11(b)) :
+s
+ 
+R2 − u2 + r2 2 u2 − R2 − r2 R2 − u2 − r2
+A1(u, r,R) = rR 1− −R
+2 arccos − u2 arccos
+2Rr 2Rr 2ur
+4.6. ANALYSE DE LA SE´LECTION DES MPR DANS OLSR 85
+                         
+                         
+ 
+                         
+                         
+                         
+                         
+                         
+R u RR                          
+                         
+                         
+                         
+                         
+                         
+                         
+                         
+                         
+r r
+(a) A(r) est l’aire en bleu : aire (b) A1(u, r, R) est l’aire hachure´e :
+de l’intersection de deux boules de union des aires de deux disques de rayons
+rayon R. R et u.
+FIG. 4.11 – Illustration des aires A(r) et A1(u, r, R).
+Nous sommes alors en mesure d e´valuer les valeurs moyennes de d+ d−’ 0 , 0 , |Γ(0)| et
+|Γ2(0)| pour une distribution poissonnienne.
+Proposition 4 Soit u ∈ Γ(0) un point uniforme´ment distribue´ dans B(0, R).
+La valeur moyenne de d+0 (u) est donne´e par :
+[ ] ∫ √λ 2pi ∫ R+ 2 − 2 3 3E d0 (u) = (piR A(r))rdrdθ = λRpiR2 0 0 4
+Pour obtenir la valeur moyenne de d+0 (u), l’ide´e est de compter le nombre moyen de
+points se trouvant dans l’aire de l’intersection de B(u,R) (1-voisinage de u) et de
+B(0, 2R)\B(0, R) (2-voisinage de 0) et de sommer pour tout point u ∈ Γ(0).
+Soit v ∈ Γ2(0) un point uniforme´ment distribue´ dans B(0, 2R)\B(0, R). La valeur
+moyenne de d−0 (v) est donne´e par :
+[ ] ∫ √2R
+− 2 2 3
+E d0 (v) = λ A(r)rdr = λR3R2 R 4
+Pour obtenir la valeur moyenne de d−0 (v), on compte le nombre de points se trou-
+vant dans l’intersection de B(v,R) (1-voisins de v) et de B(0, R) (1-voisins de 0)
+et on somme pour tout point v ∈ Γ2(0). On remarquera que v peut se trouver dans
+B(0, 2R)\B(0, R) sans pour autant eˆtre un 2-voisin de 0 dans le cas ou` 0 et v n’ont
+aucun voisin commun (si Γ(v) ∩ Γ(0) = ∅). Ainsi, pour obtenir le nombre moyen de
+2-voisins de 0, nous devons conditionner le nombre de points v dans B(R, 2R) par la
+probabilite´ que v soit un 2-voisin de 0, c.a`.d par la probabili
+Nous obtenons : [ ] [ ]
+te´ que {Γ(v) ∩ Γ(0) 6= ∅}.
+−
+− E d0 (v)
+E d0 (v)|v ∈ Γ2(0) = (d−P 0 (v) > 0)
+86 CHAPITRE 4. DIFFUSION
+ou` ( ) ∫2 2R
+d−P 0 (v) > 0 = 1− exp{−λA(r)}rdr3R2 R
+La taille moyenne du voisinage de 0 est donne´e par :
+δ˜(0) = [|Γ(0)|] = λpiR2E
+Le nombre moyen de voisins a` deux sauts de 0 (|Γ2(0)|) correspond au nombre de
+points v du processus se trouvant dans B(0, 2R)\B(0, R), conditionne´ par la proba-
+bilite´ qu’il existe un voisin commun a` chaque v et 0
+| | ( )
+. On obtient :
+2
+E [ Γ2(0) ] = 3λpiR P( d−0 (v) >∫0 )
+2 2R
+= 3λpiR2 1− exp{−λA(r)}rdr
+3R2 R
+Analyse de la premie`re e´tape de l’algorithme de se´lection des MPR.
+Nous nous inte´ressons maintenant plus particulie`rement a` la premie`re e´tape de l’al-
+gorithme de se´lection. Dans un premier temps, nous de´terminons le nombre moyen
+de points isole´s pour le point 0. Comme nous l’avons vu, l’unique voisin d’un point
+isole´ appartenant aussi a` Γ(0) est obligatoirement un MPR1. Cependant, le nombre
+de points isole´s ne nous donne pas directement le nombre de MPR1 mais une borne
+supe´rieure car un meˆmeMPR1 peut couvrir plusieurs points isole´s. Par exemple, sur la
+figure 4.10(a), nous avons quatre MPR1 mais sept nœuds isole´s. Le MPR1 i permet
+de couvrir deux nœuds isole´s : les nœuds j et k.
+Par de´finition les nœuds isole´s sont les nœuds v ∈ Γ (0)(u) tels que d−, 2 0 (v) = 1.
+Proposition 5 Soit v un point uniforme´ment distribue´ dans B(0, 2R)\B(0, R) et D
+l ensemble des points isole´s v (tels que d−’ 0 (v) = 1). On obtient :
+( ) ∫2 2R
+d−P 0 (v) = 1 = λA(r)exp{−λA(r)}rdr3R2 R
+Tout comme dans la proposition 4, nous ne conside´rons que les nœuds v tels que v ∈
+Γ2(0) : ( ) (P
+P d−0 (v) = 1|v ∈ Γ2(0) = (d−0 (v) = 1)
+)
+−
+P d0 (v) > 0
+Nous pouvons alors de´duire de cette∫probabilite´ le nombre moyen de points isole´s :2R
+E [|D|] = 2piλ2 A(r)exp{−λA(r)}rdr
+R
+qui constitue une borne supe´rieure pour le nombre de MPR1 :
+E [|MPR1|] ≤ E [|D|]
+4.6. ANALYSE DE LA SE´LECTION DES MPR DANS OLSR 87
+Dans la proposition suivante, nous donnons une borne infe´rieure du nombre moyen de
+MPR1 :
+Proposition 6 Soit u un point uniforme´ment distribue´ dans B(0, R).
+Z Z
+2   R R+r   
+P (u ∈MPR1) ≥ d
++
+P 0 (u) > 0 f(x, r,R) exp {−λ 2πR
+2−A1(R, x,R) }rdxdr
+R2 0 R
+ou` f(x, r, R) est la fonction densite´ de probabilite´ :
+[ ]
+∂
+− λ A1(x, r, R)− 2pix ( )f(x, r, R) = ∂x− {− − } exp {−λ A1(x, r, R)− pix2 }1 exp λ (A (R, r,R) piR21 )
+De cette probabilite´, nous pouvons de´duire une borne infe´rieure pour le nombre moyen
+de MPR1 :
+Z Z
+  R R+r
++   
+E [|MPR1|] ≥ 2λπP d0 (u) > 0 f(x, r,R) exp {−λ 2πR
+2−A1(R, x,R) }rdxdr
+0 R
+Preuve 6 Pour e´tablir la borne infe´rieure de la probabilite´ qu’un point de Γ(0) soit un
+MPR1, nous nous basons sur une condition suffisante. Une condition suffisante pour
+que u ∈ MPR1 est que le point w de Γ(u) le plus e´loigne´ de 0 est un point isole´
+(d−0 (w) = 1).
+Connaissant r, la distance entre 0 et u, on est capable de calculer la distribution de la
+distance entre 0 et w (le point du voisinage de u qui est le plus e´loigne´ de 0). Sachant
+alors la distance x entre 0 et w, on calcule la probabilite´ qu’il n’existe qu’un seul
+point (le point u) dans l’intersection des voisinages de 0 et w. Cette dernie`re condition
+garantit que w est un point isole´ et que u ∈ MPR1. On inte`gre alors cette dernie`re
+probabilite´ par les distributions de r et de x pour obtenir le re´sultat final. Cette borne
+est tre`s fine puisque, dans la plupart des cas, les points isole´s sont les nœuds les plus
+e´loigne´s de 0. 
+Nous nous sommes aussi inte´resse´s a` la distribution spatiale des MPR1. Nous avons
+pour cela calcule´ un encadrement de la probabilite´ qu’un point u ∈ Γ(0) a` distance
+r de 0 soit un MPR1 en fonction de sa distance a` 0. Pour cela, nous conside´rons un
+point u ∈ Γ(0) a` distance r (0 < r ≤ R) de 0. Nous fixons ces deux points (u et
+0) et distribuons les points du processus de Poisson dans B(0, 2R) inde´pendamment
+de ces deux points. Nous cherchons alors quelle est la probabilite´ que ce nœud soit
+un MPR1(0). Dans la proposition suivante, nous proposons un encadrement de cette
+probabilite´.
+88 CHAPITRE 4. DIFFUSION
+Proposition 7 Soit u un point a` distance r (0 < r ≤ R) de 0.
+Z R+r
+  
+(u ∈MPR ) ≥ 1− exp {−λ(πR2 − A(r))} f(v, r,R) exp {−λ(2πR2P 1 − A1(R, v, R))}dv
+R
+( )2
+A(R+ r)
+P (u ∈MPR1) ≤ 1− 1− exp {−λ }
+2
+Preuve 7 La borne infe´rieure est obtenue de la meˆme fac¸on que la borne infe´rieure
+du nombre de MPR1 donne´e dans la proposition 6, mais la distance entre 0 et u est
+cette fois fixe´e. La borne supe´rieure est obtenue a` partir de l’ide´e suivante. S’il existe
+des points v dans les deux demi-intersections de cercle illustre´s sur la figure 4.12, la
+plupart des voisins de u appartenant a` Γ(u) ∩ Γ2(0) sont couverts par ces points v
+(en plus de u) et ne sont donc pas isole´s. Concernant les points non couverts par les
+points v, nous pouvons montrer facilement que la meˆme borne reste valable. Cela nous
+donne une probabilite´ que u ne soit pas un MPR1, de laquelle nous pouvons de´duire
+la probabilite´ que u soit un MPR1. 
+Upper semi−intersection
+0 u
+Lower semi−intersection
+r R
+FIG. 4.12 – Les deux demi-intersections utilise´es dans la preuve de la proposition 7.
+4.6.3 Re´sultats nume´riques et simulations
+Afin d’estimer de fac¸on nume´rique les re´sultats obtenus pre´ce´demment, nous avons
+simule´ l’algorithme de se´lection des MPR. Nous utilisons le meˆme mode`le que celui
+e´tudie´ lors de l’analyse the´orique, a` savoir que les nœuds sont re´partis sur une boule
+B(0, 2) (R = 1) avec un processus ponctuel de Poisson d’intensite´ λ > 0. Nous
+ajoutons le point 0 au centre de la boule et e´tudions le nombre de MPR se´lectionne´s par
+ce point a` chaque e´tape de l’algorithme. La figure 4.13 repre´sente des e´chantillons du
+mode`le pour diffe´rentes valeurs de λ. Le point 0 pour lequel nous e´tudions l’algorithme
+est le point noir central. Les points a` l’inte´rieur de cercle sont les points de Γ(0), les
+4.6. ANALYSE DE LA SE´LECTION DES MPR DANS OLSR 89
+(a) λπ = 6 (b) λπ = 45
+FIG. 4.13 – Se´lection des MPR pour λpi = 6 et λpi = 45.
+plus gros e´tant les MPR1. Les points a` l’exte´rieur du cercle sont les voisins a` deux
+sauts de 0, les points bleus e´tant ceux couverts par les MPR1.
+On remarquera que dans les deux cas, la quasi totalite´ du 2-voisinage de 0 est couvert
+par les MPR1. L’ajout d’un seul point MPR suffirait a` couvrir l’inte´gralite´ de Γ2(0).
+Nous avons vu qu’il existe en moyenne un grand nombre de points isole´s, donnant
+naissance a` un grand nombre de MPR1. Ces MPR1 semblent eˆtre re´gulie`rement
+distribue´s pre`s de la frontie`re de B(0, R), ce qui confirme les re´sultats obtenus dans la
+proposition 7 et explique pourquoi ils couvrent une grande partie de Γ2(0).
+ 20
+analytic lower bound 1
+analytic upper bound
+18 number of MPR selected at the step 1 total number of MPR
+ 16 0,8
+ 14
+0,6
+ 12
+ 10
+0,4
+ 8
+ 6
+0,2
+ 4
+ 2 0
+0,2 0,3 0,4 0,5 0,6 0,7 0,8 0,9
+ 20  40  60  80  100  120
+mean number of neighbors distance from the origin
+(a) Nombre moyen de MPR et MPR1 obtenus (b) Bornes infe´rieure et supe´rieure de la
+par simulation et bornes analytiques du nombre de probabilite´ pour un voisin de 0 d’eˆtre un
+MPR1. MPR1(0) en fonction de la distance au
+point 0.
+FIG. 4.14 – Comparaison des re´sultats analytiques et de simulation.
+La figure 4.14(a) montre le nombre moyen de MPR et MPR1 obtenus par simulation
+ainsi que les bornes analytiques du nombre de MPR1. On observera qu’approxima-
+tivement 75% des MPR sont e´lus lors de la premie`re e´tape de l’algorithme (et sont
+number of MPR
+90 CHAPITRE 4. DIFFUSION
+des MPR1), ce qui confirme le fait que les MPR1 couvrent la quasi-totalite´ du 2-
+voisinage. Comme mentionne´ auparavant, la borne infe´rieure est une borne tre`s fine du
+nombre de MPR1 moyen.
+L’encadrement de la probabilite´ qu’un voisin de 0 soit e´lu comme MPR1(0) (donne´
+dans la proposition 7), nous permet de montrer que lesMPR1 sont re´partis a` proximite´
+de la frontie`re de la porte´e radio R de 0. La figure 4.14(b) montre ces bornes pour une
+distance r entre les nœuds 0 et ses voisins variant de 0.2 a` 0.999 pour λ = 15. On
+remarque que ces re´sultats de´pendent de λ : plus λ augmente, plus la distance entre 0
+et ses MPR1 augmente aussi (puisque 0 a plus de chances d’avoir des voisins proches
+de la frontie`re).
+4.6.4 Conse´quences
+Comme nous l’avons vu dans les sections pre´ce´dentes, le but recherche´ en introduisant
+les MPR est de minimiser le nombre de relais lors de la diffusion du trafic de controˆle.
+Le nombre de MPR doit donc eˆtre aussi petit que possible. Bien que plusieurs travaux
+aient cherche´ a` optimiser l’algorithme glouton de se´lection des MPR, seule la seconde
+e´tape de l’algorithme peut eˆtre ame´liore´e puisque la premie`re est indispensable pour
+couvrir l’ensemble du 2-voisinage d’un nœud. Or, comme nous avons pu le constater
+au cours de nos analyses et simulations, cette premie`re e´tape me`ne a` la se´lection de
+plus de 75% des MPR. Cela signifie que les ame´liorations pouvant eˆtre apporte´es ne
+portent que sur 25% des MPR, ce qui explique que les variantes de l’algorithme de
+se´lection ne produisent aucune ame´lioration significative.
+Malheureusement, cette caracte´ristique peut e´galement eˆtre une source de proble`me de
+robustesse. En effet, si 75% des MPR de u couvrent au moins un nœud isole´, la perte
+d’un de ces nœuds engendre une forte probabilite´ qu’au moins un voisin v a` 2 sauts de
+u ne rec¸oive plus un message envoye´ u. Il se peut bein suˆr que v rec¸oive le message
+de u via un autre chemin mais ce dernier serait plus optimal comme le clame OLSR.
+De plus, si v est tel que v ∈ MPR(u) et v ∈/ MPR(w), il peut recevoir un message
+pour la premie`re fois par w plutoˆt que u mais ne le re-transmettra pas puisqu’il n’est
+pas un MPR de w. Cela peut conduire a` l’isolation de certaines parties du re´seau lors
+d’une diffusion, comme l’illustre la figure 4.15. Les nuages repre´sentent deux parties
+connexes du re´seau, connecte´es par les nœuds b et c. Comme le nœud e est un nœud
+isole´ pour a, a e´lit c en tant que MPR. Il ne choisit pas b puisque le nœud d couvert
+par b l’est e´galement par c. Supposons que le lien entre c et a tombe et que la diffusion
+se propage avant que a n’ait pu recalculer ses MPR. Bien que le re´seau soit encore
+connecte´, la partie droite du re´seau ne sera pas touche´e par la diffusion car b n’e´tant
+pas MPR de a, il ne re-transmettra pas le message. Ce phe´nome`ne peut expliquer les
+mauvais re´sultats obtenus par les MPR lors de l’e´tude de la robustesse des protocoles
+de diffusion en section 4.5. De plus, les liens entre un nœud et ses MPR ont de fortes
+probabilite´s de casser dans un environnement mobile puisque, comme nous avons pu le
+constater, les MPR sont situe´s a` proximite´ de la frontie`re de la porte´e de transmission
+des nœuds. Ils sont donc plus enclins a` basculer en dehors de la zone de transmission
+et ainsi a` casser le lien radio.
+4.7. CONCLUSION ET PERSPECTIVES 91
+b
+d
+a
+c e
+(a)
+FIG. 4.15 – Exemple.
+4.7 Conclusion et perspectives
+Dans ce chapitre, nous avons tire´ avantage de certaines caracte´ristiques des clusters
+forme´s par notre heuristique pour proposer une utilisation supple´mentaire de la struc-
+ture. En effet, la structure d’arbres sous-jacente des clusters permet l’application d’un
+protocole de diffusion aussi bien dans un cluster que sur l’ensemble du re´seau, ceci
+avec un couˆt faible et borne´ et une maintenance quasi-locale. Nous avons analyse´ de
+fac¸on the´orique le nombre de re´ceptions par nœud lors d’une diffusion. Puis, nous
+avons pu constater que notre algorithme de diffusion proposait le meilleur compromis
+couˆt en e´nergie - latence - robustesse parmi les protocoles de diffusion existant dans la
+litte´rature.
+Dans le futur, il serait inte´ressant d’e´tudier ce protocole dans un environnement plus
+mobile. Dans notre approche, nous conside´rons une couche MAC ide´ale afin de pouvoir
+comparer les protocoles de niveau 3 sans s’occuper des proble`mes qui peuvent surve-
+nir aux niveaux infe´rieurs et influer sur les performances de chacun de ces protocoles.
+Cependant, comme nous l’avons mentionne´, plus le nombre de messages e´change´s
+est important, plus fortes sont les collisions survenant aux niveaux infe´rieurs. Il sem-
+blerait donc inte´ressant d’e´tudier un protocole de diffusion qui ne soit pas cloisonne´
+a` la couche re´seau mais qui prenne en conside´ration les caracte´ristiques de plusieurs
+couches en meˆme temps, plutoˆt que de chercher a` optimiser un protocole a` un niveau
+particulier.
+92 CHAPITRE 4. DIFFUSION
+4.8 Publications
+1. Journaux et revues avec comite´ de lecture :
+(a) Efficient Broadcasting in Self-Organizing Sensor Networks. Nathalie Mit-
+ton, Anthony Busson et E´ ric Fleury. International Journal of Distributed
+Sensor Networks (IJDSN), Volume 1, Janvier 2006.
+2. Colloques et confe´rences internationaux avec comite´ de lecture :
+(a) Efficient Broadcasting in Self-Organizing Multi-Hop Wireless Network.
+Nathalie Mitton, E´ ric Fleury. Conference on AD-HOC Networks & Wire-
+less (Ad Hoc Now’05), 6-8 Octobre 2005, Cancu`n, Mexique. Se´lectionne´
+parmi les meilleurs papiers pour une soumission a` une issue spe´ciale du
+journal JDA.
+(b) An analysis of the MPR selection in OLSR and consequences. Anthony
+Busson, Nathalie Mitton and E´ ric Fleury. Mediterranean Ad Hoc Net-
+working Workshop (MED-HOC-NET’05), Juin 2005, Ile de Porquerolles,
+France.
+(c) Broadcast Analysis in Multi-hop Wireless Networks. Nathalie Mitton, An-
+thony Busson and E´ ric Fleury. Invited Paper at Spatial Stochastic Modeling
+of Wireless Networks (SpasWIN’05), Avril 2005, Riva de Garda, Italie.
+(d) An analysis of the MPR selection in OLSR. Anthony Busson, Nathalie Mit-
+ton and E´ ric Fleury. Spatial Stochastic Modeling of Wireless Networks
+(SpasWIN’05), Avril 2005, Riva de Garda, Italie.
+3. Colloques et confe´rences nationaux :
+(a) Une analyse de la se´lection des MPR dans OLSR. Anthony Busson, Natha-
+lie Mitton et E´ ric Fleury. ALGOTEL’05, Mai 2005, Presqu’ıˆle de Giens,
+France.
+4. Rapports de recherche :
+(a) Broadcast in Self-organizing Wireless Multi-hop Network. Nathalie Mitton,
+Anthony Busson and E´ ric Fleury. RR-5487. Fe´vrier 2005.
+(b) An analysis of the MPR selection in OLSR. Anthony Busson, Nathalie Mit-
+ton and E´ ric Fleury. RR-5468. Janvier 2005.
+5. Journaux en cours de soumission :
+(a) Efficient Broadcasting and Self-Stabilization in Self-Organizing Multi-hop
+Wireless Networks. Nathalie Mitton, E´ ric Fleury, Isabelle Gue´rin-Lassous
+and Bruno Se´ricola and Se´bastien Tixeuil. ”Best Papers of Adhoc Now
+2005” special issue of the Journal of Discrete Algorithms (JDA).
+6. Se´minaires, pre´sentations, expose´s :
+(a) Diffusion efficace dans les re´seaux sans fil multi-sauts. Nathalie Mitton,
+E´ ric Fleury. Journe´es RESCOM - Villeneuve d’Ascq - France - 6-7 Mars
+2005.
+(b) An analysis of the MPR selection in OLSR. Anthony Busson, Nathalie Mit-
+ton, Eric Fleury. Se´minaire ACI FRAGILE - Aussois - France - 23-24 Mars
+2005.
+4.9. ANNEXES 93
+4.9 Annexes
+Nous pre´sentons ici les preuves des propositions 1 et 2 donnant le nombre de re´ceptions
+par nœud lors de la diffusion d’un message.
+Preuve de la proposition 1 E´ tant donne´ un processus ponctuel stationnaire Φ d’in-
+tensite´ λ (λ > 0), soit ΦRelay d’intensite´ λRelay un amincissement de Φ. Les points de
+ΦRelay repre´sentent les relais. Nous supposons que ΦRelay est toujours un processus
+ponctuel stationnaire. On cherche a` montrer que le nombre moyen de re´ceptions d’un
+meˆme message par nœud r est : [ ]
+o ′r = E Φ(B )
+[ ] ΦRelay 0
+′
+ou` oEΦ ΦRelay(B0) est l’espe´rance sous Palm par rapport au processus Φ (et donc la
+l y ) d b d l i d ′va eur mo enne u nom re e re a s ans B0.
+Pour un point donne´, c.a`.d. le point 0 sous les probabilite´s de Palm, le nombre moyen
+de re´ceptions correspond au nombre moyen de points de ΦRelay dans le voisinage de 0
+(a` distance infe´rieure ou e´gale a` R).
+A` partir de la formule de Mecke [76], on peut de´duire que le nombre total de re´ceptions
+Z rec¸ues par l’ensembl[e∫des nœuds d’une surfa]ce S est :[ ]
+′ o ′Z = E ΦRelay(Bx)Φ(dx) = λEΦ ΦRelay(B0)
+S
+Par stationnarite´ [d∫es deux processus pon]ctuels [Φ∫et ΦRelay , nous avon]s :
+′ ′
+E ΦRelay(Bx)Φ(dx) = E Φ(Bx)ΦRelay(dx)
+S S
+La partie gauche de l’e´quation est le nombre total de re´ceptions rec¸ues par les nœuds de
+la surface S, sachant que les nœuds en bordure peuvent recevoir le message depuis des
+nœuds en dehors de S. La partie droite de l’e´quation est le nombre de re´ceptions rec¸ues
+par l’ensemble des nœuds du processus Φ mais ge´ne´re´es uniquement par les relais se
+trouvant dans S. En appliquant la formule de Mecke de part et d’autre de l’e´quation,
+on obtient :
+[ ] [ ]
+o ′ o ′λEΦ ΦRelay(B0) = λREΦ Φ(B )Relay 0
+d’ou` :
+[ ] [ ] λ [ ]
+r = o
+′ ′ Relay ′
+EΦ Φ (B ) =
+o o o
+Relay 0 EΦ Φ(B ) P (0 ∈ Φ ) = E Φ(B )Relay 0 Φ Relay λ ΦRelay 0
+94 CHAPITRE 4. DIFFUSION
+Preuve de la proposition 2 E´ tant donne´ un graphe ale´atoireG(V,E) et un ensemble
+de relais Relay ⊂ V ou` les degre´s des nœuds et des relais ainsi que le nombre de
+re´ceptions par nœud sont e´qui-distribue´s. On cherche a` montrer que le nombre moyen
+de re´ceptions par nœud r s’e´cr[it : ∣∣∣ ]r = E δ(v1) v1 ∈ Relay P(v1 ∈ Relay) (4.2)
+Soient N une variable ale´atoire repre´sentant le nombre de sommets dans G (N = |V |)
+et Z le nombre total de re´ceptions induites sur les nœuds du re´seau par la diffusion.
+Pour tout u ∈ V , nous de´finissons δR(u) comme le nombre de relais dans le voisinage
+de u.
+Comme seuls les relais e´mettent le message, les liens e´tant bidirectionnels, le nombre
+de re´ceptions du message perc¸ues par un nœud (qu’il soit lui-meˆme relais ou non)
+correspond au nombre de relais dans son voisinage. Nous avons donc :
+r = E[δR(u)], ∀u ∈ V
+ou` E[δR(u)] est l’espe´rance de la variable δR(u) et correspond a` sa valeur moyenne.
+Les liens e´tant bi-directionnels, Z peu∑t s’e´crire de deux fac¸ons :
+Z = δR(u) (4.3)
+u∈V
+ou ∑ ∑
+Z = δ(v) = δ(v)1lv∈Relay (4.4)
+v∈Relay v∈G
+ou` 1lv∈Relay = 1 if v ∈ Relay et 1lv∈Relay = 0 sinon.
+A` partir de la pre[mie`r]e formulation[de∑+∞ ∑
+Z (e´quation 4.3), on a
+k
+Z δ (u ) ∣∣∣
+]
+i=1 R i
+E = E N = k P(N = k)
+N k
+k∑=1+∞∑k 1 [ ∣∣ ]
+= E δR(ui)∣N = k P(N = k)
+k
+k∑=1 i=1+∞ k [ ∣∣ ]
+= E δR(u1)∣N = k P(N = k)
+k
+k∑=1+∞ [ ∣∣∣ ]= E δR(u1) N = k P(N = k)
+k=1
+= E [δR(u)]
+Couple´ a` la de´finition de r donne´ en e´quation[4.2,]on a :
+Z
+r = E
+N
+4.9. ANNEXES 95
+[ ]
+Cette dernie`re e´galite´ nous permet de calculer la valeur moyenne de ZN :
+Z
+E N en
+utilisant cette fois la deuxie`me formulation de Z (e´quation 4.4). Nous conditionnons
+cette quantite´ par les diff[e´ren]tes valeurs de N :
+Z
+r = E [N∑ ]
+v∈V δ(v)1lv∈Relay= E
+∑ [+∞ ∑
+N
+k
+i=1 δ(vi)1lvi∈Relay ∣∣∣
+]
+= E N = k P(N = k)
+k
+k∑=1+∞∑k 1
+= E [δ(vi)1lv ∈Relay]P(N = k)
+k i
+k∑=1 i=+∞ [1
+= E δ(v1)1lv ∈Relay∣∣∣ ]N = k P(N = k)1
+k=1
+= E [[δ(v1)1l∣∣ v ]1∈Relay∣ ]= E δ(v1) v1 ∈ Relay P(v1 ∈ Relay)
+ou` v1 est un nœud choisi arbitrairement parmi les sommets de G.
+96 CHAPITRE 4. DIFFUSION
+Chapitre 5
+Localisation et routage
+5.1 Introduction
+Nous avons propose´ un algorithme de clustering pour organiser le re´seau (chapitre 3)
+afin de pouvoir utiliser le re´seau sans fil multi-sauts sur de larges e´chelles. Nous avons
+vu comment une telle structure de clusters peut eˆtre utilise´e pour effectuer une dif-
+fusion efficace, aussi bien dans tout le re´seau que dans un cluster. Dans ce chapitre,
+nous expliquons comment nous comptons utiliser notre organisation de clusters pour
+le routage et permettre a` toute paire de nœuds de communiquer. Dans tout type de
+re´seau, pour router un message vers un nœud destination v, un nœud u doit avoir une
+information sur la position de v. Dans les re´seaux filaires, l’information de routage
+est encapsule´e dans l’adresse du nœud, celle-ci e´tant de´pendante de la topologie du
+re´seau. Par exemple, une adresse IP identifie un nœud et en meˆme temps permet de le
+situer puisque le pre´fixe du re´seau est inclus dans l’adresse IP. Dans les re´seaux sans fil,
+l’identifiant permanent du nœud ne peut inclure sa position du fait de sa mobilite´ et est
+donc inde´pendant de la topologie sous-jacente. Les protocoles de routage utilise´s dans
+les re´seaux filaires ne peuvent eˆtre applique´s. Une approche possible est d’utiliser un
+routage indirect. Une ope´ration de routage est qualifie´e de indirecte si elle s’effectue
+en deux e´tapes : (i) le look-up qui permet de situer le nœud cible, puis, (ii) le routage
+qui permet a` la source de communiquer directement avec le nœud cible´. La figure 5.1
+illustre un routage indirect. Le nœud u veut communiquer avec le nœud v mais il doit
+d’abord le localiser. Pour cela, il effectue l’ope´ration de look-up : il demande a` une
+troisie`me entite´ (ici, le nœud w) ou` se trouve v. Cette entite´ est un point de rendez-
+vous : v enregistre re´gulie`rement sa position aupre`s de w qui garde une trace de la
+position de v. Une fois que w a re´pondu a` u, u est en mesure de contacter directement
+v Ce principe de routage est par exemple utilise´ dans les re´seaux de te´le´phonie GSM1.
+ou dans le protocole Mobile IP2, ou` la position de la destination est pre´alablement de-
+mande´e respectivement aux HLR (Home Location Register) ou aux Home Agent avant
+1http ://www.gsm.org
+2http ://www.ietf.org/rfc/rfc2002.txt
+97
+98 CHAPITRE 5. LOCALISATION ET ROUTAGE
+d’e´tablir directement la communication entre le demandeur et la destination. Cepen-
+dant, un tel principe ne peut eˆtre mis en œuvre dans un re´seau sans fil de type ad hoc
+car tous les nœuds sont susceptibles de bouger, y compris les Home Agents potentiels.
+w
+2. V is at (X,Y)
+1:  Where is v? v
+3. Route towards v
+u
+FIG. 5.1 – Routage indirect : le nœud u veut communiquer avec le nœud v mais ne
+connaıˆt pas sa position. Il demande donc dans un premier temps a` une troisie`me entite´
+(ici, le nœud w) ou` se trouve v. w sait ou` se trouve v car v enregistre re´gulie`rement sa
+position aupre`s de w qui peut re´pondre a` u. u est alors en mesure de contacter v.
+Nous nous proposons d’appliquer un sche´ma de routage indirect pour router dans des
+re´seaux sans fil multi-sauts a` large e´chelle. Nous de´sirons une solution qui permette le
+passage a` l’e´chelle du re´seau et qui doit donc maintenir le moins d’information pos-
+sible sur les nœuds. Nous voulons e´galement e´viter les situations ou` la distance entre
+la source (le nœud u sur la figure 5.1) et le point de rendez-vous (le nœud w) est plus
+importante que la distance entre la source (le nœud u) et la destination (le nœud v).
+En effet, si la requeˆte de localisation doit traverser deux fois le re´seau avant qu’une
+communication entre deux nœuds qui peuvent eˆtre proches s’e´tablisse, nous occupons
+inutilement la bande passante et introduisons une forte latence, ce qui empeˆche le pro-
+tocole d’eˆtre extensible.
+Un moyen d’appliquer un routage indirect est d’utiliser une Table de Hachage Dis-
+tribue´e (DHT - Distributed hash table). L’imple´mentation des DHT dans les re´seaux
+sans fil a donne´ naissance a` de nouvelles proble´matiques [64]. De plus, un tel adres-
+sage offre une approche prometteuse pour permettre le passage a` l’e´chelle [30]. Les
+DHT fournissent une association ge´ne´rale entre une clef et toute sorte d’information
+(comme l’identite´ d’un nœud ou une position). Elles utilisent un espace d’adressage
+virtuel V . Des partitions de cette espace virtuel sont alloue´es aux nœuds du re´seau.
+L’ide´e est d’utiliser une fonction depuis un espace re´el vers un espace virtuel V . Cette
+fonction, dite de hash, permet aux nœuds d’identifier certains points de rendez-vous
+aupre`s desquels ils enregistrent leur position. Cette fonction de hash est connue de tous
+les nœuds du re´seau et peut ensuite eˆtre utilise´e par un nœud source pour retrouver ces
+meˆmes points de rendez-vous et leur demander la position du nœud qu’ils recherchent.
+Une information connue de tous (comme le nom de notre destinataire) est hashe´e en
+une clef (hash(v) = clev) de l’espace d’adressage virtuel V . Les informations as-
+socie´es a` cette clef (comme la position des nœuds) sont ensuite stocke´es sur le (ou les)
+nœud(s) responsable(s) de la partition de l’espace virtuel auquel la clef appartient. Par
+exemple, sur la figure 5.1, nous avons hash(v) = Position nœud v ∈ I ⊂ V et
+le nœud w est responsable de l’intervalle I . En connaissant I , les nœuds v et u sont
+5.1. INTRODUCTION 99
+capables de trouver w soit pour s’enregistrer (pour le nœud v) soit pour lui demander
+ou` se trouve v (pour le nœud u). On remarque que les nœuds u et v n’ont pas besoin de
+connaıˆtre la vraie identite´ dew, mais juste son adresse virtuelle dans V . Cette ope´ration
+retournant le(s) nœud(s) responsable(s) d’une certaine clef dans les syste`mes utilisant
+des DHT, est appele´e look-up. Plus de de´tails au sujet des ope´rations de look-up sont
+donne´s dans [10].
+Dans la litte´rature, les DHT sont utilise´es a` deux niveaux : au niveau de la couche appli-
+cation et au niveau de la couche re´seau. Les DHT sont utilise´es au niveau applicatif en
+particulier dans les syste`mes pair-a`-pair. La clef ”hache´e” dans ces syste`mes de partage
+de fichiers est l’identifiant d’un fichier (cle = hash(fichier)). L’information associe´e
+a` la clef et maintenue par le nœud responsable de cette clef est l’identite´ des nœuds
+du re´seau qui de´tiennent ce fichier. Les adresses virtuelles des nœuds (ou partitions de
+V dont ils sont responsables) forment un re´seau overlay (c.a`.d un re´seau virtuel base´
+sur le re´seau physique qui maintient des liens logiques entre les nœuds) sur lequel les
+requeˆtes sont route´es. Ce qui diffe´rencie majoritairement les diffe´rentes propositions
+de re´seaux pair-a`-pair dans la litte´rature est la ge´ome´trie de ce re´seau overlay. En effet,
+la forme de ce re´seau va de l’anneau (Chord [73]) au graphe de De Bruijn (D2B [33])
+en passant par des arbres (Tapestry [84], Kademlia [54]), des espaces d-dimensionnels
+(CAN [68]), des structures en forme de papillon [52] ou encore des structures hybrides
+arbres-anneaux (Pastry [70]).
+Lorsqu’elles sont utilise´es au niveau de la couche re´seau, les DHT distribuent les in-
+formations de position des nœuds a` travers le re´seau et sont utilise´es pour identifier
+un nœud pouvant fournir des informations permettant de joindre le nœud destination.
+C’est de cette fac¸on que nous nous proposons d’utiliser les DHT. Quand un nœud u
+doit envoyer une information a` v, il doit d’abord le localiser et pour cela, demander a`
+un nœud w, responsable de la clef k = hash(v). Parmi les DHT applique´es au niveau
+re´seau, le routage utilise´ dans les diffe´rentes propositions est de deux sortes : un rou-
+tage inde´pendant de la DHT (le routage n’utilise pas l’espace virtuel V) et un routage
+de´pendant de la DHT (le routage utilise l’espace virtuel V).
+Lorsque le routage est inde´pendant de la DHT, les nœuds disposent ge´ne´ralement de
+leur coordonne´es ge´ographiques absolues (obtenues par exemple avec un GPS) ou re-
+latives (comme dans [17]). C’est cette information qu’ils associent a` la clef. En ef-
+fectuant hash(destination), un nœud u obtient des coordonne´es ge´ographiques d’une
+”zone rendez-vous” A. u peut alors appliquer un routage ge´ographique classique afin
+d’envoyer sa requeˆte vers un nœud v se trouvant dans la zone A et qui de´tient les
+coordonne´es ge´ographiques de la destination cherche´e par u. De la`, u effectue de nou-
+veau un routage ge´ographique mais cette fois, directement vers la destination. Ce type
+de routage inde´pendant de la DHT est utilise´ par exemple dans [6, 57, 58], dans les
+projets ”Terminodes” [15, 16] et ”Grid” [48]. Dans notre cas, les nœuds ne disposent
+d’aucune information concernant leur position ge´ographique et nous aimerions e´viter
+l’utilisation d’un GPS. De ce fait, nous ne pouvons utiliser ce type de routage indirect.
+Dans le cas ou` le routage est de´pendant de la DHT, l’espace virtuelV qui lui est associe´,
+est utilise´ non seulement pour identifier les points de rendez-vous mais e´galement pour
+router vers ces points et vers la destination finale. Dans ce cas, l’adresse virtuelle d’un
+100 CHAPITRE 5. LOCALISATION ET ROUTAGE
+nœud de´pend de sa position. La cohe´rence du protocole de routage repose alors sur
+la cohe´rence de la distribution des partitions de l’espace virtuel V sur les nœuds du
+re´seau. Le routage est effectue´ sur la structure logique et ne tient plus compte du
+re´seau physique sous-jacent. Dans de tels scenarii, un nœud u cherchant le nœud w
+re´cupe`re l’adresse virtuelle du point de rendez-vous v avec la fonction de hachage
+hash(w) = Idvirtuel(v). Les requeˆtes de look-up sont route´es dans V jusqu’a` v qui
+retourne l’adresse virtuelle de w. De la`, u joint w en utilisant son adresse virtuelle et en
+routant dans V . Ge´ne´ralement, le routage dans l’espace virtuel est un routage glouton :
+”Transmet a` ton voisin dans V dont l’adresse virtuelle est la plus proche de l’adresse
+virtuelle de la destination”. C’est ce qu’on trouve par exemple dans Tribe [78, 79] ou
+L+ [22] sur lequel se base SAFARI [69]. La principale difficulte´ ici est de re´partir les
+partitions de l’espace virtuel V de fac¸on a` ce que les routes obtenues en routant dans V
+ne soient pas beaucoup plus longues que les routes physiques.
+5.2 Localisation et routage sur une structure de clus-
+ters
+Dans notre proposition, chaque nœud de´tient une information concernant sa position
+relative : l’identite´ de son cluster. C’est cette information que les nœuds vont associer
+a` la clef de hachage. Comme nous avons une structure d’arbres, nous proposons de
+partitionner l’espace virtuel V dans chaque arbre. V e´tant ainsi duplique´ autant de fois
+que l’on a de clusters, on retrouve un nœud responsable d’une clef donne´e dans chaque
+arbre/cluster. Chaque nœud enregistre alors sa position dans chaque espace virtuel et
+donc dans chaque arbre. De cette fac¸on, lorsqu’un nœud v recherche un nœud u dans le
+re´seau, il a juste a` chercher dans son propre cluster. Comme l’excentricite´ d’un nœud
+dans un cluster est faible (voir chapitre 3.6.2), la distance a` parcourir pour atteindre
+le nœud de rendez-vous est e´galement faible. Partitionner ainsi plusieurs fois l’espace
+virtuel plutoˆt qu’une seule fois sur tout le re´seau e´vite les situations ou` la distance
+entre la source et le point de rendez-vous est supe´rieure a` la distance entre la source et
+la destination, puisque la source et le point de rendez-vous appartiennent toujours au
+meˆme cluster alors que la destination peut eˆtre n’importe ou` dans le re´seau.
+Pour distribuer les partitions de l’espace virtuel V de la DHT de telle fac¸on que, e´tant
+donne´e une adresse virtuelle, un nœud u soit en mesure de joindre le nœud en question
+sans information supple´mentaire, nous utilisons un sche´ma d’e´tiquetage d’arbre (tree
+Interval Labeling Scheme) pour ensuite permettre un routage par intervalle sur notre
+structure logique.
+Dans les diverses propositions de DHT que nous avons pre´sente´es, les deux phases du
+routage indirect (look-up et routage) sont toujours du meˆme type : inde´pendantes de
+la DHT et effectue´es dans l’espace physique ou de´pendantes de la DHT et effectue´es
+sur l’espace logique. Dans notre approche, les deux e´tapes de routage indirect sont ef-
+fectue´es diffe´remment. Le look-up est effectue´ en utilisant un routage par intervalle sur
+les adresses virtuelles des points de rendez-vous alors que l’e´tape de routage s’effectue
+dans l’espace physique, inde´pendamment de V .
+5.2. LOCALISATION ET ROUTAGE 101
+Le routage par intervalle s’est ave´re´ tre`s attractif de par sa simplicite´. Il a e´te´ introduit
+dans les re´seaux filaires par Santoro et Khatib dans [72] dans le but de re´duire la taille
+des tables de routage. L’ide´e est de repre´senter la table de routage de chaque nœud
+de manie`re compacte, en agre´geant l’ensemble des adresses destination qui peuvent
+eˆtre atteintes en utilisant le meˆme port de sortie, au moyen d’intervalles d’adresses
+conse´cutives. Par exemple, si l’on conside`re le graphe repre´sente´ sur la figure 5.2(a), le
+nœud 0 doit utiliser le port a pour atteindre les nœuds 4, 5 et 6, le port b pour atteindre
+1 et 2 et le port c pour atteindre 3. Plutoˆt que de cre´er une entre´e dans sa table de
+routage par nœud destination, il cre´e une entre´e par port de sortie et plutoˆt que de lister
+tous les nœuds accessibles via ce port, il stocke seulement l’intervalle contenant les
+adresses de ces nœuds : [1, 2] pour le port a, [4, 6] pour le port b et [3] pour le port
+c. Le principal avantage de ce type de routage est qu’il ne´cessite peu de me´moire sur
+les nœuds puisque la taille de la table de routage d’un nœud u est en O(δ(u)). Le
+routage est exe´cute´ de fac¸on distribue´e : a` chaque nœud interme´diaire x, si x n’est pas
+le nœud destination y, le message est transfe´re´ sur le port de sortie dont l’e´tiquette est
+un ensemble d’intervalles I tel que y ∈ I .
+Un Interval Labeling Scheme (ILS) est la fac¸on d’allouer les e´tiquettes des nœuds
+(adresses virtuelles) pour pouvoir de´finir les intervalles a` assigner aux areˆtes de chaque
+nœud, de fac¸on a` pouvoir effectuer un routage par intervalle efficace avec des routes
+aussi courtes que possible. Les auteurs de [77] ont montre´ qu’un arbre non-oriente´
+supportait un routage par intervalle avec de plus courts chemins (dans l’arbre) et en
+n’utilisant qu’un intervalle par areˆte sortante a` condition de distribuer les e´tiquettes
+(ILS) en effectuant un parcours en profondeur de l’arbre.
+Dans les re´seaux filaires, dans un arbre, les nœuds doivent stoker un intervalle pour cha-
+cune des areˆtes sortantes. La taille de la table de routage d’un nœud u est en O(δ(u)).
+Dans un environnement sans fil, l’e´mission d’un message atteint tous les nœuds se trou-
+vant a` porte´e radio de l’e´metteur. Les areˆtes du graphes sont en re´alite´ des hyper-areˆtes
+(voir figure 5.2). La proble´matique est donc un peu diffe´rente puisque une requeˆte
+e´mise sera entendue par tous les voisins de la source, qu’elle leur soit destine´e ou pas.
+Comme les nœuds n’ont qu’une hyper-areˆte sortante, ils peuvent ne stocker qu’un seul
+intervalle. Nous proposons ici de tirer avantage de la nature diffusante du me´dium ra-
+dio. Les nœuds stockent l’intervalle global pour lequel leur sous-arbre est responsable
+et non plus un intervalle pour chaque voisin. Par exemple, si on conside`re la figure 5.2,
+le nœud 0 ne ge`re plus 3 intervalles mais un seul : [0, 6]. Cela donne une taille de table
+de routage en O(1) par nœud. Quand une requeˆte est envoye´e, tous les nœuds a` porte´e
+radio la rec¸oivent mais seuls ceux concerne´s y re´pondent.
+5.2.1 Re´sume´ et analyse de complexite´
+Pour re´sumer, nous proposons d’appliquer un routage indirect sur la structure en arbres
+de notre re´seau auto-organise´, en utilisant une DHT qui associe chaque nœud a` sa
+position dans le re´seau : son cluster. L’ensemble des adresses virtuelles V de la DHT
+est partitionne´ et re´parti sur les nœuds de chaque cluster. Comme le nombre de clusters
+102 CHAPITRE 5. LOCALISATION ET ROUTAGE
+6
+[1,5] a
+[6]
+6
+b a[6] [5] 5 [5]
+[6,4] 54 c [4,6] 4
+a [0,3]
+[1 2] [0,6]
+[1,2] a [4,6]
+0
+1
+b [3,0] [3]
+1 0b [3] [2] 3a c 2
+[2]
+[3,1] [4,2]
+a a2 3
+(a) Routage en environnement filaire. Les nœuds (b) Routage en environnement sans fil. Les
+stockent un intervalle par areˆte sortante. nœuds stockent un seul intervalle (un par
+hyper-areˆte).
+FIG. 5.2 – Areˆtes dans un re´seau filaire (a) Vs hyper-areˆtes dans un re´seau sans fil (b).
+est borne´ par une constante et que les clusters sont homoge`nes (chapitre 3), chaque
+nœud maintient finalement O(1) informations de position.
+Quand un nœud u doit joindre un nœud v, il obtient l’adresse virtuelle d’un point de
+rendez-vous en utilisant la fonction de hash : hash(v) = keyv ∈ V . Puis, a` partir
+de cette adresse, en appliquant un routage par intervalle sur l’espace virtuel V de son
+propre arbre, il re´cupe`re la position C(v) de v. Comme les intervalles des voisins de u
+ne sont pas maintenus par u, u stocke uniquement l’intervalle dont son arbre est res-
+ponsable. La taille de la table de routage de u est en O(1). Une fois que u connaıˆt C(v),
+il peut atteindre C(v) en employant un routage pro-actif entre clusters puis un routage
+re´actif pour joindre v une fois que le cluster destination est atteint. Comme le nombre
+de clusters est borne´ par une constante, chaque cluster a O(1) routes a` maintenir vers
+les autres clusters.
+5.3 Notre proposition
+5.3.1 Pre´liminaires
+Chaque nœud u posse`de deux adresses :
+– Une adresse universelle Id(u) ∈ IR (souvent note´e u par la suite). Cette adresse est
+unique dans le re´seau et ne change jamais. Elle est le ”vrai” nom de u.
+– Une adresse logique i(u) ∈ V . Cette adresse est unique dans un cluster. Elle peut
+changer a` chaque re-distribution des partitions de V parmi les nœuds d’un cluster.
+Elle identifie le nœud u dans son espace logique.
+5.3. NOTRE PROPOSITION 103
+Soit I(u) la partition de V assigne´e au nœud u. I(u) est telle que I(u) = [i(u), ...[
+ou` i(u) est l’adr
+T ⋃esse logique de u dans V . i(u) de´pend donc de I(u). On noteItree(s (u)) = v∈sT (u) I(v) l’intervalle/partition de V pour lequel le sous-arbre
+de racine u est responsable. |I| de´signe la taille de l’intervalle I .
+5.3.2 Distribution des partitions de l’espace virtuel - ILS
+Comme mentionne´ dans la section 5.2, une distribution optimale des intervalles sur un
+arbre est obtenue via une nume´rotation des nœuds obtenue par un parcours en profon-
+deur ILS (Depth First Search DFS-ILS).
+Comme dans tout ILS traditionnel, les partitions de V sont attribue´es a` chaque nœud
+u ∈ V de sorte que :
+– Les intervalles des nœuds de sT (u) forment un intervalle continu.
+– La taille de l’intervalle dont un sous-arbre est responsable est proportionnelle a` la
+taille de ce sous-arbre : |Itree(sT (u))| ∝ |sT (u)|. Et donc, pour tout nœud v ∈
+sT (u), |Itree(sT (u))| ≥ |Itree(sT (v))|.
+V V ⋃– est entie`rement distribue´ parmi les nœuds du cluster : = v∈C(u) I(v).
+– Les diffe´rents intervalles s’excluent mutuellement : ∀v ∈ C(u),∀w ∈ C(u),v 6=
+w I(v) ∩ I(w) = ∅.
+Nous proposons une re´partition des intervalles distribue´e, qui s’effectue en paralle`le sur
+chaque branche de chaque arbre. Chaque nœud u ne´cessite des informations pouvant
+se trouver jusqu’a` dtree(u,H(u)) sauts de lui ou` dtree(u,H(u)) est le nombre de sauts
+dans l’arbre entre u et son cluster-headH(u). La distance dtree(u,H(u)) est borne´e par
+la hauteur des arbres qui est elle-meˆme borne´e par une constante (voir chapitre 3.6.2).
+Cette distribution peut donc eˆtre qualifie´e de quasi-locale selon la taxonomie e´tablie
+en [81], ce qui implique une maintenance rapide du processus.
+Notre algorithme s’exe´cute en deux temps : une premie`re phase pendant laquelle les
+nœuds remontent des informations depuis les feuilles de l’arbre jusqu’a` sa racine et une
+seconde phase ou` les nœuds internes distribuent re´cursivement les intervalles parmi
+leurs fils. La distribution des intervalles s’effectue en paralle`le sur chaque branche de
+chaque arbre, chaque phase ayant une complexite´ temporelle en O(Tree depth). La
+complexite´ temporelle totale de l’algorithme de distribution des intervalles pour un
+cluster est donc de 2 × (Tree depth). Comme la hauteur des arbres Tree depth est
+borne´e par une constante, la complexite´ temporelle devient O(1).
+La figure 5.3 illustre cette distribution d’intervalles pour V = [1, 17[.
+E´ tape 1. Comme nous l’avons de´ja` vu dans le chapitre 3.6.2, chaque nœud u est en
+mesure de savoir en un temps borne´ qui l’a choisi comme pe`re parmi ses voisins et
+donc connaıˆt son nombre de fils. Si un nœud est feuille, la taille de son sous-arbre
+est 1. De`s qu’un nœud interne a rec¸u la taille des sous-arbres de chacun de ses fils, il
+calcule la taille de son propre sous-arbre qui est la somme de la taille
+| T | | { }⋃ T | ∑des sous-arbres dechacun de ses fils plus 1 : s (u) = u v∈Ch(u) s (v) = 1+ v∈Ch(u) |sT (v)|.
+Chaque nœud envoie la taille de son sous-arbre a` son pe`re et ainsi de suite jusqu’a`
+atteindre le cluster-head. C’est ce qu’illustre la figure 5.3(a).
+104 CHAPITRE 5. LOCALISATION ET ROUTAGE
+E´ tape 2. Une fois que le cluster-head connaıˆt la taille des sous-arbres de chacun de ses
+fils, il partage V e´quitablement entre lui-meˆme et ses fils. Chaque fils u se voit attribuer
+une partition de V , Itree(sT (v)), de taille proportionnelle a` la taille de son sous-arbre.
+Chaque nœud interne re-distribue alors l’intervalle qu’on lui a alloue´ entre lui et ses
+fils, et ainsi de suite, jusqu’a` atteindre les extre´mite´s des branches de l’arbre. Cette
+e´tape est illustre´e sur la figure 5.3(b).
+Ainsi, une fois les deux e´tapes de l’algorithme accomplies, chaque nœud est respon-
+sable d’une partition de V qui est de taille e´gale pour tous les nœuds d’un meˆme cluster.
+La figure 5.3(c) illustre le re´sultat d’une distribution des intervalles. Le nœud u se voit
+attribuer l’intervalle I(u) et est de´sormais responsable des clefs contenues dans cet
+intervalle et il doit stocker les positions des nœuds v tels que hash(v) ∈ I(u). On
+remarque qu’il peut exister plusieurs nœuds vi tels que hash(vi) = hash(vj).
+Chaque nœud interne u garde e´galement en me´moire l’intervalle alloue´ a` son sous-
+arbre Itree(sT (u)), sans pour autant stocker les informations associe´es a` toutes les
+clefs de Itree(sT (u)). Cela lui servira lors du routage des requeˆtes, comme nous le
+verrons dans la section 5.3.6
+Comme nous l’avons mentionne´ dans le chapitre 3.6.2, un nœud interne a en moyenne
+peu de fils a` qui distribuer une partie de V . Cette ope´ration ne ge´ne`re donc que peu de
+calcul sur chaque nœud.
+5.3.3 Enregistrement
+Afin d’eˆtre localise´ par la suite, chaque nœud u doit enregistrer sa position (l’identite´
+de son cluster) aupre`s de chaque nœud responsable de la clef hash(u) dans son cluster,
+mais e´galement dans les autres clusters du re´seau. Pour s’enregistrer dans son propre
+cluster, u a juste besoin d’envoyer une requeˆte d’enregistrement ou Registration Re-
+quest, comme nous le de´taillerons plus tard dans la section 5.3.6. Pour s’inscrire dans
+les autres clusters, u doit tout d’abord joindre un nœud vi dans chaque cluster Ci. Puis,
+chaque vi envoie une Registration Request dans son propre cluster Ci au nom de u. Les
+nœuds vi peuvent eˆtre trouve´s via un routage pro-actif vers le cluster Ci, comme de´crit
+plus tard dans la section 5.3.7.
+Les nœuds s’enregistrent toutes les ∆(t) unite´s de temps. Une approche commune´ment
+adopte´e dans la litte´rature [1, 35, 56] est que les informations de localisation sont mises
+a` jour sur les points de rendez-vous en fonction de la distance de ces points de rendez-
+vous a` la source. Plus la distance est courte, plus les mises a` jour sont fre´quentes.
+5.3.4 De´parts et arrive´es
+Quand un nœud arrive dans un cluster, il n’est responsable d’aucun intervalle pour un
+certain temps.
+Quand un nœud disparaıˆt, les informations dont il e´tait en charge sont perdues (mais
+toujours disponibles dans les autres clusters). Chaque nœud interne u est constamment
+5.3. NOTRE PROPOSITION 105
+1 [1, 17[   
+    2
+   
+   
+4 [3, 5[        [13, 17[
+   
+   
+      
+    [6, 13[
+      
+   
+   
+          
+   
+      
+   
+   
+   
+      
+       1     2                              
+   
+   
+1        [7, 9[     [9, 13[ [15, 17[
+          
+   
+   
+      
+      
+          
+   
+      
+   
+      
+   
+   
+      
+      
+   
+      
+   
+      
+   
+   
+1              [11, 13[
+      
+      
+      
+      
+      
+      
+      
+(a) E´ tape 1 : chaque nœud envoie la (b) E´ tape 2 : chaque nœud interne par-
+taille de son sous-arbre a` son pe`re. Les tage l’intervalle donne´ par son pe`re entre
+feuilles (nœuds jaunes hachure´s verti- lui-meˆme et ses fils, proportionnellement
+calement) envoient 1. Les nœuds in- a` la taille des sous-arbres de chacun. Les
+ternes (nœuds oranges hachure´s horizon- intervalles note´s sur les fle`ches corres-
+talement) rassemblent les informations de pondent a` ce qui est alloue´ par un nœud
+tous leurs fils et calculent la taille de leur a` ses fils, c.a`.d l’intervalle dont le sous-
+propre sous-arbre avant de l’envoyer a` arbre de chacun est en charge.
+leur propre pe`re, et ainsi de suite, jusqu’a`
+atteindre la racine (le cluster-head), nœud
+rouge hachure´ en diagonal.
+[1, 3[
+   
+   
+   
+   
+   
+   
+      
+   
+   
+   
+   
+       [13, 15[
+   
+   
+[3, 5[     [5, 7[              
+   
+      
+   
+          
+      
+   
+          
+      
+[7, 9[    [9, 11[       [15, 17[
+      
+      
+      
+[11, 13[
+(c) Re´sultat : chaque nœud se voit attri-
+buer un intervalle de V dont il est respon-
+sable.
+FIG. 5.3 – Distribution des partitions de l’espace virtuel.
+106 CHAPITRE 5. LOCALISATION ET ROUTAGE
+au courant des arrive´es et de´parts de ses fils graˆce aux paquets HELLO. S’il constate
+des changements trop importants parmi eux, il peut de´cider localement de redistri-
+buer l’intervalle Itree(sT (u)) dont son sous arbre est en charge entre lui-meˆme et ses
+fils. Plus un nœud interne est proche du chef de cluster, plus les re´-attributions qui
+de´couleront de sa de´cision seront importantes, puisqu’elles se re´percutent de pe`re en
+fils jusqu’a` atteindre les feuilles. De plus, une nouvelle attribution des intervalles im-
+plique un changement d’adresse logique pour les nœuds. Cependant, comme constate´
+pre´ce´demment, plus un nœud est proche du chef de cluster, plus son voisinage est
+stable.
+Lorsque les intervalles sont re-distribue´s, chaque nœud u qui e´tait pre´alablement res-
+ponsable de l’intervalle Iold et qui se voit de´sormais attribuer la partition Inew ne
+conserve que les informations relatives aux clefs de Iold ∩ Inew . De fac¸on a` ne pas
+perdre pour autant les informations associe´es aux clefs de Iold \ Inew , u envoie des
+Registration Request au nom de tous les nœuds v dont il n’est plus en charge c.a`.d les
+nœuds v tels que hash(v) ∈ Iold \ Inew.
+5.3.5 Ajouter de la redondance et de la robustesse
+Comme mentionne´ dans la section 5.3.4, quand un nœud u disparaıˆt d’un cluster C(u)
+ou quitte le re´seau, les informations dont il e´tait responsable sont perdues dans ce clus-
+ter jusqu’au prochain enregistrement des nœuds. De fac¸on a` pallier cet inconve´nient,
+un nœud peut enregistrer sa position d fois dans chaque cluster, d e´tant une constante.
+Pour cela, l’espace virtuel V doit eˆtre distribue´ d fois dans chaque cluster, chaque nœud
+se voyant de´sormais attribuer d partitions inde´pendantes de V et posse´dant alors d
+diffe´rentes adresses logiques. Comme d est une constante, la taille me´moire requise
+sur les nœuds reste en O(1) puisque, en moyenne, si c est le nombre de clusters, un
+nœud devra stocker d ∗ c positions au lieu de c (c et d e´tant deux constantes). Ainsi,
+meˆme lorsqu’un nœud meurt, la position d’un nœud dont il e´tait responsable a tou-
+jours des chances d’eˆtre trouve´e dans le meˆme cluster. Cependant, cela ge´ne`re plus de
+messages puisque les requeˆtes devront de´sormais suivre d routes, une pour chaque oc-
+currence de V . Dans le pire cas, le routage des requeˆtes dans l’espace virtuel conduira
+a` une diffusion dans un cluster. Mais, comme nous l’avons e´tudie´ dans le chapitre 4,
+une telle diffusion peut s’effectuer en suivant les branches des arbres de fac¸on efficace
+et peu couˆteuse.
+5.3.6 Ope´ration de look-up : Routage dans l’espace virtuel V de la
+DHT
+Nous de´taillons ici comment les requeˆtes sont route´es dans les arbres sur la base
+d’un routage par intervalle. Ceci correspond a` la premie`re e´tape du routage indirect,
+l’ope´ration de look-up.
+Chaque nœud u a un identifiant unique Id(u). Comme dans tout sche´ma base´ sur une
+DHT, chaque nœud connaıˆt une fonction spe´cifique hash qui associe a` chaque adresse
+universelle une adresse logique de l’espace virtuel V .
+5.3. NOTRE PROPOSITION 107
+hash : IR→ V
+Id(u)→ hash(u)
+Plusieurs nœuds peuvent avoir la meˆme valeur retourne´e par la fonction hash.
+Les informations de ces nœuds seront stocke´es sur le meˆme nœud de rendez-vous.
+Dans la suite, nous utilisons la clef suivante pour identifier un nœud x : key =
+{hash(x), id(x)}.
+Une requeˆte est route´e dans l’espace virtuel jusqu’a` atteindre un nœud v responsable
+de la clef key contenue dans la requeˆte : v est tel que key ∈ I(v). Une requeˆte peut
+eˆtre de trois types :
+– u veut enregistrer une position :
+u doit enregistrer sa propre position ou, s’il est un nœud frontie`re, il peut vouloir
+enregistrer un nœud u′ d’un autre cluster qui lui en a fait la demande. u doit donc
+trouver le nœud responsable de sa propre adresse logique hash(u) ou de celle de u′,
+hash(u′) : key = {hash(u), u} (resp key′ = {hash(u′), u′. })
+Dans ce cas, u utilise une Registration Request (RR) 〈RR, key, C(u), f lag〉 (resp.
+〈RR, key′, C(u′), f lag〉).
+– u doit localiser x :
+Dans ce cas, u cherche le nœud responsable de l’adresse logique de x : hash(x).
+Il utilise une Location Request (LR) 〈LR, key = {hash(x), x} , i(u), f lag〉.
+L’adresse logique de u, i(u), est ensuite utilise´e pour envoyer la requeˆte de re´ponse
+a` u.
+– u doit re´pondre a` une requeˆte LR concernant une clef dont il est responsable
+(key ∈ I(u)) :
+u a rec¸u une requeˆte de type Location Request :
+〈LR, key = {hash(x), x} , i(w), f lag〉 envoye´e par le nœud w et contenant
+une clef telle que key ∈ I(u). u doit re´pondre a` w.
+Dans ce cas, il utilise une requeˆte de type Location Reply (Reply)
+〈Reply, key = {i(w),−1} , C(x), f lag〉. On remarque qu’ici la clef key n’a
+pas besoin de contenir l’adresse re´elle de w.
+Pour chaque type de requeˆte, le champ flag est mis a` 1 par le nœud faisant suivre la
+requeˆte si la clef key appartient a` l’intervalle de son sous-arbre, a` 0 sinon. Comme nous
+le verrons par la suite, ce champ est utilise´ pour prendre des de´cisions de routage.
+On remarque qu’un nœud u connaıˆt de´ja` la position (ou cluster) de ses voisins, de son
+chef de cluster et des nœuds dont il est responsable. Ainsi, pour un nœud v tel que
+{v ∈ H(u) ∪ Γ1(u)} ou hash(v) ∈ I(u), u n’a pas besoin d’effectuer la proce´dure de
+look-up et peut directement envoyer le message a` v, en suivant la proce´dure de routage
+dans le re´seau physique, comme de´crite dans le chapitre 5.3.7.
+Du fait de la nature diffusante du me´dium radio, un nœud rec¸oit toutes les requeˆtes
+e´mises par ses voisins, meˆme celles ne le concernant pas. Les requeˆtes de look-up
+suivent uniquement les areˆtes de l’arbre de clustering, donc un nœud ne sera pas
+108 CHAPITRE 5. LOCALISATION ET ROUTAGE
+concerne´ par une requeˆte de look-up provenant d’un de ses voisins qui ne sera ni son
+pe`re ni l’un de ses fils. Les nœuds prennent la de´cision de re´-e´mettre une requeˆte de
+look-up en se basant non-seulement sur la cle´ et le champ flag contenus dans la requeˆte
+mais e´galement sur l’identite´ de leur voisin qui leur l’a transmise. Le champ flag est
+renseigne´ a` chaque re´-e´mission de la requeˆte par un nœud. Le processus de routage
+d’une requeˆte est le meˆme quel que soit son type (LR, RR or Reply). Il est de´crit par
+l’algorithme 1.
+Vu que le routage des requeˆtes de look-up est ope´re´ sur l’espace virtuel V , il ne
+ne´cessite pas la connaissance des adresses universelles des nœuds, il n’a besoin que
+des adresses logiques.
+Sur re´ception d’un message M (RR, LR or Reply) contenant la clef key =
+{hash(x), x} provenant du nœud u (u ∈ Γ1(v)), le nœud v arreˆte le processus s’il
+est responsable de la clef key (donc si key ∈ I(v)) ou s’il est lui-meˆme le nœud
+cherche´ (si key = {hash(v), v}). Ce second cas arrive ne´anmoins rarement vu qu’il
+implique que l’initiateur de la requeˆte x soit dans le meˆme cluster que v (C(x) = C(v))
+et que v se trouve sur la route suivie par la requeˆte de x vers le nœud responsable de la
+clef.
+Lorsqu’une requeˆte de type RR 〈RR, key = {hash(u), u} , C(u), f lag〉 atteint sa des-
+tination v, v met a` jour la position du nœud u dans sa table. Lorsqu’une requeˆte
+de type Reply 〈Reply, key = {i(u),−1} , C(x), f lag〉 arrive a` sa destination u, u
+est alors capable d’entamer la seconde e´tape du routage indirect. Enfin, lorsqu’une
+requeˆte de type LR 〈LR, key = {hash(x), x} , i(w), f lag〉 atteint sa destination v
+(en charge de hash(x)), v re´pond a` l’initiateur de la requeˆte par une requeˆte Reply :
+〈Reply, {i(w),−1} , C(x), f lag〉.
+Si key 6= {hash(v), v}, le nœud v re´-e´met M dans les trois cas suivants :
+– Si u = P(v) et key ∈ Itree(sT (v)) (M a e´te´ transmis a` v par son pe`re et le sous-
+arbre de v contient la cle´ de la requeˆte). Voir figure 5.4(a).
+– Si u ∈ Ch(v) (M a e´te´ transmis a` v par un de ses fils u), v re´-e´met M si :
+– Si key ∈/ Itree(sT (v)) (le sous-arbre de v n’est pas responsable de la clef du
+message), le message doit poursuivre son chemin en remontant dans l’arbre vers
+la racine. Voir figure 5.4(b).
+– Si key ∈ Itree(sT (v)) et key ∈/ Itree(sT (u)) (flag = 0) (le sous-arbre de v
+contient la clef mais pas celui de u), v doit re´-e´mettre M afin que le message
+redescende sur une autre branche du sous-arbre de v. Voir figure 5.4(c).
+La requeˆte est ignore´e dans tous les autres cas, c’est a` dire :
+– Si u ∈/ P(v) ∪ Ch(v) (la requeˆte arrive par un lien n’e´tant pas dans l’arbre). Voir
+figure 5.5(a).
+– Si u ∈ Ch(v) et key ∈ Itree(sT (u)) (flag = 1) (le message parvient a` v par un de
+ses fils dont le sous-arbre est responsable de la clef). Graˆce au champ flag mis a` 1,
+u sait que le sous-arbre de l’e´metteur est en charge de la clef et donc ne s’en occupe
+pas. La requeˆte redescend le sous-arbre de v. Voir figure 5.5(b).
+– Si u = P(v) et key ∈/ Itree(sT (v)) (u rec¸oit M depuis son pe`re et son sous-arbre
+n’est pas en charge de la clef). u n’est pas concerne´ par la requeˆte, il l’ignore. Un de
+ses fre`res s’en chargera. Voir figure 5.5(c).
+5.3. NOTRE PROPOSITION 109
+a  I(a) = [0, 8[ a  I(a) = [0, 8[
+q = <6, a, 1>
+q = <1,  e,  0 >
+b  I(b) = [1, 3[ d  I(d) = [3, 8[ b  I(b) = [1, 3[ d  I(d) = [3, 8[
+c  I(c) = [2, 3[ e  I(e) = [5, 8[ f  I(f) = [4, 5[ c  I(c) = [2, 3[ e  I(e) = [5, 8[ f  I(f) = [4, 5[
+g  I(g) = [6, 7[ g  I(g) = [6, 7[
+h  I(h) = [7, 8[ h  I(h) = [7, 8[
+(a) Cas 1 : le message descend dans l’arbre. a (b) Cas 2 : le message remonte. e cherche le
+cherche le nœud responsable de la clef 6. nœud en charge de la clef 1.
+a  I(a) = [0, 8[
+b  I(b) = [1, 3[ d  I(d) = [3, 8[ q = <4, e,  0>
+c  I(c) = [2, 3[ e  I(e) = [5, 8[ f  I(f) = [4, 5[
+g  I(g) = [6, 7[
+h  I(h) = [7, 8[
+(c) Cas 3 : le message remonte dans une
+branche pour re-descendre dans une autre. e
+cherche le nœud en charge de la clef 4.
+FIG. 5.4 – Diffe´rents cas de figures ou` une requeˆte rec¸ue par d est re´-e´mise.
+110 CHAPITRE 5. LOCALISATION ET ROUTAGE
+a  I(a) = [0, 8[ a  I(a) = [0, 8[
+q = <key, b, flag>
+q = <7,  e,  1 >
+b  I(b) = [1, 3[ d  I(d) = [3, 8[ b  I(b) = [1, 3[ d  I(d) = [3, 8[
+c  I(c) = [2, 3[ e  I(e) = [5, 8[ f  I(f) = [4, 5[ c  I(c) = [2, 3[ e  I(e) = [5, 8[ f  I(f) = [4, 5[
+g  I(g) = [6, 7[ g  I(g) = [6, 7[
+h  I(h) = [7, 8[ h  I(h) = [7, 8[
+(a) Cas 1 : le message ne provient pas d’une (b) Cas 2 : e cherche le nœud en charge de
+branche de l’arbre. la clef 4. Le message monte et redescend les
+branches du sous-arbre de e en e´tant entendu
+par d qui ignore la requeˆte.
+a  I(a) = [0, 8[
+q = <2, a, 1>
+b  I(b) = [1, 3[ d  I(d) = [3, 8[
+c  I(c) = [2, 3[ e  I(e) = [5, 8[ f  I(f) = [4, 5[
+g  I(g) = [6, 7[
+h  I(h) = [7, 8[
+(c) Cas 3 : a cherche le nœud en charge de
+7. Cette cle´ n’est pas dans l’arbre de nœud d.
+FIG. 5.5 – Diffe´rents cas de figures ou` un message est entendu par le nœud d et ignore´. Les
+fle`ches pointille´es repre´sentent un chemin possible suivi par la requeˆte dans ces cas. Les areˆtes
+pointille´es repre´sentent les liens du graphe G non contenus dans l’arbre T .
+5.3. NOTRE PROPOSITION 111
+Algorithm 1 Routage dans l’espace virtuel
+Pour tout nœud u, sur re´ception d’une requeˆte 〈Type, key = {hash(x), x} , X, flag〉,
+X de´pendant du type de requeˆte, provenant d’un nœud v ∈ Γ1(u) et initie´e par le
+nœud y :
+if (key ∈ u ∪ I(u)) then
+⊲ u est responsable de la clef. La requeˆte a atteint sa destination.
+if (Type = LR) then
+Re´pond en envoyant 〈Reply, {X = i(y),−1} , C(x), flag〉. Exit
+end
+if (Type = RR) then Enregistre la position de x. Exit end
+if (Type = Reply) then
+Route vers le cluster destination X. Exit
+end
+end
+if (v = P(u)) then
+⊲ Le message descend les branches de l’arbre.
+if (key ∈ Itree(sT (u))) then
+⊲ ∃w ∈ sT (u) tel que key ∈ I(w). cf. figure 5.4(a).
+Met le champ flag a` 1.
+Re´-e´met.
+else
+Ignore.
+⊲ cf. figure 5.5(b).
+end
+else
+if (v ∈ Ch(u)) then
+⊲ La requeˆte remonte les branches de l’arbre depuis un fils de u.
+if (key ∈/ Itree(sT (u))) then
+Met le champ flag a` 0.
+Re´-e´met.
+⊲ cf. figure 5.4(b).
+else
+⊲ ∃w ∈ sT (u) \ {u, v} tel que key ∈ I(w).
+if (flag = 0) then
+Met le champ flag a` 1.
+Re´-e´met.
+⊲ key ∈/ Itree(sT (v)) mais puisque key ∈ Itree(sT (u)), u doit transmettre
+la requeˆte a` ses autres fils. Celle-ci redescend l’arbre par une autre branche u.
+Cf. figure 5.4(c).
+else
+⊲ La requeˆte transite par v avant de redescendre. Cf. figure 5.5(c).
+Ignore.
+end
+end
+else Ignore.
+⊲ Cf. figure 5.5(a).
+end
+end
+112 CHAPITRE 5. LOCALISATION ET ROUTAGE
+5.3.7 Routage sur le re´seau physique
+Dans cette section, nous explicitons la seconde phase du routage indirect : le routage
+dans l’espace physique. Comme nous l’avons de´ja` mentionne´, nous proposons une
+approche hie´rarchique base´e sur la structure de clusters dans laquelle nous appliquons
+un protocole pro-actif entre les clusters (comme par exemple OLSR [25]) et re´actif
+a` l’inte´rieur des clusters (comme par exemple DSR [43] ou AODV [62]). Comme le
+nombre de clusters est constant quand la densite´ des nœuds augmente, le nombre de
+nœuds par cluster augmente aussi (O(n) nœuds par cluster). Comme le nombre de
+clusters est constant, il en est de meˆme pour le nombre de routes entre ces clusters et
+chaque cluster a O(1) routes a` maintenir vers les autres clusters. Bien que le nombre
+de nœuds augmente, l’excentricite´ moyenne des nœuds dans un cluster reste faible et
+constante (entre 3 et 4 sauts en moyenne). Ainsi, une route re´active dans un cluster peut
+eˆtre trouve´e a` la demande sans trop de latence et avec un faible nombre de sauts.
+Un routage pro-actif entre clusters signifie que chaque cluster ou nœud maintient en
+permanence la liste des clusters a` traverser pour aller d’un cluster A vers un cluster B.
+Il reste maintenant a` de´finir qui, dans un cluster maintient ces routes pro-actives vers les
+autres clusters. L’approche la plus commune´ment admise est la suivante. Si tre`s peu de
+messages sont route´s vers les autres clusters, seul le chef de cluster ou quelques nœuds
+peuvent me´moriser ces routes et les fournir sur demande aux autres nœuds du cluster.
+Si au contraire, cela arrive plus fre´quemment, la table de routage entre clusters peut
+eˆtre distribue´e a` tous les nœuds en appliquant par exemple l’algorithme de diffusion
+efficace dans un cluster introduit en section 4.4.
+Supposons que le nœud u cherche a` joindre le nœud v. Si v est le chef de cluster de u
+ou un de ses voisins (v ∈ Γ1(u) ∪ {H(u)}), u sait de´ja` comment joindre v et n’a donc
+pas besoin de faire appel a` la fonction de look-up. Dans le cas contraire, u doit d’abord
+localiser v (connaıˆtre C(v)) avant de pouvoir ensuite lui envoyer un message suivant
+le processus de routage illustre´ sur la figure 5.6. Si C(v) = C(u), alors u initialise un
+routage de type re´actif dans son cluster pour joindre v. Sinon, graˆce au routage pro-actif
+entre clusters, u connaıˆt la liste des clusters a` traverser pour atteindre C(v). Soit C(w)
+le premier cluster a` traverser. u initialise un routage re´actif vers un nœud x ∈ C(u) qui
+est un nœud frontie`re avec C(w) : x tel que x ∈ C(u) et ∃y ∈ Γ1(x) ∩ C(¯w).
+x fait alors suivre le message de u a` l’un de ses voisins y se trouvant dans C(w). y
+re´ite`re alors le meˆme processus de routage, et ainsi de suite, jusqu’a` joindre le cluster
+de la destination C(v).
+Ce processus de routage est donne´ dans l’algorithme 2. Nous notons
+Next Hop(cluster1, cluster2) la fonction qui retourne le prochain cluster a`
+traverser pour atteindre le cluster2 depuis le cluster1. Cette fonction illustre le
+routage pro-actif entre clusters et est connue par tous les nœuds.
+5.3. NOTRE PROPOSITION 113
+Cluster B
+4
+Cluster C
+Cluster A 2 Y 3 Z T 5X V
+1
+U
+FIG. 5.6 – u souhaite joindre le nœud v. Graˆce a` l’ope´ration de look-up, il sait que
+C(v) = C. Il connaıˆt le prochain cluster a` traverser pour atteindre C : le cluster B. Il
+joint le nœud x, voisin de B avec un protocole re´actif (fle`che 1). x transmet le message
+a` son voisin y du cluster B (fle`che 2). y sait que les clusters B et C sont voisins,
+il transmet le message a` un nœud z de son cluster, voisin du cluster C (fle`che 3). z
+transmet a` son voisin t dans C (fle`che 4) qui joint finalement v graˆce a` un routage
+re´actif dans son cluster (fle`che 5).
+Algorithm 2 Routage hie´rarchique
+Pour un message M envoye´ par le nœud x ∈ C(x) au nœud y ∈ C(y)
+Ccurrent = C(x)
+Cnext = C(x)
+while (Cnext 6= C(y)) do
+Cnext = Next Hop(Ccurrent, C(y))
+Envoie M avec un routage re´actif vers le nœud u ∈ Ccurrent tel que ∃v ∈ Γ1(u) ∩
+Cnext.
+u envoie M a` son voisin v.
+Ccurrent = Cnext
+end
+⊲ Le message a atteint le cluster destination.
+Envoie M avec un routage re´actif vers le nœud destination y.
+end
+Enregistrer la position d’un nœud . Si le nœud u souhaite seulement enregistrer sa
+position dans un autre cluster que le sien, il utilise le meˆme sche´ma. Par exemple,
+si u souhaite s’enregistrer dans C, il exe´cute l’algorithme 2 (sans avoir a` effectuer
+l’ope´ration de look-up vu qu’il connaıˆt de´ja` le nom des clusters existants ainsi que la
+liste des clusters a` traverser pour les joindre) jusqu’a` atteindre un nœud dans C, quel
+qu’il soit (le nœud t dans notre exemple). t envoie alors une Registration Request :
+〈RR, key = {hash(u), u} , A, f lag〉 dans C. On remarque que, comme la requeˆte
+passe par le nœud y dans le cluster B, y peut faire de meˆme et enregistrer u dans b
+en meˆme temps.
+114 CHAPITRE 5. LOCALISATION ET ROUTAGE
+5.4 Simulations
+Comme nous l’avons de´ja` mentionne´, il n’a e´te´ propose´, a` notre connaissance, qu’un
+autre protocole de routage hie´rarchique qui propose une approche re´active a` l’inte´rieur
+des clusters et pro-active entre les clusters : le protocole SAFARI [69]. Dans cette
+section, nous e´valuons par simulation notre algorithme de localisation/routage sur notre
+structure de clusters en la comparant aux performances de SAFARI.
+5.4.1 SAFARI
+SAFARI propose une organisation hie´rarchique de l niveaux, c.a`.d que les clusters
+(appele´s cellules dans SAFARI) sont re´cursivement re-groupe´s en clusters de niveaux
+supe´rieurs et ainsi de suite. Les simples nœuds sont conside´re´s comme des clus-
+ters/cellules de niveau 0. Le nombre de niveaux s’e´tablit automatiquement en fonction
+de la taille et de la densite´ du re´seau.
+Le rayon des cellules de SAFARI est de´fini a priori. Le rayon D1 des cellules de ni-
+veau 1 (e´quivalentes aux clusters de notre algorithme, e´galement appele´es cellules fon-
+damentales) est fixe´ et les rayons Di des niveaux supe´rieurs sont de´finis re´cursivement
+a` partir de D1. La hie´rarchie de cellules construite par SAFARI se base sur une
+auto-se´lection des nœuds en tant que drums (cluster-heads). Un drum de niveau i est
+e´galement un drum de tout niveau infe´rieur j tel que 0 ≤ j ≤ i. Un drum de niveau i
+de´cide d’augmenter ou de de´cre´menter son niveau en fonction du nombre de drums de
+niveaux i+ 1 et i se trouvant a` une certaine distance de lui. Si un drum de niveau i n’a
+aucun drum de niveau i + 1 parmi ses voisins a` moins de Di sauts, il incre´mente son
+niveau et s’auto-de´clare drum de niveau i+ 1. Si deux drums de niveau i sont distants
+de moins de Di sauts, seul le drum de plus grand identifiant reste drum de niveau i,
+l’autre de´cre´mente son niveau et devient drum de niveau i− 1.
+Cette hie´rarchie attribue a` chaque nœud un anceˆtre (chef) unique a` chaque niveau. A
+partir de cette algorithme de clustering hie´rarchique, chaque nœud se voit attribuer
+une adresse/coordonne´e logique (qui sera son adresse dans l’espace de la DHT). La
+coordonne´e d’un nœud de niveau i est la concate´nation de la coordonne´e de son drum
+de niveau i+ 1 et d’un nombre ge´ne´re´ ale´atoirement.
+Soient COORD(di) la coordonne´e d’un drum di de niveau i, PARENT (di) le pe`re
+de di (le drum de niveau i+ 1 de di) et Rand un nombre ale´atoire. La coordonne´e de
+di est comme suit :
+COORD(di) = COORD(PARENT (d0)) pour i = 0
+= COORD(PARENT (di)).Rand pour 0 < i
+Les drums de niveau 0 (les simples nœuds) sont des feuilles dans cet arbre de coor-
+donne´es. Tous les nœuds d’une meˆme cellule fondamentale ont la meˆme coordonne´e
+logique.
+Chaque drum de niveau i envoie un paquet appele´ beacon toutes les Ti unite´s de
+temps, Ti de´pendant du niveau i. Plus le niveau hie´rarchique est e´leve´, plus la pe´riode
+5.4. SIMULATIONS 115
+d’e´mission des beacons correspondants est grande. Un beacon de niveau i envoye´ par
+le drum di est transmis a` tous les nœuds de la cellule de di ainsi qu’a` tous les nœuds
+se trouvant dans une cellule de niveau i dont le drum de niveau i + 1 est le pe`re de
+di. Par exemple, sur la Figure 5.4.3, les beacons de niveau 1 envoye´s par le drum de
+niveau 1 de la cellule F seront envoye´s a` tous les nœuds des cellules F et G, puisque
+ces deux cellules appartiennent a` la meˆme cellule de niveau 2. Chaque nœud stocke
+tous les beacons qu’ils relaient dans une table appele´e Drum Ad Hoc Routing Table
+(DART) en leur associant la date de re´ception et le nœud par lequel il a e´te´ rec¸u.
+Les coordonne´es des nœuds forment l’espace d’adressage de la DHT de SAFARI.
+La fonction de hachage retourne k diffe´rentes coordonne´es de points de rendez-vous
+pour chaque niveau i. Contrairement a` notre heuristique ou` les points de rendez-vous
+se trouvent dans le meˆme cluster que le demandeur, les points de rendez-vous dans
+SAFARI sont re´partis sur l’ensemble du re´seau. Le look-up se base sur l’ide´e qu’en
+ge´ne´ral, les nœuds communiquent plus avec les entite´s proches d’eux. Lorsqu’un nœud
+x veut s’enregistrer, il hache son identifiant et obtient k coordonne´es pour chaque ni-
+veau i (0 ≤ i ≤ l) par la DHT. x va s’inscrire k fois dans chaque niveau. Pour chacune
+de ces coordonne´es c retourne´e par la DHT, il va s’enregistrer aupre`s du nœud qu’il
+trouve qui a la coordonne´e la plus proche possible de la coordonne´e c. Pour cela, il
+envoie sa requeˆte d’enregistrement au nœud u se trouvant dans sa DART et dont la co-
+ordonne´e est la plus proche de la coordonne´e c. u fait de meˆme et transmet la requeˆte
+de u au nœud de sa propre DART dont la coordonne´e est la plus proche de c et ainsi de
+suite jusqu’a` atteindre un nœud d’une cellule fondamentale (tous les nœuds de la meˆme
+cellule fondamentale ont la meˆme coordonne´e) qui n’a aucune entre´e dans sa DART
+avec une coordonne´e plus proche de c qu il ne l est lui meˆme Ce nœud 3’ ’ - . devient le
+nœud aupre`s duquel le nœud u enregistre sa position. Lorsqu’un nœud x veut re´cupe´rer
+la coordonne´e d’un nœud y, il va d’abord chercher dans les cellules de niveau 1 appar-
+tenant a` la meˆme cellule de niveau 2 que lui. S’il ne trouve pas, il cherchera au niveau
+supe´rieur et ainsi de suite : il cherche dans toutes les cellules de niveau i appartenant a`
+la meˆme cellule de niveau i+ 1 que lui, jusqu’a` atteindre l’ensemble du re´seau. Lors-
+qu’un nœud x veut re´cupe´rer les coordonne´es d’un nœud y, il hache la coordonne´e de
+y et envoie sa requeˆte au nœud u se trouvant dans sa DART et dont la coordonne´e est
+la plus proche de la coordonne´e retourne´e par la DHT pour le niveau conside´re´, et ainsi
+de suite, jusqu’a` atteindre un nœud r. Si r connaıˆt les coordonne´es de y, il les retourne
+a` x qui pourra alors joindre y de la meˆme fac¸on qu’il a joint r. Si r ne de´tient pas la
+coordonne´e de y, x re´-ite`re sa requeˆte au niveau supe´rieur. x peut donc envoyer jusqu’a`
+l requeˆtes de look-up pour localiser y. Nous verrons par la suite que meˆme au bout de l
+fois, le look-up de SAFARI peut e´chouer. Dans nos simulations, k est fixe´ a` 3, comme
+le sugge`re les auteurs de SAFARI.
+Nous nous sommes inte´resse´s dans un premier temps a` la formation des clusters de
+chacun des deux algorithmes, puis, nous avons e´value´ les performances du look-up et
+du routage de chacun des protocoles.
+3Tous les nœuds d’une cellule fondamentale ayant la meˆme coordonne´e, plusieurs nœuds peuvent poten-
+tiellement stocker la position de u mais SAFARI n’explicite pas s’il s’agit du drum ou d’un nœud particulier
+de la cellule
+116 CHAPITRE 5. LOCALISATION ET ROUTAGE
+5.4.2 Comparaison des structures
+Comme notre heuristique construit des clusters de rayon compris entre 3 et 4 sauts
+(chapitre 3), nous avons fixe´ D1 a` 3 dans SAFARI, de fac¸on a` pouvoir comparer les
+cellules fondamentales de SAFARI aux clusters de notre algorithme. C’est d’ailleurs la
+valeur choisie par les auteurs de SAFARI dans leurs simulations.
+La diffe´rence principale entre les deux heuristiques est que SAFARI construit l ni-
+veaux hie´rarchiques de cellules alors que notre algorithme ne forme qu’un seul niveau
+de clusters. Le nombre de niveaux e´tabli par SAFARI s’adapte automatiquement en
+fonction de diame`tre du re´seau. La table 5.1 donne le nombre de niveaux construits par
+SAFARI sur diffe´rentes topologies. Nous verrons par la suite que le nombre de niveaux
+impacte les performances du look-up de SAFARI.
+Topologie Nombre de niveaux
+10× 10 Grille a` 4 voisins entre 3 et 4
+15× 15 Grille a` 4 voisins 4
+Chaıˆne de 50 nœuds entre 4 et 5
+Chaıˆne de 75 nœuds 5
+Chaıˆne de 100 nœuds 6
+Topologie Poisson λ = 500, R ≤ .1 entre 3 et 4
+Topologie Poisson λ = 500, R < .1 entre 2 et 3
+TAB. 5.1 – Nombre de niveaux de cellules construits par SAFARI en fonction de la
+topologie sous-jacente.
+Bien que le diame`tre du re´seau intervienne sur le nombre de niveaux hie´rarchiques, seul
+le degre´ des nœuds influence les caracte´ristiques des clusters, tout comme dans notre
+algorithme, les heuristiques e´tant locales et distribue´es. Les re´sultats de la table 5.2
+montrent que les clusters construits par les deux heuristiques ont des caracte´ristiques
+moyennes e´quivalentes (nous ne conside´rons que les clusters de niveau 1 pour SA-
+FARI). Cependant, comme le montre l’e´cart type du nombre de nœuds par cluster, les
+clusters de SAFARI sont moins homoge`nes que ceux de notre heuristique.
+Comme nous l’avons e´tudie´ dans le chapitre 3, lorsqu’un nœud inte`gre le re´seau or-
+ganise´ avec notre algorithme, il ve´rifie son voisinage, calcule sa densite´ et se choisit
+un pe`re. L’algorithme stabilise rapidement en un temps proportionnel a` la hauteur de
+l’arbre. Dans SAFARI, lors de la phase d’initialisation, les nœuds attendent un temps
+ale´atoire avant de prendre la de´cision d’e´ventuellement augmenter leur niveau. Cette
+de´cision est base´e sur les informations contenues dans la DART de chaque nœud. Le
+temps de stabilisation de SAFARI est donc lie´ a` la pe´riode initiale d’attente ale´atoire et
+a` la fre´quence Ti d’e´mission des beacons (donc a` T1 pour les cellules fondamentales).
+Dans nos simulations, les nœuds tirent un temps ale´atoire uniforme´ment entre 0 et 5
+unite´s de temps et T1 = 2 unite´s de temps, comme le sugge`rent les auteurs de SAFARI.
+De fac¸on a` comparer e´quitablement les deux heuristiques, nous supposons que les bea-
+cons de niveau 1 sont e´change´s a` la meˆme fre´quence que les paquets Hello dans notre
+5.4. SIMULATIONS 117
+heuristique (T1).
+λ 500 600 700
+Densite´ SAFARI Densite´ SAFARI Densite´ SAFARI
+Nb clusters 11.70 16.2 10.08 12.6 8.06 11.4
+Taille clusters 39.91 32.58 45.64 39.76 54.43 43.57
+σ(taille) 18.66 13.88 17.88 17.83 16.59 20.28
+Diame`tre 4.99 4.67 5.52 4.62 5.50 4.76
+CH/drum excen. 3.01 2.69 3.09 2.67 3.37 2.80
+Temps stab. 5.27 107.67 5.34 113.41 5.33 91.95
+σ(Temps stab) 0.63 132.41 0.74 135.56 0.85 123.69
+λ 800 900 1000
+Densite´ SAFARI Densite´ SAFARI Densite´ SAFARI
+Nb clusters 7.03 9.10 6.15 8.10 5.57 7.40
+Taille clusters 61.23 54.80 70.41 60.58 73.72 66.21
+σ(taille) 15.59 23.20 15.29 25.01 14.27 26.61
+Diame`tre 5.65 4.83 6.34 4.77 6.1 4.73
+CH/drum excen. 3.17 2.77 3.19 2.72 3.23 2.82
+Temps stab. 5.34 90.55 5.43 60.61 5.51 61.97
+σ(Temps stab) 0.99 111.18 1.21 115.58 1.44 118.69
+TAB. 5.2 – Caracte´ristiques des clusters pour chaque heuristique pour R = .1.
+Le temps de stabilisation des algorithmes est pre´sente´ dans la table 5.2. Parfois, nous
+avons pu remarquer qu’au bout de 350 unite´s de temps (temps sugge´re´ par les au-
+teurs de SAFARI), la structure de SAFARI n’e´tait pas e´tablie. Dans ces cas, SAFARI
+ne converge pas. Nous n’avons pris en compte dans ces statistiques que les cas ou`
+SAFARI converge. On remarque que l’intensite´ des nœuds n’influence pas le temps
+de stabilisation des deux protocoles. SAFARI est beaucoup plus long a` stabiliser que
+notre algorithme et son temps de stabilisation est loin d’eˆtre re´gulier comme le montre
+l’e´cart type σ. Certaines instances du protocole convergent tre`s rapidement alors que
+d’autres n’ont toujours pas converge´ apre`s un temps de 350 unite´s de temps. En effet,
+un nœud peut osciller entre diffe´rents e´tats en fonction des valeurs ale´atoires choisies.
+La figure 5.7 donne un exemple dans lequel SAFARI ne converge pas. Dans la fi-
+gure 5.7(b), le re´seau est en phase d’initialisation. La pe´riode d’attente ale´atoire du
+nœud 3 est la premie`re a` expirer : le nœud 3 devient le premier drum de niveau 1. Puis,
+les pe´riodes d’attente de plusieurs nœuds expirent. Ceux parmi eux qui entendent un
+drum de niveau 1 a` moins de D1 = 3 sauts s’attachent a` lui. Les autres s’auto-e´lisent
+drum de niveau 1. Dans notre exemple, la pe´riode du nœud 1 a expire´ avant celles de 4,
+12 et 25 et celle de 6 a expire´ avant celles des nœuds 23, 8, 26 et 16. Si au contraire, la
+pe´riode du nœud 23 avait expire´ avant celle du nœud 6, par exemple, 23 aurait cre´e´ son
+propre cluster et 6 se serait ensuite rattache´ a` 23. D’un autre coˆte´, on peut remarquer
+que si la pe´riode du nœud 19 expire avant celle du nœud 1, 19 s’attache dans un premier
+temps au drum 3 avant de s’attacher a` 1 lorsque celui-ci se de´clare drum. Ainsi, sur la
+118 CHAPITRE 5. LOCALISATION ET ROUTAGE
+figure 5.7(c), les nœuds 6 et 1 deviennent des drums de niveau 1, les nœuds 0, 9, 7
+s’attachent au nœud 0, les nœuds 21, 19, 12, 4 et 25 s’attachent au nœud 1 et les nœuds
+0, 7 et 9 s’attachent a` 3. Ceci montre l’importance du temps d’attente ale´atoire dans la
+formation des clusters de SAFARI. Comme il n’existe aucun drum de niveau 2 a` moins
+de D2 = 6 sauts du nœud 3, celui-ci devient ensuite un drum de niveau 2. les cellules
+de niveau 1 des drums 1 et 6 s’attachent a` la cellule de niveau 2 de 3 (figure 5.7(d)).
+Puis, la pe´riode d’attente du nœud 17 expire. Comme celui-ci n’entend aucun drum de
+niveau 1 a` moins de D1 sauts, il devient un drum de niveau 1. Lorsque les autres nœuds
+se re´veillent, ils s’attachent a` lui. Comme le drum 17 de niveau 1 n’entend aucun drum
+de niveau 2 dans son voisinage a` D2 sauts, il devient un drum de niveau 2. Sa cellule de
+niveau 2 ne se compose que d’une seule cellule de niveau 1. De la meˆme fac¸on, comme
+le drum 3 de niveau 2 n’entend aucun drum de niveau 3 dans son voisinage a` D3 sauts,
+il devient un drum de niveau 3. C’est ce que l’on peut voir sur la figure 5.7(f). Dans
+SAFARI, si un drum de niveau i n’entend pas au moins deux drums de niveaux i− 1,
+il baisse son niveau. Ainsi, dans notre exemple, comme le drum 3 de niveau 3 n’entend
+qu’un seul drum de niveau 2 (le drum 17), il re-devient un drum de niveau 2. De meˆme,
+comme le drum 17 de niveau 2 n’entend aucun drum de niveau 1, il re-devient drum de
+niveau 1. C’est a` dire que nous revenons a` la structure de la figure 5.7(e). La structure
+va ensuite e´voluer pour re-devenir celle illustre´e par la figure 5.7(f) et ainsi de suite.
+Un cycle apparaıˆt et SAFARI ne converge jamais.
+5.4.3 Look-up et routage
+Cette section analyse les performances du look-up effectue´ dans chaque algorithme
+ainsi que le routage qui s’en suit.
+Dans notre algorithme, les requeˆtes de look-up sont route´es a` l’inte´rieur d’un cluster
+en effectuant un routage par intervalle sur l’espace virtuel de la DHT (Section 5.3). Les
+diame`tres des clusters e´tant relativement petits, la requeˆte ne parcourra qu’un nombre
+de sauts borne´ pour atteindre le nœud rendez-vous. Ceci n’est pas le cas dans SAFARI
+ou` les nœuds rendez-vous se trouvent dans la plupart des cas dans d’autres clusters.
+De plus, comme nous l’avons de´ja` e´voque´, dans un cas de re´seau statique, avec une
+couche MAC ide´ale, tous les look-ups de notre algorithme re´ussiront, ce qui n’est pas
+le cas dans SAFARI. Et meˆme lorsqu’un look-up de SAFARI re´ussit, il peut avoir
+utilise´ plusieurs requeˆtes alors qu’une seule suffit a` notre algorithme. Cela s’explique
+par le phe´nome`ne suivant. Les drums de niveau i de SAFARI envoient leurs beacons
+aux nœuds des cellules de niveau i ayant le meˆme drum i+ 1 qu’eux. Donc, dans une
+hie´rarchie de 3 niveaux ou plus, tous les nœuds ne recevront pas les beacons de tous
+les drums. Si on prend l’exemple de la figure 5.4.3, le drum de la cellule fondamentale
+B envoie ses beacons aux nœuds des cellules A, B et C mais les nœuds des cellules D
+ou E ne les rec¸oivent pas.
+Quand le nœud d cherche a` s’enregistrer, il hache son identifiant et regarde dans sa
+table DART quel nœud v a la coordonne´e la plus proche de la valeur retourne´e par la
+DHT. En effectuant le look-up sur son propre identifiant, d finit par s’enregistrer aupre`s
+d’un nœud h. Cependant, il faut noter que h est le nœud trouve´ a` partir de la DART
+5.4. SIMULATIONS 119
+21 1
+0
+19
+25 11
+drum de niveau 0 (simple noeud) 3 9
+4
+22
+7 24
+5 12 15 20
+drum de niveau 1 2 18cellule fondamentale 14 8 26
+23 17
+drum de niveau 2 cellule de niveau 2 6 16 10 13
+drum de niveau 3 cellule de niveau 3
+(a) Le´gende (b)
+21 1 21 1
+0
+19 11 0 19 11
+3 9 4
+25
+9 4 2522 3
+7 22
+5 12 15
+24 7
+20 5 12 15
+24
+20
+14 2 26 188 14 2 8 26
+18
+23 17 23 17
+6 16 10 13 6 16 10 13
+(c)
+(d)
+21 1
+21 1
+0
+19
+25 11 0
+3 9 4 19 1122 9 4 253
+7 24 22
+5 12 15 7 2420 5 12 15 20
+14 2 8 26
+18
+14 2 18
+23 17 8 2623 17
+6 16 10 13 6 16 10 13
+(e) (f)
+FIG. 5.7 – Exemple ou` SAFARI oscille et ne converge jamais.
+120 CHAPITRE 5. LOCALISATION ET ROUTAGE
+de d. h n’a pas toujours exactement la meˆme coordonne´e que celle retourne´e par la
+DHT, il est juste un nœud dont la coordonne´e est proche. Le proble`me vient alors du
+fait que les nœuds posse`dent une table DART diffe´rente les uns des autres lorsque le
+cluster est organise´ en plus de 2 niveaux hie´rarchiques. En effet, quand un nœud s veut
+envoyer un message a` d, il hache l’identifiant de d et ainsi obtient des coordonne´es. Il
+va alors envoyer sa requeˆte aux nœuds de sa DART dont les coordonne´es sont les plus
+proches de celles retourne´es par la DHT. Il va atteindre un nœud n. Or d ne s’est pas
+enregistre´ aupre`s de n car n de figure pas dans la DART de d et n’est pas atteignable
+depuis la DART de d. De meˆme, les nœuds h aupre`s desquels d s’est enregistre´ ne
+sont pas toujours contenus dans la table DART de s et dans ces cas-la`, le look-up, ne
+peut re´ussir. Ainsi, plus le nombre de niveaux hie´rarchiques est e´leve´, plus le taux de
+re´ussite des look-ups de SAFARI est faible.
+level−0 drum (regular node)
+1
+level−1 drum
+level−2 drum d
+level−3 drum C h
+fondamental cell B
+level−2 cell
+level−3 cell F A D
+G 2
+n
+E s
+FIG. 5.8 – Exemple de clusters de SAFARI.
+La table 5.3 pre´sente diffe´rentes valeurs que nous avons releve´es lors de nos simu-
+lations de look-up et routage de chacun des deux algorithmes. La` encore, les valeurs
+concernant SAFARI ne sont prises en compte que lorsque l’algorithme converge.
+Le champ ”Nb de requeˆtes” indique le nombre de requeˆtes qu’un nœud u doit envoyer
+en moyenne avant de joindre un nœud qui de´tient l’information recherche´e (avant de
+re´ussir le look-up). Ce champ est toujours e´gal a` 1 pour notre heuristique puisqu’une
+seule requeˆte est ne´cessaire.
+Le champ ”Longueur du Look-up” donne le nombre de sauts que parcourt une requeˆte
+de look-up en moyenne dans chaque algorithme. Les nœuds de rendez-vous de notre
+algorithme e´tant toujours dans le meˆme cluster que la source de la requeˆte et ceux de
+SAFARI e´tant distribue´s sur l’ensemble du re´seau, les routes sont e´videmment plus
+courtes dans notre heuristique. A` cela s’ajoute que SAFARI peut lancer une requeˆte de
+plus en plus loin en augmentant le niveau apre`s un e´chec de requeˆte de look-up. Ces
+valeurs sont influence´es par la densite´ locale du re´seau (degre´ des nœuds) puisque les
+5.4. SIMULATIONS 121
+λ 500 600 700
+Densite´ SAFARI Densite´ SAFARI Densite´ SAFARI
+Nb de requeˆtes 1 1.71 1 1.82 1 1.78
+Taux de re´ussite 100% 95.70% 100% 92.20% 100% 90.90%
+Longueur du Look-up 3.02 14.94 3.07 12.56 3.15 10.68
+Longueur des chemins 6.31 7.28 6.67 5.87 6.37 6.17
+Longueur globale 12.39 37.16 12.81 30.99 12.67 27.53
+λ 800 900 1000
+Densite´ SAFARI Densite´ SAFARI Densite´ SAFARI
+Nb de requeˆtes 1 1.79 1 1.58 1 1.54
+Taux de re´ussite 100% 85.80% 100% 90.50% 100% 91.00%
+Longueur du Look-up 3.16 10.36 3.21 8.63 3.24 5.04
+Longueur des chemins 6.75 5.88 6.61 5.73 6.66 5.09
+Longueur globale 13.07 26.60 13.03 22.99 13.14 15.17
+TAB. 5.3 – Comparaison de notre algorithme et de SAFARI.
+caracte´ristiques des clusters en de´coulent. Cependant, ce facteur de´pend e´galement de
+l’e´talement du re´seau pour SAFARI car plus le re´seau est e´tendu, plus le nœud rendez-
+vous peut eˆtre e´loigne´.
+Le champ ”Longueur des chemins” donne le nombre de sauts a` parcourir dans la
+deuxie`me phase du routage indirect, en suivant les sche´mas de routage propose´s dans
+chacun des algorithmes. Le champ ”Longueur globale” donne le nombre moyen de
+sauts a` parcourir avant d’atteindre enfin le nœud destination. Il est e´gal a` la longueur
+des routes de la deuxie`me e´tape plus deux fois la longueur des routes du look-up car la
+requeˆte de look-up doit effectuer un aller-retour.
+On remarque que les chemins de look-up dans SAFARI sont plus longs que les chemins
+emprunte´s par les messages lors de la deuxie`me phase du routage indirect, ce qui peut
+induire une latence importante. Ce n’est pas le cas dans notre approche ou` les requeˆtes
+de look-up sont contenues dans un cluster et donc suivent un chemin dont la taille est
+borne´e par le diame`tre des clusters, lui-meˆme borne´ par une constante. (Cf. chapitre 3).
+Les longueurs des routes (suivies par les requeˆtes de look-up et par les messages de
+donne´es) de´pendent bien suˆr de la densite´ locale du re´seau comme toutes les autres
+caracte´ristiques e´tudie´es pour ces deux protocoles. Cependant, les routes emprunte´es
+dans la deuxie`me phase du routage indirect de´pendent e´galement de l’e´talement du
+re´seau. Plus le re´seau est grand, plus la distance se´parant deux nœuds du re´seau est
+grande. Dans SAFARI, il en est de meˆme pour la taille des routes suivies par les
+requeˆtes de look-up. Dans notre approche, la longueur des routes du look-up reste
+constante lorsque le re´seau s’e´tale car elle est limite´e par le diame`tre des clusters qui
+lui-meˆme reste constant. Ainsi, meˆme si pour les re´sultats de simulation obtenus, la
+longueur des routes de look-up dans notre approche repre´sente pre`s de la moitie´ de
+la taille du chemin global, elle tend a` devenir ne´gligeable devant la taille des routes
+vers le nœud destination lorsque le re´seau s’e´tale, ce qui n’est pas le cas de SAFARI
+pour lequel le ratio longueur look−uplongueur totale reste constant avec l’e´talement du re´seau. Les
+122 CHAPITRE 5. LOCALISATION ET ROUTAGE
+comparaisons mene´es ici peuvent sembler avoir e´te´ mene´es sur un re´seau trop peu
+e´tendu. Cependant, le but recherche´ ici e´tait de comparer notre algorithme a` SAFARI
+et pour un re´seau plus large, SAFARI construit un plus grand nombre de niveaux et ne
+converge plus. C’est pourquoi, nous n’avons pu simuler le routage sur un re´seau plus
+e´tendu qu’avec notre me´trique. Les re´sultats donne´s dans la table 5.4 sont obtenus sur
+un re´seau ou` le degre´ moyen des nœuds (et donc l’intensite´ λ du processus de Poisson)
+est constant mais avec une taille de re´seau de plus en plus importante. Les re´sultats sont
+donne´s pour λ = 500 (δ ≈ 15.7) mais le comportement de l’algorithme est le meˆme
+quelle que soit l’intensite´ conside´re´e.
+Les re´sultats montrent qu’effectivement, bien que le re´seau grandisse, la longueur des
+routes emprunte´es par les requeˆtes de look-up reste constante et que seule la longueur
+totale des routes pour joindre le nœud destinataire augmente.
+Les routes emprunte´es lors de la deuxie`me phase du routage indirect ne sont pas op-
+timales dans la mesure ou` elles ne sont pas calcule´es sur la topologie des nœuds mais
+sur la topologie de clusters On retrouve le meˆme principe que dans BGP 4. ou` les
+se´quences des AS (Autonomous System) ne donnent pas toujours le nombre de sauts
+optimal entre clusters. Le champ ”E´ tirement” donne l’e´carte en nombre de sauts entre
+la longueur des routes emprunte´es lors de la deuxie`me phase du routage indirect et la
+longueur des routes dans le graphe (plus courts chemins) en nombre de sauts. On re-
+marque que le facteur d’e´tirement survenant dans la seconde phase du routage indirect
+est ne´gligeable devant la longueur totale des routes. Seul l’ajout des sauts ne´cessaires
+au look-up importe.
+Nb de nœuds 500 600 700 800 900 1000
+Nb de Clusters 11.70 14.20 15.80 17.50 21.42 24.30
+Longueur du Look-up 3.02 2.97 3.07 3.05 2.99 3.07
+Longueur des chemins 6.31 6.88 7.08 8.06 8.69 9.05
+E´ tirement 0.69 0.74 0.78 0.82 0.86 0.92
+Longueur globale 12.39 12.90 13.55 13.97 14.98 15.43
+TAB. 5.4 – Proprie´te´s de notre approche de routage avec λ = 500 (degre´ moyen des
+nœuds constant δ = 15.7) lorsque le re´seau s’e´tale.
+5.5 Conclusion
+Dans ce chapitre, nous avons propose´ un protocole de routage hie´rarchique pou-
+vant s’appliquer sur notre organisation de cluster. Cette approche hie´rarchique suit le
+sche´ma inverse que ceux commune´ment de´crits dans la litte´rature. En effet, nous pro-
+posons d’appliquer un protocole de routage re´actif a` l’inte´rieur des clusters et pro-actif
+entre les clusters. Une telle approche suppose un routage indirect utilisant une table de
+4www.freesoft.org/CIE/RFC/1772/
+5.5. CONCLUSION 123
+hachage distribue´e. Notre approche tire avantage des caracte´ristiques intrinse`ques du
+me´dium radio et des clusters pour a` la fois proposer un sche´ma d’e´tiquetage efficace
+des sommets des arbres de clustering pour distribuer les partitions de l’espace logique
+d’adressage de la DHT et permettre un routage global impliquant une taille me´moire
+sur les nœuds en O(1). Les requeˆtes de look-up peuvent ensuite eˆtre route´es graˆce a`
+un routage par intervalle sur cet espace. La deuxie`me phase du routage indirect se fait
+alors dans l’espace physique avec des chemins quasi-optimaux.
+Afin d’e´valuer les performances de notre algorithme, nous l’avons compare´ au
+seul autre protocole de notre connaissance qui utilise le meˆme sche´ma de routage
+hie´rarchique : SAFARI. Il s’est ave´re´ que notre approche offre de meilleures ca-
+racte´ristiques sur diffe´rents crite`res : temps de stabilisation, succe`s des look-ups, taille
+des chemins, etc. Cependant, ces re´sultats sont a` mode´rer de par le fait qu’il n’existe
+encore que tre`s peu de protocoles proposant cette approche de routage hie´rarchique.
+Dans la continuite´ de cette approche, nous souhaiterions analyser plus en profondeur
+les pe´riodes de rafraıˆchissement des enregistrements des nœuds, en fonction de leur
+mobilite´. Comme les algorithmes pre´sente´s dans cette the`se peuvent eˆtre qualifie´s de
+”quasi-locaux” et que la structure de clusters sous-jacente a pre´sente´ de bons compor-
+tements face a` la mobilite´ des nœuds, nous espe´rons qu’il en sera de meˆme pour le
+protocole de localisation/routage.
+Comme nous l’avons vu, seulement peu de propositions utilisent une approche pro-
+active entre les clusters et re´active a` l’inte´rieur des clusters. Nous avons compare´
+notre approche a` une autre qui utilisait ce meˆme mode`le. Cependant, il peut e´galement
+s’ave´rer inte´ressant d’e´tablir des comparaisons avec une approche ”classique” de la
+litte´rature, c.a`.d. qui propose un routage re´active entre clusters et pro-actif au sein d’un
+cluster.
+124 CHAPITRE 5. LOCALISATION ET ROUTAGE
+5.6 Publications
+1. Journaux et revues avec comite´ de lecture :
+(a) Distributed Node Location in clustered multi-hop wireless networks. Na-
+thalie Mitton et E´ ric Fleury. GESTS International Transaction on Computer
+Science and Engineering, Volume 21, De´cembre 2005.
+2. Colloques et confe´rences internationaux avec comite´ de lecture :
+(a) Distributed Node Location in clustered multi-hop wireless networks. Na-
+thalie Mitton, E´ ric Fleury. Asian Internet Engineering Conference (AIN-
+TEC’05), 13-15 De´cembre 2005, Bangkok, Thailande.
+(b) Distributed Node Location in clustered multi-hop wireless networks. Na-
+thalie Mitton, E´ ric Fleury. LOCALITY’05, 26 Septembre 2005, Cracovie,
+Pologne.
+3. Rapports de recherche :
+(a) Distributed Node Location in clustered multi-hop wireless networks. Na-
+thalie Mitton et E´ ric Fleury. RR-5723. Octobre 2005.
+4. Se´minaires, pre´sentations, expose´s :
+(a) Localisation dans les re´seaux sans fil multi-sauts grandes e´chelles. Natha-
+lie Mitton, E´ ric Fleury. Se´minaire ACI Pair a` Pair - Arcachon - France - 5-6
+Septembre 2005.
+Chapitre 6
+Conclusion et perspectives
+6.1 Conclusion
+Mon objectif, au travers de cette the`se, a e´te´ de de´velopper une solution d’utilisation
+des re´seaux sans fil sur de larges e´chelles afin de re´pondre aux besoins naissants de
+notre socie´te´. Pour cela, il me paraissait important d’e´tudier les diffe´rentes contraintes
+de tels re´seaux avant de pouvoir proposer une solution viable et fonctionnelle, meˆme
+sur de grandes e´chelles.
+J’ai pour cela propose´ une solution distribue´e qui se de´compose en plusieurs e´tapes.
+Chacune des e´tapes re´pond a` une application de tels re´seaux tout en en conside´rant
+les contraintes. Chaque algorithme est ne´ d’une e´tude des contraintes ou des structures
+et se compose d’algorithmes distribue´s, auto-stabilisants et robustes, ne´cessitant peu
+de ressources en e´nergie, bande passante ou taille me´moire. Toutes ces e´tapes ont e´te´
+e´tudie´es analytiquement et par simulation. Chaque solution a e´te´ compare´e a` d’autres
+solutions propose´es dans la litte´rature et s’ave`re soit offrir de meilleurs re´sultats, soit
+de meilleurs compromis.
+La premie`re e´tape permet de structurer logiquement le re´seau en clusters. A partir de
+l’e´tude de la structure ainsi forme´e, plusieurs caracte´ristiques ont pu eˆtre de´gage´es. Ces
+caracte´ristiques ont alors guide´ la conception des algorithmes des e´tapes suivantes. La
+seconde e´tape a cre´e´ des liens entre ces clusters afin de pouvoir effectuer des diffusions
+ge´ne´rales d’information de fac¸on efficace. L’algorithme de diffusion en soi est simple,
+il se´lectionne un sous-ensemble de nœuds autorise´s a` relayer le message. Cette sim-
+plicite´ intrinse`que est d’autant plus riche qu’elle utilise une structure existante, sans
+en cre´er de nouvelles. L’algorithme de diffusion e´conomise ainsi des messages et des
+ressources.
+Enfin, la dernie`re e´tape permet a` deux entite´s individuelles de communiquer, quelles
+que soient leurs positions dans le re´seau. Ce processus de routage pre´sente plusieurs
+originalite´s. En effet, dans un premier temps, il conside`re une approche inverse a`
+125
+126 CHAPITRE 6. CONCLUSION ET PERSPECTIVES
+celle propose´e jusqu’a` maintenant afin de pre´server une faible taille me´moire sur les
+nœuds. Ensuite, il emprunte des solutions algorithmiques a` d’autres domaines comme
+les tables de hachage distribue´es issues du domaine du Pair a` Pair et le routage par
+intervalle issu des re´seaux filaires.
+6.2 Perspectives
+Les diffe´rents algorithmes propose´s dans chaque e´tape de ma proposition pre´sentent
+tous des caracte´ristiques qui peuvent eˆtre e´tudie´es plus en profondeur ou des points
+qui me´riteraient certaines optimisations. Par exemple, le comportement de chaque al-
+gorithme pourrait eˆtre analyse´ dans un environnement plus mobile. Un autre point im-
+portant est que toutes les analyses re´alise´es sur les diffe´rents algorithmes de ma propo-
+sition ont e´te´ conduites en supposant une couche MAC ide´ale et un mode`le ”Unit Disk
+Graph” pour de´finir le voisinage des nœuds. Conside´rer une couche MAC ide´ale per-
+met de n’e´tudier que les caracte´ristiques propres a` l’algorithme conside´re´, ce qui e´tait le
+but recherche´ dans cette the`se. Cependant, un protocole de niveau 3 est utilise´ conjoin-
+tement avec des protocoles de niveaux infe´rieurs. De meˆme, l’aire de transmission d’un
+nœud est rarement un cercle puisque la propagation des ondes de´pend du milieu et des
+obstacles que peut rencontrer le signal. Il serait donc inte´ressant d’e´valuer les diffe´rents
+algorithmes propose´s dans ce manuscrit, en conside´rant diffe´rents protocoles pour les
+couches infe´rieures et diffe´rents modes de propagation des ondes suivant les environ-
+nements, aussi bien en ce qui concerne les analyses par simulation que les analyses
+the´oriques. En effet, dans nos analyses the´oriques, nous avons e´galement conside´re´ le
+mode`le ”Unit Disk Graph” mais d’autres mode`les d’e´tude ont e´te´ propose´s comme par
+exemple dans [27] ou [9] qui conside`re le mode`le CDMA utilise´ dans 802.11. De plus,
+comme dans un environnement sans fil re´el, de nombreux parame`tres d’environnement
+entrent en jeu pour assurer ou non l’existence d’un lien, on peut e´galement conside´rer
+un mode`le ou` un lien existe avec une certaine probabilite´.
+Par ailleurs, les re´seaux sans fil couvrent une large famille de re´seaux, comme les
+re´seaux ad hoc ou les re´seaux de capteurs. Bien que posse´dant tous des caracte´ristiques
+semblables, chacun a une utilisation plus pre´cise et des proprie´te´s supple´mentaires. La
+solution d’utilisation grande e´chelle que j’ai de´crite ici est ge´ne´rique et peut s’appliquer
+a` tout type de re´seau sans fil. Cependant, il me semble que pour concevoir un re´seau
+efficace, il faut e´galement conside´rer l’application du re´seau. Ainsi, j’aimerais par la
+suite conside´rer plusieurs applications plus cible´es et un type de re´seau plus pre´cis
+comme par exemple les re´seaux de capteurs.
+En effet, les re´seaux de capteurs offrent un certain nombre de de´fis et de verrous scienti-
+fiques. Ils sont le reflet de l’e´volution a` la fois des syste`mes, des re´seaux, de leurs com-
+posants mais aussi de leur organisation et des inter-actions et communications entre
+syste`mes. Malgre´ des tailles souvent petites, ils inte`grent une forte complexite´, notam-
+ment de par l’infrastructure logicielle qui se retrouve distribue´e a` une grande e´chelle et
+qui se doit d’offrir des services d’auto-adaptabilite´.
+6.2. PERSPECTIVES 127
+Les re´seaux de capteurs sont de plus en plus de´ploye´s et offrent des perspectives nou-
+velles chaque jour. Aujourd’hui, on cherche a` de´ployer un re´seau de capteurs pour la
+surveillance des feux de foreˆts par exemple, afin de pre´venir d’un incendie et d’inter-
+venir avant qu’il n’ait cause´ trop de de´gaˆts. A` moyen terme, on cherche a` inte´grer ces
+capteurs dans les structures des baˆtiments et ne les faire s’activer que si le baˆtiment
+s’e´croule afin de guider les secours. Les contraintes de base restent les meˆmes : e´nergie
+et bande passante limite´es. Cependant, avec les nouvelles applications et le de´ploiement
+de re´seaux de plus en plus grands, d’autres points sont a` conside´rer, comme la mobilite´
+des capteurs (un re´seau de capteurs peut eˆtre embarque´ dans une voiture par exemple
+ou servir a` traquer des animaux), la robustesse de la structure globale (il faut s’assurer
+que le re´seau de base soit stable avant de penser a` l’e´tendre) ou encore la se´curite´. Pour
+une meilleure optimisation, tous ces aspects se doivent d’eˆtre e´tudie´s conjointement.
+La solution que j’ai de´veloppe´e dans cette the`se reste applicable, meˆme si les capteurs
+pre´sentent des proprie´te´s supple´mentaires par rapport au mode`le ge´ne´rique des re´seaux
+sans fil. Par exemple, lorsque l’on conside`re un re´seau de capteurs, bien que la topolo-
+gie reste dynamique du fait des apparitions ou disparitions de capteurs dues a` la mort, a`
+l’endormissement ou au re´veil des entite´s, les capteurs ne se de´placent pas toujours. De
+meˆme, les mode`les de communication sont diffe´rents dans un re´seau de capteur. Deux
+capteurs n’ont ge´ne´ralement pas besoin de communiquer directement. On observe sur-
+tout des communications de la station de base vers l’ensemble des entite´s (pour une
+synchronisation par exemple) ou des entite´s vers la station de base (pour retourner une
+mesure prise par un capteur par exemple). Les algorithmes que j’ai propose´s peuvent
+eˆtre optimise´s en fonction de ces caracte´ristiques plus pre´cises.
+Les contraintes a` e´tudier, quelles qu’elles soient, doivent eˆtre conside´re´es dans toutes
+les couches de communication, qu’il s’agisse de la conception au niveau signal, liaison
+de donne´es ou routage. Tous les niveaux doivent conside´rer que les capteurs ont des
+capacite´s limite´es en e´nergie et en taille me´moire, et non pas seulement la couche
+re´seau. Tous ces de´fis rencontre´s dans de tels re´seaux ont e´te´ traite´s a` diffe´rents niveaux.
+Les diffe´rentes propositions de protocoles de niveau physique cherchent a` minimiser
+l’e´nergie de´pense´e en e´mission et en re´ception. Les protocoles de niveau MAC e´tudient
+des re`gles d’endormissement des nœuds afin de ne faire travailler qu’un sous-ensemble
+de capteurs a` la fois. Les protocoles de routage cherchent a` minimiser les inondations
+de de´couverte et maintenance des routes et a` limiter le nombre de nœuds participant a`
+ces diffusions. Cependant, toutes ces recherches d’optimisation restent inde´pendantes
+les unes des autres et ne sont pas toujours compatibles. Par exemple, les protocoles de
+routage peuvent avoir de´signe´ certains capteurs pour diffuser un message que la couche
+MAC aura endormis. Dans ce cas, les messages ne seront pas relaye´s, ce qui peut avoir
+de graves conse´quences suivant l’usage du re´seau de capteurs. De la meˆme fac¸on, la
+couche la plus haute et la couche la plus basse ne peuvent eˆtre totalement de´corre´le´es,
+les capteurs physiques devant re´pondre aux contraintes des applications.
+Ainsi, chaque couche a besoin des informations des autres couches. Pour optimiser
+au maximum les communications dans les re´seaux de capteurs, toutes ces couches ne
+peuvent rester inde´pendantes les unes des autres et travailler seules. Il faudrait parvenir
+a` supprimer ce de´coupage en couche et a` fusionner les qualite´s logicielles et mate´rielles
+des capteurs. Le routage et les applications doivent pouvoir eˆtre de´termine´s en fonction
+128 CHAPITRE 6. CONCLUSION ET PERSPECTIVES
+des capacite´s physiques des capteurs et vice-versa. Les applications du re´seau de cap-
+teurs doivent e´galement guider les fonctionnalite´s qui doivent apparaıˆtre aux niveaux
+infe´rieurs. Ceci sera d’autant plus important quand on en viendra a` faire communi-
+quer des objets he´te´roge`nes qui auront des fonctions de surveillance diffe´rentes dans
+le re´seau. En effet, il faudra maintenir l’inter-ope´rabilite´ entre les composants et le bon
+fonctionnement global du re´seau. Si toutes les couches sont fusionne´es, les diffe´rences
+entre ces objets seront masque´es a` la vue des capteurs.
+Bibliographie
+[1] I. Abraham, D. Malkhi, and O. Dobzinski. LAND : Locality Aware Networks
+for Distributed Hash Tables. In ACM-SIAM Symposium on Discrete Algorithms
+(SODA’04), New Orleans, LA, USA, 2004.
+[2] K. Alzoubi, P. Wan, and O. Frieder. New distributed algorithm for connected
+dominating set in mobile ad hoc networks. In 35th Annual Hawaii International
+Conference on System Sciences (HICSS’02), Hawaii, USA, January 2002.
+[3] A. Amis and Prakash. Load-balancing clusters in wireless ad hoc networks. In
+ASSET, Richardson, Texas, USA, March 2000.
+[4] A. Amis, R. Prakash, T. Vuong, and D. Huynh. Max-Min d-cluster formation in
+wireless ad hoc networks. In INFOCOM, Tel-Aviv, Israe¨l, March 2000. IEEE.
+[5] B. An and S. Papavassiliou. A mobility-based clustering approach to support
+mobility management and multicast routing in mobile Ad-hoc wireless networks.
+International Journal of Network Management, 11(6) :387–395, November 2001.
+[6] F. Araujo, L. Rodrigues, J. Kaiser, L. Changling, and C. Mitidieri. CHR : A Distri-
+buted Hash Table for Wireless Ad Hoc Networks. In 4th International Workshop
+on Distributed Event-based Systems (DEBS’05), Columbus, Ohio, USA, June
+2005.
+[7] E. Baccelli. OLSR trees : A simple clustering mechanism for OLSR. In MED-
+HOC-NET 05, Porquerolles, France, June 2005.
+[8] E. Baccelli and P. Jacquet. Flooding techniques in mobile Ad-Hoc networks.
+Technical Report RR-5002, INRIA, 2003.
+[9] F. Baccelli, B. Błaszczyszyn, and M. Karray. Up and downlink admis-
+sion/congestion control and aximal load in large homogeneous CDMA networks.
+In Proc. of WiOpt, Sophia Antipolis, France, 2003. to appear in MONET Special
+Issue on Optimization of Wireless and Mobile Networks 10(2), April 2005.
+[10] H. Balakrishnan, M. F. Kaashoek, D. Karger, R. Morris, and I. Stoica. Looking
+up data in P2P systems. Communications of the ACM, 46(2) :43–48, February
+2003.
+[11] S. Banerjee and S. Khuller. A clustering scheme for hierarchical control in multi-
+hop wireless networks. In INFOCOM, Anchorage, Alaska, USA, April 2001.
+129
+130 BIBLIOGRAPHIE
+[12] S. Basagni. Distributed clustering for ad hoc networks. In International Sym-
+posium on parallel architectures algorithms and networks (I-SPAN’99), pages
+310–315, Fremantle, Australia, June 1999.
+[13] P. Basu, N. Khan, and T. Little. A mobility based metric for clustering in mobile
+ad hoc networks. In Distributed Computing Systems Workshop (DISC), 2001.
+[14] D. Bertsekas and R. Gallager. Data Networks. Prentice-Hall, 1987.
+[15] L. Blazevic, L. Buttyan, S. Capkun, S. Giordano, and J.-Y. Le Boudec. Self-
+organization in mobile ad-hoc networks : the approach of Terminodes. IEEE
+Communications Magazine, 39(6) :166–174, June 2001.
+[16] L. Blazevic, S. Giordano, and J.-Y. Le Boudec. Self-organized Terminode rou-
+ting. Journal of Cluster Computing, 5(2), April 2002.
+[17] S. Capkun, M. Hamdi, and J.-P. Hubaux. GPS-free positioning in mobile ad-hoc
+networks. In Proceedings of The 34th Hawaii International Conference on System
+Sciences (HICSS-34), Maui, Hawaii, USA, January 2001.
+[18] J. Cartigny. Contributions a` la diffusion dans les re´seaux ad hoc. PhD thesis,
+LiFL, Lille, December 2003.
+[19] J. Cartigny, F. Ingelrest, and D. Simplot-Ryl. RNG relay subset flooding protocol
+in mobile ad-hoc networks. IJFCS, pages 253–265, 2003.
+[20] M. Chatterjee, S. K. Das, and D. Turgut. WCA : A weight based distributed
+clustering algorithm for mobile ad hoc networks. Journal of Cluster Computing
+(Special Issue on Mobile Ad hoc Networks), 5(2) :193–204, April 2002.
+[21] G. Chelius, E. Fleury, B. Sericola, and L. Toutain. On the NAP Protocol. Techni-
+cal Report 5701, INRIA, 2005.
+[22] B. Chen and R. Morris. L+ : Scalable landmark routing and address lookup for
+multi-hop wireless networks. MIT LCS technical report 837, MIT, March 2002.
+[23] G. Chen, F. Garcia, J. Solano, and I. Stojmenovic. Connectivity-based k-hop
+clustering in wireless networks. In 35th Annual Hawaii International Conference
+on System Sciences (HICSS’02), Hawaii, USA, January 2002.
+[24] C. Chiang, H. Wu, W. Liu, and M. Gerla. Routing in clustered multihop, mobile
+wireless networks with fading channel. In ICCS/ISPACS’96, Singapore, Novem-
+ber 1996.
+[25] T. Clausen, P. Jacquet, A. Laouiti, P. Muhlethaler, A. Qayyum, and L. Viennot.
+Optimized Link State Routing Protocol, October 2003. RFC 3626.
+[26] F. Dai and J. Wu. Distributed dominant pruning in ad hoc networks. In ICC’03,
+Anchorage, Alaska, USA, May 2003.
+[27] O. Dousse, F. Baccelli, and P. Thiran. Impact of interferences on the connectivity
+of Ad Hoc networks. In Proc. of IEEE INFOCOM, San Francisco, USA, 2003. to
+appear in IEEE Transactions on Networking.
+[28] A. Ephremides, J. Wieselthier, and D. Baker. A design concept for reliable mobile
+radio networks with frequency hoping signaling. In IEEE 75, pages 56–73, 1987.
+[29] P. Erdo¨s and A. Renyi. On Random Graphs. Publicationes Mathematicae, 1959.
+BIBLIOGRAPHIE 131
+[30] J. Eriksson, M. Faloutsos, and S. Krishnamurthy. Scalable ad hoc routing : The
+case for dynamic addressing. In INFOCOM, Hong Kong, China, March 2004.
+[31] L. M. Feeney and M. Nilsson. Investigating the energy consumption of a wi-
+reless network interface in an ad hoc networking environment. In INFOCOM,
+Anchorage, Alaska, USA, April 2001.
+[32] Y. Fernandess and D. Malkhi. k-clustering in wireless ad hoc networks. In ACM
+international workshop on Principles of mobile computing, Toulouse, France,
+2002.
+[33] P. Fraigniaud and P. Gauron. An overview of the content-addressable network
+D2B. In Proceedings of the 22nd ACM Symposium on Principles of Distributed
+Computing (PODC’03). ACM, July 2003.
+[34] M. R. Garey and D. S. Johnson. Computers and intractability : a guide to the
+theory of NP-completeness. W.H. Freeman & Company, New York, 1979.
+[35] M. Gerla and G. Pei. Fisheye State Routing Protocol (FSR). DRAFT draft-ietf-
+manet-fsr-02.txt, IETF, December 2001.
+[36] M. Gerla and J. T.-C. Tsai. Multicluster, mobile, multimedia radio network.
+ACM/Baltzer Journal of Wireless Networks, 1(3) :255–265, July 1995.
+[37] P. Gupta and P. Kumar. The capacity of wireless network. IEEE Trans. On
+Information Theory, 46(2) :388–404, March 2000.
+[38] T. Herman and S. Tixeuil. A distributed TDMA slot assignment for wireless
+sensor networks. In Proceedings of the First Workshop on Algorithmic Aspects of
+Wireless Sensor Networks (AlgoSensors’2004), number 3121 in Lecture Notes in
+Computer Science, Turku, Finland, July 2004. Springer-Verlag.
+[39] T.-C. Hou and T.-J. Tsai. An access-based clustering protocol for multihop wi-
+reless ad hoc networks. IEEE Journal on Selected Areas in Communications,
+19(7) :1201–1210, July 2001.
+[40] P. Jacquet, A. Laouiti, P. Minet, and L. Viennot. Performance analysis of OLSR
+multipoint relay flooding in two ad hoc wireless network models. Technical Re-
+port RR-4260, INRIA, September 2001.
+[41] P. Jacquet, A. Laouiti, P. Minet, and L. Viennot. Performance of multipoint re-
+laying in ad hoc mobile routing protocols. In Networking, Pisa, Italy, 2002.
+[42] M. Jiang, J. Li, and Y. Tay. Cluster Based Routing Protocol (CBRP). DRAFT
+draft-ietf-manet-cbrp-spec-01.txt, IETF, July 1999.
+[43] D. Johnson, D. A. Maltz, and Y.-C. Hu. Dynamic Source Routing (DSR), Fe-
+bruary 2003.
+[44] L. Kai and L. Jiandong. Mobile cluster protocol in wireless ad hoc networks. In
+International Conference on Communication Technology (ICCT’2000) Procee-
+dings, August 2000.
+[45] P. Krishna, N. H. Vaidya, M. Chatterjee, and D. K. Pradhan. A cluster based
+approach for routing in dynamic networks. In ACM SIGCOMM, pages 49–65.
+ACM, April 1997.
+132 BIBLIOGRAPHIE
+[46] B.-J. Kwak, N.-O. Song, and L. Miller. On the scalability of ad hoc networks.
+Communications Letters, IEEE, 8 :503– 505, 2004.
+[47] T. J. K. Kwon and M. Gerla. Efficient flooding with passive clustering (PC) - an
+overhead-free selective forward mechanism for ad hoc/sensor networks. Procee-
+dings of IEEE, 91 :1210–1220, 2003.
+[48] J. Li, R. Morris, J. Jannotti, D. S. Decouto, and D. R. Karger. A scalable location
+service for geographic ad hoc routing. In Proceedings of the 6th ACM Internatio-
+nal Conference on Mobile Computing and Networking (Mobicom’00), pages 120
+– 130. ACM, August 2000.
+[49] H. Lim and C. Kim. Multicast tree construction and flooding in wireless ad hoc
+networks. In ACM MSWiM Workshop at MobiCom 2000, Boston, MA, USA,
+August 2000.
+[50] C. R. Lin and M. Gerla. Adaptive clustering for mobile wireless networks. IEEE
+Journal of Selected Areas in Communications, 15(7) :1265–1275, 1997.
+[51] H.-C. Lin and Y.-H. Chu. A clustering technique for large multihop mobile wi-
+reless networks. In Vehicular Technology Conference (VTC’00), Tokyo, Japan,
+May 2000.
+[52] D. Malkhi, M. Naor, and D. Ratajczak. Viceroy : A scalable and dynamic emula-
+tion of the butterfly. In Proceedings of the 21st ACM Symposium on Principles of
+Distributed Computing (PODC’02), 2002.
+[53] B. Mans and N. Shrestha. Performance evaluation of approximation algorithms
+for multipoint relay selection. In The Third Annual Mediterranean Ad Hoc Net-
+working Workshop, MED-HOC-NET 04, Bodrum, Turkey, June 2004.
+[54] P. Maymounkov and D. Mazie`res. Kademlia : A peer-to-peer information system
+based on the XOR metric. In Electronic Proceedings for the 1st International
+Workshop on Peer-to-Peer Systems (IPTPS ’02), MIT Faculty Club, Cambridge,
+MA, USA, March 2002.
+[55] N. Mitton, E. Fleury, I. Gue´rin-Lassous, B. Se´ricola, and S. Tixeuil. On fast
+randomized colorings in sensor networks. Research Report LRI-1416, LRI, June
+2005.
+[56] R. Morris, J. Jannotti, L. Jinyang, and D. S. J. Decouto. Carnet : A scalable ad
+hoc wireless network system. In Proceedings of the 9th ACM SIGOPS European
+Workshop : Beyond the PC : New challenges for the operating system, September
+2000.
+[57] E. T. Ng and H. Zhang. Predicting Internet network distance with coordinates-
+based approaches. In INFOCOM, New-York, USA, June 2002.
+[58] D. Niculescu and B. Nath. Ad hoc positioning system (APS). In Proceedings of
+GLOBECOM’01, November 2001.
+[59] N. Nikaein, H. Labiod, and C. Bonnet. DDR-distributed dynamic routing algo-
+rithm for mobile ad hoc networks. In MobiHoc, Boston, MA, USA, November,
+20th 2000.
+BIBLIOGRAPHIE 133
+[60] T. Ohta, S. Inoue, and Y. Kakuda. An adaptive multihop clustering scheme for
+highly mobile ad hoc networks. In IEEE International Symposium on Autono-
+mous Decentralized Systems (ISADS’03), pages 293–300, April 2003.
+[61] C. Perkins. Ad hoc networking. Addison-Wesley, 2001.
+[62] C. Perkins, E. Belding-Royer, and S. Das. Ad hoc On-demand Distance Vector
+Routing, July 2003. RFC 3561.
+[63] J. Polastre, R. Szewczyk, and D. Culler. Telos : Enabling ultra-low power wireless
+research. In IPSN/SPOTS’05, Los Angeles, CA, USA, April 2005.
+[64] H. Pucha, S. M. Das, and Y. C. Hu. Ekta : An efficient DHT substrate for dis-
+tributed applications in mobile ad hoc networks. In WMCSA, pages 163–173,
+2004.
+[65] A. Qayyum, L. Viennot, and A. Laouiti. Multipoint relaying : An efficient tech-
+nique for flooding in mobile wireless networks. In HICSS’02, Hawaii, USA,
+January 2002.
+[66] R. Rajaraman. Topology control and routing in ad hoc networks : a survey. ACM
+SIGACT News, 33(2) :60–73, June 2002.
+[67] A. Ramalingam, S. Subramani, and K. Perumalsamy. Associativity-based clus-
+ter formation and cluster management in ad hoc networks. In 9th International
+conference on high performance computing (HiPC’02), Bangalore, India, De-
+cember 2002.
+[68] S. Ratnasamy, P. Francis, M. Handley, R. Karp, and S. Schenker. A scalable
+content-addressable network. In Proceedings of the 2001 conference on applica-
+tions, technologies, architectures, and protocols for computer communications,
+pages 161–172. ACM Press, 2001.
+[69] R. Riedi, P. Druschel, Y. C. Hu, D. B. Johnson, and R. Baraniuk. SAFARI : A self-
+organizing hierarchical architecture for scalable ad hoc networking networking.
+Research report TR04-433, Rice University, February 2005.
+[70] A. Rowstron and P. Druschel. Pastry : Scalable, distributed object location
+and routing for large-scale peer-to-peer systems. In Proceedings of the 18th
+IFIP/ACM International Conference on Distributed Systems Platforms (Middle-
+ware 2001), Heidelberg, Germany, November 2001.
+[71] C. Santivanez, B. McDonald, I. Stavrakakis, and R. R. Ramanathan. On the sca-
+lability of ad hoc routing protocols. In INFOCOM, New-York, USA, June 2002.
+[72] N. Santoro and R. Khatib. Labeling and implicit routing in networks. The com-
+puter Journal, 28 :5–8, 1985.
+[73] I. Stoica, R. Morris, D. Karger, M. F. Kaashoek, and H. Balakrishnan. Chord : A
+scalable peer-to-peer lookup service for Internet applications. In Proceedings of
+the 2001 conference on applications, technologies, architectures, and protocols
+for computer communications (Sigcomm’01), pages 149–160. ACM Press, 2001.
+[74] I. Stojmenovic, M. Seddigh, and J. Zunic. Dominating sets and neighbor
+elimination-based broadcasting algorithms in wireless networks. IEEE TPDS,
+13(1), January 2002.
+134 BIBLIOGRAPHIE
+[75] I. Stojmenovic and J. Wu. Broadcasting and activity scheduling in ad hoc net-
+works. IEEE Mobile Ad Hoc Networking, pages 205–229, 2004.
+[76] D. Stoyan, S. Kendall, and J. Mecke. Stochastic geometry and its applications,
+second edition. John Wiley & Sons, 1995.
+[77] J. Van Leeuven and R. Tan. Interval routing. The computer Journal, 30 :298–307,
+1987.
+[78] A. C. Viana, M. Dias de Armorim, S. Fdida, and J. Ferreira de Rezende. Indirect
+routing using distributed location information. In PERCOM ’03 : Proceedings of
+the First IEEE International Conference on Pervasive Computing and Communi-
+cations, page 224, Washington, DC, USA, 2003. IEEE Computer Society.
+[79] A. C. Viana, M. Dias de Armorim, S. Fdida, and J. Ferreira de Rezende. Self-
+organization in spontaneous networks : the approach of DHT-based routing pro-
+tocols. Ad Hoc Networks Journal, 2005.
+[80] J. Wu and H. Li. A dominating set based routing scheme in ad hoc wireless
+networks. Telecommunication Systems, pages 13–36, 2001.
+[81] J. Wu and W. Lou. Forward node set based broadcast in clustered mobile ad
+hoc networks. Wireless Communications and Mobile Computing, 3(2) :141–154,
+2003.
+[82] J. Y. Yu and P. H. Chong. 3hBAC (3-hop between adjacent clusterheads) : A novel
+non-overlapping clustering algorithm for mobile ad hoc networks. In PacRim’03,
+Victoria, Canada, August 2003.
+[83] H. Zhai, Y. Kwon, and Y. Fang. Performance analysis of IEEE 802.11 MAC
+Protocols in wireless LANs. Wireless communications and mobile computing,
+4 :917–931, 2004.
+[84] B. Y. Zhao, L. Huang, J. Stribling, S. C. Rhea, A. D. Joseph, and J. Kubiatowicz.
+Tapestry : A resilient global-scale overlay for service deployment. IEEE Journal
+on Selected Areas in Communications, 22(1), January 2004.
diff --git a/examples/theses/Thesis_Calligari.pdf b/examples/theses/Thesis_Calligari.pdf
new file mode 100644
index 00000000..03a8dda1
Binary files /dev/null and b/examples/theses/Thesis_Calligari.pdf differ
diff --git a/examples/theses/Thesis_Calligari/fulltext.pdf b/examples/theses/Thesis_Calligari/fulltext.pdf
new file mode 100644
index 00000000..03a8dda1
Binary files /dev/null and b/examples/theses/Thesis_Calligari/fulltext.pdf differ
diff --git a/examples/theses/Thesis_Calligari/fulltext.pdf.txt b/examples/theses/Thesis_Calligari/fulltext.pdf.txt
new file mode 100644
index 00000000..c389c8da
--- /dev/null
+++ b/examples/theses/Thesis_Calligari/fulltext.pdf.txt
@@ -0,0 +1,5930 @@
+Signature of protein adaptation to warm deep sea
+environments: the case of Initiation Factor 6 studied by
+molecular simulation and neutron scattering.
+Paolo Calligari
+To cite this version:
+Paolo Calligari. Signature of protein adaptation to warm deep sea environments: the case of
+Initiation Factor 6 studied by molecular simulation and neutron scattering.. Biological Physics.
+Universite´ Pierre et Marie Curie - Paris VI, 2008. English. <tel-00368866>
+HAL Id: tel-00368866
+https://tel.archives-ouvertes.fr/tel-00368866
+Submitted on 17 Mar 2009
+HAL is a multi-disciplinary open access L’archive ouverte pluridisciplinaire HAL, est
+archive for the deposit and dissemination of sci- destine´e au de´poˆt et a` la diffusion de documents
+entific research documents, whether they are pub- scientifiques de niveau recherche, publie´s ou non,
+lished or not. The documents may come from e´manant des e´tablissements d’enseignement et de
+teaching and research institutions in France or recherche franc¸ais ou e´trangers, des laboratoires
+abroad, or from public or private research centers. publics ou prive´s.
+THÈSE DE DOCTORAT DE
+L’UNIVERSITÉ PIERRE ET MARIE CURIE - PARIS 6
+Spécialité:
+interfaces de la biologie avec la physique, la chimie et
+l’informatique
+Pour obtenir le grade de
+Docteur de l’Université Pierre et Marie Curie
+Presenté par:
+paolo calligari
+S IGNATURE DE L’ADAPTAT ION DES PROTÉ INES
+À L’ENVIRONNEMENT DES FONDS MARINS CHAUDS :
+le cas du Facteur d’Initiation 6 étudié par simulation moléculaire et diffusion de neutrons
+Paris, 18 Dcembre 2008
+Devant le jury composé par:
+Prof. Cristian Micheletti (Rapporteur)
+Prof. Roger Fourme (Rapporteur)
+Prof. Françoise Gaill (examinatrice)
+Dr. Joel Pothier (examinateur)
+Dr. Giuseppe Zaccai (examinateur)
+Prof. Mark Johnson (examinateur)
+Prof. Gerald R. Kneller (directeur de thse)
+
+thèse préparée au sein de:
+INSTITUT LAUE LANGEVIN (Grenoble)
+et
+LABORATOIRE LEON BRILLOUIN (CEA Saclay, Gif-sur-Yvette)
+
+Dedicated to Francesca Romana.
+
+ABSTRACT
+Signature of protein adaptation to warm deep sea environments: the case of Initiation Fac-
+tor 6 studied by molecular simulation and neutron scattering.
+The protein Initiation Factor 6 (IF6) takes part in the protein synthesis regulation of several
+organisms. It was also found in archeaebacteria such as Methanoccoccus Jannascii which lives in
+deep-seas near hydrothermal vents where temperature reaches 80◦C and pressure is between
+250bar and 500bar. The aim of this work was to study for the first time dynamical and
+structural properties of IF6 produced by M.Jannaschii and comparing them with those of
+the IF6 homologue present in Saccharomyces cerevisiae which lives at "normal" environmental
+conditions (27◦C and 1bar).
+Molecular simulation gave here new insights into the adaptation of these two proteins to their
+respective physiological conditions and showed that the latter induced similar dynamical and
+structural properties: in their respective "natural" conditions, IF6s show very similar structural
+fluctuations and the characteristic relaxation times which define their dynamical properties
+shows similar changes when comparing unfavorable conditions to physiological ones. The
+creation of these corresponding states between the two homologues has been interpreted by
+the fractional Brownian dynamics model and by a novel method for the characterization of
+protein secondary structures. The latter is presented here in detail together with some exam-
+ples of other applications. Experimental data obtained from quasi-elastic neutron scattering
+seemed to support the results obtained by molecular simulations.
+Keywords : Initiation Factor 6, molecular dynamics, neutron scattering, pressure, fractional
+Brownian dynamics model, warm deep sea, protein secondary structure
+vii
+RÉSUMÉ
+Signature de l’adaptation des protéines à l’environnement des fonds marins chauds: le
+cas du Facteur d’Initiation 6 étudié par simulation moléculaire et diffusion de neutrons.
+Le Facteur d’Initiation 6 (IF6) est une protéine qui participe, dans plusieurs organismes, à
+la régulation de la synthèse des autres protéines. Elle a été trouvée aussi dans l’archaebactérie
+Methanoccoccus Jannascii qui vit au fond de la mer, près des cheminées hydrothermales, où la
+température atteint 80◦C et la pression hydrostatique est entre 250 et 500bar. L’objectif de ce
+travail a été celui d’étudier pour la première fois les propriétés dynamiques et structurales de
+la IF6 issue du M.Jannaschii en comparaison avec celles de son homologue présent dans le
+Saccharomyces cerevisiae qui vit dans des conditions environnementales "normales" (27◦C et
+1bar).
+La simulation moléculaire nous a permis de montrer que l’adaptation de ces deux protéines
+aux conditions physiologiques induit des propriétés dynamiques et structurales similaires:
+dans leur conditions "naturelles" respectives, les deux protéines montrent des fluctuations
+structurales très similaires et les temps caractéristiques qui identifient leur propriétés dy-
+namiques subissent les mêmes changements dans la transition d’une condition défavorable
+vers la condition physiologique.
+Cette création d’ "états correspondants" entre les deux protéines a été étudiée par le modèle
+de dynamique Brownienne fractionnaire et par une nouvelle méthode pour la caractérisation
+des structures secondaires des protéines. Cette dernière est présentée en détail avec des brefs
+exemples d’autres applications. Les données préliminaires obtenues par diffusion de neutrons
+semblent confirmer les résultats issues des simulations moléculaires.
+Mots clés : Facteur d’Initiation 6, dynamique moléculaire, diffusion de neutrons, pression,
+modèle Brownien fractionnaire, fond marins chauds, structure secondaire des protéines.
+viii
+PUBL ICAT IONS
+Some ideas and figures have appeared previously in the following publications:
+1) Calligari P.A. et al., Inhibition of viral group-1 and group-2 neuraminidases by oseltamivir:
+a comparative structural analysis by the ScrewFit algorithm. Biophysical Chemistry, accepted
+for publication (2008).
+2) Calligari P.A. and Kneller G.R., ScrewFit : a novel approach for continuum protein sec-
+ondary structure assessments. Submitted (2008).
+3) Calandrini V., Hamon V., Hinsen K., Calligari P., Bellisent-Funel M.-C. and Kneller G.R.,
+Relaxation dynamics of lysozime in solution under pressure: combining molecular dynamics
+and quasielastic neutron scattering. Chemical Physics, 345, 289-297 (2008).
+4) Hamon V., Calligari P., Hinsen K., Kneller G.R. Simulation studies of structural changes and
+relaxation processes in lysozyme under pressure, J. of Non-Crystalline Solids, 352, 4417-4423
+(2006).
+5) Kneller G.R. and Calligari P., Efficient characterisation of protein secondary structure in
+terms of screw motions. Acta Crystallographica D62, 302-311, (2006).
+ix
+
+Il est certain que beaucoup de choses vont bien dans la nature,
+c’est-à-dire vont en sorte de pouvoir durer et se conserver, ce
+qu’elles ne pourraient faire autrement. Mais une infinité d’autres
+vont mal (et peut-être un plus grand nombre), sont mal organisées,
+moralement et physiquement, avec un immense inconvénient pour
+les créatures; ces choses auraient pu à peu de différence près être bien organisées.
+— Giacomo Leopardi, Zibaldone di pensieri [N. 4248]
+REMERCIEMENTS
+Ce travail de thèse a été effectué à l’Institut Laue Langevin de Grenoble et au Laboratoire
+Léon Brillouin au Commissariat à l’Energie Atomique de Saclay, sous la direction du
+professeur Gerald KNELLER à qui s’adressent mes premiers remerciements pour m’avoir
+accueilli dans son équipe et pour avoir su équilibrer, dès le primer jour, mon enthousiasme
+envers la biologie avec des bonnes doses de physique théorique. Je lui serai toujours
+reconnaissant de ne pas avoir laisser que j’oublie mes origines de physicien.
+Je suis pareillement reconnaissant envers Mark JOHNSON, qui à co-diriger ma thèse. A lui
+vont mes remerciements pour avoir suivi et coordonner mon travail en me laissant toute la
+liberté d’expérimenter, d’essayer et de me planter devant les problèmes comme le font les
+"vrais" chercheurs. Je lui doit tout ma gratitude pour la confiance qu’il m’a réservé ainsi que
+pour son support dans les moments les plus difficiles.
+Envers mes deux directeurs un remerciement supplémentaire pour avoir su être amis en
+outre que simples "chefs"...
+Je voudrais aussi exprimer ma gratitude envers les membres du jury: la présidente
+Françoise GAILL, Cristian MICHELETTI et Roger FOURME qui ont accepté d’être
+rapporteurs de mon mémoire, Giuseppe ZACCAI et Joel POTHIER.
+Je tiens ensuite à remercier les collaborateurs du professeur Kneller, Vania CALANDRINI
+et Konrad HINSEN pour tout ce qu’ils m’ont appris et pour leur aide précieuse dans mon
+travail partagé entre les neutrons et les simulations numériques.
+xi
+Je suis particulièrement reconnaissant envers Jacques OLLIVIER et Jean-Baptiste ARTERO
+qui ont partagé avec moi "la quotidienneté" de mon travail (et notamment des expériences de
+laboratoire, pas toujours encourageantes...!). Je remercie Jacques pour ce qui m’a appris, pour
+sa patience envers les cotés plus étranges (surtout au monde des neutrons) de mon projet de
+thèse et pour m’avoir accompagné dans nos expériences de diffusion de neutrons au Paul
+Scherrer Institut (Zurich, Switzerland) et au NIST (Maryland, USA).
+Une partie fondamentale de ce projet a été possible seulement grâce aux enseignements
+de Jean-Baptiste qui m’a guidé dans le monde de la biologie moléculaire et dans les
+expériences lourds et souvent peu généreux d’expression et purification des protéines. Je
+sais qu’il a du prouver un goût très particulier en voyant un pauvre physicien faire des
+bêtises sur la paillasse mais moi j’ai trouvé ma "vengeance" avec la coupe du monde de
+football....."Campioni del mondo!!!"
+Je ne peux pas oublier les autres collègues des laboratoires qui ont vu ma présence, souvent
+fugace, durant mon séjour à Grenoble: j’ai parcouru ma mémoire des deux années passées et
+je vous ai tous retrouvés pour votre amitié, vos encouragements, votre patience (je pense
+surtout aux collègues du DEUTERATION LAB !! ), votre aide direct et constant, pour avoir
+supporté mon travail et pour beaucoup d’autres choses.... Merci!
+A mes amis et ma famille:
+A Paris: Andrea et Adrien, merci pour les discussions hors cerveau et/ou hors logique, elles
+ont souvent sauvé ma stabilité mentale. A Grenoble: Mauro, merci pour nos nombreuses
+pauses café à mi-chemin entre nos rêves et nos ambitions. Merci à Giada, Bea, Fabrizio, i
+Fratini pour les beaux moments. Un merci générale à tous mes amis pour avoir supporté ma
+passion pour l’évolutionnisme et pour avoir écouté avec patience mes contes sur l’histoire du
+pauvre Kiwi.
+Un merci à ma famille et à mes amis à Rome qui ont vécu et participé à distance mes petits
+succès et faillites...
+En fin, au dehors de toute cette liste, une seule personne n’a pas besoin d’être remerciée ici
+parce que elle a vécu tout ce que j’ai vécu et elle sais bien que tout cela n’aurait jamais pu
+être sans sa présence, son support, sa compréhension et sa confiance pleins d’amour. Cette
+personne est devenue, au fil de cette thèse, mon épouse et c’est à elle que tous ces années de
+travail sont dédiés: "grazie amore".
+xii
+Part I
+RÉSUMÉ SUBSTANTIEL
+
+RÉSUMÉ SUBSTANTIEL
+0.1 introduction
+Dès le début du dernier siècle, les acquis sur la matière inanimée ont amenés les physiciens
+à se demander comment ces connaissances pouvaient être aussi appliquées à la matière
+biologique. La matière vivante présentait aux chercheurs une hétérogénéité et complexité de
+cas que ils n’avaient jamais rencontré en physique. Elle a ainsi donné naissance à un nouveau
+filon de recherche interdisciplinaire qui, alliant les domaines de la physique, la chimie et la
+biologie, a fourni des résultats très importants et utiles pour des applications successives en
+médecine et en biotechnologie.
+Ce travail de thèse puise ses sources dans le considérable progrès fait dans le domaine de la
+physique biologique notamment en ce qui concerne le développement de nouvelles méthodes
+de calcul, ainsi que à l’application des techniques de spectroscopie sur des échantillons
+biologiques.
+0.1.1 Organismes adaptés aux environnements extrêmes
+Organisms are integrated entities, not collections of discrete objects 1
+Les effets de la pression et de la température sur les propriétés structurales des protéines
+sont visibles à plusieurs échelles, des interactions non-covalentes des très courte portée, telles-
+que les liaisons hydrogène, jusqu’aux interactions à plus longue portée comme les interactions
+électrostatiques. Tout changement dû à une variation des variables thermodynamiques peut
+être interprété par le principe de Le Chatelier, selon lequel toute perturbation sur un système
+à l’équilibre provoque une réaction contraire de façon à diminuer l’effet de cette perturbation.
+Dans le cas considéré, l’application de la pression à une protéine favorise des processus
+qui s’accompagnent d’une diminution du volume. Ces processus agissent directement sur
+la structure de la protéine, entraînant des changements des interactions non-covalentes
+1 "Les organismes sont des entités intégrées, ils ne sont pas des collections d’objets discrets". The spandrels of San Marco
+and the Panglossian paradigm: a critic to the adaptationist programme, S.J. Gould and R.C. Lewontin, Proc.
+Royal Soc. London B, 205, 581-598, (1979).
+xv
+qui se forment ou se défont à l’intérieur de la structure. Ces changements produisent des
+effets différents sur les trois niveaux de structuration des protéines (secondaire, tertiaire et
+quaternaire)[144].
+Dans cette thèse nous avons abordé les effets de la pression et de la température dans
+un contexte particulier, celui des environnements des fonds marins près des cheminées
+hydrothermales où l’on trouve normalement des pressions et des température très hautes. En
+outre, comme suggéré par la phrase citée au début de cette section, nous voulons souligner le
+fait que l’étude de l’adaptation des protéines aux environnements extrêmes pourrait être
+largement améliorée par la connaissance du cadre général de l’adaptation cellulaire. Dans le
+texte de cette thèse nous avons donné un bref aperçu du sujet tout en renvoyant à d’autres
+publications pour des approfondissements de l’argument [85, 93, 182, 158, 107, 151, 191, 58].
+La biosphère, c’est à dire la surface de le terre connue comme lieu accueillant la vie,
+varie entre les régions abyssales des fonds marins et les hauteurs de l’Himalaya et offre une
+grande variété d’exemples d’organismes adaptés aux conditions extrêmes. D’un point de
+vue qualitative les limites physiques et chimiques pour accueillir des formes de vie sont les
+suivantes[92]:
+• −40◦C < T < 115◦C
+• P < 1.2kbar
+• ∼ 1 < pH < 11
+D’un point de vue évolutionniste, les organismes qui vivent dans des conditions proches de
+ces limites ont dû trouver des façons pour compenser tous les effets chimiques et physiques
+que ces limites mêmes peuvent générer sur l’ensemble de structures constituant les cellules.
+Autrement dit, les organismes qui sont devenues extrêmophiles ont trouvé des stratégies pour
+protéger leur système de vie des dégâts produits par l’environnement. D’après le peu qu’on
+connaît sur le fonctionnement de ces mécanismes, il y a deux démarches principalement
+suivis par les organismes. La première est la compensation des processus de dégradation
+à travers d’un réglage fin des taux de synthèse des biomolécules de façon qu’il soient
+compatibles avec le temps moyen de survie des molécules. La deuxième est l’incorporation
+de mutations ponctuelles dans les séquences des protéines à fin d’augmenter leur stabilité
+structurale, leur permettant de fonctionner plus longtemps. Apparemment, cette stratégie ne
+produit pas de différences remarquables dans la distribution globale des acides aminés dans
+xvi
+des protéines extrêmophiles par rapport à celles mesophiles, c’est à dire issues d’organismes
+vivant dans des conditions dites normales (température à 300K et pression à1bar) [48].
+Par conséquence, il semble assez évident que l’adaptation des biomolecules doit être liée à
+la présence de différents motifs locaux dans les séquences des acides aminés entraînant une
+réorganisation des interactions faibles non-covalentes qui règlent la stabilité et la flexibilité
+des protéines. Le new deal pour la stabilité des protéines extrêmophiles se fait donc par une
+réorganisation des mécanismes sensibles aux changements environnementaux. D’un point de
+vue physique, une mesure quantitative de la stabilité des protéines peut être obtenue par
+les différences d’énergie libre de Gibbs, ∆G(T ,P,N), entre l’état le plus stable et les minima
+locaux les plus proches. Jaenicke et Böhm [96] ont montré que les protéines mesophiles
+et extrêmophiles partagent un ∆G du même ordre de grandeur (∼ 50kJmol−1) même si
+les extrêmophiles montrent une plus large variabilité dans l’intervalle 10 − 100kJmol−1.
+Les différences trouvées entre les protéines mesophiles et extrêmophiles correspondent à
+l’énergie nécessaire à la formation ou à la rupture de quelques interactions non-covalentes, ce
+qui confirme le rôle fondamental que ces dernières jouent dans le contexte de l’adaptation
+moléculaire [157, 147, 151, 158].
+Le point central dans l’adaptation des biomolécules reste, de toute façon, la conservation
+des fonctionnalités biologiques représentant un compromis bien équilibré entre stabilité
+et flexibilité [197, 92]. Le processus d’adaptation se manifeste, donc, sous forme d’une
+transformation des propriétés des protéines mesophiles vers les conditions extrêmes, c’est à
+dire, vers des conditions physiologiques qui rendent les propriétés moléculaires des variétés
+extrêmophiles très similaires à celles des mesophiles. Cette translation est obtenue par la
+réorganisation des liaisons non-covalentes. Plusieurs expériences ont mis en évidence ce
+processus [217] et elles ont montré que les propriétés dynamiques de quelques enzymes
+mesophiles à une température de 25◦C sont très similaires à celles des leurs homologues
+extremophiles à 70◦C. Des résultats analogues ont été obtenus par une étude de simulation
+de dynamique moléculaire sur les différents homologues de la rubredoxine [69].
+Dans ce contexte Jaenicke [93] a supposé que l’adaptation moléculaire à des environnements
+extrêmes puisse fonctionner grâce à un maintien d’états correspondants entre les environ-
+nements natifs, en tenant compte de la topologie générale, de la flexibilité et de l’hydratation
+des protéines. Même si cette idée a trouvé plusieurs confirmations dans le passé, des études
+récentes ne semblent pas la confirmer entièrement[158].
+xvii
+0.1.2 L’environnement typique des fonds marins chauds
+Contrairement à l’opinion générale, les environnements terrestres, où la pression est d’environ
+1bar, occupent seulement 1% du volume total de la biosphère. Une partie considérable de la
+surface terrestre (70%) est couverte par les océans qui ont une profondeur moyenne de 3800
+mètres et donc une pression moyenne de 380bar. Plus du 60% de la biosphère marine est à
+1000 mètres sous le niveau de la mer. La vie au dessous de cette profondeur, normalement
+considérée comme le limite pour les environnements dits fonds marins, doit faire face à
+plusieurs conditions défavorables liées aux changements de la pression (de 1 à 1.1 kbar ) et de
+la température (de 1 à 110◦C) qui ont des impacts très important sur les mécanismes vitaux.
+Une nouvelle ligne de recherche sur les organismes qui vivent dans les sédiments marins
+a été entreprise entre le XIXème et le XXème siècle par Certes[30, 29] suivi par ZoBell et
+Johnson [220] dont les recherches ont mieux éclairées les stratégies de survie employées par
+les organismes pour faire face aux conditions extrêmes.
+Grâce à ce courant de recherche nous pouvons aujourd’hui distinguer les organismes en
+fonction de leur capacité d’adaptation aux hautes pressions: les barophiles (ou piezophiles)
+qui ont une croissance optimale à des pressions supérieures à celle atmosphérique; les
+barotolerants (ou piezotolerants) qui sont des organismes capables de vivre à hautes pressions
+tout en ayant leur taux de croissance optimale à pression atmosphérique; enfin, les organismes
+piezosensibles qui se distinguent des autres parce que leur croissance est très sensible aux
+pressions élevées.
+A la fin des années 70, les premières colonies d’organismes dans les fonds marins ont été
+trouvées à proximité des cheminées hydrothermales, des courants qui se forment où la lave
+extrudée se refroidit en se contractant et permet à l’eau de mer d’entrer dans les fissures
+des rochers basaltiques à peine formées. L’eau de mer est en suite expulsée très enrichie de
+métaux lourds formant des courants à très haute température [98].
+La vie autour des cheminée hydrothermales est devenue très rapidement l’un des sujets les
+plus intrigants dans le domaine de la biologie des fonds marins et la plupart des organismes
+barophiles connus à ce jour sont de facto aussi thermophiles, c’est à dire ils ont montré un
+plus haut taux de croissance à des températures plus élevées (typiquement entre 50 et 90◦C)
+que celles caractéristiques des fonds marins (environ 2◦C) [1].
+xviii
+Cet environnement des fonds marins chauds a introduit sous le plan biologique et
+évolutionniste plusieurs questions de grand intérêt qui ont demandé aussi des nouvelles
+explications par la biochimie et la physique.
+methanococcus jannaschii Cette thèse a comme objet l’étude d’une protéine
+produite par une archaebacterie, le Methanococcus Jannaschii, qui vit près des cheminées
+hydrothermales. Cet organisme, découvert en 1963 [102], vit normalement à des températures
+entre 48 et 94 ◦C, avec une température optimale de 85◦C, et à des pressions supérieures aux
+200 bar (profondeur in situ 2600 mètres).
+Le génome du M Jannaschii a été le premier parmi les génomes des archaebacteries dont on
+a obtenu le sequençage complet [18] ce qui révéla des relations évolutives complexes entre
+les archaea, les eucaryotes et les bactéries: seulement moins de la moitié des gènes trouvés
+dans son génome pouvait, en fait, être reliée a ceux des autres organismes. Dans le cadre de
+cette thèse, d’un point de vue de la biologie moléculaire, la propriété la plus intéressante
+de cet organisme est due au fait que tout en partageant les mécanismes de biosynthèse des
+eucaryotes, le M.Jannaschii possède des gènes pour la fonction d’initiation du processus de
+traduction homologues soit à ceux des eucaryotes soit à ceux des bactéries. Cette fonction est
+une partie fondamentale de la traduction de l’ARN messager et sera présentée en détail plus
+avant dans le texte.
+Des études ont montré que le métabolisme du M Jannaschii et sa croissance à haute
+température sont favorisés par la pression jusqu’à 750 bar et que les limites pour la croissance
+sont atteints à 90◦C soit à basse ou à haute pression [102]. Ces résultats suggèrent que le
+M.Jannaschii est effectivement un organisme barophile et pas seulement barotolerant. Cette
+conclusion semble être aussi confirmé par des études de réaction enzymatique qui ont montré
+que l’application d’une pression de 500bar peut augmenter jusqu’à cinq fois le temps moyen
+de vie de l’hydrogènase du M.Jannaschii à 90◦C [74] et jusqu’à 3 fois celui de la protease à 125
+◦C [138]. Néanmoins, des études récentes ont montré que la pression inhibait la fonction du
+20S proteasome du M Jannaschii [55], suggérant ainsi que dans certains cas la moindre activité
+d’une protéine à la pression native pourrait être un mécanisme de régulation conférant des
+avantages à la cellule entière. Par conséquent, un comportement bien plus complexe de la
+cellule par rapport aux hautes pressions et aux hautes températures devra être envisagé.
+xix
+0.1.3 Le facteur d’anti-association
+Nous présentons ici une brève introduction sur la protéine qui fait l’objet de ce travail de
+thèse, appelé Facteur d’anti-association [170, 199].
+Le facteur d’anti-association fait partie de la famille des facteurs d’initiation et il prend aussi
+le nom de Facteur d’initiation 6 (IF6).
+Le IF6, comme les autres facteurs d’initiation, prend part aux premières étapes du processus
+de traduction ARN-messager des ribosomes. Le rôle du IF6 dans l’initiation de la traduction
+est bien plus complexe que celui des autres facteurs d’initiation parce qu’il engendre diverses
+fonctions qu’on connaît très mal. D’abord, IF6 n’agit pas comme un vrai facteur d’initiation
+parce qu’il ne forme aucun complexe d’initiation, c’est à dire qu’il ne forme pas de complexe
+macromoléculaire avec les mARN, tARN et les sous-unités du ribosome dans les premières
+étapes de la traduction. Ceci est prouvé par le fait que la déplétion du IF6 ne bloque pas la
+traduction du mARN in vitro [178].
+Les fonctions principales de cette protéine peuvent être résumées comme suit:
+- IF6 est requis dans la biogenèse de la sous-unité ribosomale 60S soit dans les archaebac-
+téries que dans les eukaryotes [173, 178, 177, 212]
+- elle agit de facto comme un facteur qui règle l’association des sous-unités ribosomales
+60S et 40S dans le cytoplasme [178, 28]
+Ces fonctions, conservées dans plusieurs organismes, ont été prouvées par un grand
+nombre d’études et sont vérifiées par la présence de cette protéine dans le cytoplasme et dans
+les noyau des cellules. Dans le cadre de ce travail de thèse il est important aussi de noter que
+le IF6 a été montré comme très sensible aux hautes températures : dans certains homologues
+eukaryotes[178, 10], l’activité du IF6 a affiché un optimum autour de 37◦C alors qu’elle était
+totalement absente entre 50 et 60 ◦C. A l’état actuel, il parait très difficile d’établir si cet arrêt
+des fonctions du IF6 correspond aussi à une dénaturation.
+D’un point de vue moléculaire, les IF6 sont des protéines d’environ 26kDa qui partagent une
+séquence conservée de 224 résidus avec une similarité de 30%. Toutes les formes eukaryotes
+de la IF6, contiennent une partie carboxy-terminale de 21 acides aminés. Même si cette queue
+ne semble pas être directement impliquée dans la fonction d’anti-association du IF6[66], il a
+été prouvé qu’elle était reliée à cette dernière[28].
+En 2000, les premières structures moléculaire du IF6 ont été résolues par des études
+de cristallographie par rayon-X [66]. Il s’agit des structures de deux homologues du IF6:
+xx
+celui du M.Jannaschii et celui du Saccharomyces ceraevisie. Les deux structure ont révélé une
+pseudo-symétrie interne crée par la disposition, autour d’un centre commun, de cinq copies
+d’un domaine α/β d’environ 45 résidus. Chaque domaine contient: une longue hélice α,
+une autre plus courte ou une hélice 310 et trois brin β. Contrairement à la structure des
+premiers 224 résidus qui est connue et a été prouvée par homology modeling être conservée
+evolutivement[66], très peu a été révélé sur la structure de l’extension C-terminale de 21
+acides aminées.
+D’un point de vue structural, il faut aussi remarquer que les cinq domaines sont disposés
+d’une façon qui ne crée pas un centre hydrophobique. Au contraire, dans leur association, ils
+produisent un "tore" hydrophobe qui, à son tour, forme un centre creux dans la structure de la
+protéine. Cette cavité est assez large pour faire passer plusieurs molécules d’eau. Seize de ces
+molécules ont été trouvé aussi dans les structures cristallographiques, dans une configuration
+très ordonnée à couches pentagonales et dont les hydrogènes interagissent avec les oxygènes
+carbonyles des résidus dans les brins β voisins. Dans l’homologue provenant de la levure
+(Saccharomyces ceraevisie), le IF6 montre cette cavité fermée par une arginine (résidu 61) dont
+le groupement guanidinium forme plusieurs liaisons hydrogènes avec les glycines des courtes
+hélices α de chaque domaine.
+0.2 matériels et méthodes
+Cette section propose un bref aperçu des techniques utilisées pour la préparation des échan-
+tillons qui ont été étudiés par diffusion des neutrons et de ceux qui ont été simulés par
+dynamique moléculaire. Pour une présentation complète du cadre théorique dans lequel
+ces techniques ont été appliquées nous renvoyons au deuxième chapitre de la thèse et aux
+références [3, 56, 13, 129].
+Dans le texte qui suit, les deux IF6 homologues seront indiqués par les acronymes suivants:
+- aIF6: IF6 extremophile produit par Methanococcus Jannaschii
+- eIF6: IF6 mésophile produit par Saccharomyces cerevisiae
+0.2.1 Production des échantillons expérimentaux
+Les échantillons expérimentaux étudiés ici par diffusion de neutrons, ont étés produits à
+travers des étapes préliminaires qui demandaient notamment des connaissances en biologie
+xxi
+moléculaire. Cette thèse rapporte un protocole développé pour le IF6 qui vise à obtenir un
+rendement suffisant et compatible avec les quantités d’échantillons requis par les expériences
+de diffusion de neutron. Ce protocole suit le schéma usuel pour la production de protéines et
+qui peut être résumé comme suit:
+- Clonage de la partie de l’ADN génomique de Methanococcus Jannaschii et Saccharomyces
+cerevisiae qui codifie le IF6.
+- Expression du gène identifié dans un organisme hôte, dans le cas considéré ici le E.coli,
+à fin de produire une grande quantité de protéines.
+- Purification de la protéine produite par l’organisme hôte à fin de la séparer des autres
+protéines et d’obtenir une solution assez pure ne contenant que la IF6.
+Afin d’améliorer le rendement, du protocole de purification, nous avons utilisé une queue
+N-polyhistidine N-terminale (H-Tag) qui a permis de maintenir une concentration suffisante
+aussi pour des expériences de diffusion de neutrons à hautes pressions, ce qui, comme
+on le verra après, demande l’utilisation de grands volumes de solution. Néanmoins, des
+raisons techniques ont fortement limité le clivage de cette queue "marqueur" du IF6 en
+grands volumes de solution. Pour cette raison, ce clivage a été fait seulement à pression
+ambiante où les expériences pouvaient être faites avec des volumes adaptés. Il a été montré
+que la présence de la H-Tag n’a pas d’effets significatifs sur la structure des protéines [23]
+mais, vu son exposition au solvant qui entoure les protéines, elle pourrait avoir un effet
+dynamique important. Pour cette raison, afin de vérifier les effets produits dans le cas du
+IF6, des simulations de dynamique moléculaire ont été réalisés aussi sur un modèle du aIF6
+jointe avec la H-Tag.
+clivage du fragment c-terminal du eif6 Pendant les tests préliminaires pour
+l’optimisation du protocole ( cfr. ci-dessus) un clivage protéolytique du eIF6 a été observé
+(voir Figure 13, dans le texte de cette thèse, pour vérification SDS-PAGE) soit dans la partie
+soluble soit dans celle insoluble des fractions de purification du lysate cellulaire. A cause de
+son poids moléculaire modéré, le fragment clivé a été supposé être le même trouvé par Groft
+et al. [66]. Ces derniers ont rapporté le fait que les tentatives d’expression et purification du
+eIF6 étaient rendues très difficiles par le clivage protéolytique du fragment C-terminale.
+La partie clivée du eIF6 est formée de 21 acides aminés avec une séquence, affichée dans
+le Tableau 1, présente uniquement dans les homologues eukaryotes du IF6 dont on sait
+xxii
+très peu. En outre, une caractérisation par alignement multiple avec des bases de données
+d’autres séquences connues a montré que ce fragment n’est présent que dans les IF6, ce qui
+prouve son importance pour la fonctionnalité du IF6 même ou bien pour son histoire évolutive.
+Table 1: La séquence du fragment C-terminal du eIF6 (CTAIL). La numérotation suit celle utilisée dans
+le PDB 1G62.
+Glu225 Asp226 Ala227 Gln228 Pro229 Glu230 Ser231 Ile232
+Ser233 Gly234 Asn235 Leu236 Arg237 Asp238 Thr239 Leu240
+Ile241 Glu242 Thr243 Tyr244 Ser245
+Afin de mieux comprendre la structure native de cette queue C-terminale, nous avons
+examiné sa structure secondaire à l’aide d’outils de prédiction qui ont vérifié la probable
+présence d’une hélice-α dans la partie finale du fragment, la région DTLIE. Ce résultat a
+été confirmé par l’inspection du profil hydrophobe du fragment à l’aide de l’échelle de
+Kyte/Doolittle [122] qui montre une augmentation de l’hydrophobicité dans la même région.
+Finalement, cette étude préliminaire nous a convaincus que le fragment C-terminal du
+eIF6 joue un rôle significatif soit dans la dynamique soit dans la structure du eIF6 et donc
+aussi dans sa fonction. Cette idée est renforcée par d’autres résultats qui indiquent que les
+domaines C-terminaux contribuent à la localisation du eIF6 dans le noyau cellulaire [6]. Ces
+conclusions nous suggèrent l’importance d’exprimer et de purifier le eIF6 avec la queue
+C-terminale de 21 acides aminés et à ce propos plusieurs tests ont été mis en place pour
+réduire le clivage pendant les différentes phases de production. Le protocole présenté dans
+ce texte a donné les meilleurs résultats avec une clivage réduit d’environ 30% (voir la Figure
+14 dans le texte pour une vérification par spectrométrie de masse MALDI).
+stabilité du eif6 Afin d’aborder une étude visant les effets des conditions extrêmes
+sur les propriétés d’une protéine, il est nécessaire, tout d’abord, d’établir quelles sont les
+limites qui définissent les conditions normales pour la même protéine. Dans le cas des IF6, la
+connaissance de ces limites est très limitée à cause d’un manque d’études approfondies sur
+les propriétés chimiques de cette protéine. Ainsi, si pour le aIF6 on peut facilement supposer
+xxiii
+au moins une réponse réversible aux hautes pressions et températures, les conclusions sur les
+eIF6 sont très limitées.
+Dans notre démarche, nous avons d’abord procédé à un examen préliminaire à fin de
+vérifier la stabilité de eIF6 aux hautes températures. Pour cela, nous avons fait référence au
+travail de Valenzuela et al. qui a montré la cessation de l’activité du eIF6 à des températures
+au-dela de 60 ◦C. Une étude par diffusion de lumière, réalisée pour vérifier les conclusions
+de Valenzuela et al., a montré l’augmentation irréversible du rayon hydrodynamique des
+molécules au delà de la température de 50◦C. Ce résultat semble indiquer pour le eIF6 des
+conditions non-denaturantes à des températures inférieures à 50◦C. Cette limitation a été
+tenue en compte dans les mesures expérimentales, toutefois, des simulations de dynamique
+moléculaire ont été quand même réalisées afin de vérifier la présence effective d’un processus
+de dénaturation ou simplement son amorce.
+echantillons finaux Afin de pouvoir réaliser les expériences de diffusion des neu-
+trons sur aIF6 et eIF6, les deux protéines ont été préparées dans des solutions deuterées
+avec une concentration d’environ 40 mg/ml et une pD de 7.0. La concentration finale de
+ces solutions a été vérifiée avec des mesures d’absorption UV-VIS à une longueur d’onde de
+280nm. Cette mesure a donné cependant des résultats très imprécis à cause du nombre réduit
+de chromophores (qui normalement absorbent les UV à 280nm) dans les acides aminés de
+la séquence des IF6. Le manque de valeur précise a engendré des fortes limitations dans les
+mesures de diffusion des neutrons.
+0.2.2 Expériences de diffusion des neutrons
+Dans ce travail, les mesures de diffusion des neutrons ont visé les effets de la pression et de la
+température sur la dynamique des protéines. Pour les expériences de diffusion quasi-elastique
+de neutrons (QENS), ces mesures sont normalement réalisées sur des échantillons en
+solution qui sont comprimés dans des porte-échantillons de forme cylindrique. Dans le
+cas de cette étude, la grande variation de température explorée a nécessité l’utilisation de
+matériels qui ne subissent pas de changements structuraux importants à hautes températures
+qui pourraient modifier, par exemple, la résistance mécanique des porte-échantillons. En
+outre, les expérience de QENS nécessitent des solutions à très haute concentration afin de
+pouvoir bien distinguer le signal provenant des protéines de celui donné par le solvant.
+xxiv
+Ce dernier fait pose un limitation importante dans le volume total disponible pour les
+expériences sur des molécules biologiques car ces molécules ne sont normalement disponibles
+qu’en petites quantités. Dans le cas des a/eIF6, cette limitation a constitué un point
+crucial pour la mise en place de l’instrumentation nécessaire aux mesures sous haute pres-
+sion. Une description complète de la cellule pour les hautes pressions est donnée dans la thèse.
+0.2.3 Simulation de dynamique moléculaire
+Toutes les étapes de simulation de dynamique moléculaire décrites dans le texte qui suit
+ont été réalisées avec le programme AMBER9[27]. Le champ de forces utilisé est le AM-
+BER99SB [86], une mise à jour du plus connu champ de forces AMBER94, qui contient des
+paramètres permettant une meilleure différentiation des éléments de structure secondaire des
+protéines.
+Le schéma général pour la réalisation de ces simulations de dynamique moléculaire peut etre
+résumé comme suit:
+1. La configuration initiale est créée à partir des donnés cristallographiques (codes PDB:
+1G61 pour aIF6 et 1G62 pour eIF6). Au système initiale nous avons ajouté des molécules
+d’eau représentées par le modèle TIP3P et 14 contre-ions de sodium. Ces derniers ont le
+rôle de rendre nulle la charge totale du système.
+2. Le système entier est porté vers un état stable en appliquant des algorithmes de
+minimisation de l’énergie d’abord sur les seules molécules d’eau et puis sur la totalité
+du système.
+3. Le système est ensuite porté vers les conditions thermodynamiques souhaitées par
+des courtes simulations de dynamique moléculaire d’équilibration. D’abord le système
+est équilibré dans un ensemble NVT (volume et température constantes) avec un pas
+d’intégration de 1fs et pour une durée de 150ps; puis il est équilibré à pression et
+température constantes (1bar et 300K) pendant 700ps.
+4. Une fois obtenue l’équilibration du système, plusieurs simulations dans différentes
+conditions de pression et de température ont été réalisées. Les cordonnées atomiques
+sont stockées toutes les 40fs et la longueur des trajectoires générées est de 2ns.
+xxv
+Dans cette démarche la régulation de la température a été réalisée avec un thermostat
+de Langevin [195] (constante de friction 3.5ps−1) et la pression moyenne a été maintenue
+constante par un barostat de Berendsen [14] (temps de relaxation de 1.5ps).
+configuration initiale du eif6 La configuration initiale du eIF6 issue des données
+cristallographiques eu Saccharomyces cerevisiae (code PDB 1G62) ne contient pas les positions
+atomiques des 21 acides aminés qui forment le fragment C-terminale, cette absence étant du
+aux clivages protéolytiques déjà mentionnés dans les paragraphes précédents. La construction
+de la structure complète du eIF6 exige des étapes supplémentaires par rapport au aIF6.
+D’abord la structure du fragment C-terminale (CTAIL, ainsi par la suite) a été modélisée et
+partiellement repliée. Ensuite la structure du CTAIL a été attachée au reste de la structure
+du eIF6 et l’ensemble a été équilibré vers une configuration stable. Toutes ces étapes ont été
+réalisées par des simulations de dynamique moléculaire avec solvant implicite permettant de
+réduire considérablement les temps de calcul. Cette méthode consiste dans la substitution
+des molécules d’eau par des termes additionnels, dans le champs de force atomique, qui
+devraient reproduire les effets du solvant sur la protéine.
+Le protocole utilisé pour la modélisation du CTAIL et pour son repliement est basé sur le
+schéma suivant:
+1. Une configuration "linéaire" du CTAIL a été d’abord créée avec la séquence des acides
+aminés montrée dans le Tableau 1
+2. Un repliement initial du CTAIL a été obtenu par une suite de simulations courtes dans
+un ensemble NVT (volume et température constants) avec un pas d’intégration entre 0.1
+et 0.5 fs. Le protocole complet de cette étape est affiché dans le tableau ?? de cette thèse.
+3. Le processus de repliement est ensuite obtenu par une simulation de 40ns de longueur.
+La structure du CTAIL partiellement repliée est montrée par la Figure 16 (voir le texte de cette
+thèse). La configuration initiale de la structure complète du eIF6 a été crée par la jonction
+entre CTAIL et le eIF6. Cette dernière opération a été effectuée par la création d’une liaison
+covalente entre l’azote N-terminal du CTAIL et le carbone C-terminal du eIF6. La structure
+ainsi obtenue a été ensuite soumise à une procédure de minimisation et d’équilibration.
+Enfin, pour obtenir une meilleure optimisation locale de la structure, nous avons réalisé
+une simulation moléculaire avec la méthode de recuit simulé. Grâce à une succession de
+simulations à très hautes températures suivies par des autres à 300K, cette méthode permet
+d’explorer l’espace des configurations des grandes molécules mieux qu’une simple procédure
+xxvi
+de minimisation de l’énergie. Dans le cas du eIF6, la structure finale issue de cette méthode (
+voir Figure 17) a une énergie potentielle légèrement inférieure à celle initiale.
+La configuration ainsi trouvée a été utilisée ensuite comme état initial pour la procédure de
+simulation moléculaire décrite au début de cette section.
+Figure 1: Structure du eIF6 issue de la procédure de simulated annealing.
+echantillons supplémentaires Afin de mieux comparer les résultats obtenus à
+partir des simulations moléculaires avec ceux issues des mesures expérimentales, d’autres
+échantillons ont été modélisés et simulés. Les résultats issues de ces simulations, ont fourni
+notamment une meilleure compréhension des effets structuraux et dynamiques du CTAIL et
+de la queue de poly-histidines (H-Tag) respectivement sur eIF6 et aIF6. Les deux échantillons
+sont les suivants:
+. eIF6-NoCTAIL: le eIF6 simulé sans le CTAIL attaché. La structure cristallographique a
+été utilisé comme configuration initiale et a été soumise à la procédure de simulation
+moléculaire énoncée au début de cette section.
+. aIF6-HTag: le aIF6 est simulé avec une queue poly-histidine à l’extrémité N-terminale.
+Comme déjà expliqué dans ce texte, la présence de ce fragment additionnel a permis
+une amélioration considérable du rendement des protocoles de production des IF6. Les
+xxvii
+expériences de diffusion des neutrons sous pression ont été réalisées sur des échantillons
+contenant la H-Tag, ce qui a rendu indispensable la réalisation des simulations du même
+échantillon. La création de la structure, composée par le aIF6 et la H-Tag, a été obtenue
+avec une procédé similaire à celui utilisé pour le CTAIL.
+0.3 méthode de caractérisation de la structure secondaire des pro-
+téines
+Dans cette section, nous présentons une nouvelle méthode pour la caractérisation de la
+structure secondaire des protéines. Le développement de cette méthode, appelée ScrewFit, a
+été inspiré par la nécessité d’une analyse fine des effets de l’environnement sur les structures
+des protéines.
+Nous avons ensuite trouvé que ScrewFit est capable aussi de détecter les motifs qui carac-
+térisent la structure secondaire et de donner une évaluation des effets locaux et globaux
+résultants des interactions avec un ligand. La méthode et ses applications sont présentées
+dans cette thèse par le biais de deux articles, déjà parus ou en cours de publication dans des
+revues internationales avec comité d’évaluation :
+- Kneller, G.R. and Calligari, P. Efficient characterization of protein secondary structure in
+terms of screw motions. Acta Crystallographica D, 62(3), 302-311(2006).
+- Calligari, P. and Kneller G.R., ScrewFit: a novel approach for continuum protein secondary
+structure assessments. soumis.
+Une autre application de cette méthode, en dehors du sujet de cette thèse, est exposée ici :
+- Calligari, P. et al., Inhibition of viral group-1 and group-2 neuraminidases by oseltamivir:
+a comparative structural analysis by the ScrewFit algorithm. Biophysical Chemistry,
+accepté pour publication (2008).
+Les résumés des deux articles inclus dans la thèse sont ici traduits et une brève introduction
+de la méthode est donnée avec un exemple d’application.
+0.3.1 Efficient characterisation of protein secondary structure in terms of screw motions
+Nous présentons une méthode simple et efficace pour décrire la structure secondaire
+en termes de distances d’orientation entre plans peptidiques consécutifs et paramètres
+xxviii
+hélicoïdaux locaux. La méthode utilise des fits de superposition de plans peptidiques en
+combinaison avec le théorème de Chasles qui affirme que tout mouvement de corps rigide
+peut être décrit par un mouvement du type "mouvement de vis". Pour la superposition
+de plans peptidiques consécutifs nous avons dérivé les paramètres hélicoïdaux et utilisé
+le fit le plus mauvais pour définir une distance d’orientation. Nous avons aussi montré
+les applications de la méthode aux modèles théoriques des structures secondaires, aux
+protéines appartenant à différentes classes structurales et à la description des changements
+structuraux induits dans le lysozyme par une haute pression hydrostatique. Dans cette
+dernière application, nous avons utilisé des donnés déjà publiées, issues de la cristallographie
+par rayons-X et des mesures par RMN.
+0.3.2 ScrewFit: a novel approach for continuum protein secondary structure assessments
+Nous présentons ici une nouvelle méthode pour la détection des éléments de la structure
+secondaire des protéines combinant une description de la chaîne principale d’une protéine en
+terme de "mouvement de vis" (Acta Cryst. 62, 302-311 (2006)) et une approche statistique.
+L’application de cette méthode produit des intervalles de confiance qui définissant les
+variations naturelles des paramètres hélicoïdaux qui décrivent la chaîne principale. Afin
+d’établir ces intervalles pour chaque motif (pattern) de structure secondaire, nous avons
+analysé plusieurs bases de données contenant des structure de protéines caractérisées par
+un profil structural bien défini. Cette méthode permet une évaluation "continue" de la
+structure secondaire d’une protéine et a été démontrée stable par rapport aux variations
+structurales, trouvées dans les donnés RMN, et à la résolution expérimentale des donnés
+cristallographiques. La comparaison avec d’autres méthodes confirme sa précision et fiabilité.
+L’exemple de l’analyse de la structure de l’inhibiteur trypsine pancréatique bovine dans
+ses trois différentes formes cristallines montre la capacité de notre méthode de détecter
+et d’analyser des petites variations structurales dans des données expérimentales très bruitées.
+0.3.3 L’algorithme ScrewFit
+A fin de décrire d’une manière simple la structure secondaire des protéines, nous avons utilisé
+l’algorithme ScrewFit, qui est basé sur la superposition optimale de structures moléculaires
+xxix
+[50, 115, 116] et sur le théorème de Chasles [33, 32].
+Nous pouvons considérer deux plans peptidiques consécutifs A et B, comme deux corps
+rigides définis par les positions des atomes {O,C,N} de chaque plan. Ces corps rigides
+peuvent être superposés en minimisant la fonction suivante:
+∑3
+m(q) = (D · xα − x ′ 2α) , (0.1)
+α=1
+où {x } et {x ′α α} sont respectivement les positions atomiques de la structure de référence (les
+atomes {O,C,N} dans le plan A) et celles de la structure cible (plan B). Le symbole D dénote
+une matrice orthogonale qui décrit une rotation. Les deux ensembles des coordonnées sont
+définis par rapport à un point de référence qui est la position de l’atome de carbone de
+chaque plan {O,C,N}. En utilisant le fait qu’une matrice de rotation peut être exprimée par
+les composantes d’un quaternion normalisé q ≡ {q ,q ,q ,q }, où q20 1 2 3 + q2 + q2 + q2 = 1 [4],
+ 0 1 2 3
+ q20 + q21 − q22 − q2 3
+2(−q0q3 + q1q2) 2(q0q2 + q1q3) 
+ D(q) =  2(q q + q q ) q2 + q2 − q2 − q2 2(−q q + q q )  , (0.2)0 3 1 2 0 2 1 3 0 1 2 3
+2(−q q + q q 2 2 2 20 2 1 3) 2(q0q1 + q2q3) q0 + q3 − q1 − q2
+la fonction (6.1) peut être minimisée par rapport à ces quatre composantes. Comme il a
+été montré dans d’autres études [50, 115, 116], la minimisation avec contraintes peut être
+transformée dans un problème de valeurs propres d’une matrice M semi-definie positive
+M ≡M({x , x ′α α}),
+M · q = λq, (0.3)
+où les valeurs propres λj = m(qj) sont les possibles erreurs dans la superposition des
+deux plans peptidiques défini par (6.1). Le quaternion correspondant à la valeur propre la
+plus petite est la solution pour une superposition optimale et ses composantes décrivent
+l’orientatio ′n relative de {xα} par rapport à {xα}. La relation:
+q ≡ q0  cos(φ/2)=  . (0.4)
+qv sin(φ/2)n
+nous montre que le quaternion correspondant à la valeur propre la plus petite définit aussi un
+angle de rotation φ et un axe de rotation n, ce dernier étant aussi la direction du "mouvement
+de vis" décrit dans le théorème de Chasles. La preuve de ce dernier théorème peut être trouvée
+dans la référence [114]. La valeur propre la plus grande λmax décrit la "pire" superposition
+xxx
+possible entre les deux plans peptidiques et donne leur distance euclidienne maximale. Nous
+avons utili√sé ce dernier fait pour définir une distance d’orientation unique par∑3 (x − x ′ )2
+∆ = α=1
+α α . (0.5)
+λmax
+Par définition 0 6 ∆ 6 1.
+La caractérisation de la structure secondaire d’une protéine est réalisée dans cette méthode
+avec les paramètres suivants:
+1. La distance d’orientation entre deux plans consécutifs, défini par Eq. (6.5).
+2. Le rayon de la surface cylindrique sur laquelle bouge l’atome de référence (atome C)
+en réalisant le "mouvement de vis" entre deux plans peptidique comme décrit par le
+théorème de C√hasles,
+|t⊥|
+ρ = 1+ cot2(φ/2). (0.6)
+2
+Ici t⊥ est la composante perpendiculaire à l’axe de rotation n du vecteur t qui relie les
+atomes C.
+3. Le paramètre de "rectitude" σ. Pour chaque résidu i ce dernier est défini comme suit:
+σ = µTi i · µi+1, (0.7)
+où
+R⊥i+1 −R
+⊥
+= iµi (0.8)
+|R⊥ ⊥i+1 −Ri |
+et R⊥i est le point de l’axe hélicoïdal le plus proche de l’atome C du plan peptidique i.
+La "rectitude" donne des renseignements sur la courbure des éléments de la structure
+secondaire.
+0.3.4 Application de ScrewFit à des structures modèles
+Nous présentons ici un exemple d’application simple de la méthode ScrewFit. Il s’agit de
+structures-modèles différemment configurées et composées de 10 alanines et qui ont été
+obtenues par le Image Library of Biological Macromolecules in Jena 2 (les valeurs obtenues
+sont affichés dans le tableau 2).
+Les résultats remarquables de cette application sont:
+2 Institute-of-Molecular-Biotechnology-Jena:http://www.imb-jena.de/IMAGE.html
+xxxi
+Table 2: Paramètres hélicoïdaux de différentes structures. Ici ρ est la valeur de ρ obtenue en utilisant
+Cα
+la position des atomes Cα comme référence. Les paramètres τ, pitch et h sont illustrés de
+manière approfondie dans la thèse.
+Motive ρ [nm] ρ [nm] τ pitch h σ ∆
+Cα
+α-helix (R) 0.171 0.227 3.62 0.556 + 1 0.582
+α-helix (L) 0.171 0.227 3.62 0.556 − 1 0.582
+3-10 helix 0.146 0.203 3.28 0.589 + 1 0.670
+π-helix 0.178 0.258 4.16 0.558 + 1 0.471
+β-strand 0.055 0.093 2.03 0.671 − 1 0.875
+extended 0.037 0.055 2.00 0.725 − 0.754
+1. les hélices-α lévogyre et dextrogyre ont exactement les mêmes valeurs, ce qui montre
+l’efficacité mathématique de la méthode.
+2. Chaque type d’hélice peut être distingué des autres même si, en général, les valeurs des
+paramètres pour les hélices sont très similaires.
+3. La méthode permet une distinction très nette entre hélices et brins-β.
+0.4 résultats
+Nous présentons ici les principaux résultats obtenus dans ce travail de thèse soit par le
+moyen de simulations de dynamique moléculaire (MD) soit par les expériences de diffusion
+quasi-élastique des neutrons (QENS). Ces résultats seront utilisés pour déterminer les effets
+locaux et globaux des conditions environnementales sur les deux homologues du IF6. Le lien
+entre ces deux types d’effets est assuré par la complémentarité des informations obtenues par
+dynamique moléculaire et par diffusion des neutrons.
+Les conditions d’environnement appliqués dans les deux cas sont affichées dans les Tableaux
+4 et 3.
+Le nombre et la variété des mesures expérimentales ont été largement limités par des
+problèmes techniques qui seront discutés plus avant dans le texte. La comparaison entre
+données QENS et MD a été quand même possible dans un nombre restreint de cas. Pour la
+raison énoncée, les données affichées dans cette section sont issues des simulations MD sauf
+xxxii
+Table 3: Ensemble des configurations environnementales appliquées dans les simulation MD
+aIF6 eIF6 eIF6-NoCTAIL
+300K - 1bar 300K - 1bar 300K - 1bar
+300K - 250bar 320K - 1bar 300K 500bar
+300K - 500bar 350K - 1bar 350K - 1bar
+350K - 1bar 350K - 500bar 350K - 500bar
+350K - 250bar
+350K - 500bar
+Table 4: Ensemble des configurations environnementales appliquées dans les mesures QENS
+aIF6 eIF6 aIF6-HTag
+300K - 1bar 300K - 1bar 300K - 250bar
+350K - 1bar 350K - 1bar 300K - 500bar
+350K - 250bar
+350K - 500bar
+xxxiii
+exceptions signalés.
+0.4.1 Effets de la pression et de la température sur la structure des IF6
+Les principaux effets de la température et de la pression sur les deux homologues du IF6 ont
+été caractérisés autant d’un point de vue global que local.
+Dans le premier cas, nous avons observé les changements du volume moléculaire des
+deux protéines ainsi que les changements de leurs rayons de gyration et de leurs surfaces
+accessibles au solvant. Dans le deuxième cas, une caractérisation fine des changements de la
+structure secondaire a été obtenue par l’étude des fluctuations des atomes de carbone α et
+l’analyse effectuée avec la méthode ScrewFit.
+Les principaux effets globaux trouvés sont ici résumés:
+· Les changements du volume moléculaire et du rayon de gyration montrent que le aIF6
+est moins sensible au changements environnementaux que son homologue mesophile.
+Figures 2 et 3
+· Le rayon de gyration et la surface accessible au solvant du aIF6 affichent, aux conditions
+naturelles pour Methanococcus Jannaschii (350K -500bar), des valeurs très similaires à
+celles du eIF6 dans des conditions normales. Ce résultat semble suggérer la présence d’
+"états correspondants" entre les conditions naturelles des deux homologues.
+Les fluctuations des chaînes principales et les variations des paramètres ScrewFit montrent
+les résultats suivants:
+aIF6
+· A une haute température les régions autour du résidu 60 et comprises entre les résidus
+120 et 130 subissent des distorsions indiquant des changements d’orientation des plans
+peptidiques de la chaîne principale qui cependant n’entraînent pas de courbures de cette
+dernière. Nous avons observé que ces changements ne se produisent pas aux hautes
+pressions.
+xxxiv
+· La haute pression induit une courbure significative sur la structure principale du aIF6 dans
+la région comprise entre les résidus 90 et 95. Cet effet engendre aussi une augmentation
+des fluctuations atomiques dans la même région.
+· La combinaison de haute température et haute pression modifie les configurations des
+plans peptidiques autour du résidu 50 vers des orientations relatives plutôt hélicoïdales.
+eIF6
+· Des importantes variations dans la région 220-245 sont engendrées par les fluctuations
+du CTAIL. Comme on pouvait l’attendre, ces variations augmentent en fonction de la
+température.
+· Différentes variations dans la région 170-180 se produisent tant à haute température
+qu’à haute pression mais elles disparaissent quand la pression et la température sont
+appliquées de façon simultanée.
+· La combinaison d’une haute pression (500bar) et d’une haute température (350K) produit
+une courbure de la partie C-terminale de la longue hélice-α dans la région 35-45.
+Certains des ces effets locaux sur la structure ont été ensuite reliés aux possibles effets
+sur la fonction du IF6. En particulier, nous avons remarqué que la pression a des effets très
+importants sur la configuration des sérines 174 et 175 dans le eIF6. Ces deux derniers acides
+aminés ont un rôle essentiel dans la localisation du IF6 dans le noyau cellulaire parce que
+leur phosphorylation permet le passage du IF6 entre noyau et cytoplasme.
+La présence des états correspondants entre les deux protéines dans leurs conditions naturelles
+est ultérieurement confirmée par l’étude du facteur de structure élastique incohérent (EISF,
+voir texte de la thèse) qui donne accès aux fluctuations atomiques en fonction de l’échelle
+de longueur explorée par les mouvements internes des protéines. La figure 4 montre les
+fluctuations carrées moyennes en fonction du transfert de quantité de mouvement, q.
+Pour mieux comprendre les effets de la présence du CTAIL dans le eIF6 et celle possible de
+la H-Tag dans le aIF6, nous avons réalisé les mêmes études structurales sur eIF6-NoCTAIL et
+sur aIF6-HTag. Les résultats les plus remarquables de ces études ont été que le eIF6-NoCTAIL
+affiche des changements très similaires à ceux qui ont caractérisé le aIF6 et que l’aIF6-HTag
+montre des propriétés similaire a celles du eIF6. Ces observations suggèrent que la présence
+d’une "queue" additionnelle dans les deux structures des IF6 joue un rôle crucial dans la
+xxxv
+300K 1bar
+45.5
+300K 500bar A)
+350K 1bar
+45 350K 500bar
+44.5
+44
+43.5
+43
+42.5
+0 500 1000 1500 2000
+time [ps]
+300K 1bar
+45.5
+300K 500bar B)
+350K 1bar
+45 350K 500bar
+44.5
+44
+43.5
+43
+42.5
+0 500 1000 1500 2000
+time [ps]
+Figure 2: Variation du volume moléculaire en fonction de la pression et de la température. Panel A:
+aIF6. Panel B: eIF6.
+17 17300K 1bar
+A) 300K 500bar B)
+350K 1bar
+16.9 16.9
+350K 500bar
+16.8 16.8
+16.7 16.7
+16.6 16.6
+16.5 16.5
+300K 1bar
+16.4 16.4 300K 500bar
+350K 1bar
+350K 500bar
+16.3 16.3
+0 500 1000 1500 2000 0 500 1000 1500 2000
+time [ps] time [ps]
+Figure 3: Variation du rayon de gyration en fonction de la pression et de la température. Panel A: aIF6.
+Panel B: eIF6 (Seuls les résidus entre 1 et 224 ont été pris en compte).
+xxxvi
+Radius of gyration [A]
+Volume [Å3] Volume [Å3]
+Radius of gyration [Å]
+eIF6(1-224) 300K 1bar
+eIF6(1-224) 300K 500bar
+0.008 eIF6(1-224) 350K 1bar
+eIF6(1-224) 350K 500bar
+aIF6 300K 1bar
+aIF6 300K 500bar
+0.006 aIF6 350K 1bar
+aIF6 350K 500bar
+0.004
+0.002
+0 20 40 60 80 100
+q [nm-1]
+Figure 4: Comparaison des fluctuations atomiques du eIF6 et du aIF6.
+détermination des propriétés structurales de chaque homologue.
+0.4.2 Effets dynamiques de la pression et de la température
+Afin de caractériser les effets dynamiques d’un environnement extrême sur les IF6, les donnés
+issues des simulations MD et celles obtenues par mesures QENS ont été comparées. Les
+quantités "naturelles" pour l’analyse des simulations MD sont celles reliées à des fonctions
+dépendant du temps, tels que le déplacement carré moyen, ou bien aux fonctions des
+corrélations comme la fonction intermédiaire de diffusion. Les mesures expérimentales sont
+au contraire étudiées par l’analyse du facteur de structure dynamique qui est une quantité
+reliée au transfert de la quantité de mouvement et aux variations d’énergie. La fonction
+intermédiaire de diffusion et le facteur de structure dynamique d’une protéine peuvent être
+bien représentés par le modèle de dynamique Brownienne fractionnaire (fOU, dans la suite)
+[119, 20]. Ce modèle donne des temps de relaxation qui définissent la dynamique interne des
+protéines en fonction d’une échelle de longueur.
+xxxvii
+<x2>  [Å2]
+Les résultats sur les effets dynamiques de la pression et de la température peuvent être
+résumés comme suit:
+Les temps de relaxation définis par le fOU affichent des valeurs très différentes dans les
+deux protéines. En particulier, dans le cas du aIF6, ils sont systématiquement plus
+rapides que ceux du eIF6 à toutes les échelles de longueur.
+Les mêmes temps caractéristiques des deux protéines changent d’une façon différente en
+fonction de la pression et de la température. En particulier ils augmentent en fonction
+de la pression dans le cas du aIF6 et ils baissent dans le cas du eIF6.
+Ces dernières observations identifient plutôt les caractères dynamiques de chaque homo-
+logue du IF6 et de sa réponse aux changements des conditions environnementales. Cette
+dernière réponse devient par contre évidente si l’on compare les temps de relaxation de
+chaque homologue dans ses conditions "naturelles" avec ceux affichés dans des condition
+défavorables. Les Figures 5 et 6 montrent que dans les deux homologues les conditions les
+plus défavorables produisent des changements non homogènes dans le temps de relaxation et
+que ces changements deviennent de plus en plus homogènes en se rapprochant des conditions
+"naturelles".
+1.6
+1.5
+1.4
+300K-500bar
+350K-1bar
+1.3
+350K-500bar
+1.2
+4 6 8 10 12 14 16 18
+-1
+q [nm ]
+Figure 5: Valeurs du paramètre τ issu du fit fOU de eIF6.
+Ces résultats principalement issus des simulations MD ont été aussi confirmés par les
+expériences de diffusion de neutrons. Ces dernières ont été toutefois limitées par les difficultés
+techniques suivantes:
+xxxviii
+τ/τ300K-1bar
+300K-1bar
+1.5 300K-500bar
+350K-1bar
+1.4
+1.3
+1.2
+1.1
+1
+0.9
+4 6 8 10 12 14 16 18
+-1
+q [nm ]
+Figure 6: Valeurs du paramètre τ issu du fit fOU de aIF6.
+· Le eIF6 a montré une stabilité précaire dans les configurations expérimentales utilisée dans
+ce travail
+· L’évaluation de la concentration des échantillons en solution a été très difficile à cause de
+l’absorption très limitée dans la gamme des UV-VIS tant du aIF6 que du eIF6.
+Ces deux problèmes n’ont pas rendu possible une analyse plus fine des données expéri-
+mentales. Celles-ci néanmoins ont pu être utilisées pour supporter les résultats obtenus par
+dynamique moléculaire.
+0.5 conclusions
+Dans ce travail nous avons caractérisé la réponse des deux homologues du IF6 à différentes
+conditions extrêmes. Ces réponses ont été caractérisées d’un point de vue autant structural
+que dynamique.
+L’étude structurale a montré que l’aIF6, bien que moins sensible aux changements de
+température et de pression, assume dans ces conditions "naturelles" (350K -500bar) des
+caractéristiques structurales très similaires à celle du eIF6 à température et pression ambiante.
+Nous avons aussi distingués les effets globaux des effets locaux, qui sont très différents
+dans les deux IF6. En outre, contrairement aux attentes, les effets des deux variables thermo-
+dynamiques ne s’opposent pas les uns aux autres.
+D’un point de vue dynamique, le modèle de dynamique Brownienne fractionnaire
+nous a permis d’associer des temps caractéristiques à chaque protéine. Ces temps, qui
+xxxix
+τ/τ350K-500bar
+dépendent de l’échelle de longueur considérée, affichent des valeurs différentes dans les
+deux protéines dans des conditions environnementales diverses alors qu’ils changent
+d’une façon similaire si les protéines sont dans des conditions défavorables. Ces résul-
+tats nous ont permis d’identifier d’abord la présence des "états correspondants" des
+fluctuations structurales de chaque homologue du IF6 dans ses conditions naturelles.
+Deuxièmement ils ont rendu possible la distinction entre les propriétés dynamiques reliées à
+la structure de chaque protéine et les propriétés caractérisant l’état naturel de chaque protéine.
+xl
+Part II
+THES I S
+
+CONTENTS
+i résumé substantiel xiii
+0.1 Introduction xv
+0.1.1 Organismes adaptés aux environnements extrêmes xv
+0.1.2 L’environnement typique des fonds marins chauds xviii
+0.1.3 Le facteur d’anti-association xx
+0.2 Matériels et Méthodes xxi
+0.2.1 Production des échantillons expérimentaux xxi
+0.2.2 Expériences de diffusion des neutrons xxiv
+0.2.3 Simulation de dynamique moléculaire xxv
+0.3 Méthode de caractérisation de la structure secondaire des protéines xxviii
+0.3.1 Efficient characterisation of protein secondary structure in terms of
+screw motions xxviii
+0.3.2 ScrewFit: a novel approach for continuum protein secondary structure
+assessments xxix
+0.3.3 L’algorithme ScrewFit xxix
+0.3.4 Application de ScrewFit à des structures modèles xxxi
+0.4 Résultats xxxii
+0.4.1 Effets de la pression et de la température sur la structure des IF6 xxxiv
+0.4.2 Effets dynamiques de la pression et de la température xxxvii
+0.5 Conclusions xxxix
+ii thesis 1
+1 General Introduction 7
+1.1 Effects of pressure and temperature on proteins 8
+1.2 Organisms adapted to extreme environments 16
+1.3 The warm deep-sea environment 18
+1.4 The anti-association factor 23
+1.5 The thesis project "at a glance". 27
+2 Material and Methods 29
+2.1 Molecular Dynamics 29
+3
+4 Contents
+2.1.1 The basic principle 29
+2.2 Neutron Scattering 38
+2.2.1 Incoherent Scattering 41
+2.2.2 Spectrometers 44
+3 Experimental and Simulated Systems setup 47
+3.1 Sample production 47
+3.1.1 Protein expression and purification 47
+3.2 Neutron Scattering measurements setup 54
+3.2.1 Data analysis 58
+3.3 Molecular Dynamics setups 59
+3.3.1 System Setup 60
+3.3.2 eIF6 61
+4 Characterization of protein structure 69
+5 Efficient characterisation of protein secondary structure in terms of screw mo-
+tions 71
+5.1 Introduction 72
+5.2 Method 73
+5.2.1 Quaternion superposition fits 73
+5.2.2 Orientational distance 75
+5.2.3 Chasles’ theorem 76
+5.3 Applications 77
+5.3.1 Screw motion description of protein main chains 77
+5.3.2 Model structures 78
+5.3.3 Proteins in different fold classes 80
+5.3.4 Lysozyme under hydrostatic pressure 82
+5.4 Conclusion 87
+5.5 Mathematical Background 89
+5.5.1 Quaternions 89
+5.5.2 Helix parameters in Chasles’ theorem 90
+5.6 Notes 92
+6 ScrewFit: a novel approach for continuum protein secondary structure assess-
+ments 93
+6.1 Introduction 94
+6.2 Methods 96
+contents 5
+6.2.1 The ScrewFit algorithms 96
+6.2.2 Availability 99
+6.2.3 Databases 99
+6.3 Results and Discussion 100
+6.3.1 Evaluation of natural parameters 100
+6.3.2 Reliability and consistency of ScrewFit assignments 103
+6.3.3 Comparison with DSSPcont 107
+6.3.4 Application 109
+6.4 Conclusion 112
+6.5 Notes 113
+7 Results 115
+7.1 Effects of pressure and temperature change on IF6s structure 116
+7.1.1 Local effects 117
+7.1.2 Secondary structure changes 121
+7.1.3 Relation between local structural effects and IF6 function 124
+7.1.4 Comparison between ScrewFit profiles of eIF6 and eIF6-NoCTAIL 126
+7.1.5 Comparison between ScrewFit profiles of aIF6 and aIF6-HTag 127
+7.1.6 Elastic Incoherent Structure Factor 129
+7.2 Efffects of pressure and temperature on IF6s dynamics 134
+7.2.1 Dynamical models 134
+7.2.2 Fractional Brownian Dynamics 135
+7.2.3 Analysis of scattering functions obtained from MD simulations 138
+7.3 Comparison with QENS measurements 144
+7.3.1 Ambient pressure measurements 146
+7.3.2 High pressure measurements 150
+7.4 Discussion and Conclusion 151
+8 General conclusions and Perspectives 157
+iii appendix 161
+a Buffers used for protein expression and purification 163
+b Corrections to the Stokes’ law for sphere diffusion. 165
+bibliography 167
+
+1
+GENERAL INTRODUCTION
+The last century owes the majority of its advances in science and technology to the
+investigation of the structure and dynamics of matter at the atomic and subatomic scale
+which lead, among others, to a significantly better understanding of the physical and
+chemical properties of solids and liquids.
+Since the beginning of the century, the knowledge acquired about the inanimate matter lead
+physicists to question how this insight could also be applied also to biological matter. To
+this end, most of the principles of thermodynamics and classical mechanics were applied to
+biological systems to gain new insights into their properties, but only the advent of quantum
+theory and statistical mechanics finally allowed them to be investigated at the atomic scale.
+These new theories, along with important developments in the techniques of atomic and
+molecular spectroscopy lead researchers to revise and interpret from a molecular point of
+view several results obtained in biology in the last century. 1
+Living matter presented to researchers a degree of heterogeneity and complexity that they
+had never encountered before in physics and stimulated the birth of a new interdisciplinary
+field of research which brought together physics, chemistry and biology and which revealed
+itself as a source for a large number of key results with further applications in medicine and
+biotechnology.
+The work presented in this thesis is based on the enormous progress made in the field of
+biological physics, in particular with respect to the development of computer simulation
+methods, made possible by the rapid improvements in computers, and the application of
+spectroscopic techniques to biological samples.
+As will be explained more deeply, later in the text, these two techniques can be combined in a
+unified approach in which computer simulations helps to better characterize the experimental
+results at the atomic scale.
+1 As an example, it is worth to cite the famous prediction by E.Schroedinger who inferred from the basic quantum
+mechanical principles, that the structure of DNA had to be that of an aperiodic lattice. His prediction was then
+confirmed years later by the crystallographic resolution of the DNA structure made by Watson and Crick.
+7
+8 general introduction
+In the following, a general introduction to this thesis work will be given assuming a basic
+knowledge of protein structure elements the explanation of which would be beyond of the
+scope of this thesis. This subject is however treated in detail in a number of excellent textbooks
+[42, 187]
+1.1 effects of pressure and temperature on proteins
+In the very first efforts to investigate living matter, physicists focused on the application of
+basic principles of mechanics and thermodynamics to interpret the complexity of biological
+macromolecules [30].
+As this thesis deals essentially with the effects of temperature and pressure on proteins, the
+following sections will concentrate on this subject, giving a short presentation of the known
+effects of these two thermodynamic variables on the structure and dynamics of proteins.
+Pioneering work on the impact of pressure on proteins was performed by Regnard in 1891
+[160] and by Bridgman in 1914 [17]. The former showed that pressure below 1kbar affects
+reversibly the catalytic functions in bacteria, whereas the second proved that pressures
+above 8kbar lead to a coagulation of the protein ovalbumin. Moreover, Bridgman also noted
+that high temperature reduced the effects of high pressure on albumin, i.e. reduced the
+coagulation.
+These studies yielded the important result that two types of pressure effects have to be
+distinguished: irreversible and reversible effects depending on the magnitude of the applied
+pressure [75]. The same observations have been made concerning temperature induced
+changes [42, 189].
+When irreversible effects produced by high pressure (as well as by high temperature) are
+present, a large change in the spatial conformation affects proteins which loose their native
+structure. In these new denaturated states, proteins cannot perform their functions and
+tend to have unusual interactions with other proteins leading to large aggregates. Partially
+denaturated states (also known as molten globules) can be included among the reversible
+effects because when pressure or temperature are brought back to their original values
+proteins fold back in their native configuration [42].
+Several more recent works [143, 219, 169, 99], showed also that : i) proteins do not all have
+the same characteristic threshold for denaturing pressures: it depends of their size and shape;
+ii) denaturing caused by high temperature is often very different from denaturing caused by
+1.1 effects of pressure and temperature on proteins 9
+freezing or by high pressure.
+In summary, these results, which will be discussed in the following, show that high
+temperature and high pressure have similar effects on protein stability but they appear to
+be competitive when applied together. Moreover, the structural changes of proteins due to
+external pressure are much less homogenous than those induced by temperature changes.
+le chatelier’s principle A useful theoretical framework for the comprehension of
+how biomolecules respond to changes in thermodynamic conditions is given by the criteria
+for the stability of thermodynamic systems and by Le Chatelier’s principle[126]. The latter
+states that at equilibrium, a system tends to minimize the effect of any external factor by
+which it is perturbed. As briefly shown in the following, Le Chatelier’s principle gives the
+physical interpretation of the stability criteria for the thermodynamical potentials which
+describe the macroscopic states of the system. Indeed these criteria reflect those demanded
+for the intrinsic stability of the thermodynamic system itself. For an equilibrium process
+connecting two states A and B, the general expression for the variation of Gibbs free energy,
+G(T,P,N) reads as follows:
+∑
+∆G = V∆P− S∆T + µi ∆Ni (1.1)
+i
+where ∆Ni, ∆P and ∆T are, respectively, the variation in number of particles of type i and
+the change in pressure and temperature. In the case of the Gibbs free energy, the stability
+criteria lead to the condition that the function G(T,P,N) be concave with respect to variables T
+and P and convex with respect to Ni [21]. From a mathematical point of view, this means that
+the second order derivatives of the function G(T,P,N) with respect to T and P must be negative.
+These conditions can be rewritten with respect to the natural thermodynamic variables by
+means of the Maxwell relations:
+( ) ( )
+∂2G ∂V
+( ) =∂P2 T (∂P) 6 0 (1.2)T
+∂2G ∂S
+= − 6 0 (1.3)
+∂T2 P ∂T P
+As a consequence, an increase in pressure on a system favors a reduction of its conjugated
+extensive variable, the volume. Hence, in general, pressure favors all processes that are
+10 general introduction
+accompained by negative volume changes.
+In the case of proteins, which usually have compact and tightly packed structures, three
+different types of volumes can be distinguished: the volume of atoms, the void volume due to
+imperfect packing of atoms which leave small cavities at the interior of molecular structures
+and the volume variations which result from the degree of solvation of peptide bonds and
+amino acids residues. All these components influence both the atomic fluctuations and the
+weak intramolecular interactions (i.e. those not involving covalent bonds) which govern the
+transition between its various conformations.
+Besides giving a general framework for the understanding of the effects of pressure on
+proteins, the Le Chatelier principle also introduces a first explanation of the antagonistic
+relation between temperature and pressure. The principle states in fact that perturbations
+on a system directly induce processes that attenuate the perturbations themselves but its
+response also induces indirectly other processes that reduce the initial perturbation. A
+phenomenological demonstration of this extension of principle, which is usually called
+LeChatelier-Braun principle, can be found in references [21, 161].
+From a molecular point of view, the antagonism between the two variables can be inter-
+preted by the microscopic ordering principle, which states that an increase in pressure at
+constant temperature leads to a decrease in the entropy of the system, which corresponds to
+an increase in the ordering of molecules in the system itself.
+This is a general property of molecular systems but it has also a strict sense for protein stability
+as proven by Brandts et al. [16] and Hawley [72] who showed that the pressure-temperature
+phase diagram which determines the transition between functional and denaturated states
+of proteins has elliptic boundaries, meaning that there exist several combinations of the P,T
+variables which are compatible with the stability criteria. This peculiar behavior has been
+ascribed to the exposure of hydrophobic groups to the solvent when the protein folds. It is
+worth to note that this behavior is found neither in nucleic acids [73] nor in lipids [47]. The
+elliptic phase boundaries, which are also found in liquid crystals, seems to be produced by a
+fine balance between aromatic and aliphatic parts of molecules.
+effects of pressure on intermolecular interactions The stability of
+biomolecules results from a cooperation of interactions involving its components and the
+external environment [93]. In the case of proteins, once the primary structure is formed
+1.1 effects of pressure and temperature on proteins 11
+by the peptide bonds, the interactions that play a significant role in this cooperation are
+essentially weak [94].
+The electronic structure of atoms and the covalent bonds are directly modified by
+pressure only for values greater than 30kbar [51]and 15kbar [67, 144], respectively, but their
+compression is negligible[62]. Their breaking is responsible for big changes in free volume
+and leads to a totally irreversible protein denaturation. The formation of covalent bonds has a
+∆V = −10ml.mol−1, whereas ∆V values for the changes in bonds or bond angle changes are
+nearly zero [200]. Besides the peptide bonds that form the primary structure of proteins, the
+only type of covalent bond which plays a significant role in protein stability is the interchain
+disulphide bonds formed by non-contiguous cysteine residues [43].
+In contrast to covalent bonds, weak non-bonding interactions give a large contribution to
+the observed ∆V due to pressure changes.
+■♦♥✐❝ ✐♥t❡r❛❝t✐♦♥s Ion pairs in proteins cause attractive, short-range interactions that occur
+between negatively and positively-charged amino-acid side chains over a distance of 4 Å[42].
+The role of ion pairs in proteins is to stabilize the tertiary [76] and quaternary structure.
+For example, interprotein salt bridges provide a mechanism for solvent exclusion from the
+interfacial domain of the cytochrome b5-cytochrome c complex, in addition to maintaining
+the stability and specificity of the complex formed [165].
+When an ion is formed in solution, the nearby water dipoles are compressed by the
+Coulombic field of the ion; this phenomenon, which is accompained by a volume decrease, is
+usually called electrostriction. Because of this volume contraction, pressure is expected to favor
+the disruption of ion-pair but Michels et al. [139] have showed that this should be eliminated
+by high temperature due to the disruption of the highly ordered structure of electrostricted
+water.
+The solvation of ions in water produces a ∆V = −10ml ·mol−1 whereas the dissociation of
+a neutral molecule into ions induces a volume contraction of about −20ml ·mol−1. These
+facts confirm that electrostriction is favored by pressure but does not give insights into the
+effect on protein stability. Indeed, this phenomenon can have opposite results depending
+on the structural effects it produces locally: it can induce denaturation like in the case of
+chymotrypsin where pressure produces the dissociation of a salt-bridge in the active site
+region bringing the protein reversibly to an inactive state[77]; on the other had, it can also
+engender an increase in protein stability if there are weak intersubunit ion-pair interactions
+12 general introduction
+not exposed to solvent, which may be strengthened by pressure.
+❍②❞r♦❣❡♥ ❜♦♥❞s Studies on simple model molecules showed that hydrogen bonds are
+stabilized by high pressures up to 4kbar [105, 200]. This results from the smaller inter-atomic
+distances in the hydrogen-bonded atoms. The stabilizing effect of pressure on hydrogen
+bonding in proteins was first detected by the pressure dependence of the infrared spectra of
+the α-helix in myoglobin[127] and from a comparison of the effect on the intermolecular
+interactions in hydrogen-bonded versus non-hydrogen-bonded amides[65]. In particular
+hydrogen bonds play a fundamental role in the formation of the secondary structure due to
+their role in creating the α-helix and β-strand motifs.
+It is worth to note also that pressure may promote intermolecular hydrogen bonds at the
+expense of intramolecular hydrogen bonds, causing increased conformational fluctuations
+[38]. However, a very small if not negligible ∆V value is observed for processes in which
+there is an exchange between the existing hydrogen bonds [200, 24].
+❍②❞r♦♣❤♦❜✐❝ ✐♥t❡r❛❝t✐♦♥s In general hydrophobic interactions describe the tendencies
+of hydrocarbons to form aggregates in the presence of aqueous media. In proteins, they
+direct non-polar side chains to the interior of proteins and are a major driving force for
+proper folding [110]. In 1959, Kauzmann [109] suggested that the volume changes for the
+association of hydrophobic molecules in water should be positive. His hypothesis was based
+on the observations made on the large entropic effects of the transfer of hydrocarbons from a
+nonpolar solvent to water. Weber et al [207], on the other hand, showed that the association
+of aromatic molecules is enhanced by pressure and later Van Eldik et al.[200] confirmed
+that interactions that pack aromatic rings parallel to each other engender negative volume
+changes. These results give account of two different hydrophobic effects, one related to the
+solubility of apolar molecules into water and another one which concerns the solvent-induced
+interaction between apolar species.
+The former class of hydrophobic effects was initially considered as a good model (called
+oil-drop model)[7] for protein folding as it was confirmed by works on thermal denaturation
+but could not be confirmed by the pressure effects on protein unfolding because the volume
+change upon unfolding is positive at low pressures but negative at pressures of about 1-2
+kbar. The transfer of hydrocarbons into water shows exactly the opposite behavior, with ∆V
+being negative at low pressures and positive at high pressures[110].
+1.1 effects of pressure and temperature on proteins 13
+The major role in pressure effects in protein denaturation is commonly attributed to the
+hydration of hydrophobic cores. Indeed, the presence of solvent around the proteins gives a
+significant importance to the cavities created by the imperfect packing of protein structure.
+Solvents, and in particular water, can often enter these void volume areas and come into
+contact with inner regions, destabilizing the hydrophilic/hydrophobic equilibrium which
+maintained the protein’s stability. Due to its higher compressibility compared to proteins,
+water under pressure can also assume local ordering that can easily cause an important
+increase in the density of hydrogen bond acceptors/donors, which in turn enhance the
+hydrophilic properties of those amino acids that are able to produce hydrogen bonds [213].
+Although several works confirmed this essential role of hydrophobic interactions, discrepan-
+cies in experimental [74, 139, 138] and theoretical [87] results on how their role in protein
+folding/unfolding is accomplished, have not yet allowed the acceptance of the ’oil-drop’
+model as a common framework for the interpretation of the different physico-chemical
+contributions to the related volume variations [168].
+It is worth to note here the work by Hummer et al. [87] which proposed a different role of
+hydrophobic interactions in temperature and pressure-induced denaturations. They suggested
+that pressure denaturation corresponds to the infiltration of water into the protein, whereas
+heat denaturation corresponds to the transfer of nonpolar side-chain groups into water. As a
+consequence, pressure denaturation processes lead to (partially or totally) unfolded protein
+structures with reduced compactness which are, however, considerably more ordered than
+those in heat-denatured proteins, as probed by NMR experiments of hydrogen exchange
+[218].
+In the context of hydrophobic interactions, it is well established that a significant contribution
+is made by the van der Waals (VDW) forces [153, 187, 42]. The effects of pressure on VDW
+forces present the same contradictory results as hydrophobic interactions in general, which
+does not permit a simple framework to be defined for their physical interpretation. From a
+general point of view, VDW forces are likely to be enhanced by pressure since they tend to
+maximize the packing density of proteins and thus reduce the volume. Indeed, packing density
+is maximized by VDW interactions because the dipole moment attractions they produce
+improve the packing of the hydrophobic core [67, 95]. On the other hand, VDW forces can
+also contribute to protein destabilization under pressure. In particular for oligomeric proteins,
+pressure below 3 kbar promotes the replacement of some weak non-covalent interactions
+between amino acid residues with amino acid-water interactions causing changes in peptide
+14 general introduction
+chain conformations and resulting in dissociation [180]. These protein-water interactions are
+promoted by pressure because they produce stronger and shorter bonds that decrease the
+overall volume [144, 180].
+❈♦♠♣r❡ss✐❜✐❧✐t② The atomic density in proteins is similar to that in solids and can
+even exceed the latter locally [87] which makes proteins very insensitive to compression.
+Most of the data available on protein compressibility are obtained by sound velocimetry
+measurements and the volume change usually observed is around 1% of the protein’s total
+volume[60]. Such a small volumetric variation is induced only by the weak interactions we
+presented earlier in this section and does not receive any contribution from covalent bonds
+in the protein backbone [206]. The major effect is due to the hydrophobic interactions: the
+higher the hydrophobic content is in a protein, the more the latter is compressible [180].
+A significant role in compressibility is played by the effects of pressure on the hydration. In
+particular, as stated in the previous paragraph, the infiltration of water molecules into void
+cavities produces a significant change in the local atomic fluctuations which results in the
+destabilization of the hydrophilic/hydrophobic equilibrium of the protein. In general the
+cavities filled by the solvent can act as two-ways-valves or one-way-valves, depending on the
+local molecular environment in the protein [133], i.e. they can form volumes that solvent
+molecules can continuously enter or leave or they can instead incorporate water molecules,
+separating them from the bulk solvent. These two type of behavior engender differences in
+compressibility of cavities and in the whole protein structure [39].
+In contrast to temperature, pressure does not seem to have a uniform effect all over the
+protein [61]. A molecular simulation study by Paci and Marchi [148] proved that short
+distances are rather less compressed than longer one. This was also confirmed by x-ray
+experiments performed by Kundrot et al. [121] which showed that side-chains in lysozyme
+have a larger response to pressure than backbone.
+The physical origin of this heterogeneity in structural response to pressure has been explained
+by a phenomenological model of non-covalent interactions where each pairwise interaction
+in the protein’s native structure was replaced by an effective harmonic force with a distance
+dependent force constant. Interestingly the short-ranged interactions were characterized by
+effective force constants larger than long-ranged ones [82, 80], meaning that the former are
+stronger and less compressible than the latter.
+1.1 effects of pressure and temperature on proteins 15
+pressure impact on protein structure levels To summarize, we can conclude
+from the previous section that a protein’s reaction to pressure increase is often due to
+a complex balancing of opposite effects which tend to combine differently at different
+pressures. The effects on the interactions that determine the internal protein structure, have
+consequences on all the levels of structural organization (i.e. on secondary, tertiary and
+quaternary structures). In the following, we report schematically these repercussions on each
+level with reference to the experimental techniques which were used to detect them.
+◗✉❛t❡r♥❛r② str✉❝t✉r❡ is mainly maintained by hydrophobic interactions and for this rea-
+son it is the most sensitive to pressure. As mentioned in the previous section, moderate
+pressure below 1.5kbar favours dissociation of oligomeric proteins [180] which results in
+very large and negative volume changes. Sometimes pressure-induced dissociation leads
+to formation of individual non-denaturated subunits, as in the case of tryptophane syn-
+thethase at 1.5kbar[149], but more frequently it is followed by subsequent conformational
+changes in individual subunits[150]. When quaternary structure is maintained by either
+pressure-insensitive interactions like hydrogen-bonds or by pressure-enhanced interactions
+like aromatic clustering (due to hydrophobic interaction), dissociation can appear also at
+pressures higher than 3kbar [132].
+Pressure effects on quaternary structure are usually investigated by electrophoresis, ultracen-
+trifugation [152], fluorescence spectroscopy[180] and NMR spectroscopy[100].
+❚❡rt✐❛r② str✉❝t✉r❡ can be irreversibly changed by pressures above 2kbar. However, some-
+times reversible denaturation can be found also at pressure between 4 and 8kbar[171]. This
+shows that the volume changes are not completely dominated by hydrophobic interactions
+but that other type of weak interactions can also play an important role. An important feature
+of pressure denaturation is the formation of a molten globule in which proteins, even though
+retaining their intact secondary structure, change their tertiary structure adopting conforma-
+tions with hydrodynamic radii 10-20% higher than that of the native state[154]. For the studies
+of the tertiary structure changes induced by pressure, the more frequently used methods are
+NMR spectroscopy, X-ray, UV-visible and fluorescence spectroscopy[121, 180, 100].
+❙❡❝♦♥❞❛r② str✉❝t✉r❡ undergoes significant changes at very high pressure, above 3-7kbar.
+These changes, in contrast to those that affect tertiary structure result always in non-reversible
+protein denaturation. Indeed, such pressures induce a high compression of protein
+structure resulting in the rupture of hydrogen bonds, which play a major role in the
+16 general introduction
+formation of secondary elements like α-helices and β-sheets [211]. As regards the secondary
+structure, one of the most suitable methods to detect changes is Fourier transform infrared
+(FTIR)spectroscopy which gives insights into the protein vibrational spectra where the band
+corresponding to the vibration of C=O bond of the amide group is easily detectable. The latter
+is very sensitive to the conformation of the polypeptide. Another technique frequently used
+to detect changes in secondary structure is circular dichroism (CD) spectroscopy which can
+rapidly give the percentage of α-helices, β-strands and random-coil in a protein solution [196].
+The fact that every pressure range affects roughly only one structure level makes this
+physical variable a rather better tool to investigate protein structure stability than any other
+perturbation like temperature or pH changes.
+1.2 organisms adapted to extreme environments
+Organisms are integrated entities, not collections of discrete objects 2
+While in the previous section the general effects of pressure and temperature on
+proteins were presented, here I want to focus on the particular aspect of the chemical and
+physical properties of proteins from organisms which live under extreme conditions. More
+precisely, a special case of extreme environment, the warm deep-sea, in which both high
+pressure and high temperature can be found, will be presented. Furthermore, inspired
+by the phrase that opens this section, I want to point out the fact that the study of
+protein molecular adaptation to extreme environments could be highly improved by
+the knowledge of the framework of the whole-cell adaptation. Although this section is
+intended to be an introduction to the subject of the biology of extreme environments, it is
+inevitably incomplete and mainly reflects the personal view and interests of the author. Many
+more aspects are described in a number of excellent reviews [85, 93, 182, 158, 107, 151, 191, 58].
+The biosphere, i.e. the surface of the earth known to host life, ranges from the abyssal
+region of the deep sea to the heights of the Himalaya and shows a wide range of example of
+adaptation to ’extreme’ environments. From a quantitative point of view, physical limits to
+life today known are the following3[92]:
+2 From The spandrels of San Marco and the Panglossian paradigm: a critic to the adaptationist programme, S.J. Gould and
+R.C. Lewontin, Proc. Royal Soc. London B, 205, 581-598, (1979).
+3 As a reference: the critical point of water is at 374◦C and 2.2kbar
+1.2 organisms adapted to extreme environments 17
+• −40◦C < T < 115◦C
+• P < 1.2kbar
+• ∼ 1 < pH < 11
+In the previous section we have discussed the effects of pressure on proteins structure,
+here we want to recall some critical effects of temperature on biological chemistry: i) at 100
+◦C thermal degradation outruns biosynthesis[92, 95]; ii) at 110-140 ◦C hydrophobic hydration
+effects in protein vanish [92]; iii) and at 150 ◦C amino acids start to fall apart [141, 140].
+These are obviously the extreme boundaries that do not permit life developing but their
+knowledge is useful to understand the increasing effects that organisms have to face when
+approaching these limits. From an evolutionary point of view, this means that organisms
+should have to find a way to compensate these effects.Hence, organisms which became
+extremophiles [167] found some mechanisms to protect themselves against the chemical and
+physical damages induced by the environment.
+Little is known on how this is accomplished[90, 49] but presumably two parallel strategies
+are followed: the first one is the compensation of degrading processes made through a tuning
+of the synthesis rate of biomolecules that would be compatible with the average lifetime
+of the molecules [92]; the second one is the incorporation of point mutations in protein
+sequences in order to increase their structural stability, resulting in a longer lifetime and thus
+a longer time of functioning[93].
+Nevertheless, this strategy adopted in molecular adaptation does not seem to engender
+significant differences between the global distribution of amino acids in mesophile proteins,
+i.e. obtained from ’normal’ organisms, as compared to the extremophile ones. Deckert et
+al. showed, for example, that the distribution of amino acids contents in mesophilic and
+thermophilic proteomes, even though not identical, do not present any significant differences
+that could lead to a simple method to distinguish them [48].
+As a consequence, adaptation of biomolecules seems to be related exclusively to dif-
+ferent local patterns in amino acids sequences resulting in a reorganization of the weak
+non-convalent interactions that govern protein stability and flexibility[147, 94]. The new deal
+for the stability of extremophile proteins is thus played by the re-organization of mechanisms
+that are, as we have seen in the previous paragraphs, sensitive to environmental changes;
+they are for example: increased number of hydrogen bonds, salt bridges, improved core
+18 general introduction
+packing, shorter and/or tighter surface loops, enhanced secondary structure propensities, or
+oligomerization[134, 135, 136].
+From a physical point of view, a first quantitative experimental measure of protein stability
+can be made by means of differences in the Gibbs free energy, ∆G(T ,P,N), between the more
+stable global minimum and its nearest minima. Jaenicke and Böhm [96] showed that mesophile
+and extremophile proteins share ∆G of the same order of magnitudes (∼ 50kJmol−1) even
+though extremophiles may show a variability in the range 10− 100kJmol−1. The difference
+between the typical values for mesophilic proteins and the variation found in extremophilic
+ones correspond to the energy of a few non-covalent interactions and confirm the significant
+role the latter play in molecular adaptation[157, 147, 151, 158].
+The central issue in the adaptation of biomolecules remains, however, the conservation
+of biological functionality which means a well-balanced compromise between stability
+and flexibility[197, 92]. Hence, the process of adaptation has to translate the properties
+of mesophilic proteins toward the relative extreme conditions which means towards physio-
+logical conditions that make molecular properties of extremophilic counterparts very similar
+[93]. This translation is perfomed by a re-organization of non-covalent interactions. Several
+experiments have provided evidence for this process [217] and showed that dynamical prop-
+erties of some mesophilic enzymes at temperature of 25◦C are very similar to those of their
+extremophilic homologues at 70◦C. Analogous results were obtained on rubredoxin by a
+molecular dynamics study [69].
+In this context Jaenicke [93] proposed that molecular adaptation to extreme environments
+should tend to maintain corresponding states between respective native environments, which
+take into account overall topology, flexibility and hydration of proteins. Even though this idea
+found confirmation by experiments in the past, recent works seem to not entirely confirm it
+[158].
+1.3 the warm deep-sea environment
+In contrast to common opinion, terrestrial environments, where the ambient pressure is 1bar,
+occupy only the 1% of the total volume of the biosphere. A large fraction of the earth’s surface
+(70%) is covered by oceans which have an average depth of 3800 meters and thus an average
+ambient pressure of 380 bar4. More than 60% of the marine component of the biosphere is
+4 Hydrostatic pressure increases at a rate of 10.5kPa per meter depth, compared with 22.6kPa per meter for
+lithostatic pressure.
+1.3 the warm deep-sea environment 19
+below 1000m 5. Life below this depth, which is usually defined as the upper boundary of
+the "deep sea", has to face several unfavourable conditions such as high pressure (from 1 to
+1.1kbar) or temperature (from 1 to 110◦C) 6 which have strong impact to life mechanisms.
+After the pioneering studies of Certes in 1884 [30, 29] which helped to establish the
+existence of microorganisms in deep sea sediments, the first systematic studies of ZoBell and
+Johnson[220], gave the birth in 1949 to a new research line which helped, during the last
+century, to better understand the survival strategies employed by organisms to face extreme
+conditions.
+It allowed for example to elucidate the different adaptation to pressure in several groups
+of microorganisms which can be divided into two distinct groups: barophiles (or piezophiles)
+which are micro-organisms that possess optimal growth rates at pressures above atmospheric
+pressure, whereas barotolerant (or piezotolerant) microorganisms are capable of growth at
+high pressure, as well as at atmospheric pressure, but can be distinguished from piezophiles
+because they do not have optimal growth rates at pressures above one atmosphere.
+Both groups of microorganisms can also be distinguished from piezosensitive ones, whose
+growth is sensitive to elevated pressure, because they can grow at 50 MPa at a rate that
+is above 30% of their growth rate at atmospheric pressure [107, 108]. Moreover, from a
+molecular point of view, barotolerant organisms differentiate themselves from normal
+piezosentive ones by the production of some "pressure-shock" proteins induced as reponse to
+high pressure environment [97]. These proteins have some equivalents in the "heat-shock"
+proteins found in organisms which undergo thermal stress [67, 174] but their mechanism is
+far from being completely understood.
+In late 70s, the first colonies of "deep-sea" organisms were found also near the hydrothermal
+vents[8]. The latter are warm currents which form where freshly extruded lava contracts
+upon cooling and allows seawater to penetrate in the newly formed crust of basaltic rocks.
+Seawater is then expulsed, highly enriched in heavy metals, creating hot vents which
+significantly change the temperature in the nearby area [98].
+Obviously the life of organisms near hydrothermal vents became very rapidly the most
+intriguing subject in the deep-sea biology and de facto most of the barophilic organisms
+known today are also thermophilic which means that they have been proven to also have
+greater growth rates at high temperatures (typically from 50 to 90◦C) than at usual deep-sea
+5 The greatest depth in oceans, in the Mariana Trench is near 11000 meters whereas the deepest floor found in
+freshwaters is at 1632 meters in the Lake Baikal
+6 From a biochemical point of view it is worth to note for exemple that both light and photosynthesis are available
+only until 300 meters of depth
+20 general introduction
+temperatures ( around 2◦C) [1].
+This environment, usually called the warm deep-sea, introduced several interesting ques-
+tions from a biological and evolutionary point of view which demanded also new explanation
+from biochemistry and physics.
+pathways of adaptation to warm deep-sea environments Before focusing on
+some aspects of the molecular adaptation of proteins to this environment, here some well
+known facts about the whole-cell adaptation are reported schematically, for they play a
+fundamental role in defining the general framework in which all molecular results should be
+interpreted. The main features of biological adaptation to high hydrostatic pressure are[182]:
+Adaptation to pressure allows deep-living species to thrive under high pressure but it
+can also reduce their ability to live at moderate depths. This means that deep-living
+species are usually barophilic and not barotolerants[179].
+Common patterns of adaptation appear in widely different types of deep-sea
+organisms[179].
+Most of the physiological and biochemical processes which are in general found to
+be pressure-sensitive in normal organisms, are rather stable under high pressure in
+deep-living ones and exhibit, at in situ temperatures and pressures, values similar to
+those found in terrestrail or shallow-living organisms at 1bar pressure[41, 44].
+Species living in deep sea hydrothermal vents show that adaptation to both temperature
+and pressure are essential for cellular growth and physiological function. This means
+that adaptation to high pressure does not pre-adapt organisms from cold deep sea to the
+environment typical of the hydrothermal vents[182, 45].
+While the first three points seem to confirm the idea of the existence of corresponding states
+between mesophilic and extremophilic organisms, the last point reveals the fundamental
+interplay of pressure and temperature in warm deep-sea environments. This means, however,
+that evolution has to cope with complex superpositions of parameters which are difficult to
+separate and renders impossible the definition of strategies of molecular adaptation.
+1.3 the warm deep-sea environment 21
+In an extremely simplified view, the complex mechanism which governs the life of a cell
+can be schematically divided in two parts: protein synthesis, which furnishes all the "tools"
+(the proteins) necessary for the cell machinery to work; and cellular metabolism, which
+includes all the process that constitute the cellular life itself.
+Following this scheme, we present the principal properties of protein adaptation to a warm
+deep-sea environment, focusing on proteins that participate in the cellular metabolism and
+those which have a role in other protein synthesis.
+Enzymes, by their role as catalysts and regulators of metabolism, are the mediators by
+which living systems function and reproduce. Somero et al [183] proposed that the successful
+adaptation of an organism entering the deep sea would require the maintenance of the
+same balance of enzyme synthesis, catalytic activity, and regulation as its surface-living
+counterparts. Indeed, from several studies of enzymatic functions of deep-living organisms, a
+few convergent common properties were found [130, 98]: i) the preservation of an enzyme’s
+capacity to bind substrates under deep-sea conditions is essential in adapting metabolism
+to that environment; ii) structural changes induced at pressures as low as 50-100 bar may
+modify enzyme function sufficiently to induce evolutional selection for pressure insensitivity;
+and finally iii) the capacity of an enzyme to function independently of pressure is acquired at
+the cost of a reduction in catalytic efficiency.
+Furthermore, in the context of the combined adaptation to temperature and pressure, it is
+worth noting that for several hydrogenase enzymes from widely different warm deep-sea
+organisms, pressure was found to significantly increase their thermal stability [45, 188]. This
+type of enzyme undergoes large conformational change and hydration during its activity and
+this makes them particularly well suited for investigating the effects of pressure.
+In general for deep-sea organisms from the hydrothermal vents, the stabilization of catalytic
+proteins was often found as the result of some point mutations in primary sequences
+whose outcome could either be the increase of the size of the hydrophobic core and
+its compactness (essentially substitutions with hydrophobic amino acids with larger
+side-chains), the augmentation of hydrogen bonds (substituiting lysine with arginines ) or
+the reduction/deletion of amino acids with side-chains sensitive to high temperatures (
+asparagines, glutamines, cysteines and tryptophane) [142].
+Protein synthesis is ideally divided into two steps: transcription, in which the genetic code
+is copied from DNA to a RNA messenger (mRNA); and translation where peptides are bound
+22 general introduction
+together with the help of ribosomes and where genetic code in mRNA is decoded into amino
+acids sequences. Both process are found to be highly sensitive to pressure [124].
+Early studies investigating the effects of pressure on E. coli revealed that an essentially
+complete cessation of protein synthesis occurred at growth-inhibiting pressures of 680 atm
+[67]. Subsequent comparison of protein synthesis of E. coli and known barotolerant organisms
+permitted the barotolerance properties to be associated to the activity of ribosome [124] and
+in particular to its 30S subunit [125].
+Indeed, ribosomes are made of two subunits (a smaller and a larger one) which are capable
+of associating and dissociating. As we will discuss later in the text, this phenomenon is
+important because the initiation of protein synthesis requires free ribosomal subunits in order
+to allow the formation of a complex containing the mRNA anchored to the small subunit
+before the joining of the large subunit. The ribosome’s subunit association is known to be a
+rate-limiting process in the protein synthesis [162] and was found to be inhibited at elevated
+hydrostatic pressures in mesophilic organisms [185].
+This effect was previously discussed as a possible reason for the inhibition of protein synthesis
+and, hence, of cell growth by hydrostatic pressure [91] but later more sophisticated in vitro
+studies showed that ribosomal complexes retain their "associated" state over the whole range
+of biologically relevant pressures [68]. Other studies on ribosomes from mesophilic organisms
+showed that association can be regulated also by temperature which usually enhances the
+association equilibrium towards the associated species[83, 184]. Interestingly, these results
+show that under estimated physiological conditions in several eukaryotes, ribosomes are
+present almost exclusively in their associated form. The cell must therefore possess some
+mechanisms for maintaining a pool of free ribosomal subunits. These mechanisms have to
+account for protein synthesis inhibition under extreme conditions. Unfortunately, very little
+is known about the differences between the protein synthesis machinery of extremophiles
+and mesophiles.
+methanococcus jannaschii This thesis will focus on a protein produced by an
+archaeon7 microbe living near the hydrothermal vents, Methanococcus Jannaschii. This
+organism, discovered in 1963 as a "methane-producer" [102], usually lives at temperatures
+ranging from 48 to 94 ◦C with an optimum temperature at 85◦C and at pressures of more
+than 200 bar (in situ depth 2600 meters).
+7 The archaea are known as a primitive form of life significantly different from both prokaryots and eukaryotes.
+For this reason is often referred to as the third domain of life.
+1.4 the anti-association factor 23
+M Jannaschii’s genome was the first archaeon genome to be completely sequenced [18]
+and revealed the complex evolutionary relationships between archaea and eukaryotes and
+bacteria: only less than an half of the genes found in its genome could be matched to those
+of other organisms. In the context of this thesis work, from a molecular biology point of
+view, the most interesting feature of this organism is that while sharing the same protein
+biosynthesis machinery (both transcription and translation) as eukaryotes, it does also have
+genes homologous to both eukaryotes and bacteria for the initiation part of the translation
+process. The latter is a fundamental and rate-limiting part of the translation and will be
+discussed more deeply in the next section.
+It has been shown that M Jannaschii’s metabolism and growth at high temperatures are
+enhanced by pressure up to 750 bar whereas the upper limit for growth is 90◦C either
+under low or high pressure [102]. These results suggested that M.Jannaschii is effectively a
+barophilic organism and not just barotolerant. The finding seemed to be confirmed by studies
+on enzymatic reaction: it was shown that application of 500 bar increased the thermal half-life
+of hydrogenase from M. jannaschii 4.8-fold at 90 ◦C ◦C [74] and increased the half-life of a
+protease from the same organism 2.7-fold at 125 ◦C [138]. Nevertheless, recent works showed
+that pressure inhibits the 20S proteasome function from M Jannaschii [55], suggesting that in
+some cases lower protein activity at the in situ pressure could be a regulatory mechanism
+that confers some advantage to the whole cell. Hence, a more complex behaviour of the cell
+response to high pressure and high temperature should be envisaged.
+1.4 the anti-association factor
+In the following we want to give a short introduction to the protein studied in this thesis,
+which is called the Anti-Association Factor[170, 199]. A complete description of the molecular
+biology background which is necessary to introduce the function of this protein, would
+be largely out of the scope of this thesis and we limit our discussion to the essential key points.
+The anti-association factor belongs to the familiy of initiation factors and is usually also
+called initiation factor 6. In the following, in order to maintain a coherence with the cited most
+recent bibliographic references, I will call it by the short name IF6 sometimes preceded by a
+prefix indicating the domain of life from which it comes: eIF6, for eukaryotic initiation factor
+24 general introduction
+6, pIF6 for its prokaryotic counterpart and aIF6 for the archaeon one.
+IF6, like the other initiation factors, takes part in the first steps of the translation process.
+Translation initiation can be subdivided into three steps: first, binding of the specific initiator
+Met-tRNA to the small ribosomal subunit; second, binding of the resulting complex to a
+mRNA and locating the initiation codon; and third, joining of the large ribosomal subunit
+to generate a translation competent ribosome. All these steps are facilitated by soluble
+proteins termed translation initiation factors, and the structures of many of them have been
+characterized at the atomic level. It is worth noting that while the essential part of this process
+is shared by both prokaryotes and eukaryotes, the process itself is decidedly more complex
+in eukaryotes than in prokaryotes and in part reflects the fact that much of the regulation in
+prokaryotes is via the coupling of transcription and translation. Such coupling is not possible
+in eukaryotes as transcription occurs in the nucleus while translation occurs in the cytoplasm.
+The eukaryotic initiation factors can be divided into two groups: those that bind and
+operate on ribosomal particles promoting subunit dissociation and association, initiator
+Met-tRNA binding, and mRNA binding; and those that are aimed at mRNA and engaged in
+preparing its upstream region for initiation. The first group contains the factors analogous to
+prokaryotic pIF1, pIF2 and pIF3, namely eIF1 ( and eIF1A), eIF2 and eIF3 respectively, as
+well as several additional factors, such as eIF2B, eIF5 and eIF6. The second group seems to
+have no analogs in prokaryotes and includes special mRNA-binding and mRNA-unwinding
+proteins facilitating initiation of translation; these are the factors of eIF4 group, namely eIF4A,
+eIF4B, eIF4F and eIF4E [186].
+The role of IF6 in the translation initiation is more complex than those of the other initiation
+factors because it engenders different functions about which very little is known. First of all,
+IF6 does not act as a true initiation factor because it does not form any initiation complex8
+either with RNAs and ribosome subunits as proved by the fact that yeast cells depleted of
+eIF6 remained active in translation of mRNAs in vitro [178]. Its principal functions can be
+resumed as follows:
+- it is required for biogenesis of the 60S ribosomal subunit both in archaebacteria and
+eukaryotes [173, 178, 177, 212]
+8 Initiation complexes are macromolecular complexes formed by mRNA, tRNA and ribosome subunits which
+come together to form the machinery that perform the first two steps of the translation. IF6 does not take part
+directly into this mechanism.
+1.4 the anti-association factor 25
+- it acts as de facto anti-association factor of the 60S and 40S subunit in the cytoplasm
+[178, 28]
+Moreover, a very recent work also uncovered another evolutionary conserved function
+of IF6 in the microRNA-mediated post-transcriptional silencing[34] which could extend
+significantly the peculiarities of IF6.
+Si and Maitra showed that depletion of eIF6 in yeast cells resulted first in a decrease in
+the rate of protein synthesis and then in cessation of cell growth [178] and Basu et al. [10]
+showed also that the protein depletion caused in cells a selective reduction of 60S ribosomal
+subunits. These two results and the previous one confirmed the evolutionarily conserved
+main role of IF6 in biogenesis and assembly of ribosomal units and also the absence of its
+direct participation into the translation process.
+The suggestion of these two functions of IF6 is also strengthened by the localization of
+the protein in both nucleus and cytoplasm[6] where ribosome subunit biogenesis and
+ribosome assembly take place respectively. Furthermore, Basu and coworkers [10] showed
+that phosphorylation of eIF6 regulates its distribution in nucleus and cytoplasm [11].
+As a whole, the multiple functions of IF6 make of this protein an essential factor for cellular
+growth and protein synthesis. Very little is known about its participation in the 60S biogenesis
+whereas several works in the past decades better elucidated its role of anti-association factor
+at a molecular level [28]. This function has been identified in eukaryotes as part of process
+which involves a protein promoter of ribosome translation, RACK1 and a protein kinase PKC.
+In the context of this work, it is worth noting that eIF6 has been proven to be very sensitive
+to heat: in homologues from wheat germ [170] and calf liver[199], eIF6 activity had an
+optimum at around 37◦C but was completely abstent between 50 and 60◦C. Whether the
+cessation of activity is due to a partial or complete protein denaturation is not known.
+From a molecular point of view, IF6s are 26kDa proteins which share a phylogenetically
+conserved sequence of 224 residues with 30% similarity. All known eukaryotic IF6 contain
+an additional carboxyl terminal extension of 21 amino acids. Even though this tail does
+not seem to be directly involved to the anti-association function of IF6[66], as proved in
+in vitro reactions, it has been proven to be somehow related to this process through the
+26 general introduction
+phosphorylation of a serine residue (Ser235) by the protein kinase PKC [28].
+In 2000, the first molecular structure of an IF6 homologues was resolved by x-ray
+crystallography by Groft and coworkers [66] who obtained the structures of two homologous
+IF6s issued from M.Jannaschii and from Saccharomyces ceraevisie. Both structures revealed a
+very unusual internal pseudo-symmetry made by the disposition around a common axis of
+five copies of a repeating α/β subdomain of about 45 residues. Each subdomain contains: one
+long α helix, a shorter α-helix or a 310-helix and three β-strands. While the global structure
+of the first 224 residues is well known and has been proven to be evolutionarily conserved by
+homology modelling [66], nothing is known about the structure of the C-terminal extension
+of 21 amino acids.
+Figure 7: Cartoon representation of IF6 backbone. The color scheme highlights different type of protein
+secondary structure. One of the pseudo-subdomain is shown on the left-hand side as
+reference.
+1.5 the thesis project "at a glance". 27
+From a structural point of view is also worth-noting the fact that the five subdomains do
+not make a unified hydrophobic center of the protein. Instead, they produce an hydrophobic
+"torus" by their association which in turn creates a cave-like hollow in the center of the
+structure. The cavity is large enough to let water molecules enter and in the crystallographic
+data sixteen of them were found in a well-ordered conformation of pentagonal layers and are
+hydrogen bonded to the carbonyl oxygen atoms of two residues in the neighboring β-strands.
+In the yeast (Saccharomyces ceraevisie) eIF6 this cavity is closed by an arginine (residue 61)
+whose guanidinium group makes several hydrogen bonds with glycines in the short α-helix
+of subdomains.
+1.5 the thesis project "at a glance".
+As stated earlier in this introduction, the key point for molecular evolution is the maintain of
+biological function. This is accomplished in proteins either by point mutations or by simple
+structure re-arrangements. Nonetheless, evolution does not have a unique pathway to follow
+this procedure.
+This thesis focused on the way proteins evolutionarily "react" to large environmental
+changes, i.e. how they adapt to function even in organisms which live in extreme conditions.
+Following this idea, this work concentrated on the study of the adaptation of the IF6 from
+Methanococcus Jannaschii to extreme environments. In this context the comparison with
+proteins in normal (mesophilic) conditions would have been essential to finely characterize
+the ability to adapt to extremes conditions.
+IF6s from Saccaromyces cerevisiae was chosen as mesophilic counterpart of Methanococcus
+Jannaschii. They share only 33% of identity in sequence but their structures are significantly
+similar to each other and to most of the other IF6s homologues [66]. As a whole, this means
+that IF6’s function was highly conserved during evolution but it does not explain how
+function and, apparently, structure have been maintained in the adaptation to a wide variety
+of environmental conditions.
+In this context, the work presented here will try to give a first answer to the following
+questions:
+Where does the extremophilic signature come from ?
+If structure cannot be the origin for this, can it be the dynamics??
+28 general introduction
+Of course all answers given here will be limited to the particular case of adaptation to the
+warm deep-seas and will not be neither exhaustive nor general but could introduce a new
+approach in study of protein evolution.
+The main tools used in this work are molecular dynamics simulation and neutron
+scattering experiments. After a brief introduction to the main concepts of the theoretical
+frameworks that guided this work, the experimental setups will be presented.
+In the following chapter a wide and detailed presentation of a novel method for the
+characterization of the protein secondary structure is given. The method, called ScrewFit, was
+developped in the context of this thesis but it has rapidly found some different applications
+of the analysis of protein structures. Some examples already published as scientific articles in
+international peer-reviwed journals will be given.
+Finally the results of this work on IF6 homologues will be presented and discussed. Some
+general outcomes will be then used in the tentative of giving answers to the questions about
+protein evolution proposed above.
+2
+MATERIAL AND METHODS
+2.1 molecular dynamics
+2.1.1 The basic principle
+Molecular simulations used in combination with experimental methods, are a very
+useful tool to give new insights into the dynamics and structure of complex molecular
+systems. Simulation methods are used within different approximations, depending on the
+experimental results with which they are confronted.
+In this sense, neutron scattering techniques are well matched to molecular dynamics
+simulation (MD) method which combines the classical equations of motions with empirical
+force fields obtained from a priori quantum-dynamical calculations of atomic interactions
+in the building blocks of the systems of interest. The basic approximation made in MD
+is the Born-Oppenheimer approximation which states that due to the large difference in
+masses between electrons and atomic nuclei, the electron dynamics is orders of magnitude
+faster than that of the nuclei and, therefore, it can be assumed that electronic shells adapt
+instantaneously to the positions of the nuclei. Moreover the dynamics of the nuclei is treated
+by classical mechanics.
+De facto, the MD gives information about the dynamics of the same objects that are directly
+seen by neutrons: the atomic nuclei. As a consequence, MD and neutron scattering give
+access to the same length and time scales (ranging from 1 Åto 100 Åand from 0.1ps to 10ns,
+respectively).
+In an MD simulation each atom is represented by a point mass whose dynamics is described
+by the classical Newton’s equations of motion:
+mir¨ = Fi, i = 1, . . . ,N (2.1)
+29
+30 material and methods
+where mi is the mass of atom i and Fi is the total force acting it. The force Fi is derived
+from the potential energy U(r1 . . . rN) through:
+∂U(r1 . . . rN)
+Fi = − (2.2)
+∂ri
+As already mentioned, the energy U(r1 . . . rN) is an effective energy which describes all
+types of atomic interactions. The generic form of the potential energy is :
+∑
+Utotal = Kr(r− r
+2
+eq)
+b∑onds
++ Kθ(θ− θ
+2
+eq)
+ang∑les Vn
++ [1+ cos(nφ− γ)]
+d∑ 2ihedralsAij Bij
++ −
+12 6
+∑ Ri<j ij Rijqiqj
++ (2.3)
+ǫRij
+i<j
+The terms of this potential can be divided into two groups: bonded interactions, which are
+related to the covalent bond structure taking into account the stretching of bond lengths, the
+bending of bond angles and dihedral angles described by three consecutive bonds; non-bonded
+interactions describe the repulsion between neighboring atoms, the dispersive forces due to
+mutually induced atomic dipoles (both contained in a Lennard-Jones 12-6 function) and
+electrostatic interactions.
+Throughout this thesis all molecular dynamics simulations have been performed using the
+AMBER9 simulation program [26]. The whole set of simulations used the AMBER99SB force
+field which is a recent upgraded version of the AMBER94 force field, usually used for protein
+molecular dynamics, and which contains a reparametrization of the backbone torsion terms
+and achieves a better balance of the different secondary structure elements [86].
+MD simulations of biological molecules are mostly performed in solution, typically
+water, as in real biological environments. In order to obtain a realistic solvation of the
+sample molecule, the amount of solvent molecules is usually very large and counts for a
+2.1 molecular dynamics 31
+substantial part of the computational effort. Several simple models for water molecules
+have been developed in the past which allow simulations to be performed with a moderate
+computational cost. A simple and widely used model is the TIP3P model [103, 104]. Here
+the molecule has a rigid geometry with fixed bond lengths and angles; the intermolecular
+interactions are modeled by Coulombic and Lennard-Jones terms. Moreover, the model
+contains three sites for the electrostatic interactions: the partial positive charge of hydrogens
+is balanced by a negative charge placed at the oxygen atom position; the van der Waals
+interactions are computed with only one point of interaction per molecule, centered on the
+oxygen atoms.
+The set of ordinary differential equations (2.1) is solved numerically using a discretization
+method. The general procedure can be summarized as follows. Given the initial dynamic state
+(position and velocities) at time t, the positions and velocities at time t+∆t are calculated.
+The finite time-step ∆t depends on the integration method as well as on the system itself. The
+basic criteria for a good integrator are: it should be fast, require little computer memory and
+be time-reversible; it should permit the use of a relatively long time step and guarantee the
+conservation of the total energy within a reasonable error which is related to the definition of
+the time step ∆t. For later analysis one assumes also the ergodicity of the simulated trajectory,
+i.e. if A is a function of time then
+∫
+1 T
+lim∞ A(τ)dτ = 〈A〉T→ T 0
+where T is the simulation length and 〈·〉 a phase space ensemble average. This condition
+allows the calculation of the ensemble averages by means of time averages.
+periodic boundary conditions and summation of non-bonded terms A
+real experiment relates to macroscopic samples consisting of ≈ 1023 atoms whereas the
+simulated systems usually contains between 103 to 106 atoms. This discrepancy leads to
+significant differences in physical quantities of the bulk, due to a larger influence of boundary
+effects in the simulated systems. For this reason, periodic boundary conditions are applied:
+the initial unit cell is replicated infinitely in all directions, meaning that each atom i having
+position ri = (xi,yi, zi) in the central box has an infinite number of image atoms with
+32 material and methods
+Figure 8: Bidimensional representation of the periodic boundary condition
+positions ri + niL = (xi + n1L,yi + n2L, zi + n3L) where L is the linear dimension of the
+simulation box (assuming a cubic shape) and the integer triples n = (n1,n2,n3)define the
+direction in space. From a practical point of view, this means that during the simulation,
+whenever an atom leaves the principal simulation box, it enters again from the opposite side
+thus keeping the average density of the system constant.
+When calculating the force acting on an atom of the system, one should consider both the
+interactions with the other N− 1 atoms and those with all images lying in the surrounding
+box. This would lead to a sum of infinite terms which is clearly not possible in practice. For
+this reason, it is assumed that each atom interacts only with the nearest images of all other
+atoms. In this approach, called the minimum image convention, the distance between the pair
+of atoms i, j is defined by dij = minn{||rj + nL− ri|}, i.e. the distance between atom i and the
+closest image of atom j. The outcome of this convention is that the calculation of potential
+energy and forces would involve only 1/2N(N− 1) terms.
+For short-ranged interactions, such as Lennard-Jones ones, the list of atoms interacting with
+atom i can be restricted to its neighboring pairs taking a cut-off distance which is usually
+set lower than L/2, where L is the linear dimension of the box, in order to ensure that each
+atom is counted only once. Nevetheless, this truncation of potential energy calculation can be
+safely applied only to the short-ranged forces. The long-ranged forces, i.e. the electrostatic
+ones, cannot be calculated within this approach because they contribute significantly to the
+overall potential also at distances larger than the box dimensions.
+2.1 molecular dynamics 33
+The periodic boundary conditions can be used also to calculate the electrostatic interactions
+between all atoms of the system by means of the Ewald summation method. The term due to
+these interactions, when written for periodic systems, must take into account the interactions
+between atoms belonging to different periodic images of the original box:
+∑′ ∑ qiqj
+Uelect = ‖ ‖ (2.4)ǫ r
+n ij
++ nL
+i6j
+where the vectors n = (n1,n2,n3) with n1,n2,n3 = 1, ..∞ are the lattice vectors which
+define the periodic images of the original box. This sum is conditionally convergent, i.e. the
+results depend on the order in which the terms are summed up. A suitable choice is to sum
+boxes in order of their distance from the original one, thus approaching the sum of terms
+over spherical layers for which the value of Uelect in equation (2.4) is known. A rapidly
+convergent form to this value, can be obtained by the substitution of (2.4) by the sum of two
+rapidly convergent series, as originally proposed by Ewald [53, 131].
+In the general approach, each point charge in the system is surrounded by a charge
+distribution of equal magnitude and opposite sign. The form of this distribution is usually a
+Gaussian:
+q β3i
+ρ(r) = exp(−β2r2) (2.5)
+π3/2
+This distribution screens the interactions between neighboring charges and summed, over
+the periodic system, together with the original point charges, leads to a rapidly convergent
+potential which has the form [46, 78]:
+∑ erfc(β|r+ n|)
+φ(r;β) = (2.6)
+|r+ n|
+n
+where erfc is the error function and β is a parameter which affects the rate of convergence
+of the series in the direct space of the periodic lattice. Another charge distribution of the
+same sign of the original charges and with the same shape of ρ(r) is added to reduce the
+overall potential to the one due to the original set of charges. This cancelling distribution is
+summed in the reciprocal space of the periodic lattice by means of Fourier transforms. To
+correct the fact that the latter series contains also the interaction of each distribution with
+itself, a self-term is also added. Finally, another additional term, J(D) is usually added to take
+into account the effects due to the dipole moment D of the original box as well as the external
+dielectric constant.
+34 material and methods
+The final rapidly convergent potential reads:
+N
+1∑ ∑N ( ∑∞ erfc(β|rij + n|)
+Uelect = qiqj
+2 |r + n|
+i=1∑ ijj=i+1 |n|=0 )1 4π2
++ qiqj exp(−k2/4β2) cos(k · r )
+πL3 k2
+ij
+∑k 6=0N
+√β− q2i + J(D) (2.7)π
+i=1
+where k defines the reciprocal lattice vectors. The rate of convergence of the series in (2.7) is
+determined by the value of β. Adjusting it can significantly improve the computational effort
+and transform an initial O(N2) algorithm to an O(N3/2) one (if the system is homogenous).
+Further improvements in the efficiency of the algorithm can be achieved by choosing β
+sufficiently large that atom pairs for which rij exceeds a specific cut-off distance roff are
+negligible in the first series in (2.7), which reduces this term to an O(N) calculation. The sum
+in the reciprocal space in the second series of (2.7) can then be approximated by means of
+the Fast Fourier Transfom algorithm. The latter algorithm requires a regular discrete grid of
+points and for this reason the point charges are mapped onto the neighboring grid points
+by means of interpolation. The spacing of the grid significantly affects the accuracy of this
+approximation. This improvement of the original Ewald summation is referred to as the
+particle-mesh method and has global complexity of order O(N lnN), N being the number of
+particles.
+Throughout this thesis, periodic boundary conditions were applied for all production
+simulations and the electrostatic interactions were computed using the particle-mesh Ewald
+method for which the cut-off roff distance in the direct sum was set to 8 Åand the grid for
+the term in the reciprocal space had a spacing of 0.75 Åwith an B-spline interpolation upto
+the 4th order.
+extended ensemble molecular dynamics The MD simulations presented in this
+work have been performed to reproduce the environment of experimental setups. For this
+purpose, they emulated the condition of constant average temperature and pressure which
+2.1 molecular dynamics 35
+corresponds to the isothermic-isobaric ensemble, NPT in statistical mechanics. In the case of
+MD simulations, this means that the number of particles N in the system is constant and the
+value of the temperature T and of the pressure P are instantaneously readjusted toward the
+average requested value by the control of some supplementary variables. The latter modify
+both the velocities (to adjust the temperature) and the interatomic distances (for pressure
+adjustment), introducing additional degrees of freedom in the original equation of motion
+(2.1). The following paragraphs give a brief explanation on how these re-adjustements are
+performed.
+▲❛♥❣❡✈✐♥ t❤❡r♠♦st❛t The macroscopic average temperature is maintained constant by
+means of a coupling of the system with a thermal bath at constant temperature which should
+work like a real thermostat. In the present work this coupling is achieved by inserting in
+Newton equation of motion a friction and a stochastic term. This leads to the equation known
+as the Langevin equation and for each atom i reads:
+miv(¨t) = Fi − γivi(t) +Ri(t). (2.8)
+where Fi is total force applied on atom i, Ri(t) is a stochastic force and γi represents the
+intensity of coupling with the thermal bath.
+The stochastic term is defined as a white-noise, i.e. its ensemble average must be zero and it is
+completely uncorrelated at all times:
+〈Ri(t)〉 = 0
+〈R (t) ·R (t ′)〉 = 6k Tγ δ (t− t ′i i B i i ) (2.9)
+where δ (t− t ′) is the Dirac distribution centered in (t− t ′i ).
+The friction term −γivi(t) opposes the motion of atom i affecting its velocity: it is proportional
+to the atom velocity and with opposite sign. This term is strictly related to the stochastic force
+by the fluctuation-dissipation theorem which leads to:
+∫
+dt〈Ri(t) ·Ri(0)〉 = 6kBTγi. (2.10)
+These assumptions have to be made to avoid any memory effect in the values of Ri(t)
+which could bring to unreal drift phenomena in velocity values. This method allows to the
+36 material and methods
+control of the temperature through the mutual balance between the friction and stochastic
+terms in adjusting the velocity of each atom. It is worth noting here that Langevin thermostat
+allows a correct sampling of the canonical ensemble but a priori the addition of a friction
+term in the equation of motion could result in some artifacts in the dynamical properties of
+the simulated system. Nevertheless, this problem can be biased using friction coefficients
+much smaller than the actual friction coefficient of the solvent. In the case of water which
+has γ = 50ps−1 is was shown that a value of 2ps−1 does not significantly change protein
+dynamics [195]. Details on the parameter values used in this work are given in the next
+chapter.
+❇❡r❡♥❞s❡♥ ❇❛r♦st❛t The adjustment of instant pressure values can be approached exactly
+in the same way as for temperature, by coupling the system to a pressure bath.
+The value of the system pressure is related microscopically to the internal kinetic energy and
+the virial:
+2
+P = [Ekinetic − Ξ] , (2.11)
+3V
+where
+∑N1
+Ξ = − 〈 rij · Fij〉. (2.12)
+2
+i>j
+From these equations it is evident that a change in pressure can be obtained by changing
+the virial through the rescaling of the interatomic distances rij. The latter leads to a rescaling
+of the total volume of the simulated system and of its atomic coordinates. The method
+originally proposed by Berendsen and coworkers [14] uses the rescaling of distances to
+regulate the macroscopic pressure of the system. For this purpose the equation that relates
+the time derivative of atomic coordinates with velocities, r¨ = v should be modified with the
+introduction of an extra term : x¨ = v− αx. The volume of the system should also change
+accordingly: V¨ = α3V .
+The pressure variation in the pressure bath is defined by:
+( )
+dP P0 − P
+= (2.13)
+dt bath τp
+2.1 molecular dynamics 37
+where P0 is the target pressure value. Additionally, the pressure change is generally also
+related to the isothermal compressibility β by:
+( )
+dP 1 dV 3α
+= − = − , (2.14)
+dt T βV dt β
+where the last equality is obtained by applying the requested volume re-scaling.
+Equations (2.13) and (2.14) leads to:
+P0 − P
+α = −β (2.15)
+3τp
+Hence, the equation of motion now reads:
+P0 − P
+x¨ = v−β x (2.16)
+3τp
+The solution of this equation, as obtained by the finite difference methods used in MD
+simulations gives a rescaling factor for the atom coordinates and the linear dimension of the
+simulation box which is equal to (at the first order in the time step ∆t)1:
+β∆t
+µ = 1− (P0 − P). (2.17)
+3τp
+leapfrog integrator In the program suite AMBER9, the integration of the equations
+of motion for the extended system corresponding to the NPT ensemble used in this work, is
+implemented through the use of the Leapfrog integrator [56, 3]. The latter is a symplectic and
+time-reversible integrator whose general form is derived by the Taylor series expansion of
+Newton equations for the atom position r, at timestep t and for its velocity at an intermediate
+time step t+∆t/2 [56]:
+1
+vi(t+∆t/2) = vi(t−∆t/2) + Fi∆t (2.18)
+mi
+ri(t+∆t) = ri(t) + vi(t+∆t/2)∆t (2.19)
+The velocity vi(t+∆t) can be computed a posteriori with the relation:
+1
+vi(t) = [vi(t+∆t/2) + vi(t−∆t/2)] (2.20)
+2
+1 The isothermal compressibility β does not need to be known exactly because its value influence only the
+accuracy of τp without any consequence to the dynamics
+38 material and methods
+When applied to an extended system issued by the use of the Langevin thermal bath and
+Berendsen barostat, (2.19) reads:
+1
+vi(t+∆t/2) = vi(t−∆[t/2) + ∆t [Fi − γivi(t) +mi ]Ri(t)] (2.21)
+P0 − P
+ri(t+∆t) = ri(t) + vi(t+∆t/2) −β ri(t) ∆t (2.22)
+3τp
+2.2 neutron scattering
+Neutrons are one of the most useful probes to study the structural and dynamical properties
+in condensed matter. Neutrons for scattering experiments are usually moderated to be at
+thermal equilibrium at room temperature with typical energies of ∼ 25 meV and wavelength
+around 1.78Å, which corresponds to the same time and length scale of the thermally excited
+atoms motions. These facts make neutrons very sensitive to both amplitude and frequencies
+of atomic motions. For macromolecules, cold neutrons which have typical energies around
+2.3meV and wavelength ∼ 5Å, are however better adapted to explore longer length scale and
+slower dynamics.
+Figure 9: Scheme of neutron scattering
+Neutrons interact directly with atomic nuclei via a very short range potential which can
+be considered as a direct collision between the neutron and a nucleus (see Figure 2.2). An
+incident monochromatic neutron beam can interact with matter through both absorption
+and scattering. When scattered, neutrons can be characterized by their wave vector kout and
+energy Eout [129, 13].
+2.2 neutron scattering 39
+The number of incident neutrons with wave vector kout which are scattered with a wave
+vector kout in the elementary solid angle dΩ around the direction of kout and with an
+energy exchange dω is called differential cross section and it is defined as:
+d2σ · |kout|= N S(q,ω), (2.23)
+dΩdω |kin|
+where N is the number of scatterers in the sample.
+The function S(q,ω) is called the dynamic structure factor and it gives access to sample
+dynamics as a function of q and ω which represent the momentum and the energy transfer
+respectively:
+∆p = h (kin − kout) = h q (2.24)
+h 2
+∆E = E  in − Eout = hω = (k
+2
+in − k
+2
+out) (2.25)2mn
+The value of  √|q| is related to the energy transfer hω by the relation:√√√ √h ω h ω
+|q| = kin 2− − 2 1− cos θ (2.26)
+Ein Ein
+This formulation of the problem takes into account the fact that in scattering phenomena
+neutrons more easily loose energy in interacting with matter. Equation in (2.26) is of crucial
+importance for the determination of the accessible range in the experimental settings of
+quasielastic neutron scattering measurements.
+Linear response theory allows the dynamic structure factor to be written in terms of
+equilibrium fluctuations of the sample and thus, using the fluctuation-dissipation theorem
+[201], S(q,ω) can be written as the Fourier transform of the intermediate scattering function
+F(q, t):
+∫
+1 +∞
+S(q,ω) = dtF(q, t)e−iωt∞ , (2.27)2π −
+∑ ∫1 +∞ −iq·r 1 ∑ 〈 iqTF(q, t) = Γ G (r, t)e dr = Γ e ·rα(t) e−iqT·r∞ ¸˛ β(0)αβ αβ 〉 (2.28)N Nα,β − α,β
+40 material and methods
+2 2Γαβ = bαbβ + δαβ(bα − bα ) (2.29)
+where "〈· · ·〉" denotes an ensemble average and if A(t) and B(t) are two time-dependent
+functions, "〈A(t1)B(t2)〉" is usually referred to as a correlation function. The parameter b¸/˛,
+called the scattering length, is an effective linear dimension of the nucleus α/β with respect to
+its interaction with neutrons. The function G¸˛(r, t) in (2.28) is referred to as the Van Hove
+pair correlation function and represents the probability that, given a particle at the origin at
+time t = 0, any particle (including the same one) is at r at time t.
+The intensities of the neutron-nucleus interactions are defined by the scattering lengths b of
+each nucleus in the sample which depend on the isotope and the relative orientation between
+the spin of the two interacting particles. If the spins of the nuclei and the neutron are not
+maintained in a special orientation one can assume a random relative orientation and that
+spin and position of the nuclei are uncorrelated.
+For this, F(q, t) in (2.28) takes into account the random distribution of nuclear spins in the
+sample through the parameter Γαβ defined in (2.29) where the average over isotopes and
+relative spin orientations of neutron and nucleus is expressed by · · ··.
+The parameter Γαβ can be divided into two terms:
+Γαβ = bα,cohbβ,coh + δαβ(bα,incbα,inc) (2.30)
+where,
+b√α,coh = bα (2.31)
+2 2bα,inc = bα − bα (2.32)
+are linked to the total scattering cross section by the relation:
+σ = 4π(b2 + b2α α,coh α,inc).
+The outcome of equation (2.30) is also that F(q, t) can now be recast as a sum of two parts:
+the coherent part Fcoh(q, t) which results from the correlations in time between the positions
+of the atom α (autocorrelation term) and those of different atoms β (cross-correlation term);
+the incoherent part Finc(q, t) which results only from the time auto-correlation of the positions
+of the same atom α:
+1 ∑
+F (q, t) = b b 〈eiqT·rk(t) e−iqT·r, , j(0)coh α coh β coh 〉 (2.33)
+N
+α,β
+2.2 neutron scattering 41
+1 ∑
+F (q, t) = b2 〈 iqTe ·rk(t) Te−iq ·rj(0)inc α,inc 〉 (2.34)N
+α
+2.2.1 Incoherent Scattering
+Neutron scattering from biological samples is mainly dominated by the incoherent part
+of the scattering of the hydrogen nucleus. This fact is due to the large difference between
+the incoherent term from hydrogens and the incoherent and coherent terms from the other
+isotopes that are usually present in biological samples. This fact is clearly shown in Table
+2.2.1
+Isotope bcoh(fm) binc(fm) σcoh(barn) σinc(barn)
+1H -3.74 25.27 1.76 80.27
+2H 6.67 4.04 5.59 2.05
+12C 6.65 0 5.56 0
+14N 9.37 1.98 11.03 0.49
+16O 5.80 0 4.23 0
+32S 2.80 0 0.99 0
+Table 5: Incoherent and coherent scattering lengths of the most common isotopes found in biological
+samples. Data reported from [175].
+The characteristic cross section of hydrogens is mainly due to a large incoherent
+contribution of the most favorable state of the interacting system composed by the incident
+neutron and the hydrogen nucleus. From a practical point of view, this fact constitutes a
+significant advantage in studying biological samples because they present large amounts of
+hydrogens uniformly spread over their chemical components. Therefore, the scattering from
+samples will represent the dynamics of the whole molecule even though they are mainly
+due to only one type of atom. Moreover, the great difference between the cross section of
+hydrogen (1H) and the one of deuterium (2H) allows some contrast to be created between
+different parts of the same molecule or between the molecule and the aqueous content of the
+surrounding solvent yielding a better characterization of the structure and dynamics of the
+42 material and methods
+sample itself.
+Elastic and Quasielastic Incoherent Scattering
+A typical spectrum from neutron scattering measurements is shown in Figure (2.2.1) where
+one can easily distinguish three different regions: the elastic peak which results from scattering
+without exchange of energy between the interacting particles and gives insights into the
+structural configuration of the sample; the quasi-elastic part which results from small energy
+changes and describes all the stochastic dynamics of atoms in the sample, such as rotational
+and translation diffusion; the inelastic part which is present only if the energy change is
+sufficient to modify the equilibrium state of the sample and gives access to vibrational
+motions.
+As mentioned in the previous paragraph, the large quantity of hydrogens in proteins or
+DNA lets us perform the following approximation:
+F(q, t) ≈ N b2H,inc FH(q, t) (2.35)
+where
+1 ∑
+F (q, t) = 〈eiqT·rα(t) e−iqT·rα(0)H 〉 (2.36)
+N
+α∈{H}
+The relative dynamic structure factor can be written using the relation (2.27)
+∫
+1 +∞
+S (q,ω) = dtF (q, t)e−iωtH ∞ H , (2.37)2π −
+and it is the main part of the dynamic structure factor that can be directly measured by
+neutron scattering experiments.
+In the case of samples with confined internal motions, such as biological macromolecules,
+the intermediate scattering function defined in (2.36) can be decomposed into a time-
+dependent part and a time-independent one:
+F (q, t) = F ′H H(q, t) + FH(q,∞) (2.38)
+2.2 neutron scattering 43
+Figure 10: A typical spectrum from neutron scattering measurements.
+This is due to the fact that the atom positions at different instants become independent of
+time as the latter goes to infinity.
+In simple liquids, where any confined motion is present, the time-independent term is strictly
+zero because of the atomic brownian motion which contributes in totally de-correlating
+atom positions, whereas in proteins, where the atomic internal motions are confined, the
+time-independent part is a non-zero constant.
+The time-independent part of (2.38) is usually called Elastic Incoherent Structure Factor (EISF)
+and can also be used to redefine the dynamic structure factor in the following manner:
+S (q,ω) = EISF(q)δ(ω) + S ′H H(q,ω) (2.39)
+44 material and methods
+In this form, SH(q,ω) presents an elastic and δ(ω)-shaped component related to the EISF
+along with another part, S ′H(q,ω) issued from the quasi-elastic and inelastic spectra of the
+s∫ample. Moreover the two parts on the right-hand side of (2.39) are restrained by the relation+
+−∞∞ SH(q,ω)dω = F(q, 0) = 1 (with appropriate normalization) which leads to:
+∫+∞
+dωS ′∞ H(q,ω) + EISF(q)δ(ω) = 1 (2.40)−
+By definition, the EISF relates to the ensemble of positions that the scattering nuclei
+(hydrogens) can attain during an infinite time and it gives insights into the configurational
+space volume the latter can explore.
+In practice, the definition of EISF given above suffers from two main biases: from the
+experimental point of view δ(ω) cannot be obtained exactly because of the finite resolution
+of the instrument used for the measurements and it typically assumes a larger-width shape
+(usually fitted as a triangular, gaussian or a lorentzian distribution); from a numerical point
+of view, the calculation of the EISF as the limit to infinity of the intermediate scattering
+function is very difficult due to the very low statistics attainable for time scales close to the
+total time-window used to observe the sample dynamics.
+Nevertheless, one can easily overcome these problems by redefining the EISF in both cases: the
+measured EISF can be rewritten as the ratio of the elastically scattered intensity integrated over
+the frequencies ω to the total integrated intensity (the sum of the elastic and the quasi-elastic
+part):
+∫+
+EISF (q) = −mes ∫∞∞ dω Selasticmes (q,ω)+∞∞ (2.41)−∫ dω Smes(q,ω)
+where , +S (q ω) = ∞∞ S (q,ω ′)R(ω − ω ′)dω ′mes − mes takes into account the effects of
+the finite experimental resolution represented by the function R(ω) of half-width-at-half-
+maximum (HWHM) equal to Γ ; the numerical EISF can be written instead as:
+1 ∑
+EISFnum(q) = b
+2
+α,inc〈|exp(iq · rα)|2〉 (2.42)N
+α
+2.2.2 Spectrometers
+The choice of the type of spectrometer to be used to perform the measurements and its
+resolution is highly related to the time and length scales of interest. In case one wants to
+2.2 neutron scattering 45
+investigate the effects of pressure or temperature on the internal dynamics of biological
+samples such as proteins, which requires the use of samples in liquid solutions, the
+spectrometer resolution should be attentively set to reduce the contribution of the global
+diffusion of the sample to the measured signal.
+Time-of-flight spectrometers are typically used for measurements of quasielastic scattering
+spectra in solids, liquids and molecular crystals.
+Time-of-flight spectrometers
+In time-of-flight spectrometers, such as the one illustrated in 2.2.2, neutrons from the reactor
+strike a sequence of choppers: passing through them the beam is first pulsed and then
+selected with respect to its energy E0 and wave vector k0. Therefore the neutrons leave the
+last chopper, placed at a known distance dCS from the sample, as a pulsed monochromatic
+beam. An array of 3He detectors is arranged at a known fixed distance dSD from the sample,
+and scattered neutrons arrive at the detectors at times determined by their scattering energies.
+The time-of-flight of a neutron from the last chopper to one of the detectors, the incident
+Figure 11: Example of time-of-flight spectrometer.
+neutron energy and the distances dCS and dSD are directly obtainable from measurements
+and allow the calculation of the final energy of scattered neutrons. Moreover, the knowledge
+of the angles of scattering allows to solve spectra as a function of momentum and energy
+transfer q and h ω.
+46 material and methods
+The time-of-flight spectrometers typically measure energy transfers in the range 10− 10−2meV ,
+hence they are used to investigate dynamics that occur in the time range 10−10 − 10−13s.
+All time-of-flight measurements for this work have been performed with the following
+spectrometers:
+- FOCUS (Paul Scherrer Institut, Zurich, Switzerland ) which is a time-of-flight spectrom-
+eter with a variable incident wavelength from 2 to 15 Å. Its energy resolution varies
+from 50µeV to 300µeV in the setup with higher incident neutron flux and a maximum
+momentum transfert of 8Å−1.
+- IN6 (Institut Laue Langevin, Grenoble, France) which is a time-of-flight spectrometer
+with incident wavelength of 4 to 5.9 Åwith corresponding energy resolution from 50
+µeV to 170 µeV . The maximum momentum transfert available is 2.6 Å−1.
+3
+EXPER IMENTAL AND S IMULATED SYSTEMS SETUP
+3.1 sample production
+3.1.1 Protein expression and purification
+In the following we will discuss the methods used to produce samples for both neutron and
+in silico experiments.
+Both approaches demand a wide knowledge of techniques some of which have been already
+presented in the previous chapters. The experimental samples also needs some preliminary
+steps for their own production which require knowledge in molecular biology. The discussion
+of these aspects in detail would be beyond the scope of this thesis, nevertheless, this part of
+the work has been fundamental for the following experimental steps as it allowed us to setup
+a stable protocol whose yield was adapted to neutron experiments.
+The protocol reported here followed the usual scheme for protein production which can be
+summarized in a very simplified way, as follow:
+- Cloning of the part of the genomic DNA from both Methanococcus Jannaschii and
+Saccaromyces cerevisiae which encode the a/eIF6 proteins.
+- Massive expression of the identified gene into an host organism, here E.coli, to produce
+large amount of proteins.
+- Purification of the protein solution obtained from the host organism to obtain an as
+much as possible pure solution containing only the a/eIF6 proteins.
+cloning Two cloning experiments have been performed to produce the genes encoding
+eIF6 and aIF6 proteins. Following the nomenclature found in literature we will call TIF6 the
+gene that encodes for eIF6. For M. jannaschii, the genomic DNA fragment encompassing the
+aIF6 gene was obtained from TIGR/ATCC Bult et al. [18]. The resulting cDNA was then
+amplified by PCR amplification using the nucleotides showed in Table (6).
+For S. cerevisiae, TIF6 construct was produced by PCR amplification using genomic DNA
+from S. cerevisiae as a template. Cloning experiments were performed using the nucleotides
+47
+48 experimental and simulated systems setup
+Table 6: default
+aIF6-forward AAA CAT ATG ACC ATG ATT ATA AGA AAA TAC TTC TC
+aIF6-reverse TTT TGC GGC CGC TCA TTA AAT CAG GCC TAA AGC ATC TT.
+TIF6-forward CGG GAT CCC ATA TGGCTA CCA GGA CTC AA
+TIF6-reverse GGG AAT TCC TAT GAG TAG GTT TCA ATC AA
+showed in Table (6).
+The forward primers introduced a NdeI restriction site and the reverse primers introduced a
+NotI restriction site. The aIF6 and TIF6 PCR products were cloned into a pET28a expression
+vector (Novagen). This plasmid contains a kanamycin resistance gene for selection of
+transformed cells, and a pBR322 replication origin. The target gene is placed under the control
+of the T7 RNA polymerase promoter, and is expressed as a fusion with a N-terminal hexahis-
+tidine tag followed by a thrombin cleavage site. Escherichia coli strain BL21(DE3) (Stratagen)
+chemically competent cells were transformed with this plasmid in order to express the protein.
+The DE3 gene encodes for the T7 RNA polymerase (under the control of the galactose operon).
+Transformation was done by heat shock: 1ng of plasmid DNA was mixed with 100µl of
+competent cells, and then incubated on ice for 20min. Following adsorption of the plasmid
+onto the cell membrane cells are placed at 42◦C for 45 sec, and then on ice for 2 min. 500µl of
+SOC medium is added and the cells were incubated 1 h at 37◦C. To select cells which have
+been properly transformed, the culture was then plated on LB-agarose plates containing
+kanamycin (10 mg/l).
+The plates were incubated at 37◦C overnight. The next day 20 ml of LB containing 10 mg/l
+kanamycin were inoculated with 1 colony. The cells were grown until the OD600 reached 0.6
+AU. 1 ml of the cell suspension was complemented with 100µl of sterilized glycerol, and the
+mix was frozen by immersion into liquid nitrogen. The aliquot was stored at -80◦CC.
+protein expression The expression was carried out in Erlenmeyer flasks. A 50ml
+preculture was prepared on the previous day by inoculating 50 ml LB (with 10 mg/l
+kanamycin) with cells scraped from the top of the frozen stock. For cultures in Erlenmeyer
+flasks, 2.5 l flasks were filled with 1 l of LB media complemented with 10 mg/l kanamycin.
+3.1 sample production 49
+Each flask was inoculated with 10 ml preculture, then incubated at 37◦C with 200 rpm
+agitation until the OD600 reached 0.6-0.8 AU. The temperature was then decreased to
+23◦C for 30 min, and 0.5 ml of isopropyl-thiogalactosidase (IPTG) 1 M (0.5 mM final) was
+added to induce expression of the cloned protein (via induction of the T7 RNA polymerase).
+Incubation was continued in the same conditions for 5 h. The cells were pooled into 1 l
+bottles and harvested by centrifugation for 15 min at 5000 g. Cell pellets were frozen by flash
+cooling in liquid nitrogen and stored at -80◦C.
+protein purification For each protein preparation 10 g of frozen cellular paste were
+resuspended in 40 ml of lysis buffer + 40mg of lysozyme (Appendix A). 3 pills of antiprotease
+complete EDTA free cocktail and 4 µl of Benzonase enzyme were added. The bacterial
+suspension was incubated 20 min on ice with agitation. Then, the cells were lysed twice by
+cell disruption (Constant System) at 1.4 Kbar. 1mM β-mercaptoethanol was added to the
+solution. Here two different approaches were used for aIF6 and eIF6: i) the crude extract
+expressing aIF6 was incubated for 1 hour at 75◦C taking advantage of its heat resistance
+properties; ii) the eIF6 was was rapidly brought to the next step to reduce the probability of
+proteolytic clevage (see next paragraph). The soluble and insoluble fractions of aIF6 and eIF6
+were separated by ultra-centrifugation (1.5 h, 250000 g) for both preparations. The soluble
+part of the crude extract was then incubated with 3 ml Talon superflow Cobalt affinity resin
+(Clontec) previously equilibrated with lysis buffer; incubation was done at 4◦C for 1.5 h
+with gentle agitation. The resin was transfered in a column and washed successively with 10
+column volumes of wash solution (Appendix A, 1M NaCl) by gravity. The histidine tagged
+IF6 protein was then eluted from the resin using 8 volumes of elution buffer (Appendix A,
+250 mM imidazole), and collected in 1.5 ml fractions. Fractions were loaded on a denaturing
+gel to check for presence of the overexpressed IF6 protein.
+Fractions containing the protein were pooled and dialysed twice for 2 h against imidazole
+free, dialysis buffer (Appendix A). The protein concentration was determined by measuring
+the OD280 of the solution and thrombin was added (1 u per 150 µg of protein) to
+selectively cleave the N-terminal histidine tag of the protein. The cleavage step was done by
+incubation overnight (approx. 16 h) at room temperature, and stopped by addition of 0.2
+mM (final concentration) phenylmethylsulfonyl-fluoride (PMSF). The completeness of the
+proteolysis was checked by SDS-PAGE.The protein was concentrated to 10 mg/ml using a
+UltraFree (Millipore) ultrafiltration device (5 kDa membrane cutoff) prior to size exclusion
+50 experimental and simulated systems setup
+MW Clys Fractions
+Figure 12: Denaturing gel verification of overexpressed IF6 protein. Cell lysate shown as reference.
+chromatography. Gel filtration was performed using a Superdex-75 HR 10/30 (Pharmacia)
+column previously equilibrated in the protein storage buffer (appendix 1). Both OD280
+(optical density at 280nm) and OD260 were monitored during the chromatography to control
+the absence of nucleic acids and 500 µl fractions were collected. Peak fractions were pooled
+and concentrated a last time using a Centricon (Millipore) ultra-filtration device with a
+membrane cutoff of 10 kDa.
+poly-histidine tag The use of polyhistidine tags helped to obtain a considerable yield
+from the above protocol which allowed a reliable protein concentration to be maintained even
+for neutron scattering measurements in high pressure systems where a large solution volume
+is necessary. Nevertheless, for technical reasons the selective cleavage of this tag was not
+suitable for large volume solutions. For this reason, the cleavage procedure explained above
+was performed only on ambient pressure measurements where more convenient volumes
+could be used. As a consequence, this protocol must be considered as a first effort toward a
+more satisfactory procedure adapted to neutron scattering experiments.
+The presence of the histidine tag is not expected to have strong effects on protein structures,
+as proved by Carson and coworkers [23] on a wide set of crystallographic structure, but it
+could significantly affect the global protein dynamics. For this reason, as shown in Results,
+some supplemental tests have been performed to quantify the dynamical contribution of the
+tag in the case of a/eIF6.
+3.1 sample production 51
+clevage of carboxyl-terminal tail in eif6 During some preliminary tests for
+protocol optimization, a proteolytic clevage of the eIF6 protein was observed (see Figure 13
+for the corresponding SDS-PAGE verification), either in the soluble and in insoluble fractions
+of the cell lysates.
+Figure 13: SDS-PAGE verification of partial clevage in eIF6 samples. Cell lysate shown as reference.
+Due to its apparent small molecular weight, the cleaved fragment detected in this work
+was supposed to be the same found by Groft and coworkers [66]. The latter reported that
+attempts to express and purify S.cerevisiae eIF6 were complicated by proteolytic cleavage of
+the divergent C-terminus. They also remarked that truncation beyond residue 224 eliminated
+this problem, and eIF6(1-224) could be purified using the same aIF6 purification scheme.
+Interestingly, the cleaved part of eIF6 contained a tail made of 21 aminoacids, with sequence
+shown in Table 7, which can be found only in eukaryotes homologous of IF6 and very little is
+known about its structure.
+A preliminary characterization of the fragment was performed by the means of the Basic
+Local Alignement Search Tool (BLAST) which compares the aminoacid sequence of the
+fragment against sequence databases in order to find some similarities with other known
+proteins. For eIF6, the only significant scores were obtained from other IF6 homologous
+meaning that this sequence fragment must be strictly peculiar for the function of this class of
+52 experimental and simulated systems setup
+Table 7: Sequence of the C-terminal fragment of eIF6 (CTAIL). Numbers of residues start at 225,
+according to the sequence in eIF6.
+Glu225 Asp226 Ala227 Gln228 Pro229 Glu230 Ser231 Ile232
+Ser233 Gly234 Asn235 Leu236 Arg237 Asp238 Thr239 Leu240
+Ile241 Glu242 Thr243 Tyr244 Ser245
+initiation factor or of its evolutionary history.
+In order to obtain more insights into the native conformation of this C-terminal tail, a test of
+secondary structure prediction was performed with two distinct methods:
+- PSIPRED server [101], which performs structure predictions based on position-specific
+scoring matrices
+- APSSP2 server [156], which predicts secondary structure conformations using nearest
+neighbor and neural network approaches.
+Both methods found a reasonably probable formation of a α-helix in the ending part
+of the fragment, in the region Asp238 Thr239 Leu240 Glu241. These results are also
+corroborated by the inspection of the hydrophobic profile of the fragment with the help of
+the Kyte/Doolittle hydrophilicity scale [122] which shows an increasing hydrophobicity in
+the regions Pro229-Ser231 and Asp238-Glu242.
+These results lead to the convinction that the fragment could have a significant role either
+in dynamics or structure stability of eIF6 and thus also in protein function. This idea is
+comforted by recent results which indicate that C-terminal subdomains contribute to the
+localization in the cellular nucleus of eIF6 [6].
+This outcome suggested the importance of maintaining the 21 C-terminal fragment as part
+of the investigated sample. For this purpose, several tests on the production of eIF6 were
+performed in order to limit the proteolytic cleavage during the production itself without
+effect on the total final yield.
+The protocol presented here gave the best results with a cleavage reduced to around 30%
+as resulted from the preliminary MALDI mass spectrometry analysis reported in Figure 14
+where two large peaks are evident at molecular weights equal to both the entire protein and
+the truncated structure (1-224). The height of these peaks gives an estimation of the relative
+3.1 sample production 53
+Voyager Spec #1=>BC=>NF0.7=>SM21[BP = 28472.8, 442]
+28469.98
+100
+90
+80
+8667.46
+70
+60
+10648.91 28654.25
+50
+14238.52
+40 16653.33
+11525.53
+8246.39
+30 10141.64 14332.58 27129.39
+28870.80
+20 13561.33 27269.91
+10
+0
+7999.0 13399.4 18799.8 24200.2 29600.6
+Mass (m/z)
+Figure 14: MALDI-MS essay on eIF6 solution.
+amount in solution.
+stability of eif6 When performing studies on the effects of extreme conditions on
+protein structure and dynamics it is important to know beforehand the boundaries which
+define the normal conditions for the specific protein of interest.
+Nevertheless, in the case of IF6 homologues, there is a scarcity of works on the general
+chemical properties with respect to temperature and pressure changes. Although aIF6 is
+presumably able to reversibly respond to high temperature and high pressure values, very
+little can be said about the eIF6. In an early paper on biological properties of eIF6, Valenzuela
+and coworkers [199] reported that anti-association factor 6 from calf liver was found to
+undergo a cessation of its activity at temperature of ∼ 60◦C. As the inactivation of a protein
+function may not correspond to the total and irreversible denaturation of the protein itself,
+the latter was tested here by means of dynamic light scattering measurements in the range of
+interest of the present work. The measurements of the hydrodynamic radius of eIF6 were
+performed with a DynaPro-Titan© fixed-angle light scattering system. The results, listed
+in Table 8, shows that, at 50◦C, eIF6 forms aggregates or partially unfolds. Moreover, when
+brought back to 30◦C it does not find its initial state, suggesting that the transition is not
+reversible.
+These preliminary reults together with the outcome of the work made by Valenzuela and
+% Intensity
+54 experimental and simulated systems setup
+coworkers, suggested to limit all neutron scattering experiments on eIF6 into the non-
+denaturating temperature range. However, as explained in the next sections, some in silico
+exmperiments have been performed on eIF6 also at high temperature and high pressure
+to verify the presence or more simply the beginning of a denaturating process. It is also
+worth noting that the reported values of hydrodynamic radius for eIF6 at 20◦C correspond
+only to an effective value due to a spherical approximation of the whole protein structure:
+the conserved pseudo-globular part formed by residues 1-225 and the C-terminal tail of 21
+aminoacids.
+Table 8: Variation of the hydrodynamic radius of eukaryotic eIF6
+20◦C 30◦C 50 ◦C back to 30 ◦C
+RH [nm] 3.32 3.61 29.76 24. 23
+final samples For both aIF6 and eIF6, deuterated protein solutions were prepared at a
+concentration of ∼ 40mg/ml and pD ∼ 7.0. All labile hydrogen atoms in the samples were
+exchanged overnight by dialysis and then filtered with an Amicon Filter Ultra (membrane
+cutoff 5kDa) against a thirty-fold excess of pure deuterated solvent. The final solution was
+centrifuged to eliminate possible aggregates. The final concentration was measured by
+UV-VIS absorption at 280nm. The latter measurement gave results with a possible systematic
+error greater than 10% due to the very low amount of chromophore amino acids (such as
+tryptophan, tyrosine, phenylalanine and histidine) in the sequence of both proteins. Although
+the limits for solution concentration of both samples were not known from literature, several
+preliminary DLS assays seemed to comfort the observation of monodisperse solutions of eIF6
+around 40mg/ml.
+3.2 neutron scattering measurements setup
+In this work the reported measurements of neutron scattering spectra were performed in
+order to investigate the effects of the pressure and temperature changes into the dynamics of
+3.2 neutron scattering measurements setup 55
+proteins. For quasielastic neutron scattering experiments (QENS), the easiest way to apply
+pressure to a biological sample is to put it in a liquid solution and then compress the
+volume in which it is contained. This is usually done in sample containers with a cylindrical
+geometry. In this work, two different sample containers of this shape have been used for
+the measurements at ambient and higher pressure, respectively. The relatively wide range
+of temperature values, explored in measurements, imposed for both sample containers, the
+choice of materials which do not undergo significant structural changes at high temperature
+that could modify, for example, their mechanical resistance.
+Moreover, when performing QENS experiments on samples in solution, one often needs
+to use high concentrations to maintain the signal due to the sample itself significantly
+distinguishable from the one coming from the buffer. For biological macromolecules this fixes
+a constraint to the total solution volume used in the experiment as the biological samples
+are often available in small quantity mainly due to expression protocols yields. In the case of
+a/eIF6, although the protocol presented in the previous section was conceived to obtain a
+maximum amount of samples, this was still a limiting factor for the total volume available for
+measurements. For this reason the sample containers used in this work were also chosen for
+their effective volume.
+Ambient pressure An approximate scheme of the sample container used for these
+measurements is shown in Figure 15 (panel A). The container is made of two concentric
+hollow aluminum cylinders with a diameter of 19mm and 20mm, respectively. The irradiated
+region was ∼ 50mm in height. The space between the walls of the two cylinders were
+filled by the samples and closed on the top by a disc made of Teflon© in order to avoid
+the sample to exit the space due to capillarity effects. The Teflon© cap was supposed
+to be out of the irradiated region. The total volume available for samples were limited to 1.2ml.
+High pressure The pressure cell was developed at the Institut Laue Langevin in Grenoble
+(France) and was conceived to carry out experiments on liquid solutions at moderate high
+pressure. In particular the dimensions of the cylindrical geometry were determined to
+withstand pressure up to 2kbar: internal diameter of 10mm and wall thickness of 1.5mm. The
+global geometry of the cell, shown in Figure in 15 (panel B), was inspired by another one
+previously used for high pressure studies on lysozyme and reported in [20].
+In contrast to the latter, however, here the pressure is applied without transmitting media
+and directly on the sample which is compressed by a pump connected to the pressure cell by
+a very thin capillary (0.1mm diameter). Moreover, the irradiated part of the cell was made of
+56 experimental and simulated systems setup
+Figure 15: Sample can for high pressure measurements
+an alloy of copper-berylium which permitted the wall thickness to be significantly reduced
+without affect their mechanical resistance. In order to reduce the multiple scattering due to
+the protein solution an insert with a diameter of 9 mm was used. As a whole the pressure
+system required a total volume of ∼ 3ml of protein solution which is considerably smaller
+than the volume commonly used in this type of QENS experiments and suitable for the
+typical amount of a/eIF6 production yields.
+instrumental resolution The QENS measurements reported in this thesis have
+been performed mainly to investigate the internal dynamics of proteins. For this purpose
+it was important to filter out of the quesielastic spectra all other contributions coming for
+example from the global translation and rotation of proteins in solution. The standard method
+to accomplish this task is the choice of an adequate experimental energy resolution which
+should be larger than the width HWHM (half-height at half-maximum) of quasielastic signal
+due to global motions. The energy width of the latter can be estimated from knowledge of
+the translational and rotational diffusion constant of the protein. Unfortunately in the case
+3.2 neutron scattering measurements setup 57
+of a/eIF6 no reference can be found in litterature and these values could only be estimated
+from the available crystallographic structures. Nevertheless, as reported in Results, some a
+posteriori finer estimations have been made by means of molecular dynamics simulations.
+The values obtained for the conserved structure (residues 1-224) in aIF6 and eIF6 were around
+8.4 · 10−3 Å2/ps which correspond, in terms of HWHM, to an energy width of 20 µeV for
+a value of q = 1Å−1el . This result should be however corrected by a factor 0.20 due to the
+higher viscosity of D2O with respect to that of H2O. The experimental resolution chosen for
+measurements at the spectrometers FOCUS (Paul-Sherrer Institut) and IN6 (Institut Laue
+Langevin) reported with other experimental settings in Table 9, was not sufficient to totally
+eliminate the effects of global motions to the protein spectrum but was enough to significantly
+reduce it with respect to the quasielastic signal corresponding to internal diffusive motions.
+In this discussion only the translational diffusion constant was taken into account. To estimate
+the influence of rotational diffusion on the measured QENS spectra the following formula for
+the diffusion constant for rotational diffusion [36] was used:
+kBT
+γr = . (3.1)
+4πηR3H
+The above relation is used assuming that the approximation of eIF6 as a spherical-shaped
+protein is reliable1. Here RH is the radius of the protein and η is the shear viscosity of
+the solvent (water). For a/eIF6, which has a radius of RH = 2.81nm, one obtains γr =
+0.14 · 108 s−1 at T = 293K. This corresponds to a width of 6 · 10−5meV , which is far below the
+instrumental resolution. Therefore, spectral contribution from the global rotational diffusion
+are expected to be largely within the chosen energy resolutions.
+Table 9: Instrumental settings used in this work.
+Incident waveleght Energy resolution Sample environment Time per run
+[Å] HWHM [meV] [hours]
+FOCUS 5.92 ∼ 0.020 ambient pressure 15
+IN6 5.98 ∼ 0.020 high pressure ∼ 10
+1 In the Results, I will show that a better approximation of IF6’s shape can be given by the Perrin correction to the
+Stoke’s law for the diffusion of a sphere.This refinement will not change however the considerations made here.
+58 experimental and simulated systems setup
+3.2.1 Data analysis
+The usual procedure for the analysis of data from neutron scattering measurements, is
+preceded by some preliminary as follows:
+- Normalization to the total number of incident neutrons during a single measurement.
+This normalization is needed to account for the differences in time length and in incident
+neutron flux for each measurement
+- Correction for the detector efficiencies. It is performed in two steps. Firstly by the
+normalization to the spectrum of vanadium performed with the same experimental
+environment which corrects for relative efficiencies of detectors with respect to each
+other. Secondly a correction is made with respect to the energy dependent efficiency of
+detectors. A vanadium spectrum is used for the first calibration because it is a completely
+elastic incoherent scatterer in the range of q of interest in time-of-flight experiments.
+- Grouping of spectra over angles is made to increase the statistics related to data.
+The latter procedure was crucial because the signal-to-noise ratio in measurements of
+biological samples in solution is usually very low.
+In QENS measurements on protein solutions, the detected signal does not come exclusively
+from the protein but shows also significant contribution from the bulk solvent and from
+the sample environment, like for example, the sample containers and background noise.
+The spurious contributions are usually subtracted from the total signal to obtain scattering
+functions related only to the protein dynamics. This procedure can be summarized by the
+following relation:
+S˜protein(q,ω) = (SS(q,ω) − τ ∗ SE(q,ω)) − (1−α) ∗ (SB(q,ω) − τ ∗ SE(q,ω)) (3.2)
+where τ takes into account the transmission of the protein solution2 and α is the volume
+fraction of the protein and its first hydration shell in the solution sample.The latter must be
+known to apply a correct subtraction of solvent contribution in protein solution spectra.
+The parameter α was estimated from the following relation between the mass density of
+proteins and their mo[lecular weight (M((KDa)) [54]: )]
+M(KDa)
+ρ(M)[g/cm3] = 1.41+ 0.145 · exp − (3.3)
+13
+2 Through out this thesis the transmission of the protein solution was approximated to the one of the buffer alone
+3.3 molecular dynamics setups 59
+For a/eIF6 one obtains ρ = 1.43g/cm3, which gives a specific volume ν = 0.70cm3prot /g.
+Multiplying by the estimated concentration of 40mg/ml one has the volume fraction α =
+0.028. The hydration shell needs to be included as part of the protein because the dynamics
+of water molecules in this shell is different from the one of bulk water due to the weak
+interactions occurring between the protein and solvent molecules.
+Gerstein and Chothia [63] showed that hydration water volume is equal to 24 Å3 which
+means it is 20% smaller than the volume of bulk water. Hence, the increase of protein specific
+volume due to its first hydration shell can be estimated as follows:
+ν = νprot + νshellN
+where N is the number of protein molecules in the unit volume and
+νshell = rshell ·Awater
+In the above equation rshell represents the radius of the spheres with the same volume of
+water molecules in the first hydration shell and Awater is the surface area of the protein
+accessible to solvent molecules with radius rshell. For lack of more precise estimations, in the
+case of IF6, the value of νshell was approximated with the Surface Accessible Surface Area
+(SASA) calculated on the crystallographic structure of aIF6. The obtained value corresponds
+to a hydration layer composed by approximately 850 water molecules per protein molecule.
+Hence, the final volume fraction α was found equal to 0.04.
+As stated at the end of the previous section, the measurement of the protein concentration
+in the final samples was made very difficult by the poor UV-VIS absorption of a/eIF6. As
+a consequence, all values obtained from the considerations made above, which are strictly
+dependent to the knowledge of the real protein concentration, have to be considered here as
+strong approximations and they will be used only as references in the Results.
+3.3 molecular dynamics setups
+We performed all the stages of the molecular dynamics simulations using the AMBER9
+simulation code[27]. The whole set of final simulations for both the homologues used the
+AMBER99SB force field [86]. The latter is an upgraded version of the AMBER94 force field,
+usually used for protein molecular dynamics, and it contains a reparametrization of the back-
+60 experimental and simulated systems setup
+bone torsion terms and achieves a better balance of the different secondary structure elements.
+3.3.1 System Setup
+aIF6
+The initial configuration of the IF6 protein issued from the M.Jannaschii was taken from a
+crystal structure with a refined resolution of 1.30 Å(available from the Protein DataBank with
+the code: 1G61)[66] together with all the water molecules found within a distance of 2nm
+from the protein center of mass in the crystallographic data. The coordinates of the missing
+hydrogen atoms were added using the algorithms implemented in the LEaP program from
+the AMBER9 package.
+The protein was placed in a orthorhombic periodic box filled with water molecules
+parametrized as TIP3P. The crystallographic water represented by oxygen atoms, within a
+distance of 2nm from the protein center of mass, were replaced by the same type of water
+molecule models. The final total amount of water molecules was 8136. The whole system
+includes also 14 sodium (Na+) counterions in order to obtain a neutral global charge for the
+Ewald calculations.
+The whole system was initially minimized in two steps with combined use of steepest-
+descent and conjugated-gradient algorithms: i) 200 cycles of conjugated-gradient after 4 steps
+of steepest-descent with position restraint on protein atoms and counter ions; ii) 200 cycles
+of conjugated-gradient after 4 steps of steepest-descent for the whole system without restraint.
+As a preliminary step of the real molecular dynamics simulation, we first performed
+a system equilibration step in which the simulated system attained a stable equilibrium
+conformation compatible with the environmental constraints, i.e. constant pressure and
+temperature. For this purpose, a short simulation of 150ps in a NVT ensemble, i.e. with
+fixed total volume and temperature kept equal to 300K was performed, followed by a 700ps
+long simulation in the final NPT ensemble, with T = 300K and P = 1bar. In all simulations
+performed in this work the time-step used for the integration of motion equation was equal
+to ∆t = 0.001ps = 1fs (fs is femto-seconds). The equilibration in the NVT ensemble was
+made with the calculation of the contribution of the forces slowly-varying in space only every
+3.3 molecular dynamics setups 61
+two steps, resulting in a shorter CPU-time without significant changes in the total energy of
+the system.
+From the equilibration at 300K and 1bar all other simulations branched to other NPT
+conditions of interest. In every case the equilibration steps were followed by production
+simulations of length equal to 2ns which was used for the calculation of dynamical properties
+of the system itself.
+In each simulation the control of temperature was performed with a Langevin thermostat3
+with a collision rate of 3.5ps−1, whereas pressure was constrained by a Berendsen barostat
+relaxation time τp = 1.5ps.
+3.3.2 eIF6
+The initial configuration of the IF6 protein issued from the S.cerevisiae was taken from a
+crystal structure with a refined resolution of 2.5 Å(available from the Protein DataBank with
+the code: 1G62)[66]. Nevertheless, the crystallographic data contained in the original PDB
+file did not give the atom positions of the 21 amino acids long C-terminal tail which was
+not crystallized with the rest of the proteolytic cleavage protein because of the structural
+instability that was encountered in this work during the sample production, as mentioned in
+Section 3.1.1. The presence of this tail, even though it does not seem to influence the function
+of eIF6 [66], certainly has some effects on protein mobility [6].
+The construction of the complete structure of eIF6 required some supplementary steps with
+respect to the case of aIF6. Firstly the structure of the C-terminal tail (CTAIL, in the following)
+was modeled and partially folded. Secondly the complete structure was assembled and
+equilibrated to an appropriate equilibrium state.
+Both steps of this preliminary procedure were performed by means of molecular dynamics
+simulations with implicit solvent in order to significantly reduce the CPU-time [198]. This
+method consist of the substitution of the explicit calculation of the dynamics of solvent
+molecules -usually very time-consuming - with an additional mean forces term in the protein
+force-field which should take account of all solvent effects on the protein. This approach
+3 The chosen collision rate for Langevin thermostat did not produce artifacts on IF6 dynamics as verified
+by comparison of effective friction constant calculated from NPT ensemble with the one obtained from a
+NVE (constant energy) simulation of the same system. Friction constant was estimated by memory function
+calculation[118].
+62 experimental and simulated systems setup
+clearly contains some strong approximations and it does not always give the right description
+of dynamics if compared with explicit solvent calculations [146] but it is however a valuable
+tool to rapidly explore the configuration space of large systems in order to find an appropriate
+equilibrium state. The implicit solvent model used throughout this thesis was the pairwise
+Generalized Born solvation model (GB), developed by Hawkins and coworkers [70, 71],
+where mean forces are obtained from the estimation of the total solvation free energy of the
+molecule into water. A complete description of the method can be found in many textbooks
+on methods in computational physics and biology [12].
+ctail folding Here a brief summary of the protocol used for the modeling and the
+initial folding of CTAIL is reported. The whole procedure was performed using the LEaP and
+Sander programs from the AMBER9 package.
+. A "linear" configuration was firstly created for the polypeptide with sequence shown in
+Table 7.
+. Initial folding of the linear structure was then performed in a NVT ensemble with the pro-
+tocol for the temperature re-scaling shown in Table 10. The time step for the integration
+of equation of motion was varied between 0.1 and 0.5 fs, in order to reduce the extent
+of force variation and thus the probability of unnatural atom contacts which would
+prevent the CTAIL from folding correctly.
+Table 10: default
+Total time Partial time Initial T Final T time step
+[ps] [ps] Kelvin Kelvin [fs]
+10 10 0 50 0.1
+260 250 50 100 0.5
+510 250 100 150 0.5
+560 50 150 200 0.5
+610 50 200 250 0.5
+660 50 250 300 0.5
+3.3 molecular dynamics setups 63
+. The final step of this procedure was a very long equilibration simulation in which the
+protein fragment could fold. The total time length of this simulation was ∼ 40ns. A
+shorter simulation with explicit solvent was also performed to verify the absence of
+solvent-specific effects in CTAIL folding.
+Interestingly, the final folded structure of CTAIL, shown in Figure 16 (Panel A), contains a
+small helix in the region 14-18 whose shape is similar to an α-type. The inclusion of this helix
+into the protein sequence corresponds to the one found in Section 3.1.1 by means of structure
+prediction and hydrophobic arguments.
+Figure 16: Modeling of CTAIL in implicit solvent. Panel A shows structure folded without contraints.
+Panel B: structure folded with a position restraint in amino-terminus. Color scheme: purple
+for α-helix, blue for 310-helix, cyan for turns and white for random coil.
+It is worth noting that the folded configuration obtained here might not correspond to the
+one that CTAIL would reach when folded together with the rest of the protein sequence. For
+this reason, the same procedure was repeated with the amino-terminal position fixed in space
+by an harmonic force, F = −Kx, with K = 10 kcal mol−1 Å2 . The resulting final structure
+was compared with the previous one in order to better understand the effects of the spatial
+constraints in the folding pathways. The resulting structure after a total simulation time of
+40ns is shown in Figure (Panel B). Inspection by eye reveals that secondary and tertiary
+structures are slightly different. This comparison indicate that CTAIL folding is very sensitive
+64 experimental and simulated systems setup
+to the number of degrees of freedom available for its three-dimensional configurations.
+modeling of eif6’s complete structure The above paragraph showed the
+importance of an ultimate verification of the actual conformations of CTAIL when the latter is
+joined to the rest of the protein. A complete study on this subject would be out of the scope
+of this thesis and would need a more exhaustive simulation of folding of the whole protein.
+Here I would like to focus on more qualitative considerations about the effects induced on
+the rest of the eIF6 structure by the presence of CTAIL. For this purpose, in the following it
+will be supposed that the conserved region of aIF6 and eIF6 (residues 1-224) does not attain a
+different fold in the presence of CTAIL. This assumption seems to be confirmed as reliable by
+homology modeling study of different homologues of IF6 from a wide range of different
+organisms [66].
+On these bases, another molecular dynamics simulation with implicit solvent was
+performed on the system composed by CTAIL directly joined to the rest of "already-folded"
+eIF6 structure. The initial configuration used for this simulation was composed by CTAIL
+folded through the procedure described above and the crystallographic structure of eIF6.
+The binding of the two subunits of the system was performed by the creation of the peptide
+bond between the nitrogen atom in the C-terminus of the residue 224 and the nitrogen atom
+in the N-terminus of CTAIL. The latter structure was then minimized with restraints in
+atom positions in residues from 1 to 200 and with fixed hydrogen covalent bond-length (the
+SHAKE algorithm[35] for rigid molecule dynamics was used here). The procedure consisted
+of 900 steps of minimization using the steepest-descent gradient method followed by 1100
+steps performed with the conjugated-gradient algorithm.
+The energy minimization was followed by a short equilibration run of molecular dynamics
+(30ps) in a NVT ensemble, i.e. with constant volume and temperature. The Langevin
+thermostat was used to keep temperature constant. Here, in order to significantly improve the
+thermal coupling between the system and the thermostat a very high friction constant value
+(γ = 500 ps−1). A short time step (∆t = 0.5 fs) for the Leapfrog integrator was used in order to
+avoid improper fluctuations of potential energy which would result in total energy divergence.
+Local optimization of the protein conformation found through the previous steps, was
+performed using the simulated annealing method which consists, as for the real annealing of
+3.3 molecular dynamics setups 65
+matter, in a sequence of heating and cooling phases. The latter, which is commonly used
+for finding of the global minimum of potential surfaces in the case of small molecules, was
+shown to not be reliable for systems with a broad distribution of energy scales. Nevertheless,
+several works demonstrated that it remains very useful method for local optimization of
+larger molecules conformations, such as proteins, because unlike minimization methods, it is
+able to locate local minima even far away from the initial conformation[208]. The sequence of
+annealing steps used in this work is shown in Table 11 and was performed with the same
+parameters settings as the previous equilibration step.
+Table 11: Simulated Annealing of eIF6’s complete structure
+Total time Partial time Initial T Final T time step
+[ps] [ps] Kelvin Kelvin [fs]
+50 50 300 400 0.5
+100 50 400 400 0.5
+150 50 400 500 0.5
+200 50 500 500 0.5
+250 50 500 300 0.5
+300 50 300 300 0.5
+Figure 18 shows the time evolution of RMSD for the region 1-224 (hydrogens not taken
+into account) with respect to the initial equilibrated conformation, expressed as a function of
+time by the relatio√n:∑N(R (t) −R (0))2i i iRMSD(t) = (3.4)
+N
+where Ri(t) represents the position vector of the atom i at time t. In the same figure the
+evolution of total potential energy during the simulated annealing is shown. Both results give
+evidence of a new conformation far from the initial one and with a slightly lower energy.The
+final structure is shown in Figure 17.
+It is worth noting that, after minimization and simulated annealing, the root-mean-square-
+deviation of the eIF6 backbone in region 1-224 with respect to the original crystallographic
+66 experimental and simulated systems setup
+Figure 17: Final structure issued from the minimization and simulated annealing procedures.
+structure is however small (1.5Å), meaning that, although the core region of eIF6 moved away
+from its initial minimum, its global arrangement is not significantly changed by the presence
+of CTAIL, at least on the time scale explored here.
+The structure resulting from the sequence of procedures discussed above, was used as
+initial structure for molecular dynamics simulations performed with explicit solvent and
+with the same protocol used in the case of aIF6.
+supplemental samples In order to compare results from molecular simulations with
+the experimental measurements and to obtain more insights into the dynamical and structural
+effects of CTAIL, two other samples were modeled and analyzed (they are reported here with
+the short names used through out this thesis to refer to them):
+. eIF6-NoCTAIL: the eIF6 simulated without the attached CTAIL. The crystallographic
+structure was used as initial configuration after a preliminary step of minimization to
+let it attain an equilibrium conformation compatible with the buffer environment. Due
+to the low resolution of x-ray data, any crystallographic water was found in the initial
+PDB file. All buffer molecules were modeled as made for aIF6.
+3.3 molecular dynamics setups 67
+Figure 18: Time evolution of RMSD for the region 1-224. Insert: evolution of potential energy of
+the whole protein during the annealing procedure. Both quantities use the previously
+equilibrated conformation as reference (see text for more details).
+. aIF6-htagged: As explained in Section 3.1.1, for technical reasons due to the specific experi-
+mental setup, high pressure measurements were performed on samples produced with
+a specific tag of six consecutive histidines (His-tag) which significanlty improved the
+yield of the production protocol. In order to compare these measurements with those
+obtained from molecular dynamics, the structure of aIF6 complexed with the His-tag
+was modeled following the same procedure used for the global structure of eIF6.
+Both samples were simulated following the protocol used for aIF6 and eIF6.
+
+4
+CHARACTER IZAT ION OF PROTE IN STRUCTURE
+In the next chapters a new method for the characterization of protein secondary structure
+will be presented. The development of this method, called ScrewFit, was inspired by the task
+of finely characterize the environmental effects on protein structures.
+ScrewFit was then found to be able to make precise assessments on protein secondary
+structure motifs and also to find local and global structural effects induced by ligand binding.
+The text proposed here has been already published or is under review as scientific articles
+in international peer-reviewed journals. The original text is reprinted here together with
+supplemental data and notes at the end of each article.
+Next chapters formerly appeared as the following scientific articles:
+Kneller, G.R. and Calligari, P. Efficient characterization of protein secondary structure in
+terms of screw motions. Acta Crystallographica D, 62, 302-311 (2006).
+Calligari, P. and Kneller G.R., ScrewFit: a novel approach for continuum protein secondary
+assessments. Submitted (2008).
+Another application of the method ScrewFit can be found in:
+Calligari, P. et al., Inhibition of viral group-1 and group-2 neuraminidases by oseltamivir:
+a comparative structural analysis by the ScrewFit algorithm. Biophysical Chemistry,
+accepted for publication (2008).
+69
+
+5
+EFF IC IENT CHARACTER ISAT ION OF PROTE IN SECONDARY
+STRUCTURE IN TERMS OF SCREW MOTIONS
+We present a simple and efficient method to describe the secondary structure of proteins in
+terms of orientational distances between consecutive peptide planes and local helix parame-
+ters. The method uses quaternion-based superposition fits of the protein peptide planes in
+conjunction with Chasles’ theorem, which states that any rigid body displacement can be
+described by a screw motion. From the best superposition of consecutive peptide planes we
+derive the helix parameters, and the “worst” fit is used to define the orientational distance.
+Applications are shown for standard secondary structure motifs of peptide chains, for some
+proteins belonging to different fold classes, and for a description of structural changes in
+lysozyme under hydrostatic pressure. In the latter case we use published reference data which
+have been obtained by X-ray crystallography and by structural NMR measurements.
+71
+72 efficient characterisation of protein secondary structure in terms of screw motions
+5.1 introduction
+The determination and characterisation of protein secondary structure is a fundamental
+task in molecular biology, crystallography and in simulation studies. In many situations
+arises the necessity to quantify in particular structural changes of a protein, which are due
+to a change of its environment. The influence of temperature or pressure on the fold of a
+protein is a typical example. Standard motifs in protein secondary structure are traditionally
+described in terms of two torsional angles, φ and ψ, per residue, which define for each
+Cα-atom the rotation of the left and right peptide plane about the N−Cα and Cα −C
+bond, respectively [187]. In the past different methods have been developed to determine
+secondary structure elements [106, 163, 57, 190] and to describe their geometry in more
+detail [9, 181, 194]. A rigourous mathematical description of protein secondary structure
+can be obtained by applying the theory of screw motions, where the winding of the protein
+backbone is described in terms of local helix parameters. The theory of screw motions goes
+back to the mathematician M. Chasles [32, 33], and a useful recent introduction can be found
+in the book by Selig [176]. In a recent paper, Quine [155] uses screw motion theory and
+constructs local helix parameters for a protein from the torsion angles φ and ψ. An important
+step is the introduction of quaternions which can be related to the (φ,ψ)-angles on one hand,
+and to the rotation/helix axis on the other hand.
+In this article we present an efficient method for the characterisation of protein secondary
+structure, which is based on quaternion superposition fits of consecutive peptide planes.
+From the resulting quaternion parameters we construct the local helix geometry of the protein
+backbone, and we show that the superposition method may also be used to define a scalar
+measure for the orientational distance between consecutive peptide planes. The latter allows
+to distinguish between all common secondary structure motifs, such as different helix types
+and β-strands, except for handedness.
+In the following section the method is briefly explained and applications are presented in
+Section 5.3. The first one concerns an illustration for simple model structures, such as right-
+and left-handed α-helices and β-strands. We show then how our method works for proteins
+which fall into different fold classes, and discuss finally in more detail how it can be used
+to quantify changes in the secondary structure of lysozyme which are caused by external
+pressure. For this purpose we use published reference structures which have been obtained
+from X-ray crystallography and from structural NMR measurements. The essential results are
+summarised and discussed in Section 5.4. In the Appendix we recall the essential properties
+5.2 method 73
+of quaternions and give a short constructive proof of Chasles’ theorem, which demonstrates
+the usefulness of quaternion calculus.
+5.2 method
+As stated in the introduction, our method for the description of protein secondary structure
+relies on quaternion-based superposition fits of molecular structures. The method is well
+established, and we refer to articles by Kearsley [111] and by Kneller [115] for details. Here
+we use that the quaternion method does not only yield the “best” fit, from which local helix
+parameters describing the winding of the protein backbone can be constructed, but also the
+“worst” fit, from which an orientational distance measure can be derived.
+5.2.1 Quaternion superposition fits
+Suppose that {r } and {r ′~α ~α} are two sets of vectors describing the positions of atoms repre-
+senting equivalent molecular structures A and B, respectively. Both structures contain the
+same number of atoms and are somehow placed in space. A rigid-body displacement A→ B
+can be defined as an optimisation problem, where structure A is fitted onto structure B in a
+least squares sense. In case that both structures are identical, the resulting fit error will be
+zero. One starts by constructing the translation vector ~t = ~R ′ − ~c Rc connecting the two centres
+of rotation, C and C ′, which are to be chosen in the same way for A and B, and computes
+the coordinate sets {x } and {x ′α α} containing the relative atomic positions to the respective
+rotation centres. Here and in the following the prime refers to the target structure B. The
+optimal rotation is obtained by minimising the target function
+∑N
+m(q) = w (D · x − x ′ 2α α α) (5.1)
+α=1
+with respect to a set of angular variables which parametr∑ise the orthogonal rotation matrix
+D. Each atom is assigned a positive weight wα, with αwα = 1. A convenient set of
+angular variables are normalised (real) quaternion parameters, q ≡ {q0,q1,q2,q3}, with
+q2 + q2 + q2 + q20 1 2 3 = 1. In this case D takes the form [4]
+ 
+ q20 + q21 − q22 − q2 3
+2(−q0q3 + q1q2) 2(q0q2 + q1q3) 
+D(q) =  2(q q + q q ) q2 + q2 − q2 − q2 2(−q q + q q )  (5.2)0 3 1 2 0 2 1 3 0 1 2 3
+2(−q0q2 + q1q ) 2(q q + q
+2 2 2 2
+3 0 1 2q3) q0 + q3 − q1 − q2
+74 efficient characterisation of protein secondary structure in terms of screw motions
+and describes a proper rotation with det(D) = +1. Using the orthogonality of D, the target
+function m(q) can be written as a quadratic form in the quaternion parameters,
+m(q) = qT ·M · q, (5.3)
+where q = (q ,q ,q ,q )T0 1 2 3 is a column vector and M is a positive semi-definite matrix. The
+superscript “T” denotes a transposition. The matrix M has the form [111, 115]
+∑  N (x − x ′ 2 T α α) uαM = w α  , (5.4)
+α=1 uα Pα
+where uα and Pα are given by
+u = 2x ∧ x ′α α α, (5.5)
+P = x · x ′T + x ′ · xTα α α α α. (5.6)
+The minimization of m(q) with respect to the quaternion parameters must be performed
+with the side constraint qT · q = 1. Using the method of Lagrange multipliers one is lead
+to the eigenvector problem
+M · q = λq. (5.7)
+Sincem(q) > 0 the matrixM is positive semi-definite, and one obtains a set of four real eigen-
+values, {λj}, with λj > 0 (j = 1, . . . , 4), and a set of corresponding orthonormal eigenvectors,
+{q }, with qTj j · qk = δjk. Here δjk is the Kronecker symbol. It follows from (5.3) and (5.7) that
+m(qj) = λj. (5.8)
+The eigenvalues are thus the residuals of the fit and can be ordered such that
+λ1 6 λ2 < λ3 6 λ4. (5.9)
+The quaternion corresponding to the smallest eigenvalue, λ1, is thus the solution for the
+optimal fit, and the quaternion parameters q describe the relative orientation of {x ′1 α} with
+respect to {xα}.
+We note that one obtains two twofold degenerate eigenvalues if the structures to be
+superposed are linear. In this case one has [115]
+∑ ( )
+λ = w |x |2 + |x ′ |2 ∓ 2|x ||x ′a,b α α α α α| , (5.10)
+α
+5.2 method 75
+where a = 1, 2, b = 3, 4, and both the rotation leading to the minimum and maximum distance
+are not uniquely determined. Any normalized linear combination of the two eigenvectors
+associated with λa and λb, respectively, describes an equivalent rotation.
+The use of quaternion parameters in not only very convenient for finding a rigid-body
+transformation between two sets of coordinates, but the result can also be directly related to
+conventional representations ofrotations. Here the following relation is of importance:
+q ≡ q0  cos(φ/2)=  . (5.11)
+qv sin(φ/2)n
+From the scalar part of a quaternion, q0, one obtains thus directly the rotation angle and
+the rotation axis can be extracted from the vectorial part, qv. It should be noted that the
+transformation φ → φ+ 2π, which leaves the rotation matrix D(n,φ) invariant, leads to a
+global change in sign of the quaternion parameteres. One verifies easily that q(n,φ+2π) = −q.
+The pair of quaternions {Q,−Q} is thus mapped onto the same rotation matrix D(q).
+5.2.2 Orientational distance
+The eigenvalue describing the “worst” superposition – λ4 according to the ordering scheme
+(5.9) – can b√e used to define an orientational distance between two molecular structures via
+M11
+∆Ω = . (5.12)
+λ4
+Eq. (5.4) shows that the matrix elementM11 contains the squared Euclidean distance between
+the vectors sets {x } and {x ′~α ~α}, and therefore ∆Ω is the Euclidean distance normalised to its
+maximum possible value. Consequently,
+0 6 ∆Ω 6 1. (5.13)
+It is important to note that definition (6.5) yields a unique orientational distance of two
+linear molecular structures, whose relative orientation has no unique description in terms
+of angular variables. Supposing that |x ′α| = |xα| for α = 1, . . . ,N, we see from eq. (5.10) that
+for linear rigid bodies ∆Ω = 0 in the parallel configuration and ∆Ω = 1 in the anti-parallel
+configuration. We note here that λb, as given by eq. (5.10), is a strict upper limit for the
+Euclidean distance of two molecular structures in general [116].
+76 efficient characterisation of protein secondary structure in terms of screw motions
+5.2.3 Chasles’ theorem
+T −→Let r = (x,y, z) be a column vector containing the coordinates of a radius vector ~r = OP
+of a point P in a rigid body, where O is the origin of the coordinate system. An arbitrary
+rigid-body displacement is described by a rotation about a point C, which is not necessarily
+located inside the rigid body, and a subsequent translation. Let Rc be the coordinates of
+−→ −−→
+the radius vector ~R = OC and let t be the coordinates of the translation vector ~t = CC ′c ,
+where C ′ is the centre of rotation after the translation. The coordinates of P after a rigid body
+displacement are then given by
+r ′ = Rc +D · (r−Rc) + t, (5.14)
+where D is an orthogonal 3× 3 matrix. In the following only proper rotations with det(D) =
++1 will be considered. If n = (n ,n ,n )Tx y z contains the components of the unit vector n~ ,
+pointing in the direction of the rotation axis, and φ is the angle of rotation, the corresponding
+rotation matrix can be written as
+D(n,φ) = P‖ + cos(φ)P⊥ + sin(φ)N, (5.15)
+where P = n ·nT‖ and P⊥ = 1 −P‖ are, respectively, the projectors onto n~ and its complement,
+and N is the antisymmetric matrix
+ 0 −nz ny
+N =  
+
+n 0 −n  . (5.16)z x
+−ny nx 0
+The theorem of Chasles states that one can find a reference point X, whose radius vector
+−→
+~Rx = OX has the coordinates Rx, such that
+r ′ = Rx +D(n,φ) · (r−Rx) +αn. (5.17)
+This coordinate transformation describes a screw motion, with translation α parallel to
+the axis of rotation. For the following considerations we introduce the difference vector
+~u = ~R − ~x Rc. Equating relations (5.14) and (5.17) and using that n is an eigenvector of D, one
+finds that the coordinates of ~u satisfy the following set of linear equations
+(1 −D) · u = t⊥. (5.18)
+Here t⊥ = P⊥ · t. As shown in Section 5.5, the above equation has a linear manifold of
+solutions,
+u(λ) = u⊥ + λn, λ ∈ R, (5.19)
+5.3 applications 77
+where u⊥ is perpendicular to n and has the explicit form
+1( )
+u⊥ = t⊥ + cot(φ/2)n∧ t . (5.20)
+2
+In absolute coordinates the axis of the screw motion is given by
+Rx = Rc + u⊥ + λn, (5.21)
+and
+R⊥x = Rc + u⊥ (5.22)
+contains the coordinates of the radius vector ~R⊥ relating the origin with the point X⊥x on the
+helix axis which is closest to the reference point C. In the following X⊥ will be referred to
+as centre of screw motion. The radius ρ of the corresponding screw motion is given by the
+Euclidean length of u , since the latter is the vector pointing from ~R to X⊥~⊥ c . Using (5.20) one
+finds
+√
+|t⊥|
+ρ = 1+ cot2(φ/2). (5.23)
+2
+It should be noted that ρ diverges if φ is a multiple of 2π, corresponding to pure translations,
+and if |t⊥| 6= 0.
+5.3 applications
+5.3.1 Screw motion description of protein main chains
+The method described above, which will be referred to as ScrewFit in the following, is now
+applied to define the local helical structure of polypeptides and proteins. The rigid bodies are
+here the triangles formed by the atoms {O,C,N} in the backbone of polypeptides – see Fig. 19
+– which define the so-called peptide planes. Here the C-atoms are the centres of rotation, and
+the translation vectors are thus the position differences between the C-atoms in consecutive
+amino acids, ti = RC(i+1) −RC(i). The quaternion parameters qi are obtained from the fit of
+the {O,C,N}-triangle of peptide bond i onto the one of peptide bond i+ 1. From each set of
+quaternion parameters the direction n~ of the rotation axis and the rotation angle φ can be
+computed from relation (6.4).
+The following parameters are used to define the local helix structure of a polypeptide:
+• The helix radius ρ defined in eq. (6.6).
+78 efficient characterisation of protein secondary structure in terms of screw motions
+• The number of amino acids per turn,
+2π
+τ = . (5.24)
+φ
+• The pitch, which is defined as
+p = |R⊥ −R⊥x,i+1 x,i|τ. (5.25)
+Here ~R⊥ is the radius vector pointing from the origin to the centre X⊥x,i i of the screw
+motion relating peptide plane i and peptide plane i+ 1.
+• The handedness, which is defined as the sign of the projection of the translation vector
+~ti onto the direction n~ i of the local helix axis,
+h = sign(nTi · ti). (5.26)
+• The straightness parameter σ of the local helix axis. For residue i the latter is defined as
+σ = µTi i · µi+1, (5.27)
+where
+R⊥x,i+1 −R
+⊥
+x,i
+µi = . (5.28)
+|R⊥ ⊥x,i+1 −Rx,i|
+• The orientational distance between the peptide planes {O,C,N} in residues i and i+ 1,
+which is defined through relation (6.5).
+5.3.2 Model structures
+We apply ScrewFit first to well-known model structures for polypeptides which have been
+taken from the Image Library of Biological Macromolecules in Jena 1. Table 13 shows the
+corresponding local helix parameters which have been defined in the previous section. All
+model peptides are polyalanine molecules containing 10 residues, except for the extended
+conformation, which is represented by the alanine-tripeptide shown in Fig. 19. In all cases
+the N-terminus is the starting point of the respective polypeptide chain. In the context of our
+study all motifs are considered as helices, a β-strand being simply a thin left-handed helix
+with 2 amino acids per turn2.
+1 Institute-of-Molecular-Biotechnology-Jena:http://www.imb-jena.de/IMAGE.html
+2 See also note 5.6 at the end ot this article.
+5.3 applications 79
+Figure 19: A tri-peptide with two peptide bonds in the extended conformation, where the symbol “R”
+stands for non-specified side-chains. The screw motion relating the yellow triangles formed
+by the {O,C,N} atoms of the peptide planes defines the local helix which is schematically
+represented by the cylinder in purple and the corresponding screw arrow. The radius of the
+cylinder corresponds to the radius of the screw motion.
+Table 12: Helix parameters for different model structures. Here ρ is the helix radius with the C-atom
+of the peptide plane on the helix surface, ρ is the corresponding radius if the C-atom is
+Cα
+replaced by the Cα-atom, τ is the number of residues per turn, h is the handedness, and σ
+the straightness parameter. The latter equals 1 for all model structures, since none is curved.
+The straightness parameter for the extended conformation cannot be defined, since the model
+structure for the latter consists of only three residues (see Fig. 19). More explanations are
+given in the text.
+Motive ρ [nm] ρ [nm] τ pitch h σ ∆
+Cα Ω
+α-helix (R) 0.171 0.227 3.62 0.556 + 1 0.582
+α-helix (L) 0.171 0.227 3.62 0.556 − 1 0.582
+3-10 helix 0.146 0.203 3.28 0.589 + 1 0.670
+π-helix 0.178 0.258 4.16 0.558 + 1 0.471
+β-strand 0.055 0.093 2.03 0.671 − 1 0.875
+extended 0.037 0.055 2.00 0.725 − 0.754
+80 efficient characterisation of protein secondary structure in terms of screw motions
+The parameters concerning the different secondary structure motifs shown in Table 13 may
+be compared to those published in the study of Barlow and Thornton [9]. Here one must pay
+attention to the fact that the helix radius depends on the reference point which is chosen to
+lie on the helix surface. In our case this is the carbon atom in the {O−C−N} peptide plane.
+If the carbon Cα-atom is chosen instead, we find the values given in the column with the
+header “ρ ”.
+Cα
+The parameters we find for the right-handed α-helix are very close to the ones given
+by Barlow and Thornton, who compare different standard definitions with average values
+computed from a set of 291 helices in “real” proteins. The parameters listed in the above
+reference are in the intervals 0.23 6 ρ 6 0.24, 3.54 6 τ 6 3.67, and 0.52 6 p 6 0.55,
+respectively, using our notation and units (ρ and p in nm). In case of the 3-10 helix the
+spread of the parameters given by Barlow and Thornton is 0.18 6 ρ 6 0.20, 3.0 6 τ 6 3.2,
+and 0.58 6 p 6 0.60. Parameters for π-helices are not listed. It should be noted that the
+orientational distance takes well distinguishable values for the different secondary structure
+motifs, but left and right-handed motifs cannot be distinguished by this parameter.
+5.3.3 Proteins in different fold classes
+In the following we will show the results of ScrewFit for proteins which fall into the four
+main fold classes according to the SCOP scheme [145]:
+1. Carbonmonoxy-myoglobin (PDB code 1A6G), which belongs to the “all alpha” class.
+2. Protease inhibitor ecotin (PDB code 1ECY), which belongs to the “all beta” class.
+3. Triose phosphate isomerase from chicken muscle (PDB code 1TIM), which belongs to
+the “alpha/beta” class. Proteins falling into this class consist mainly of parallel β-sheets,
+which are separated by α-helices.
+4. Hen egg white lysozyme (PDB code 193L), which falls into the “alpha + beta” class. Pro-
+teins of this type contain mainly anti-parallel β-sheets and separated regions containing
+α-helices.
+The latter application is postponed to the next section, where we consider structural changes
+of lysozyme under pressure. In this context the ScrewFit parameters will also be discussed in
+more detail. Here we give only an impression of the results, as compared to DSSP.
+Figs. 20 to 22 shows the comparison first three proteins in the list given above. In each figure
+we give the local orientational distance, ∆Ω, the local helix radius, ρ, and the straightness
+5.3 applications 81
+Figure 20: ScrewFit description of the main chain of Carbonmonoxy-myoglobin (PDB code 1A6G, “all
+alpha” in the SCOP scheme). The vertical green stripes indicate α-helices found by the
+DSSP method and the horizontal lines indicate the reference values given Table 13.
+Figure 21: ScrewFit description of the main chain of Protease inhibitor ecotin (PDB code 1ECY, “all
+beta” in the SCOP scheme). The vertical blue stripes indicate β-strands found by the DSSP
+method and the horizontal lines indicate the reference values given in Table 13.
+82 efficient characterisation of protein secondary structure in terms of screw motions
+Figure 22: ScrewFit description of the main chain of Triose phosphate isomerase (PDB code 1TIM,
+“alpha/beta” in the SCOP scheme). The vertical green and blue stripes indicate, respectively,
+α-helices and β-strands found by the DSSP method. The green and blue horizontal lines
+indicate the respective reference values from Table 13.
+parameter, σ. All calculations have been performed on the basis of the respective entries in
+the Brookhaven Protein Data Bank (PDB). The vertical stripes correspond to the secondary
+structure motifs found by the DSSP method by Kabsch and Sander, which is based on
+hydrogen bonding criteria and which is widely used for the determination of secondary
+structure elements in proteins [106]. The colouring scheme indicates α-helices in light green
+and β-strands in light blue.
+One recognises that the ScrewFit method often leaves some ambiguity concerning the
+boundaries of secondary structure elements. This is simply due to the fact that it is sensitive
+to deviations from ideal geometries. This effect is in particular visible in the behaviour of
+straightness parameter. Similar observations have been made by comparing the method by
+Barlow and Thornton with DSSP [9].
+5.3.4 Lysozyme under hydrostatic pressure
+In the following we apply our method to visualise structural changes in lysozyme due to the
+application of an external pressure. For this purpose we consider protein structures which
+have been obtained from X-ray crystallography and from NMR measurements. The X-ray
+structures are taken from the entries 193L and 3LYM of the Brookhaven Protein Data Bank
+(PDB), which contain the atomic coordinates of hen egg-white lysozyme at pressures of,
+5.3 applications 83
+respectively, 1 bar and 1 kbar [202, 121]. The NMR structures are taken from PDB entries
+1GXV and 1GXX, corresponding to 1 bar and 2 kbars, respectively [159]. Fig. 23 shows
+the backbone of lysozyme at 1 bar (blue tube) obtained from the crystal structure together
+with the line joining the centres of screw motion mapping each peptide plane onto the
+consecutive one (red line). The centres of the screw motions have been constructed according
+to expression (5.22). Inspection by eye shows that that the red line passes right through the
+geometrical centres of the helices.
+More details can be obtained from Figs. 24 and 25 which show the same parameters as
+in Figs. 20 to 22. In both cases the curves corresponding to the structures under pressure
+are given in red. The green and blue horizontal lines correspond again, respectively, to the
+reference values for an α-helix and a β-strand given in Table 13. Here the vertical stripes
+indicate the secondary structures according to the PDBsum data base. The latter uses the
+PROMOTIF program for secondary structure determination [89], which is itself based on the
+DSSP method. In addition to α-helices we indicate also 3-10 helices in dark green.
+For the crystal structure entries 193L and 3LYM the PDBsum database displays three long
+helices in the residue intervals {5− 14}, {25− 36}, and {89− 99}, and four short ones in the
+residue intervals {80− 84}, {104− 107}, {109− 114}, and {120− 123}. In addition three short
+β-strands of 2–3 residues are displayed in the regions {43 − 45}, {51 − 53}, and {58 − 59},
+respectively. We note here that only the long helices are described in the work by Barlow and
+Thornton [9]. Concerning the NMR structures, the PDBsum database lists again the three
+long helices ({5− 14}, {25− 36}, {89− 98}), but only two short ones ({80− 84}, {109− 114}). In
+contrast, the short β-strands are displayed at almost the same positions as for the crystal
+structures ({44− 46}, {50− 53}, {58− 59}). As for the crystal structures, the structural motifs
+are found for both pressures at identical positions.
+Looking first at Fig. 24 displaying the parameters corresponding to the crystal structures
+shows that the orientational distance is a good measure to localise rapidly secondary structure
+elements in the amino acid sequence of a protein. For the moment we discuss only the
+structure at ambient pressure. The analysis of the helix radius and the straightness gives
+more detailed information. The three long helices and also the three short β-strands are
+easily localised. We find that the first helix ({5− 14}) is straight only in the region {5− 11}.
+Towards the C-terminus the straightness drops considerably and the orientational distance
+rises. The helix radius stays approximately constant up to about residue number 15. We
+find that the second helix ({25− 36}) is deformed as well towards its C-terminus, but here
+the orientational distances stays more or less constant, whereas the helix radius and the
+84 efficient characterisation of protein secondary structure in terms of screw motions
+Figure 23: Minimal model for Lysozyme at normal pressure. The red line joins the centres of screw
+motions, X⊥, mapping each peptide plane onto the following one.
+straightness change considerably. We consider this helix to be straight in the range {25− 32}.
+Similar observations can be made for the third long helix, which we find to be straight in the
+range {89− 96}. We note here that Barlow and Thornton consider the first of the above helices
+as “irregular” and the others as “curved”, using, however, different criteria. Concerning the
+shorter helices, which are not considered helices by Barlow and Thornton, we confirm less
+well defined helices in the ranges {80− 84}, {104− 107}, {119− 123}, and {109− 114}. According
+to the orientational distance, the first three of them are 3-10 helices. As for the β-strands, our
+analysis would confirm the short one in the range {58− 59}, but yield longer strands in the
+regions {42− 46} and {50− 53}. It is worthwhile mentioning that the straightness parameter
+indicates hairpin turns between the β-strands, leading to antiparallel β-sheets.
+Applying ScrewFit to the NMR structure of lysozyme at ambient pressure yields the
+following results: the three long helices indicated by PDBsum are retrieved, and, using the
+orientational distance as criterion, we confirm less well defined helices in the ranges {80− 84}
+(3-10 helix) and {109− 114} (α-helix). According to our analysis the first β-strand is longer
+than the one displayed in the PDBsum database (approximately in {41− 45}).
+Let us now look at the changes in secondary structure of lysozyme due to the exertion
+of an external pressure. We start with the analysis of the crystallographic data by Kundrot
+and Richards [121]. The black line in Fig. 26 shows that the structural change obtained from
+the crystal structures is localised at residue no. 72. All parameters show a change in the
+5.3 applications 85
+Figure 24: ScrewFit description of Lysozyme for crystallographic structures at pressures of 1 bar (black
+line) and 1 kbar (red line) (PDB entries 193L and 3LYM) [202, 121]. According to the SCOP
+scheme lysozyme falls into the “alpha+beta” class. The horizontal lines show the reference
+values given in Table 13 and the vertical stripes indicate here the secondary structures
+according to the PDBsum database. More explanations are given in the text
+.
+Figure 25: The same as Fig. 24, but for NMR structures at 1 bar (black line) and 2 kbar (red line) [159].
+86 efficient characterisation of protein secondary structure in terms of screw motions
+same place. Fig. 27 shows the change of straightness of the crystal structure of lysozyme in a
+tube representation, using a colouring scheme where red corresponds to a negative change,
+green to no change, and blue to a positive change. In their study Kundrot and Richards
+perform a difference distance matrix analysis of the structural changes and report that the
+least changes are seen in helix 2 ({25− 36}) and in the loop and β-sheet region {42− 60},
+whereas a stronger structural change is seen in region {61− 87}, which appears to expand.
+We note here that Kundrot and Richards call this region “loop region”, not counting the short
+3-10 helix {80− 84}. This observation is coherent with ours, which shows in particular a strong
+rise of the local helix radius at residue 72, corresponding to a swelling of the corresponding
+loop region.
+Figure 26: Differences for the parameters shown in Figs. ?? and 25 (X-ray crystallography = black line,
+NMR = magenta line).
+The corresponding analysis for the NMR structures is less clear (see Fig. 25, magenta
+lines). Here the orientational distance and the helix radius do not exhibit significant changes,
+whereas the straightness shows a strong decrease at residue no. 60. which is located at the
+very beginning of the long loop in residue range {60 − 80}. Refaee et al. report the most
+extensive deformations in the loop and what they call “β-sheet domain” ({40− 88}), which is
+certainly in agreement with a very localised change in secondary structure at residue no. 60.
+We do, however, not see considerable changes in the hairpin turns {47− 49} and {54− 57} seen
+by Refaee et al.. Fig. 28 shows the change in straightness for the NMR structure of lysozyme
+in a tube plot in which the same colouring scheme is used as in Fig. 27.
+5.4 conclusion 87
+Figure 27: Change in straightness between the crystallographic structure of lysozyme at 3 kbar and
+1 bar. The colouring scheme is chosen such that blue, green, red correspond to, respectively
++2 (maximum positive change), 0, and -2 (maximum negative change).
+Figure 28: Change in straightness between the NMR structure of lysozyme at 2 kbar and 1 bar. The
+colouring scheme is the same as in Fig. 27.
+5.4 conclusion
+We have presented a simple method – ScrewFit – for the characterisation of protein secondary
+structure which uses quaternion-based superposition fits of consecutive peptide planes in
+88 efficient characterisation of protein secondary structure in terms of screw motions
+the backbone. The combined use of the quaternion fit method and Chasles’ theorem allows
+to express protein secondary structure in terms of local helix parameters. The superposition
+method yields also an orientational distance measure for consecutive peptide planes. The
+latter is obtained from the “worst” possible quaternion fit and yields a simple measure for the
+rapid localisation of secondary structure elements along the protein backbone. The analysis
+of standard motifs of protein secondary structure and of proteins belonging to different fold
+classes showed that all common motifs are well discriminated by the orientational distance
+measure, and that the straightness parameter and the helix diameter are useful to characterise
+non-ideal secondary structure elements, keeping a minimal set of parameters.
+Using ScrewFit to study conformational changes in Lysozyme due to application of an
+external pressure revealed different localised changes in the loop regions. The structural
+changes extracted by difference distance matrix analysis from the crystallographic data could
+be confirmed, giving, however, a more precise description of these changes. Concerning the
+NMR structures, we find the essential conformational changes in a different position than the
+authors of the reference article, although both results agree in so far, as the changes are found
+in the same region. Prior to these analyses we tested that the localisation of the essential
+secondary structural elements found by crystallography and NMR is confirmed.
+ScrewFit allows to pinpoint secondary structure changes precisely, which is more difficult
+to achieve by the standard analysis of positional differences. The reason is that the latter
+might indicate important structural differences in a large region, although the corresponding
+position differences are induced by one single localised change in the winding of the protein
+backbone.
+A point which should also be mentioned is the numerical efficiency of the quaternion-
+based superposition algorithm we use as a basis of our method. The superposition of two
+molecular structures can be performed in a few millisceconds [115], and this fact has been
+exploited in many studies of rigid body motions in molecular systems, using the molecular
+dynamics analysis package nMoldyn [120, 166]. Using the method presented in this article,
+the characterisation of the secondary structure of a protein can be done in about a second on
+a normal PC, and this efficiency could for example be used in database-oriented applications
+and for analyses of molecular dynamics trajectories of proteins. In this context it is important
+to note that the protein backbone can be completely reconstructed from the helix parameters
+defined in this article. This is an interesting aspect for homology modelling. Another useful
+application could be the characterisation of structural variability in different structural models
+which are used to construct protein 3D structures from NMR distance data.
+5.5 mathematical background 89
+5.5 mathematical background
+5.5.1 Quaternions
+Quaternions are hypercomplex numbers which are composed by linear superposition of one
+real unit element 1 and three imaginary imaginary unit elements I, J,K. The latter satisfy
+the non-commutative algebra I2 = J2 = K2 = −1 and IJ = −JI = K (cycl.). An arbitrary
+quaternion Q is written as Q = q01 + q1I+ q2J+ q3K, where qj ∈ R (j = 0, . . . , 3). The
+component q0 is called the scalar component, and {q1,q2,q3} are the vectorial components.
+It is useful to introduce the column vector q = (q ,q ,q )Tv 1 2 3 comprising the three vectorial
+components of a q√uaternion. Analogously to complex numbers, the length of a quaternion is
+defined as ‖Q‖ = q2 + q2 + q2 + q2 and its conjugate is given by Q∗0 1 2 3 = q01 − q1I− q2J−
+q3K.
+Let A and B be quaternions with components {a0,a1,a2,a3} and {b0,b1,b2,b3}, respec-
+tively. The components of C = A±B are obtained by cj = aj ± bj (j = 0, . . . , 3) and from the
+algebra of the imaginary elements one finds that the components of the product C = AB are
+givenby   
+c   a b − aT0 0 0 v · bv = ,
+cv a0bv + b0av + av ∧ bv
+where “∧” denotes a vector product. In general AB 6= BA. The inverse of a quaternion A is
+defined as
+A∗
+A−1 = ‖ ‖ .A 2
+Due to the non-commutative algebra of quaternions one has in general A−1B 6= BA−1.
+Similarly to complex numbers of unit length, which represent rotations in the plane,
+normalised quaternions represent rotations in space. Let r = (x,y, z)T a column vector
+comprising the components of a radius vector ~r, let R = xI+ +yJ+ zK be the corresponding
+spatial quaternion and let Q be a normalised quaternion with ‖Q‖ = 1. One finds that the
+scalar component of R ′ = QRQ∗ vanishes too, and that the vectorial components of R ′ are
+given by
+r ′ = D · r,
+where D represents the rotation matrix (6.2). The bilinear transformation R ′ = QRQ∗ repre-
+sents thus a rotation in space.
+90 efficient characterisation of protein secondary structure in terms of screw motions
+5.5.2 Helix parameters in Chasles’ theorem
+Chasles’ theorem can be easily proven using quaternion algebra. For this purpose we start
+from Eq. (5.18) and introduce the spatial quaternions U and T⊥, representing, respectively,
+the column vectors u and t⊥. Expressed in quaternions, Eq. (5.18) becomes
+U−QUQ∗ = T⊥.
+Multiplication with Q from the right and using that Q∗Q = 1 yields
+UQ−QU = T⊥Q.
+Using the multiplication rule for quaternions, the above equation can be expressed in the
+form     
+ −uT · q Tv   −qv · u   −t⊥ · qv − = .
+q0u+ u∧ qv q0u+ qv ∧ u q0t⊥ + t⊥ ∧ qv
+Herewe can make use of relation (6.4)
+q0  cos(φ/2)= ,
+qv sin(φ/2)n
+from which we conclude that t⊥ · qv = 0, since t⊥ ⊥ n. We are thus left with the vector
+equation   
+ 0   0 =  ,
+2u∧ qv q0t⊥ + t⊥ ∧ qv
+which can be reduced to
+1( )
+n∧ u = − cot(φ/2)t⊥ + n∧ t⊥ (5.29)
+2
+if φ 6= 2kπ (k ∈ Z). Now one can apply on both sides a vectorial multiplication with n, using
+that n∧ (n∧ a) = −a for an arbitrary column vector a. This yields
+1(
+⊥ )
+u⊥ = t⊥ + cot(φ/2)n∧ t ,
+2
+if one uses that n∧ (n∧ t⊥) = −t⊥ and that n∧ t⊥ = n∧ t. Relation (5.20) is thus proven.
+The general solution of Eq. (5.29) has obviously the form
+u(λ) = u⊥ + λn, λ ∈ R,
+5.5 mathematical background 91
+which shows that u⊥(λ) is the solution of minimum length.
+Acknowledgements: All figures containing molecular graphics have been generated using
+the VMD code for molecular dynamics simulation and visualisation of biomolecules [88]. The
+screw motion calculations have been performed with modules from the MMTK package [79].
+92 efficient characterisation of protein secondary structure in terms of screw motions
+5.6 notes
+[i] It is worth to note here that, in the context of ScrewFit algorithm, all motifs are
+considered as helices, a β-strand being simply a thin left-handed helix with 2 amino acids
+per turn. This fact can be easily seen in Fig. 29 where the blue cylinder represent the extent of
+the helix obtained according to the definition of the C-atom of the peptide plane lying on the
+helix surface, for the right-handed α-helix and the β-strand.
+Figure 29: Visualisation of a straight right-handed α-helix (left-side) and a straight β-strand (right-side)
+in terms of the local helix parameters given in Table 1. The arrow indicates the direction of
+the helix axis. Here the hydrogen atoms.
+6
+SCREWFIT: A NOVEL APPROACH FOR CONTINUUM PROTE IN
+SECONDARY STRUCTURE ASSESSMENTS
+We present a novel approach for the detection of protein secondary structure elements,
+which combines a description of the protein backbone in terms of screw motions (Acta
+Cryst. 62, p. 302-11 (2006)) with a statistical approach, yielding confidence ranges for the
+corresponding helix parameters on the basis of natural variations. To establish these ranges
+for each type of secondary structure element, we analyzed several databases of protein
+structures, exhibiting each well defined structural profiles. The method allows for a continous
+assessment of protein secondary structure elements and is proved to be stable with respect to
+both structural variations found in NMR data and resolution problems in crystallographic
+data. The comparison with other methods supports its reliability and accuracy. A structural
+analysis of bovine pancreatic trypsin inhibitor in three different crystal forms illustrates the
+capability of the method to detect secondary structure elements in noisy data and to describe
+at the same time small but systematic structural variations in the latter.
+93
+94 screwfit : a novel approach for continuum protein secondary structure assessments
+6.1 introduction
+In the last decades, a variety of newmethods has been developed for the analysis of experimen-
+tal and simulation data in structural biology. One of the standard tasks is the determination
+of secondary structure elements in proteins, in particular for the characterization of changes
+in protein structure. Such conformational changes may be induced by binding of ligands or
+by external stress, such as temperature, hydrostatic pressure, or chemical agents.
+Traditionally secondary structure elements are described in terms of two torsional angles
+per residue, φ and ψ, which define for each Cα-atom in the protein backbone the rotation of
+the left and right peptide plane about the N−Cα and Cα −C bond, respectively [187]. This
+approach is, however, not well suited to describe non-ideal secondary structure elements,
+such as kinked or curved helices, which occur in any protein fold, nor does it easily allow to
+detect and to describe structural changes in protein structure. In the past, different methods
+have been developed to determine secondary structure elements in polypeptide chains
+[106, 163, 57, 190] and to describe their geometry in more detail [9, 181, 194]. One of the
+most frequently used methods is the dictionary of protein secondary structure (DSSP) which
+detects secondary structure elements through typical hydrogen bond patterns [106, 89]. The
+method allows in principle to distinguish eight of the most common motifs, both in secondary
+and supersecondary structures, but the results are often biased by the fact that DSSP makes
+assessments on protein structure using average hydrogen-bond distances as references which
+implicitly include the effects of static and dynamical disorder in crystallographic data. Like
+other, so-called “discrete methods”, DSSP assesses secondary structure elements on the basis
+of a “true-false” decision, which follows geometrical criteria. All patterns which meet these
+criteria within certain thresholds are safely detected by all discrete methods [40], but they
+run into difficulties if the natural variability in the secondary structure of a given protein
+is too important. Methods like DSSP are, for example, not able to reproduce the variations
+between different NMR models which correlate with thermal disorder and local mobility of
+structure motifs. This fact has already been observed by Andersen and coworkers [5] [25]
+who presented a new method, derived from DSSP, which is called DSSPcont. The suffix
+“cont” indicates that the method uses a description of protein secondary structure in terms of
+a set of parameters which vary continuously in a predefined range of values. It has been
+pointed out in the literature that this continuous approach can more easily distinguish between
+natural conformational variations and effective changes in secondary structure profiles [5].
+Indeed, Andersen and coworkers proved that a major improvement of the DSSP method
+6.1 introduction 95
+could be obtained simply substituting the single threshold-based definition per secondary
+structure element by a quasi-continuum spectrum of assessments obtained by running the
+discrete DSSP method with different hydrogen bond distance thresholds. The resulting series
+of assessments leads to the final assignment probability of each residue to belong to one of
+the eight DSSP classes: the three helix types (α, 310 and π); β strands; helix-turns; β bridges;
+bends and not-structured loops.
+With these assumptions, DSSPcont was refined in order to maintain a high consistency with
+respect to the influences of small structural variations caused by the experimental setups or
+by the natural thermal fluctuation of structures.
+Motivated by the task to pinpoint changes in the secondary structure of proteins, we have
+recently developed the ScrewFit-algorithm [114]. The algorithm uses the Cartesian atomic
+coordinates of a protein as input and expresses its secondary structure in terms of screw
+motions relating consecutive peptide planes in the protein backbone. In this work we present
+further developments of this method which demonstrate that ScrewFit does not only allow
+to quantify changes in protein configurations but can also be used to detect all common
+secondary structure elements.
+By construction, ScrewFit belongs to the so-called continuous methods for secondary
+structure assignment, since the local helix parameters quantifying the screw motions are
+continuous functions of the residue number.
+Nevertheless, the ScrewFit method proposes a new approach to the continuous assignments as
+it does not relate to any threshold-based definition but only to simple geometrical criteria that
+define the set of parameters. The latter run over continuous ranges of values whose interpre-
+tation is not biased by an a priori division into classes and which are simply obtained from an
+empirical observation of the natural variations of the parameters in some appropriate protein
+structure databases. Moreover, this approach does not limit the values of the parameters which
+can vary beyond the ranges found for the most common secondary structure elements and
+still be useful to finely characterize the secondary level of uncommon structural configuration.
+In the following sections we will first present the ScrewFit-algorithm and then we will
+show that structure definitions obtained by this algorithm are as precise as those obtained by
+the DSSP discrete method and are less biased by finite resolution of crystallographic data.
+96 screwfit : a novel approach for continuum protein secondary structure assessments
+In a second application we will compare ScrewFit with the DSSPcont method mentioned
+above in order to verify the stability of our set of parameters in respect to the variations
+observed in NMR models due to experimental technique and thermal fluctuations.
+Finally, as an example of a typical application, we will show the secondary structure profile
+of bovine pancreatic trypsin inhibitor (BPTI) in its three different crystal forms and we will
+compare the results with those detected with DSSPcont. This example will be useful to
+illustrate the advantages of this novel approach which allows to make assessments on protein
+secondary structure and also quantitatively characterize all changes it can undergo as an
+effect of different external conditions.
+6.2 methods
+6.2.1 The ScrewFit algorithms
+To synthetically describe protein secondary structure, we use the algorithm ScrewFit, which is
+based on quaternion superposition fits for molecular structures [50, 115, 116] and Chasles’
+theorem on rigid-body displacements [33, 32]. In this section we sketch the main features of
+the method and refer to [114] for more details.
+In the following two consecutive peptide planes A and B, containing the atoms {O,C,N},
+are considered as rigid bodies. The latter are superimposed by minimizing the target function
+∑3
+m(q) = (D · xα − x ′ 2α) , (6.1)
+α=1
+where {x } and {x ′α α} are the atomic positions of the reference (the atoms {O,C,N} in plane A)
+and the target structure (plane B), respectively.
+The symbol D denotes an orthogonal matrix describing a proper rotation . Both coordinate
+sets are defined with respect to a reference point, which is chosen to be the position of
+atom C in the respective peptide plane {O,C,N}. Using the fact that a rotation matrix can
+6.2 methods 97
+be expressed in the components of a normalized quaternion q ≡ {q0,q1,q2,q3}, where
+q2 + q2 + q2 + q20 1 2 3 = 1[4], 
+ q20 + q21 − q22 − q2 3
+2(−q0q3 + q1q2) 2(q0q2 + q1q3) 
+ D(q) =  2(q q + q q ) q2 + q2 − q2 − q2 2(−q q + q q )  , (6.2)0 3 1 2 0 2 1 3 0 1 2 3
+2(−q q + q q 2 2 2 20 2 1 3) 2(q0q1 + q2q3) q0 + q3 − q1 − q2
+the function (6.1) is to be minimized with respect to these four parameters. As demonstrated
+in previous work [50, 115, 116], the constrained minimization problem can be mapped onto
+an eigenvector problem for a positive semi-definite matrix M ≡M({x , x ′α α}),
+M · q = λq, (6.3)
+whose eigenvalues λj = m(qj) are four possible errors of the superposition fit between the
+two peptide planes, defined by (6.1). The smallest eigenvalue is the solution for the optimal fit,
+and the components of the corresponding eigen-quaternion describe the relative orientation
+of {x ′α} with respectto {xα}. Writing
+q ≡ q0  cos(φ/2)=  . (6.4)
+qv sin(φ/2)n
+one sees that the resulting quaternion defines the rotation angle φ and the corresponding
+rotation axis n, which is at the same time the direction of the screw motion, according to the
+theorem of Chasles. The proof of the latter can be elegantly given by using the quaternion
+calculus [114]. The largest eigenvalue λmax describes the “worst” superposition and gives
+the maximal Euclidean distance between the two peptide planes. We use the latter to define a
+unique ori√ent∑ational distance via3 (x − x ′ )2
+∆ = α=1
+α α . (6.5)
+λmax
+By definition 0 6 ∆ 6 1.
+To characterize protein secondary structure we use the following parameters:
+1. The orientational distance of consecutive peptide planes, which is defined in Eq. (6.5).
+2. The radius of the cylindrical surface on which the reference atom (atom C) moves
+performing th√e screw motion between two consecutive peptide planes,
+|t⊥|
+ρ = 1+ cot2(φ/2). (6.6)
+2
+Here t⊥ is the component of the vector t relating the C-atoms, which is perpendicular
+to the rotation axis defined by n.
+98 screwfit : a novel approach for continuum protein secondary structure assessments
+3. The straightness parameter σ. For residue i the latter is defined as
+σ = µTi i · µi+1, (6.7)
+where
+R⊥i+1 −R
+⊥
+= iµi (6.8)
+|R⊥ ⊥i+1 −Ri |
+and R⊥i is the point on the helix axis, which is closest to the C-atom of peptide plane i.
+The straightness gives information about the curvature of a secondary structure element.
+Figure 30(Panel A) gives an illustration of the helix (screw motion) parameters defined above.
+By definition the C-atoms of the peptide planes are on the surface of the cylinder defining
+the envelope of the screw motion. Figure 30 (Panel B) gives a sketch of a typical ScrewFit
+profile of a protein (in this figure, bovine pancreatic trypsin inhibitor).
+Figure 30: Panel A)A tri-peptide with two peptide bonds in the extended conformation. The yellow
+triangles formed by the atoms {O,C,N} of the peptide planes define the local helix structure
+of the polypeptide. The green spheres, labeled with “R”, indicate dummy atoms replacing
+the side-chains. The radius of the cylinder shown in figure defines the radius ρ of the screw
+motion relating the two consecutive peptide planes. Panel B) A typical ScrewFit profile for
+a protein structure. In this figure the three parameters refers to the BPTI (PDB code: 4PTI).
+The colored stripes on the bottom of the figure indicate the secondary structure motifs
+determined by DSSP method (β-strands: blue; α-helices: red; 3− 10-helices: green). Vertical
+stripes superimposed on ScrewFit plots represent motifs detected by the latter method
+(same coloring scheme as for the DSSP).
+6.2 methods 99
+6.2.2 Availability
+ScrewFit is implemented in a Python open-source code which uses several modules from the
+Molecular Modelling Toolkit library [81]1. A Web-based implementation is under construction.
+6.2.3 Databases
+We created two subsets of the SCOP structural classification with “all-α” and “all-β” pro-
+teins [145], which contain protein domains whose sequence have less than 40% of identity
+and whose structure elements are essentially α-helices and β-strands, respectively. For this
+purpose we used a subset of the ASTRAL [31] database which contains PDB-style files for
+each SCOP classified domain. From the original database, all structures with non-canonical
+atom notations were corrected or erased.
+After these reductions we obtained two databases:
+- A, containing 1027 all-α domains
+- B, containing 1336 all-β domains
+Every item into these databases is made only by the structurally significant domains and
+not by the whole proteins structure. The distribution for the ∆ and ρ parameters obtained
+with these databases are represented in Figure 31.
+To validate the variation of the ScrewFit parameters and their accuracy obtained by the
+approach described in the next section we will use three other sets of proteins with a limited
+overlap with our original databases and with a greater structural heterogeneity. For this
+purpose we chose:
+- C, a subset from the database PDBSelect25[84], containing 2144 chains with sequence
+homology lower than 25% and non-redundant folds
+- D, a subset obtained directly from the PDB by the culling server PISCES [203][204],
+containing 2477 chains with sequence homology lower than 25% and experimental
+resolution in the range 0.5− 2.0A˙
+- E, a subset also obtained via PISCES, containing 1829 chains with sequence homology
+lower than 25% and experimental resolution in the range 2.1− 3.5A˙
+1 Both codes are freely available at http://dirac.cnrs-orleans.fr/software.html
+100 screwfit: a novel approach for continuum protein secondary structure assessments
+Each entry in these databases C,D,E is chosen according the same rules which were applied
+to constitute databases A and B. The database C is intended for reproduction of most of the
+structural heterogeneity present in the whole PDB database.
+Finally, a finer comparison between ScrewFit and DDSPcont will be performed to verify
+the consistency of assessments made by ScrewFit. For this purpose, we will refer to the same
+database of NMR entries used in the original work by Andersen et al. [5]. We will call it :
+- F, containing 211 chains from NMR structures each containing at least ten models.
+6.3 results and discussion
+6.3.1 Evaluation of natural parameters
+The algorithm described above has already been tested in [114] for model structures of
+polypeptides taken from the Jena Library of Biological Macromolecules (available at 2) and
+the resulting parameters will be considered as ideal values in the following. Comparison with
+values obtained from real protein structures shows that the parameters fluctuate substantially
+around the ideal values, even in well definined structural motifs [114]. Secondary structure
+should, therefore, be associated with a range of possible values of the three parameters. In
+order to find these ranges we have applied ScrewFit to the large number of protein domains
+of known and well classified structures, which belong to databases A and B (see Figure 31 ).
+Each peak of the distributions corresponds to the dominant structural pattern in the respec-
+tive database and its width gives an estimation of the natural variation of the geometrical
+parameter which is considered. To quantify the latter we fitted the dominant peaks in each
+distribution by a Gaussian function,
+[ (x−m)2 ]
+y = a · exp − (6.9)
+s2
+Here m is the position of the peak and s its width, which is to be compared with the
+parameters for model structures listed in Table 13.
+The reader should be aware that 310 and π helices are sometimes present in all-α domains,
+but they are clearly under-represented in our database A. As shown in [114], these secondary
+structure elements can however be unambiguously distinguished by ScrewFit applied on
+their ideal structures. The same is true for the extended conformation with respect to the
+2 Available at http://www.imb-jena.de/IMAGE.html
+6.3 results and discussion 101
+Figure 31: Panel A) : Normalized distributions for Orientational Distance ∆ in A (in black) and in B (in
+red). Fitted Gaussian functions are shown in dashed lines. Correlation coefficients between
+distributions and fitted curves are between 0.90 and 0.96. Panel B) : Nomalized distribution
+for the helix radii ρ in A (in black) and in B (in red). Fitted Gaussian functions are shown
+in dashed lines. Correlation coefficients are between 0.94 and 0.96.
+β-strand. From Figure 31 (Panel b), it is also evident that ρ parameter distribution for each
+database presents an additional peak at values far from the dominant one. This fact is due to
+the presence of some residues in the extended conformation and reverse turns (α, β and γ
+type) in both databases.
+Table 13: ScrewFit parameters for different structure motifs from model polypeptide and from database
+evaluation.Values for 310 and π are only derived by the model polypeptide as given in [114].
+More details in the text.
+Motive ρideal ρ ∆ideal ∆
+α-helix 0.171 0.168 ± 0.020 0.582 0.537 ± 0.041
+3-10 helix 0.146 0.146 0.670 0.670
+π-helix 0.178 0.178 0.471 0.471
+β-strand 0.055 0.041 ± 0.018 0.875 0.850 ± 0.062
+extended 0.037 (0.041 ± 0.018) 0.754 0.800 ± 0.057
+102 screwfit: a novel approach for continuum protein secondary structure assessments
+Figure 32: Normalized distributions of ∆ (panel A) and ρ (panel B) parameters calculated on a
+heterogeneous selection of protein structures obtained from the PDBselect25 database (C).
+The full-colored bins represent the natural values obtained from calculation on A and B.
+The hollow bins represent the ideal values reprinted from ??. The color-scheme used is: red
+for α-helices, blue for β-strands, violet for extended conformations, green for 310-helices
+and brown for π-helices.
+Figure 32 shows the normalized distributions of the parameters ∆ and ρ obtained from the
+application of ScrewFit to the database C introduced in the previous section. Despite their
+origin from a wider spectrum of structural domains, these distributions are very similar to a
+superposition of those obtained from A and B. Interestingly, the peaks from C are also very
+close to those from A and B which are reported in Figure 32 as full-colored bins.
+The ideal values reported in Table 13 and obtained from previous works [114] are also reported
+in Figure 32 as hollows bins. Here it is worth noting that 310 and π helices, which were
+under-represented in our original databases A and B, have ideal values slightly different from
+the natural value obtained for the α-helices6.5. This observation supports the assumption that
+even using these ideal values one can easily characterize an helicoidal pattern and distinguish
+if it belongs to one of the three most frequent classes.
+As a whole, these facts confirm that the empirical definitions made for structural elements
+and summarized in Table 13 allows to distinguish the structural elements in several types of
+protein folds.
+6.3 results and discussion 103
+6.3.2 Reliability and consistency of ScrewFit assignments
+In the following we want to confirm the reliability of the natural parameters in Table 13,
+comparing ScrewFit to other methods and with respect to the refinement of experimental
+resolution.
+It is worth noting here that a wide variety of methods have been used in the past to make
+discrete secondary structure assessments based on different approach: intra-backbone hy-
+drogen bonds (DSSP), expert assignements and backbone dihedral angles (STRIDE[57]),
+Cα coordinates (P-SEA[123] and DEFINE[163]) and protein curvature (P-curve [181]). Ob-
+servations made by Colloc’h et al. [40] showed that DSSP, DEFINE and P-curve share the
+same assessment in 63% of cases whereas DSSP and STRIDE agree for 96%. As for several
+reasons, DSSP is commonly considered the standard reference in the field, we will limit our
+comparison to it, in its discrete (simply DSSP in the following) and continuous (DSSPcont, in
+the following) forms, and two other methods with different approach and assume that all
+other comparisons can be inferred using the results showed in [40].
+In their original work, Kabsh and Sander [106] applied DSSP on three different crystallo-
+graphic structures of decreasing resolution from 1.5 A to 3.0 A in order to study its accurancy
+against experimental resolutions. In this work we use the same three structures to compare
+our method with DSSP and with the method by Levitt and Greer (LG) [128] also referred in
+[106]. The latter is another method based on distance dependent definitions of the secondary
+structure motifs and all results obtained from its application are simply reprinted from
+reference [106] . The reader should be aware that two of these structures have now been
+superseded by new and more accurated ones. Here we use the older structures to refer
+directly to the original work by Kabsch and Sander as this will not affect our conclusions.
+Nevertheless we also compare the ScrewFit analysis on one of these structures ( PDB code:
+2ADK ) with its homologue obtained by the more refined structure ( PDB code: 3ADK) to
+make further assessments of the effects of the experimental resolution on our method.
+Table 14 shows the results of ScrewFit on pancreatic trypsin inhibitor at 1.5 Å resolution (PDB
+code: 3PTI) and cytochrome c550 at 2.5 Å resolution (PDB code: 155C).
+The comparison of assignments ScrewFit with those taken from [106] for DSSP and LG,
+shows that the three methods are globally equivalent in detecting secondary structure motifs
+on the structure at higher resolution but some relevant discrepancies among them begin to
+appear at the 2.5 Å resolution structure. In particular, this fact is evident in the region 26-31
+of cytochrome c550, where LG and DSSP do not find the same β-strand and ScrewFit detects
+104 screwfit: a novel approach for continuum protein secondary structure assessments
+Table 14: Comparison of ScrewFit assignments with two other methods (Levitt&Greer and
+DSSP/DDSPcont) for two structures of decreasing resolution. Assessments for both DSSP
+and DSSPcont are showed only when they differ. Comments column refers to additional
+information obtained by ScrewFit analysis. LG stands for Levitt and Greer method.
+Structure LG DSSP/DSSPcont ScrewFit comments
+3PTI Res. 1.5 Å
+310-helix 2-7 3-6 2-5
+β-strand 14-25 18-24 16-23
+β-strand 28-37 29-35 29-34
+β-strand 43-46 45 45 β-turn
+α-helix 47-55 48-55 48-57
+155C Res. 2.5 Å
+α-helix 4-16 6-12 6-10
+310-helix - 11-13/ - 11-13
+β-strand 17-23 19-20 19-20
+β-strand 26-31 - 26-30 extended conf.
+β-strand 33-39 35-37 -
+α-helix 40-44 - -
+α-helix 55-65 56-64 57-63 curved C-term.
+α-helix 71-80 73-80 72-82 310-like C-term
+α-helix 81-90 - -
+α-helix 106-118 107-117 106-116 curved C-term.
+a region of some β-strand conformations alternated with some extended ones. Equivalent
+results are obtained also for α-helices in regions 57-63, 72-82 and 106-116 where ScrewFit
+can give quantitative assessments on the curvature and other terminal deformations of each
+motif.
+6.3 results and discussion 105
+Table 15: ScrewFit assignements for the same protein structure with two different experimental
+resolution. Assessments for both DSSP and DSSPcont are showed only when they differ and
+assessments by DSSP are printed in italics.
+2ADK Res. 3.0 Å 3ADK Res. 2.1 Å
+Struct. DSSPcont STRIDE P-SEA ScrewFit DSSPcont STRIDE P-SEA ScrewFit
+α-helix 2-7 2-7 2-6 2-6 2-6 1-7 2-7 2-6
+β-strand 10-14 10-14 9-13 10-14 10-15 10-15 9-16 7-16
+α-helix 23-30/23-31 21-31 23-31 23-29 21-31 21-32 21-31 17-30
+β-strand 35-38 35-38 34-38 35-381 35-38 35-38 34-38 33-38
+α-helix 39-48 39-49 41-49 39-47 39-49 39-49 39-49 38-49
+α-helix 52-62 52-62 52-62 52-61 52-61 52-63 52-63 52-61
+β-strand - - - - - - 65-68 65-68
+α-helix 69-83 69-84 69-83 70-83 69-81 69-82 69-83 72-81
+β-strand 90-93 90-93 89-92 86-93 90-93 90-93 89-93 88-93
+α-helix 101-108 101-107 101-108 101-108 99-108 99-108 99-108 99-108
+β-strand - - - - - - 109-112 109-112
+β-strand 114-118 114-118 114-121 113-118 114-119 114-119 114-117 113-120
+α-helix 122-132 122-133 122-133 122-130 122-136 122-136 122-136 122-136
+α-helix 143-157 143-166 144-155 143-155 146-156 145-157 144-155 145-155
+α-helix 160-167 - - 156-165 158-164 159-165 158-167 159-164
+β-strand 170-173 170-173 168-175 170-173 170-174 170-174 170-173 170-174
+α-helix 179-193 179-193 182-193 179-193 179-191 179-192 179-192 178-191
+106 screwfit: a novel approach for continuum protein secondary structure assessments
+In both cases assignments made by DSSP and DSSPcont did not show any significant
+differences. A more detailed comparison with respect to experimental resolution is made in
+Table 15. The accuracy of ScrewFit assignments on adelynate kinase structure at different
+resolution ( PDB codes: 2ADK and 3ADK) was compared with those made by the means of
+three other methods: DSSP, STRIDE and P-SEA.
+Globally the effects of resolution on these methods are the same and only some discrepancies
+in N- and C- edges were encountered. This fact is already well known in literature as an
+artifact due to the different definitions [40].
+Nevertheless, a more accurate analysis of this comparison shows different response of each
+method to the improved resolution. Firstly, at low resolution the assignments made by
+ScrewFit overlap very well with those made by DSSP except for a slightly deformed β-strand
+in 35-38 which makes ScrewFit assessment quite uncertain. Secondly, DSSP and ScrewFit
+detect also two α-helices instead of one unique helix in the region 143-167. This outcome is
+confirmed for the four methods at higher resolution.
+Additionally, from Table 15 is also evident that P-SEA and ScrewFit improve their accuracy
+with resolution detecting two new β-strands in 65-68 and 109-112.
+These results confirm those previously shown in reference [114] and suggest that ScrewFit
+performance is equivalent to those obtained by the more refined distance-dependent methods
+if it is applied on a structure at low resolution. If the resolution is improved on the same
+structure, ScrewFit shows instead a significant conservative refinement with respect to the
+lower resolution structure and it also adds some new motifs with partial convergence with
+the common distance-dependent methods.
+To confirm the consistency of ScrewFit assignements with respect to the experimental
+resolution, we plotted the normalized distribution of values obtained for the parameters
+∆ and ρ calculated over all structures in databases D (resolution less than 2.0Å) and E (
+resolution between 2.1Åand 3.5Å). As shown in Figure 33 the effect of a better resolution is
+the slight narrowing of some peaks in the distributions, in particular for those corresponding
+to the α-helices values. Interestingly, assignments on β strands seem to be not affected by
+the experimental resolution. It is worth noting instead that although the shape of the peak
+distributions slightly changed, the position of their maxima stands unchanged. As a whole,
+the outcome of the comparison showed in Table 15 and the calculation over the databases D
+and E proved that the efficiency of ScrewFit assessments is globally quite insensitive to the
+experimental resolution with which the structural data were obtained.
+6.3 results and discussion 107
+Figure 33: Normalized distributions of ∆ (panel A) and ρ (panel B) parameters calculated over
+databases C (experimental resolution lower than 2.0Å; black lines) and D (experimental
+resolution greater than 2.1Å; red lines ).
+6.3.3 Comparison with DSSPcont
+As we mentioned in the Introduction, the main problem with the most common methods for
+the secondary structure assignments is the use of threshold-based definitions which recast
+the structural conformation heterogeneity of protein backbones into eight or less classes
+without accounting for the effect of the natural variations that could occur into the structures
+due, for example, to thermal fluctuations.
+Andersen and coworkers [5] presented an improved version of the DSSP method in which
+the discrete assignments were substituted by continuous ones obtained from the former
+ones variating of the hydrogen-bond distance thresholds defined for each of the eight DSSP
+structural classes. The efficency of DSSPcont method in capturing the effects of thermal
+fluctuations in NMR structure models has been shown to be higher than that of the discrete
+DSSP [5].
+Here we discuss the consistency of the ScrewFit assessments with the same criteria used by
+Andersen and coworkers and in particular we verify the stability of our set of parameters
+over the database F.
+For each NMR structure in F, we first calculated (for both parameters ∆ and ρ) the
+standard deviation of values over all the models. We then grouped these results when the
+corresponding mean values of the parameters fell within one of the ranges defined in Table
+13. The averages over these groups gave an estimation of the stability of parameters ∆ and ρ
+108 screwfit: a novel approach for continuum protein secondary structure assessments
+as a function of their values and could be compared to those obtained for DSSPcont in [5].
+Results for α-helices, β-strands and extended conformation are presented in Table 6.3.3.
+Table 16: Comparison of assessment consistency between ScrewFit and DSSPcont by the means of the
+root mean square deviation from average assignments. Value for DSSPcont are reprinted
+from [5]. Lines labeled with def refer to amplitudes of the ranges presented in Table 13 with
+respect to the corresponding parameter’s value. Extended conformation is given with the
+same values of β-strands when a differentiation between the two cannot be made. All values
+are in percentage.
+α-helix β-strand extended
+DSSPcont 13.1 11.3 11.3
+ScrewFit -ρ - NMR 13.7 29.3 29.3
+ScrewFit -ρ - def 11.9 44.0 44.0
+ScrewFit -∆ - NMR 9.1 4.4 8.2
+ScrewFit -∆ - def 7.6 7.2 7.1
+The first outcome of this analysis is that consistency of assignments in ScrewFit seems to
+be higher than in DSSPcont only for parameter ∆ and not for ρ. In fact, for the latter, the
+large deviation from the average values is clearly due to the lack of two distinct ranges for
+β-strands and for extended conformations. This is a direct effect of using continuous ranges
+of natural values for the definition of secondary structure elements and these differences
+between parameter consistency prove that in ScrewFit the combination of the two parameters,
+∆ and ρ, (combined with σ) is essential to make precise assessments.
+Moreover, Table 6.3.3 shows that, independently of the type of structural element, the root
+mean square differences for NMR models is coherent with the relative amplitudes of the
+ranges defined in Table 13. Nevertheless, it is worth to note that the use of ranges did not
+permit the same calculation for less represented structural elements like 310 and π helices
+and the comparison with DSSPcont with respect to the consistency of assignments remains
+incomplete. Corresponding work is in progress in order to obtain comparison also on the
+other DSSP structural classes.
+6.3 results and discussion 109
+6.3.4 Application
+In the following we will show a simple application of our method. This example underlines
+the combined approach which allows assessments on the protein secondary structure and
+a quantitative characterization of its changes within the same tool and without any further
+data treatment.
+BPTI Crystal forms
+As reported in our previous work [114], ScrewFit can be used to pinpoint small conformational
+changes due to several causes ranging from different experimental techniques to external
+environment changes like, for example, ligand binding or variation in pH. As an example we
+will consider here the case of the three different crystal forms of bovine pancreatic trypsin
+inhibitor (BPTI) which are known to be originated by different pH condition: pH values lower
+than 9.35 favor the form I and II crystals whereas higher pH values favor the form III.
+These three different crystal structures induce some small changes in protein conformation
+as reported in [209, 210]. In the original works, the authors compared the three structures
+of BPTI by means of inter-atomic distances in the backbone and/or in the side-chains. The
+outcome of this type of analysis was the finding of several local changes induced by the
+different crystal forms. Nevertheless, a detailed structural characterization of those changes
+were not possible.
+Here, we will first analyze the secondary structure assignments made by ScrewFit on the
+structure obtained from the crystal form I and we will then discuss the differences with the
+other two structures.
+For the determination of secondary structure motifs, we confront again the ScrewFit
+parameters with the secondary structure elements found by the DSSPcont method. The
+results are shown in Figure 30 (Panel B). The motifs found by DSSPcont are shown on the
+bottom of the figure. We used the same color scheme for both methods: red for α-helices,
+blue for β-strands and green for 3-10 helices. Visual inspection shows that most of the motifs
+found by DSSPcont correspond to the regions where the ScrewFit parameters are enclosed
+by the natural variations. Interestingly, our method is able to identify very well the α-turn
+between the two beta strands 19-25 and 30-36. These regions are highlighted in Figure 30
+(Panel B) with colored vertical bands. Minor discrepancies can, however, be observed in some
+regions, expecially in the extreme residues of each element. In particular, ScrewFit finds that
+the assignment of the 310 between residues 3 and 6, is quite uncertain due to the highly
+110 screwfit: a novel approach for continuum protein secondary structure assessments
+Figure 34: ScrewFit profile for bovine pancreatic trypsin inhibitor (BPTI) in its three different crystal
+forms. This figure shows how ScrewFit is able to pinpoint small differences between similar
+structural configuration of the same protein. Here Crystal form I (black solid line, PDB:
+4PTI), form II (red solid line, PDB: 5PTI) and forms III (green solid line, PDB: 6PTI) are
+represented. Horizontal stripes define the natural variations for β-strands (colored in blue)
+and α-helices (colored in red).
+6.3 results and discussion 111
+deformed C-terminus which is characterized by abnormally high values for this structural
+element in parameters ∆ and ρ and by the value of σ very close to zero in residue 6 which
+evidently stands for a kink in the backbone profile.
+Let us now look at the effects of the three crystal forms on the structure of the BPTI. Figure
+34 shows the parameters calculated in the three different conformations of the protein. In
+each plot, the horizontal stripes indicate the range of variation for the ScrewFit parameters
+as found in databases A and B (the usual color-code is used here: α-helix highlighted in
+red; β-strands highlighted in blue; 310-helix highlighted in green). In the original works the
+authors reported some major differences between form I and form II in the regions 15-19,
+26-29, 39-41 and 47-50 and between form II and form III mainly localized in residues 15 and 26.
+It is worth noting that deviations of backbone close to residue 15 are particularly interesting,
+since this residue is part of the active site of the BPTI. The application of ScrewFit to the
+three structures confirms some the differences mentioned above and allows them to be better
+characterized. In particular, changes around both residue 15 and 26 show major discrepancies
+between the conformation in crystal form III and the other two. In residue 15, parameter ∆
+changes, from form I and II to form III, toward values closer to an helix-turn conformation
+but the absence of equivalent changes in the other two parameters proves that this change is
+only due to a different relative orientation of the peptide planes related to a reorientation of
+the side-chains bewteen residues 15 and 16. The analysis of parameters’ values for residue
+26 leads to similar conclusions. A confirmation of these findings can be done with a direct
+visualization of the structure as showed in Figure 34. Additionally, ScrewFit reveals also a
+difference between the crystal form II and the other two at the C-terminus of the α-helix
+in region 47-53. In this case the parameter σ shows that in forms II the helix axis is rather
+straight whereas in the other two forms it clearly bends.
+The application of DSSPcont on the same structures confirmed that the major differences
+between crystal form I and crystal form II were localized in the regions around residues 15
+and 26 where it is reported an higher probability, in form II rather than in form I, of having
+respectively an not-structured and a helix-turn conformation. Nevertheless, DSSPcont does
+not find any relevant change between crystal form II and form III which was detected by
+ScrewFit.
+112 screwfit: a novel approach for continuum protein secondary structure assessments
+6.4 conclusion
+We presented the ScrewFit method for the analysis of the secondary structure level of proteins,
+which describes the latter in terms of local helix parameters obtained by the screw motions
+relating consecutive peptide planes. By construction, this method represents, ipso facto, a
+new approach to the so-called continuous methods for the secondary structure assessments
+because it does not relate to beforehand threshold-based definitions but only to geometrical
+criteria which are verified a posteriori on natural secondary structure elements.
+To establish confidence levels for the definition of all types of elements, we applied our
+method to different well defined selections of protein structures. The natural variations in
+parameters of ScrewFit have been shown to be coherent with the ideal values obtained in a
+precedent work.
+We have then confirmed the reliability of our definitions by applying our method on a
+heterogeneous set of proteins with different type of folds. In order to show the efficiency and
+accuracy of ScrewFit we confronted it to other methods, in particular to DSSP and DSSPcont.
+The outcome of this comparison showed that ScrewFit can be considered as accurate as
+DSSP/DSSPcont in function of crystallographic resolution. As an example, we analyzed the
+three different crystal forms of the bovine pancreatic trypsin inhibitor by means of ScrewFit.
+This application has shown that ScrewFit finds essentially the same structural elements
+as DSSP, but gives also a more detailed description of them, leading in some cases to a
+different assessment of secondary structure elements. It is worth noting that the method is
+also shown to be efficient in detecting some kind of reverse turns and random coils. Further
+improvements to permit more detailed assignments also of these motifs are the subject of
+work in progress.
+As a whole, with the same application we showed that ScrewFit is able to pinpoint small
+structural changes and to give a global view of the structural rearrangements of the protein
+as a response to external changes.
+In this context, another important feature of the method is the fact of combining in the same
+tool a method for detecting secondary structure and a way to find and characterize any
+induced structural change.
+It should be mentioned that while ScrewFit was developed for the analysis of protein
+secondary structures, with some minor improvements, it may also be used to characterize the
+protein supersecondary motifs and the folds of DNA and RNA molecules. Corresponding
+work is also in progress.
+6.5 notes 113
+6.5 notes
+[i] It can be easily verified that the ranges found for the parameter for ρ in α-helices and
+in 310-helices are fully compatible with those obtained by Barlow and Thornton [9] [ see
+section 5.3.2] on a rather smaller set of ∼ 100 structures.
+
+7
+RESULTS
+As stated in the introduction, one of the principal aims of this work was the characterization
+of both dynamical and structural aspects in protein adaptation to environmental conditions.
+In the present chapter, results obtained in this thesis for the particular case of the IF6s will be
+presented and discussed.
+After a summary on the samples used in this work and the environmental conditions
+investigated, the discussion will focus on the analysis of structural and dynamical effects of
+pressure and temperature on each sample. The results will be used to determine both local
+and global effects of the environmental conditions to IF6 homologues. The link between the
+assessment of both types of effects will be assured by the complementarity of the insights
+obtained by molecular dynamics (MD) and quasielastic neutron scattering (QENS).
+The samples that have been studied either by MD simulations or by QENS experiments are:
+- aIF6: the extremophile IF6 homologue from Methanococcus Jannaschii.
+- aIF6-HTag: the extremophile homologue with the supplemental N-terminal poly-
+histidine tag (HTag). This sample was used in the high pressure QENS experiments and
+was needed during the production phase in order to enhance the expression protocol
+yield.
+- eIF6: the modeled mesophile IF6 homologue from Saccharomyces cerevisiae.
+- eIF6-NoCTAIL: the mesophile homologue with C-terminal cleaved.
+The different environmental conditions used in MD are listed in Table 17, whereas those
+used in QENS measurements are shown in Table 18. It is worth noting here that the number
+and the variety of experimental measurements was largely constrained by several technical
+facts as will be exposed later in this chapter. Nevertheless, the comparison to results obtained
+from MD were however possible through a limited set of measurements. The environmental
+conditions listed in Tables 17 and 18 will be selectively chosen in the next section to present
+different aspects. Unless explicitly mentioned, the results shown here were obtained from
+115
+116 results
+molecular dyanamics simulations.
+Table 17: Set of MD simulations of each sample performed with different environmental configurations
+aIF6 eIF6 eIF6-NoCTAIL
+300K - 1bar 300K - 1bar 300K - 1bar
+300K - 250bar 320K - 1bar 300K 500bar
+300K - 500bar 350K - 1bar 350K - 1bar
+350K - 1bar 350K - 500bar 350K - 500bar
+350K - 250bar
+350K - 500bar
+Table 18: Set of QENS measurements of each sample performed with different environmental configu-
+rations
+aIF6 eIF6 aIF6-HTag
+300K - 1bar 300K - 1bar 300K - 250bar
+350K - 1bar 350K - 1bar 300K - 500bar
+350K - 250bar
+350K - 500bar
+7.1 effects of pressure and temperature change on if6s structure
+The following section presents a study of the structural response of IF6s to changes in
+pressure and temperature.
+7.1 effects of pressure and temperature change on if6s structure 117
+When high pressure and high temperature are applied to protein solution, one of the main
+effects that one would expect to see is the change in molecular volume and molecular surface
+exposed to the solvent.
+In Figure 36 is shown the volume change induced in aIF6 and eIF6 by a pressure change
+equivalent to 500bar at 300K and 350K. Here the molecular volume was estimated by the
+volume related to the surface accessible to solvent molecules. The extremophile IF6 structure
+seems to be less sensitive to environmental changes than its mesophilic counterpart. This
+observation is also corroborated by Figure 37 which shows the variation of the radius of
+gyration (Rgyr)in eIF6 and aIF6, respectively. This quantity, defined by
+N
+1 ∑
+R = (R −R )2gyr i CM , (7.1)
+N
+i
+is the root mean square distance of atoms from the protein center of mass (RCM). Although
+Rgyr is commonly used to give insight into the global shape of proteins, here it cannot be
+used to give an exact representation of IF6s, as the latter has a torus-like shape (see Figure 35)
+and the atomic mean distance does not distinguish between changes in either the internal
+or the external radius of the tours. Nonetheless, Rgyr can be used to give a qualitative
+representation of shape changes in IF6s. Indeed Rgyr of aIF6 varies in a narrow range from
+16.45 to 16.75 Å, indicating that the protein structure is rather insensitive to environmental
+changes. In eIF6, Rgyr does not significantly change at 300K when pressure is applied
+whereas it shows a very large variation when pressure is applied at high temperature (350K).
+Interestingly radial values of aIF6 at extremophilic natural conditions (350K and ∼ 500bar) are
+very similar to those of eIF6 in mesophilic natural conditions (300K and 1bar).
+Similar observations can be made with respect to the surface accessible area (SASA) shown
+in Figure 38. The differences in variation of SASA between the two homologues, at 350K
+reveals that the changes found in Rgyr of eIF6 must be mainly related to the increase of the
+total surface exposed to the solvent.
+7.1.1 Local effects
+The local effects produced by pressure and temperature on IF6s structures can be probed
+using the root mean square fluctuations RMSF(i) = 〈R (t) − 〈R 〉〉2i i , where i can refer to
+either an atom or a group of atoms (e.g., backbones or sidechains ); in the latter case an
+118 results
+Figure 35: Cartoons representation of IF6 structure.
+300K 1bar
+45.5
+300K 500bar A)
+350K 1bar
+45 350K 500bar
+44.5
+44
+43.5
+43
+42.5
+0 500 1000 1500 2000
+time [ps]
+300K 1bar
+45.5
+300K 500bar B)
+350K 1bar
+45 350K 500bar
+44.5
+44
+43.5
+43
+42.5
+0 500 1000 1500 2000
+time [ps]
+Figure 36: Molecular volume of IF6s with respect of pressure and temperature. Panel A: aIF6. Panel B:
+eIF6.
+Volume [Å3] Volume [Å3]
+7.1 effects of pressure and temperature change on if6s structure 119
+17 17300K 1bar
+A) 300K 500bar B)
+350K 1bar
+16.9 16.9
+350K 500bar
+16.8 16.8
+16.7 16.7
+16.6 16.6
+16.5 16.5
+300K 1bar
+300K 500bar
+16.4 16.4
+350K 1bar
+350K 500bar
+16.3 16.3
+0 500 1000 1500 2000 0 500 1000 1500 2000
+time [ps] time [ps]
+Figure 37: Radius of gyration of IF6s as a function of time. Panel A: aIF6. Panel B: eIF6. Only residues
+from 1 to 225 are taken into account.
+11600 300K 1bar 11600 300K 1bar
+300K 500bar A) B) 300K 500bar
+350K 1bar 350K 1bar
+11400 11400350K 500bar 350K 500bar
+11200 11200
+11000 11000
+10800 10800
+10600 10600
+10400 10400
+0 500 1000 1500 2000 0 500 1000 1500 2000
+time [ps] time [ps]
+Figure 38: Solvent accessible surface area of IF6s as a function of time. Panel A: aIF6. Panel B: eIF6.
+Radius of gyration [A]
+Solvent Accesible Surface Area [Å]
+Solvent Accesible Surface Area [Å^2] Radius of gyration [Å]
+120 results
+average over the atoms of the group is performed.
+A) B)
+Figure 39: Root-mean-square-fluctuation (RMSF) of carbon Cα in aIF6 backbone.
+A) B)
+Figure 40: Root-mean-square-fluctuation (RMSF) of carbon Cα in eIF6 backbone. Panel A: Region
+1-224. Panel B: Region 1-245.
+The RMSF of carbon Cα in aIF6’s backbone (Figure 39) shows that at 300K atomic fluc-
+tuations of residues are slightly reduced by pressure on the whole structure but a more
+significant variation is found in the region 80-90 . The latter region corresponds to the α-helix
+of one of the five pseudo-symmetric subdomains which composed the IF6 structure. No
+7.1 effects of pressure and temperature change on if6s structure 121
+significant differences are found between RMSF at 250bar and 500bar whereas at 350K the
+same region 80-90 shows RMSF increased by pressure. Moreover, as one would expect the
+general effect of temperature is to increase RMSF.
+The changes due to pressure found in aIF6 are not present in eIF6 where instead RMSF in
+region 80-90 is increased by temperature but reduced by pressure.
+In both cases, these results lead to the conviction that pressure and temperature can induce
+large changes in the exposure to the solvent of the α-helix in region 80-90 which results in a
+higher or lower RMSF of Cα atoms in the region. This observation is supported by visual
+inspection of both aIF6 and eIF6 sequences which reveals that the α-helix is highly charged
+and thus it has an high propensity for interaction with solvent.
+Figure 40 shows that eIF6, at both 300K and 350K, has an higher baseline for Cαs fluctuations,
+probably due to the presence of the C-terminal tail of 21 amino acids (CTAIL) which could
+transmit supplemental fluctuations to the rest of the protein structure. In the same context, it
+is worth noting that at high temperature this baseline is particularly increased for residues
+from 100 to 220, as shown in Figure 40.
+7.1.2 Secondary structure changes
+Even though the calculation of RMSF allowed several qualitative assessments on the effects
+of pressure and temperature on IF6s’ structures, a finer method is necessary to quantify
+them. For this purpose, the ScrewFit method will be used here to characterize the response
+of IF6s to the environmental changes. In particular the method will be used to analyze the
+molecular structures obtained by time-averaging of the atomic trajectories issued from the MD
+simulations in order to make assessments on the local flexibility of the secondary structure of
+IF6.
+The first application of ScrewFit on the time-averaged structure of both aIF6 and eIF6 at 300K
+and 1bar allows to distinguish the very similar secondary structure of the five subdomains
+which compose the IF6 structure (Figure 41 shows the aIF6’s profile). The inspection by eye
+allows the five motifs to be found through their regular profiles. Here, the discussion will be
+limited to the motif in the region 52-100 but the same conclusions can be obtained also from
+any of the other structural subdomains.
+Groft and coworkers [66], who reported the presence of subdomains in a five-axis pseudo-
+symmetry in IF6 structures, stated also that the almost invariant secondary structure profile of
+these subdomains was made of a long α-helix, a shorter one (alternatively a 310-helix was also
+122 results
+found) and three β-strands. Here the analysis of the orientational distance and of the radius
+of the helix of screw motion, seems to confirm the presence of a tight α-helix or more likely
+a 310-helix in residues 57-60 followed by two β-strands in the region 60-75 (See previous
+chapters for reference values). The latter have, however, a very variable straightness, meaning
+that they have a very curved form, as one can verify by visual inspection on molecular
+structure.
+Residues 78-90 clearly form a long and straight α-helix as evident from the comparison
+of values of the three parameters. Nonetheless, the C-terminus of this long α-helix shows
+a curved region as shown again by the straightness parameter which attains values close
+to zero. This result confirms and completes the observation made on the RMSF in the
+region around residue 90 in both aIF6 and eIF6. Indeed, variations found in the RMSF
+must correspond in changes in the curvature of the C-terminal region of the α-helix. The
+subdomain ends with a rather straight short β-strand from residue 90 to 100.
+1
+0.9
+0.8
+0.7
+0.6
+0.5
+0.4
+0 20 40 60 80 100 120 140 160 180 200 220
+0.4
+0.3
+0.2
+0.1
+0
+0 20 40 60 80 100 120 140 160 180 200 220
+1
+0.5
+0
+-0.5
+0 20 40 60 80 100 120 140 160 180 200 220
+Residues
+Figure 41: Secondary structure profile of aIF6 as detected by ScrewFit algorithm. The subdomain
+52-100 is highlighted by grey stripes.
+Straightness
+Helix Radius Orientational distance
+7.1 effects of pressure and temperature change on if6s structure 123
+Once the profile of IF6 secondary structure is characterized by ScrewFit parameters,
+one can observe the changes of the same parameters on the effect of high pressure and
+temperature. Nevertheless, as reported in [22], a direct comparison of the structures of eIF6
+and aIF6 will not be possible due to the presence of several deletions and insertions in
+sequences of both homologues which do not permit a direct structural alignment of the two
+IF6s without gaps.
+Figures 42 and 43 show the effects of temperature and pressure on both structures by means
+of differences of ScrewFit profiles. Profiles at high temperature or pressure were subtracted
+from the profile at 300K and 1bar to obtain the differences shown in figures. The outcome of
+the analysis of these figures is listed in the following. In both cases distinct effects due to
+temperature or pressure have been observed.
+aIF6
+- At 350K-1bar aIF6 shows a higher value of orientational distance in region around residue
+60 and between residue 120 and 130. In both cases this reflects a significant distortion of
+the helical conformation without change in the local curvature of backbone as evidenced
+by a rather small variation in straightness values.
+- High pressure (500bar), induces a significant change in residues 90-95. The inspection of all
+parameters seems to confirm that pressure induces a more curved structure and locally
+residues assume a conformation more similar to the neighbor α-helix 78-90 rather than
+to β-strand 90-100.
+- The combination of high temperature and high pressure has another significant effect
+around residue 50 where a transition towards a more curled conformation is evident
+from values of orientational distance and helix radius.
+eIF6
+- Large variations of all parameters in the region 220-245 are clearly due to the large fluctua-
+tions of CTAIL. These variations increase, as expected, with temperature.
+- Different variations in the region 170-180 are shown as effects of both temperature and pres-
+sure when applied separately but they are not present when a simultaneous application
+of high pressure and high temperature is performed(see also Figure 44).
+124 results
+300K-1bar vs 300K-500bar
+0.2 300K-1bar vs 350K-1bar
+300K-1bar vs 350K-500bar
+0.1
+0
+-0.1
+0 20 40 60 80 100 120 140 160 180 200 220
+0.05
+0
+-0.05
+-0.1
+-0.15
+-0.20 20 40 60 80 100 120 140 160 180 200 220
+1
+0.5
+0
+-0.5
+0 20 40 60 80 100 120 140 160 180 200 220
+Residues
+Figure 42: Effects of pressure and temperature on ScrewFit parameters of aIF6 secondary structure.
+- Combination of high temperature and high pressure produces an evident change in all
+parameters in the region 35-45 which correspond to the long α-helix of the first subdo-
+main of IF6 structure. As for region 78-90 in aIF6, also here variations are related to
+a major curvature of the C-terminus of the α-helix. Several different configurations of
+peptide planes in region 35-45 are shown by variations in orientational distance and
+helix radius.
+Interestingly, changes in ScrewFit profiles of eIF6 and aIF6 appear in different regions. The
+former is more affected in residues between 160 and 245 and between 1 and 50, whereas the
+latter is more significantly affected in the central region 50-140.
+7.1.3 Relation between local structural effects and IF6 function
+Very little is known about how IF6 performs its functions. Only few insights were reported
+by Basu et al [11] and by Groft et al. [66]:
+• Serines 174 and 175 are found to play an essential role in nuclear localization of IF6s
+which must be related to the phosphorylation of these two residues.
+Straightness Helix Radius Orientational Distance
+7.1 effects of pressure and temperature change on if6s structure 125
+300K-1bar vs 300K-500bar
+300K-1bar vs 350K-1bar
+300K-1bar vs 350K-500bar
+0.4
+0.2
+0
+-0.2
+-0.40 20 40 60 80 100 120 140 160 180 200 220 240
+0.3
+0.2
+0.1
+0
+-0.1
+-0.2
+0 20 40 60 80 100 120 140 160 180 200 220 240
+2
+1
+0
+-1
+-20 20 40 60 80 100 120 140 160 180 200 220 240
+Residues
+Figure 43: Effects of pressure and temperature on ScrewFit parameters of eIF6 secondary structure.
+Figure 44: Time-averaged structures of eIF6 at 300K-1bar and 300K-500bar. The structure of the C-
+terminal region of the α-helix is significantly changed by pressure. This variation affects the
+position of Serine 174 and Serine 175.Color scheme: red for eIF6 structure at 300K-1bar and
+blue for structure at 300K-500bar. Cartoons representation of secondary structure elements
+are built following the DDSP assignements.
+Straightness Helix Radius Orientational Distance
+126 results
+• Arginine 61 in eIF6 is found to close the central hollow of IF6 structure and prevent
+water molecules passing throught it. This fact could have effects on the global stability
+of IF6s structures.
+• The C-terminal region (to be distinguished from CTAIL which is formed by residues
+224-245) encompassing the evolutionarily conserved arginines and tyrosines Arg 67,
+Tyr 113, Arg 223 and Tyr 202 represents an exellent candidate for the participation in a
+biologically relevant protein-protein interaction. Indeed it is suggested as the binding
+site for the 60S ribosomal subunit.
+Some of the structural changes found in this work and induced by pressure and/or
+temperature involved the residues mentioned above, meaning that the corresponding
+structural re-arrangements could be related to the functional adaptation of IF6.
+In particular it was reported that the region including the two serines 174 and 175 undergoes
+structural changes at high pressure (Figure 44) and high temperature separately but it assumes
+its normal configuration when both pressure and temperature are increased. This result seems
+to be crucial for the assessment of the function of eIF6 under extreme conditions similar to
+those of warm deep seas. The C-terminal is obviously also largely influenced by the presence
+of CTAIL which induces fluctuations in eIF6 that are not present in aIF6. Also this fact
+will be used in the following to discuss the ability of eIF6 to adapt its function to extreme
+environments. As a whole, aIF6 seems to show a higher stability with respect to the change
+of the thermodynamic variables. Nonetheless, it shows some significant changes in backbone
+conformation in regions apparently not related to protein function.
+Finally, the comparison of RMSF and ScrewFit parameters for Arg 61 did not give any
+significant result in structural changes on the time scales used in this work.
+7.1.4 Comparison between ScrewFit profiles of eIF6 and eIF6-NoCTAIL
+In order to better understand the role of CTAIL in (de)stabilizing eIF6 structure, a supple-
+mental MD simulation was performed on eIF6’s structure without its C-terminal tail. The
+protocol used for this simulation was mentioned in the chapter on system setups.
+Comparison of ScrewFit profile of eIF6-NoCTAIL (Figure 45) with that of complete eIF6, reveals
+the absence of variations that characterized eIF6 in the previous paragraphs. Moreover, the
+variations in ScrewFit parameters in eIF6-NoCTAIL are more similar and closer in sequence
+localization to those shown for aIF6.
+7.1 effects of pressure and temperature change on if6s structure 127
+The observations made above lead to the conclusion that CTAIL could play a important
+role in structural adaptation of IF6 to extreme environment. In particular it seems that the
+presence of this C-terminal tail induces thermal fluctuations to the backbone of the rest of
+IF6 structure leading to a lower protein stability. As will be shown later in this chapter, the
+effects of pressure and temperature induced through CTAIL fluctuations do not cause only
+structural changes but also a different scheme of IF6 dynamical response to environmental
+changes.
+300K-1bar vs 300K-500bar
+300K-1bar vs 350K-1bar
+0.6 300K-1bar vs 350K-500bar
+0.4
+0.2
+0
+-0.2
+0 20 40 60 80 100 120 140 160 180 200 220
+0.2
+0.1
+0
+-0.1
+-0.20 20 40 60 80 100 120 140 160 180 200 220
+0.5
+0
+-0.5
+0 20 40 60 80 100 120 140 160 180 200 220
+Residues
+Figure 45: Effects of pressure and temperature on ScrewFit parameters of eIF6-NoCTAIL secondary
+structure.
+7.1.5 Comparison between ScrewFit profiles of aIF6 and aIF6-HTag
+As recalled at the start of this chapter, high pressure QENS experiments were performed on
+aIF6 with an attached supplemental N-terminal tail of 21 amino acids (HTag). This tail was
+essential to improve the yield of protein production. The same sample (aIF6-Htag), was also
+studied by MD simulations to make comparison with experimental data possible. aIF6-HTag
+Straightness Helix Radius Orientational Distance
+128 results
+time-averaged structure was initially analyzed by ScrewFit in order to identify differences
+with other samples and to verify the structural effect of the HTag on the protein itself.
+ScrewFit differences between structures of aIF6-HTag at different pressures and temperatures
+are shown in Figure 46. Here the beginning of the residue sequence was shifted to -20 in
+order to maintain the usual numbers in the conserved part of the structure.
+First of all, the effect of the HTag is clearly present in all parameters as large variations in the
+region from -21 to 0 but in contrast to the effects produced by CTAIL on eIF6 structure, here
+these changes are localized only in the region of the HTag and do not propagate over the rest
+of the structure.
+Moreover, the region between residues 40 and 50 seems to undergo the same changes found
+in aIF6, meaning that this region is intrinsically sensitive to environmental changes probably
+due to its exposure to solvent.
+300K-1bar vs 300K-500bar
+300K-1bar vs 350K-1bar
+0.4 300K-1bar vs 350K-500bar
+0.2
+0
+-0.2
+-20 0 20 40 60 80 100 120 140 160 180 200 220
+0.2
+0.1
+0
+-0.1
+-0.2
+-20 0 20 40 60 80 100 120 140 160 180 200 220
+2
+1.5
+1
+0.5
+0
+-0.5
+-20 0 20 40 60 80 100 120 140 160 180 200 220
+Residues
+Figure 46: Effects of pressure and temperature on ScrewFit parameters of aIF6-HTag secondary
+structure.
+Finally, it is worth noting that the major change in the whole structure happens in region
+110-115 and is present almost in the same way in all conditions. This fact suggests that the
+Straightness Helix Radius Orientational Distance
+7.1 effects of pressure and temperature change on if6s structure 129
+latter is a structural arrangement compatible only with the structure at 300K-1bar.
+The outcome of this comparison of ScrewFit profiles as well as the others was that both
+aIF6 and eIF6 are largely affected by the possible presence of a additional sequence of amino
+acids either in their N- or C- termini. Nevertheless, the effects produced strictly depend on
+the rest of the protein structure and can be very different.
+7.1.6 Elastic Incoherent Structure Factor
+As stated in the chapter on Material and Methods, the Elastic Incoherent Strcture Factor gives
+insights into the configurational space volume explored by atomic motions in macromolecules.
+As for other scattering functions, in the case of biomolecules, also the EISF is largely dominated
+by hydrogen contributions and it can be approximated as due to the motions of only one
+single representative scattering atom.
+The EISF has already been used widely to characterize the structural "flexibility" of proteins
+because it can be directly related to atomic mean square displacement (MSD). Indeed, for
+small values of the momentum transfer, it can be proved that the equation 2.42 can be
+approximated by the following expression [15]:
+EISF(q) = lim∞ I(q, t) = exp(−q2〈x2〉), (7.2)t→
+which has Gaussian form. In reality the Gaussian approximation holds strictly only for
+q→ 0 [15]. The above equation reveals that 〈x2〉 can be directly obtained by EISF via:
+〈x2〉 = − ln(EISF[q])/q2 (7.3)
+Using equation 2.42, the EISF of aIF6 and eIF6 have been calculated. Here and in the
+following, the quantities of interest are calculated only on the evolutionary "conserved" part
+of the IF6, i.e. on the region 1-224, filtering out the contribution of the C-terminal tail. A first
+comparison of EISF from aIF6 ( Figure 47 - Panel A) and eIF6 ( Figure 47 - Panel B) underlines
+two main differences between the two samples:
+- In both cases pressure makes the slope of EISF only slightly change whereas temperature
+has a much more evident effect
+- Even though aIF6 shows qualitatively the same behavior as eIF6, its variations due to
+pressure are very limited. Moreover, at high temperature (350K), EISFs at 1bar and
+500bar are almost identical.
+130 results
+A) B)
+Figure 47: Elastic Incoherent Structure Factor for aIF6 and eIF6.
+Looking at these results, one would conclude that the difference between the two samples
+is mainly related to their stiffness/softness character [216], but the direct comparison of EISFs
+in Figure 48 shows also another interesting outcome: EISFs of aIF6 at high temperature are
+very similar to those of eIF6 at 300K. This means that configurational spaces explored have
+the same extent in both samples when they are both in their natural conditions.
+Furthermore, EISF from eIF6 at high temperature shows a much more rapid decrease as a
+function of the momentum transfer with respect to the other EISFs. Another interpretation
+for this result is given by the atomic position fluctuation, 〈x2〉, obtained from equation 7.3
+and shown in Figure 48 (Panel B). From this figure it seems evident that atomic fluctuations
+can be analyzed as function of the momentum transfer. This does, however, not necessarily
+mean that the Gaussian approximation given above does not hold, but only that it is not
+compatible with the assumption of one single representative scattering atom. It has, in fact,
+been shown that the Gaussian model can represent the EISF of a protein up to moderate q
+values, since such a model can account for motional heterogeneity.
+The 〈x2〉 attains larger values for eIF6 at high temperature (at both pressures), meaning that
+fluctuations increase and involve the motion of rather large group of atoms or structural
+domains (q < 20nm−1). It is also worth noting here that the EISF (and the corresponding
+〈x2〉) from eIF6 at 300K-500bar superpose slightly better than the one at eIF6-300K-1bar to
+aIF6 1bar/500bar.
+7.1 effects of pressure and temperature change on if6s structure 131
+1
+A) eIF6(1-224) 300K 1bar
+eIF6(1-224) 300K 500bar
+eIF6(1-224) 350K 1bar
+0.8 eIF6(1-224) 350K 500bar
+aIF6 300K 1bar
+aIF6 300K 500bar
+aIF6 350K 1bar
+0.6 aIF6 350K 500bar
+0.4
+0.2
+0
+0 20 40 60 80 100
+q [nm-1]
+B) eIF6(1-224) 300K 1bar
+eIF6(1-224) 300K 500bar
+0.008 eIF6(1-224) 350K 1bar
+eIF6(1-224) 350K 500bar
+aIF6 300K 1bar
+aIF6 300K 500bar
+0.006 aIF6 350K 1bar
+aIF6 350K 500bar
+0.004
+0.002
+0 20 40 60 80 100
+q [nm-1]
+Figure 48: Panel A): Comparison of EISFs from aIF6 and eIF6.Panel B): Atomic mean fluctuations as
+obtained from equation 7.3
+<x2>  [Å2]
+EISF
+132 results
+characterization of eif6-noctail and aif6-htag structure and dynamics
+In this chapter, an hypothesis on the characterization of structural and dynamical properties
+of eIF6 and aIF6 is proposed. In particular the comparison of different EISFs will be used to
+assess the existence of corresponding states between aIF6 and eIF6.
+Here, similar characterization will be sketched also for eIF6-NoCTAIL and aIF6-HTag in
+order to use them latter in a more detailed discussion of the results.
+EISFs from aIF6-HTag are compared to those of eIF6 and aIF6 at different temperature and
+pressure and plotted in Figure 49. Interestingly, this result, together with the analysis made
+by ScrewFit in the previous sections, shows that aIF6-HTag has the same structural properties
+as eIF6. An opposite result was obtained from comparison of EISFs from eIF6-NoCTAIL with
+both eIF6 and aIF6 (Figure 50). Here, it seems that, even though EISFs from eIF6-NoCTAIL
+are very similar to those from aIF6, they show that the former has a less compact structure as
+shown in 51.
+1
+aIF6-HTag(1-224) 300K 1bar
+aIF6-HTag(1-224) 300K 500bar
+aIF6-HTag(1-224) 350K 1bar
+0.8 eIF6(1-224) 300K 1bar
+eIF6(1-224) 350K 500bar
+aIF6 300K 1bar
+0.6
+0.4
+0.2
+0
+0 20 40 60 80 100
+-1
+q [nm ]
+Figure 49: Elastic Incoherent Structure Factor for aIF6-HTag compared to EISFs from eIF6 and aIF6.
+EISF
+7.1 effects of pressure and temperature change on if6s structure 133
+1
+aIF6 300K 1bar
+aIF6 350K 1bar
+eIF6-NoCTAIL 300K 1bar
+0.8 eIF6-NoCTAIL 350K 500bar
+eIF6 300K 1bar
+eIF6 350K 1bar
+0.6
+0.4
+0.2
+0
+0 20 40 60 80 100
+Figure 50: Elastic Incoherent Structure Factor for eIF6-NoCTAIL compared to EISFs from eIF6 and
+aIF6.
+aIF6 300K 1bar
+aIF6 350K 1bar
+0.008 eIF6-NoCTAIL 300K 1bar
+eIF6-NoCTAIL 350K 500bar
+eIF6 300K 1bar
+eIF6-NoCTAIL 350K 1bar
+0.006
+0.004
+0.002
+0 20 40 60 80 100
+q [nm-1]
+Figure 51: Atomic mean square displacement (MSD) of eIF6-NoCTAIL as function of momentum
+transfer. Comparison with MSD from eIF6 and aIF6 is shown.
+<x2> [Å2]
+134 results
+7.2 efffects of pressure and temperature on if6s dynamics
+7.2.1 Dynamical models
+The data issued from neutron scattering measurements need to be interpreted in a frame of
+physical models describing the different types of motions which compose the global status
+of the sample. The easiest assumption which is usually made is to consider every type of
+motion de-correlated with respect to the others and every atom dynamically equivalent to
+the others. For this, the position of the atom i reads:
+Ri = RCM + ri + ui (7.4)
+where RCM is the position of the center of mass (CM) of the sample, ri is the atom position
+with respect to CM and ui is the deviation from the equlibrium position RCM + ri. These
+assumptions are reliable for small molecules with some degrees of symmetry but becomes
+an approximation when applied to much more complex molecules like proteins. Assuming
+that the latter is acceptable, i.e. that atom i represents the average dynamical properties of all
+atoms in the sample, the intermediate scattering function can be recast as follows:
+FH(q, t) = FCM(q, t) · Frot(q, t) · Fint(q, t) (7.5)
+here the "rot" and "int" indexes refer to global rotational and internal motions, respectively.
+Fourier transformation of 7.5 gives the relation for the dynamic structure factor which reads
+now:
+SH(q, t) = SCM(q, t)⊗ Srot(q, t)⊗ Sint(q, t) (7.6)
+The term due to translation of the center of mass can be described following the Frick’s law of
+diffusion of a free particle [13]. For the latter, particles positions are governed by a Gaussian
+probability and thus, the intermediate scattering function F(q, t) will have a Gaussian form
+as function of the momentum transfer [164]. The corresponding dynamic structure factor
+S(q,ω) will have a Lorentzian form:
+1 Dq2
+S(q,ω) = (7.7)
+π (Dq2)2 +ω2
+7.2 efffects of pressure and temperature on if6s dynamics 135
+where D is the diffusion constant and the half-width-half-maximum (HWHM) is defined by
+Dq2. The contribution to equation 7.6 due to global rotational diffusion is more complicated
+to obtain because it requires a description of molecules as rigid-bodies [37]. As stated in
+Chapter 2, this term is not taken into account in our QENS measurements because it is largely
+beyond the experimental resolution used here. Finally, several models have been developed
+to analyze the internal motions of atoms in large molecules like proteins. This means that,
+in the simplest case, all types of atomic diffusion motions which can be found into large
+molecules, are averaged to find a unique dynamical property for all atoms that characterize
+the molecule. This usually results in time-correlation functions characterized by a unique
+relaxation time associated with all atoms in molecules.
+However, a discussion all these models would be out of the scope of this thesis and accounts
+can be found in many excellent reviews. Here a brief summary will be given of the model
+used in this work to characterize atomic motions in proteins.
+7.2.2 Fractional Brownian Dynamics
+To interpret both the simulated and experimental data, the fractional Ornstein-Uhlenbeck
+(OU) process [137] is used as an analytical model for the atomic motions in a protein. The
+model describes anomalous diffusion in a harmonic potential, where the latter accounts for
+the fact that atomic motions in a protein are confined in space. The anomalous diffusion
+describes slow, non-exponential structural relaxation in the functional dynamics of proteins,
+which has been observed in the past on the microsecond to second time scale by fluorescence
+correlation spectroscopy[214] and by kinetic studies[64]. The existence of fractional Brownian
+dynamics in proteins on the nanosecond time scale has been recently demonstrated by
+analyses of molecular dynamics simulations [119] and the fractional OU process has been
+introduced in [113] for the interpretation of QENS spectra from proteins. It can be considered
+as an extension of a simple harmonic protein model, which has been used in the past to
+describe elastic neutron scattering profiles, in particular to extract the “resilience” of proteins
+in terms of an average force constant [216]. The fractional OU process (fOU) adds to this a
+description of the relaxation dynamics, which is measured in QENS experiments.
+Full details of fOU model and its application to protein dynamics can be found in previous
+works [119, 113, 19, 20] and here I will recall only the key points needed for the following
+136 results
+analysis of MD and QENS data.
+time-dependent mean-square displacement The most elementary quantity to
+be considered in the context of diffusion processes is the time-dependent mean-square
+displacement (tMSD),
+W(t) := 〈[x(t) − x(0)]2〉, (7.8)
+where x is the position of the diffusing particle and the brackets indicate a thermal average.
+In case that the dynamics of the particle is confined in space, the tMSD will tend to a plateau
+value, which is giv 2(en by 2〈x 〉. For t)he fractional OU process one has
+W(t) = 2〈x2〉 1− E αα(−[t/τ] ) . (7.9)
+Here Eα(z) is t∑he Mittag-Leffler function [52]∞ zk
+Eα(z) = , (7.10)
+Γ(1+αk)
+k=0
+where Γ(.) denotes the generalized factorial [2]. One recognizes that for α = 1, where Γ(1+
+αk) = Γ(1+ k) = k!, the exponential function is retrieved from expression (7.10), i.e. E1(z) =
+exp(z). In this case the fractional OU process becomes the well-known standard Markovian
+OU process, which is characterized by exponential relaxation functions [205, 59, 164]. As
+indicated in [117], the fractional counterpart is characterized by non-Markovian memory
+effects, which lead to non-exponential correlation functions.
+Expressions (7.10) and (7.9) show that the proposed model contains three parameters:
+1. the position fluctuation 〈x2〉,
+2. the parameter α indicating the deviation from exponential behavior,
+3. the time scale parameter τ.
+These parameters will be considered as q-dependent and will give account of the multiple
+relaxation dynamics the characterize the internal motions on proteins.
+relaxation rate spectrum The function E (−[t/τ]αα ) can be considered as a
+“stretched” generalized exponential function. The non-exponential character of this func-
+tion can be most easily visualized by writing it as a superposition of normal exponential
+functions. Using ∫fo∞r simplicity a dimensionless time variable we have
+Eα(−t
+α) = dλpα(λ) exp(−λt), (7.11)
+0
+7.2 efffects of pressure and temperature on if6s dynamics 137
+where pα(λ) is a normalized and positive distribution function, which is of the the form [64,
+117]
+1 λα−1 sin(πα)
+pα(λ) = , 0 < α < 1. (7.12)
+π λ2α + 2λα cos(πα) + 1
+In the limit α→ 1 we have [117]
+lim pα(λ) = δ(λ− 1), (7.13)
+α→1
+in agreement with lim E (−tαα→1 α ) = exp(−t).
+modeling incoherent neutron scattering In the following the dynamic struc-
+ture factor for incoh∫erent neutron scattering will be considered,
+1 +∞
+S(q,ω) = ∞ dt exp(−iωt)I(q, t), (7.14)2π −
+where I(q, t) is the incoherent intermediate scattering function, which depends on the position
+of the scattering atom
+I(q, t) = 〈exp(iq[x− x0])〉. (7.15)
+Here q = |q| is the modulus of the momentum transfer which the neutron transfers to the
+scattering atom in the scattering process. Within the model it is assumed that the system
+under consideration is isotropic and that, as made for EISFs, the protein dynamics, as seen
+in incoherent neutron scattering, can be described by one “representative” atom. In this
+case it suffices to consider one coordinate of the scattering atom, which is chosen to be the
+x-coordinate. In view of the predominance of incoherent scattering by hydrogen atoms, the
+representative atom in the model is a representative hydrogen atom.
+Within the model the inter∑mediate scattering function has the form∞ 2n
+2〈 2〉 q 〈x
+2〉n
+I(q, t) = exp(−q x ) Eα (−[t/τ αn] ) , 0 < α 6 1, (7.16)
+n!
+n=0
+where τn is given by
+τ = τn−1/αn . (7.17)
+The dynamic structure factor associated with the intermediate scattering function (7.16)
+reads { ∑∞ }q2n〈x2〉n
+S(q,ω) = exp(−q2〈x2〉) δ(ω) + Lα,τn(ω) , (7.18)n! 2π
+n=1
+where Lα,τ(.) is the generalized Lorentzian
+Lα,τ(ω) = ( 2τ sin(απ/2) ) , 0 < α 6 1. (7.19)
+ωτ (ωτ)α + 2 cos(απ/2) + (ωτ)−α
+138 results
+fitting qens spectra The model introduced in previous paragraphs describes internal
+protein dynamics and to be useful for the interpretation of QENS spectra of protein solutions
+the effects of global diffusion and of finite instrumental resolution must be incorporated.
+Neglecting multiple scattering effects and absorption, and assuming that global diffusion of
+the IF6 molecules and internal motions are decoupled, one can write the measured dynamic
+structure factor as convolution product (defining ∗ ∫+(f g)(ω) = ∞∞ dω ′ f(ω−ω ′)g(ω ′− )):
+Sm(q, t) = (S ∗ l ∗ r)(ω), (7.20)
+Here S stands for the dynamic structure factor of the model, l is a Lorentzian describing
+translational diffusion (D is the diffusion constant),
+1 Dq2
+l(ω) = (7.21)
+π (Dq2)2 +ω2
+and r is the resolu(tion fu)nction, which is well described by a Gaussian,
+2
+exp − ω
+r(ω) = √ 2σ2 , (7.22)
+2 πσ
+with σ > 0 and a half-w∫ idth at half maximum (HWHM) of ∆E ≈ 1.17σ. Both r(.) and l(.) are
+normalized such that +∞∞ ∫and +− dωr(ω) = 1 −∞∞ dω l(ω) = 1.
+The convolution product (7.20) for the measured dynamics structure factor can be written
+in the following form, using for{S the model (7.18),∑∞ }q2n〈x2〉n
+Sm(q,ω) = exp(−q2〈x2〉) (l ∗ r) + (LDα,τ ∗ r)(ω) . (7.23)n! 2π n
+n=1
+Here LDα,τ (ω) = (Lα,τn ∗ l)(ω) is the convolution of a generalized Lorentzian with a normaln
+Lorentzian, for which an analytical form can be given. Defining
+√
+ω˜ = ω2 + (Dq2)2, φ = arg(Dq2 + iω), (7.24)
+one obtains [112]
+D 2 {(ω˜τ)
+α cosφ+ cos([α− 1]φ)}
+Lα,τ(ω) = . (7.25)ω˜ {(ω˜τ)α + 2 cosαφ+ (ω˜τ)−α}
+7.2.3 Analysis of scattering functions obtained from MD simulations
+The “natural” quantities for the analysis of MD simulations are time-dependent MSDs and
+time correlation functions, such as the intermediate scattering functions (ISF), which can be
+directly computed from the trajectories. In this thesis, the MD analysis package nMoldyn
+7.2 efffects of pressure and temperature on if6s dynamics 139
+was used for this purpose [166]. All global motions (translation and rotation) were filtered
+out beforehand from all trajectories in order to avoid the presence of unwanted spurious
+contributions in the calculation of correlation functions. The procedure used to accomplish
+this task is well established and has already been explained in [115]. ISFs from aIF6 and eIF6
+for four different values of momentum transfer are shown in Figures 53 and 54 for different
+environmental conditions.
+The related time-dependent tMSD is shown in Figure 52. Data were fitted with the fOU model
+as explained in the previous section. Values for 〈x2〉 in 7.9 were fixed from direct calculation
+on MD simulations. The results of fits together with calculation of atomic 〈x2〉 are reported
+in Table 19.
+Table 19: Parameters of the fOU model from fits on eIF6 and aIF6.
+aIF6 〈x2〉 α τ eIF6 〈x2〉 α τ
+[nm2] [nm2] [ps] [nm2] [nm2] [ps]
+300K 1bar 2.84 · 10−3 0.42 115 4.13 · 10−3 0.46 225
+300K 500bar 2.96 · 10−3 0.36 198 3.88 · 10−3 0.47 168
+350K 1bar 4.32 · 10−3 0.40 114 6.56 · 10−3 0.56 143
+350K 500bar 4.46 · 10−3 0.42 142 5.36 · 10−3 0.49 168
+Inspection by eye of tMSD plots reveals that eIF6 at 300K as well as aIF6 at 350K are quite
+insensitive to pressure whereas they undergo a much more evident change at the non-natural
+temperatures. Moreover, at high temperature eIF6 shows large variations due to pressure.
+The fitted ISF from both samples are shown in Figures 53 and 54. Here, ISFs of both eIF6 and
+aIF6 do not relatively change with respect to pressure when temperature is kept respectively
+to 300K and 350K whereas significative variations occurred at different temperatures.
+Again also the observations made on tMSD and ISF seem to confirm the presence of
+corresponding states between the dynamical properties of the two IF6 homologues in their
+natural conditions and defined by apparent similar responses to environmental changes.
+Nevertheless, it is worth noting that here the presence of this correspondence is not found
+through similar values of these quantities but by means of homologous variations in function
+of thermodynamical variables. A further and more complete analysis of dynamical properties
+140 results
+aIF6 300K 1bar
+0.035
+aIF6 300K 500bar
+aIF6 350K 1bar
+0.03 aIF6 350K 500bar
+eIF6(1-224) 300K 1bar
+eIF6(1-224) 300K 500bar
+0.025
+eIF6(1-224) 350K 1bar
+eIF6(1-224) 350K 500bar
+0.02
+0.015
+0.01
+0.005
+0
+0 50 100 150 200
+time [ps]
+Figure 52: Comparison of time-dependent mean square displacement of aIF6 and eIF6.
+can be obtained by means of fractional Brownian dynamics model. As explained in the
+previous section, parameters α and τ given in the fOU model, define the heterogeneity of
+relaxation dynamics and are valuable tools to characterize the internal motions in proteins.
+Values of these two parameters obtained from fit with the fOU model of ISF are plotted as
+a function of momentum transfer in Figures 55 and 56. Surprisingly, the fitted parameters
+show several differences between aIF6 and eIF6:
+- τ in eIF6 is generally larger than in aIF6 by a factor of 3, meaning that its internal
+dynamics is characterized by slower motions. Moreover, its variation as function of
+pressure is of opposite sign with respect to the one in the extremophile homologue.
+- α in aIF6, although similar to the one obtained in eIF6, is always systematically larger
+than the latter. Following the definition of α and expression 7.12 this could mean that
+the two holomogues are characterized by different distributions of relaxation rates.
+The partial discrepancies between the values of {α, τ} from tMSDs and those from ISFs
+could be explained from the fact that tMSDs suffer much more than ISFs from the limited
+time-length of MD trajectories which do not permit a good sampling to be achieved for
+time-correlation functions.
+A key point here is the understanding of which of differences found in {α, τ} are related
+intrinsically to the differences between the two proteins and which can be taken as a possible
+MSD 
+7.2 efffects of pressure and temperature on if6s dynamics 141
+1 300K 1bar 1 300K 1bar
+300K 500bar 300K 500bar
+350K 1bar 350K 1bar
+0.95
+350K 500bar 350K 500bar
+0.98
+0.9
+-1
+qel=4nm
+-1
+qel=10nm
+0.85
+0.96
+0.8
+0.94 0.75
+0.7
+0.92
+0 50 100 150 200
+0 50 100 150 200
+time [ps] time [ps]
+1 300K 1bar 1 300K 1bar
+300K 500bar 300K 500bar
+350K 1bar 350K 1bar
+0.9 350K 500bar 0.9 350K 500bar
+0.8
+0.8 -1 -1
+qel=16nm qel=18nm
+0.7
+0.7
+0.6
+0.6
+0.5
+0.5
+0.4
+0 50 100 150 200 0 50 100 150 200
+time [ps] time [ps]
+Figure 53: Intermediate Scattering Function from MD simulation on aIF6 at different q-values:
+4, 10, 16, 18nm−1.
+F(q,t) [a.u.]
+F(q,t) [a.u.]
+F(q,t) [a.u.]
+F(q,t) [a.u.]
+142 results
+1 300K 1bar 1 300K 1bar
+300K 500bar 300K 500bar
+350K 1bar 350K 1bar
+350K 500bar 350K 500bar
+0.98
+0.9
+-1
+q =4nm -1
+0.96 el qel=10nm
+0.8
+0.94
+0.7
+0.92
+0.6
+0.9
+0 50 100 150 200 0 50 100 150 200
+time [ps] time [ps]
+1 300K 1bar 1 300K 1bar
+300K 500bar 300K 500bar
+350K 1bar 350K 1bar
+0.9 0.9
+350K 500bar 350K 500bar
+0.8
+0.8
+-1 -1
+q =16nm qel 0.7 el
+=18nm
+0.7
+0.6
+0.6
+0.5
+0.5
+0.4
+0.4
+0.3
+0 50 100 150 200 0 50 100 150 200
+time [ps] time [ps]
+Figure 54: Intermediate Scattering Function from MD simulation on aIF6 at different q-values:
+4, 10, 16, 18nm−1.
+F(q,t) [a.u.] F(q,t) [a.u.]
+F(q,t) [a.u.] F(q,t) [a.u.]
+7.2 efffects of pressure and temperature on if6s dynamics 143
+300K 1bar
+70
+300K 500bar
+60 350K 1bar
+350K 500bar
+τ 50
+40
+30
+20
+4 6 8 10 12 14 16 18
+0.58
+0.56
+0.54
+0.52
+α
+0.5
+0.48
+0.46
+4 6 8 10 12 14 16 18
+-1
+q [nm ]
+Figure 55: Parameters for the fOU model obtained from fits on intermediate structure factors of eIF6.
+35
+300K 1bar
+30
+300K 500bar
+25 350K 1bar
+350K 500bar
+τ 20
+15
+10
+5
+0
+0.64 4 6 8 10 12 14 16 18
+0.62
+0.6
+α 0.58
+0.56
+0.54
+0.52
+4 6 8 10 12 14 16 18
+-1
+q [nm ]
+Figure 56: Parameters for the fOU model obtained from fits on intermediate structure factors of aIF6.
+144 results
+"signature" of adaptation. As will explained later in this chapter the sign of variations
+with respect of temperature and pressure should be related to peculiar properties of each
+homologue and more generally of each protein, whereas other qualities of these variations,
+such as their length scale dependancy, could be related to evolutionary molecular adaptation.
+The analysis of EISF was very useful for finding the corresponding states but it does
+not show how dynamical properties of proteins are modified moving from unfavorable
+conditions to physiological ones. The absolute value of parameter τ which characterizes
+relaxation time as function of momentum-transfer, thus as function of length-scale, was
+shown to be a useful tool to identify differences between eIF6 and aIF6. Interestingly,
+comparing the value of τ of each protein in different environmental conditions to those
+in natural conditions, one finds that in both samples, τ variations are q-dependent and
+that their extension is related to the quality of extremeness of the particular environmental
+condition. This comparison can be made normalizing values of τ to values at natural
+conditions as shown in Figures 57 and 58. From these figures one can easily note that
+variations in τ become non-uniform as external conditions move too far from the natural
+(optimal) ones and they mainly involve the region corresponding to small momentum transfer.
+7.3 comparison with qens measurements
+In the QENS experiments performed for this thesis work a number of technical difficulties
+were encountered which severely limited the amount and the quality of data. Hence, only
+a purely qualitative comparison with MD was possible. The main problems related to
+experimental measurements were due to the lack of previous knowledge of the chemical
+properties of IF6 samples:
+eIF6 turned out to have a very low stability in the experimental setups developed for this
+work. Indeed, in high pressure experiments after some hours of measurements the
+protein started to aggregate and very few spectra were reliable for analysis. Probably
+this was due to variations in protein concentration caused by pressure application and
+the coexistence of CTAIL and the poly-histidine tag which could interfere with protein
+stability.
+The evaluation of protein concentration in solution was made very difficult by the very
+low quantity of chromophore aminoacids which resulted in low UV absoprtion. As
+7.3 comparison with qens measurements 145
+1.6
+1.5
+1.4
+300K-500bar
+350K-1bar
+1.3
+350K-500bar
+1.2
+4 6 8 10 12 14 16 18
+-1
+q [nm ]
+Figure 57: Values of τ from fit of eIF6 normalized to value at 300K and 1bar.
+300K-1bar
+1.5 300K-500bar
+350K-1bar
+1.4
+1.3
+1.2
+1.1
+1
+0.9
+4 6 8 10 12 14 16 18
+-1
+q [nm ]
+Figure 58: Values of τ from fit of aIF6 normalized to value at 350K and 500bar.
+τ/τ350 τ/τK-500bar 300K-1bar
+146 results
+a consequence, the absorption at 280nm, usually measured to estimate the protein
+concentration gave systematic errors greater than 10%.
+In addition to these limitations, one should recall also the other results found on eIF6 stability
+and reported in Chapter 3. For this reason, QENS spectra of eIF6 will not be shown here.
+Some preliminary analysis of spectra from aIF6 was, however, still possible and will be used
+here to support some of the observations made by means of MD simulations.
+7.3.1 Ambient pressure measurements
+Measurements at ambient pressure were performed on the spectrometer FOCUS (Paul
+Scherrer Institut, Switzerland) as explained in the Chapter 3. Spectra for the empty sample
+container, solvent and protein solutions were acquired. The experimental spectra were treated
+as mentioned in Chapter 3. The following procedure was used to estimate the sample
+container transmission in the presence of samples: i) firstly, the empty cell spectra were fitted
+with a normalized Gauss(ian function):
+exp (ω−ω0)
+2
+−
+2σ2
+G(ω;ω0,σ) = √ (7.26)
+2 πσ
+ii) secondly the Gaussian function with parameters {ω0,σ} fixed from the previous fit on
+empty cell was used to estimate the contribution of the sample container in solvent spectra
+which were fitted by the following expression:
+Ssolvent(q,ω) = A (τ G(ω;ω0,σ) + (1− τ)SB(q,ω)) (7.27)
+where A is a normalization factor and
+∑2 1 Γ2
+SB(q,ω) = i , (7.28)
+π (Γ )2 2i +ω
+i
+The expression for SB(q,ω) is intended to describe global translation and rotation of
+solvent molecules. In order to limit the systematic errors due to the technical constraints listed
+above, the resulting spectra containing the contribution of the sample container, the solvent
+and the protein itself, were fitted with the fractional Brownian Dynamics model following the
+expression:
+Smes(q,ω) = C(α ((1− τ ′) S˜ (q,ω) + τ ′S P S˜E(q,ω)) + (1−α) S˜B(q,ω; Γ1, Γ2)) (7.29)
+where S˜P(q,ω) was defined by expression 7.23, S˜B(q,ω; Γ1, Γ2) was obtained from previous
+fit and S˜E(q,ω)) is the spectrum from the empty sample container. Here, S˜ represents
+7.3 comparison with qens measurements 147
+experimental spectra convoluted with instrumental energy resolution as estimated from
+vanadium spectra performed with the same setup of the other measurements.
+300K exp
+300K fOU ﬁt
+353K exp
+0.001 353K fOU ﬁt
+q= 17 nm-1
+0.0001
+0.01 0.1 1
+ω [meV]
+Figure 59: Log–log plot of aIF6 experimental QENS spectra for q = 17 nm−1 at 300K (hollow squares)
+and 353K (filled triangles) as a function of neutron energy gain ω. Lines represent the fits
+of the fOU model defined in the text.
+Data were fitted in the range [−1.5 : 0.1]meV . The EISF obtained from this fit is shown
+in Figure 60 together with the EISFs obtained from MD simulations. Experimental data
+seem to agree very well with those obtained from MD simulation. The diffusion constant
+estimated from 7.23 is given in Figure 61 as a function of momentum transfer. The values can
+be compared with those given by direct calculation from the IF6 molecular dimensions. Here
+it is worth noting that the spherical approximation for the usual Einstein-Stokes expression
+of the translation diffusion constant would not fit very well in the case of IF6 as the protein
+shape can be better approximated by a disk or by a torus. These corrections to the spherical
+case can be performed by means of the Perrin factor and the explicit expression for torus
+diffusion constant (Appendix B). The values obtained from aIF6 were calculated using the
+volume associated to the solvent accessible surface and are given in Table 20. In the Perrin
+factor approximation the dimensions of the disk-shape which describe the IF6 structure was
+estimated by a orthorhombic box which included the whole molecular structure. Experimental
+values have to be corrected with respect of the viscosity of D2O which is 20% higher than that
+S(q,ω) [a.u.]
+148 results
+of H2O. Hence taking into account this correction, values shown in Figure 61 are included
+between the Perrin and the torus approximations.
+Table 20: Perrin correction to spherical diffusion constant obtained from bounding box and solvent
+accessible surface volume.
+Temp&Press axis a axis b Solv. Vol Stokes-Einstein D Perrin D torus
+[Å] [Å] [103Å3] [10−3Å2/ps] [10−3Å2/ps] [10−3Å2/ps]
+300K-1bar 33.6 48.0 41.36 11.50 12.39 34.66
+350K-1bar 34.2 46.3 40.99 34.23 36.64 95.34
+1 300K ﬁt fOU
+300K MD
+353K ﬁt fOU
+0.8 353K MD
+0.6
+0.4
+0.2
+0
+0 0.2 0.4 0.6 0.8 1 1.2 1.4 1.6 1.8
+q [Å-1]
+Figure 60: EISF from QENS measurements at ambient pressure and MD simulation of aIF6.
+The values of α and τ parameters of the fOU model estimated from the fit of experimental
+QENS spectra at 300K and 350K are plotted in Figure 62. Interestingly, the values for parameter
+α are still coherent with those found from MD simulations whereas the values for τ are very
+different. The discrepancy in the evaluation of τ could be related to the limited energy range
+EISF
+7.3 comparison with qens measurements 149
+0.055
+300K
+353K
+0.05
+0.045
+0.04
+0.035
+0.03
+0.025
+0.02
+0.4 0.6 0.8 1 1.2 1.4 1.6 1.8
+q [Å-1]
+Figure 61: Diffusion coefficient as function of momentum transfer obtained from fractional Ornstein-
+Uhlenbeck from QENS measurements at ambient pressure.
+used to perform this fit which was smaller than the one accessed by the time-correlation
+functions calculated from MD trajectories.
+1
+0.9 300K
+α 0.8 350K
+0.7
+0.6
+0.5
+0.4
+0.3
+4 0.4 0.6 0.8 1 1.2 1.4 1.6 1.8
+3
+τ 2
+1
+0
+0.4 0.6 0.8 1 1.2 1.4 1.6 1.8
+q [Å-1]
+Figure 62: Parameters for the fractional Ornstein-Uhlenbeck process obtained from fits to QENS
+measurements at ambient pressure.
+Diffusion Coefﬁcient [Å2/ps]
+150 results
+7.3.2 High pressure measurements
+As mentioned in the chapter on experimental and simulated systems setups, all the QENS
+measurements performed in the pressure cell system required large volumes of protein
+solution. This was a limiting factor for the cleavage of the poly-histidine tag (HTag) used to
+enhance the expression protocol yield. For this reason, high pressure measurements were
+performed with aIF6 with HTag (aIF6-HTag). Also for these measurements the knowledge of
+precise protein concentration in sample solution would be essential for the correct analysis of
+spectra. As a consequence, a correct treatment for the analysis of quasi-elastic spectra was
+not possible. Nonetheless, acquired spectra were used to estimate EISF from aIF6-Htag with
+a qualitative approach which was however useful to partially support the observations made
+by MD simulations.
+Spectra from empty cell, solvent and protein solution were taken and the same procedure for
+the estimation of sample container transmission used for ambient pressure measurements
+was used here.
+The empty cell contribution was subtracted from solvent and protein solution spectra with a
+transmission τ = 0.90. EISF from aIF6-Htag was estimated directly from the protein solution
+spectra from the expression:
+Ssolution(q,ω) = B (β G(ω;ω0,σ) + (1−β)L(q,ω)) (7.30)
+where L(q,ω) which accounts for IF6 global and internal motions as well as for solvent
+quasi-elastic contribution and G(ω;ω0,σ) is a Gaussian function which should estimate the
+EISF from aIF6-HTag. The normalized fitted EISFs at different temperatures and pressures
+are shown in Figure 63. The MD simulation of aIF6-HTag was performed in order to compare
+experimental data. After filtering out the global motions as the other MD simulations,
+the scattering functions were calculated using the nMoldyn package. The EISFs from MD
+simulation are plotted together with experimental ones in Figure 63. Experimental results
+seem to underestimate EISF with respect to MD but the variation due to pressure and
+temperature are qualitatively similar. Here, it is worth noting that in general MD simulations
+tend to overestimate EISF due to the limited time length of trajectories which is far from being
+sufficiently large to correctly evaluate this quantity. From the experimental point of view,
+however, the EISF could be susceptible to systematic errors due to an incorrect subtraction
+of the sample container. Indeed, the latter could give a different contribution from the one
+7.4 discussion and conclusion 151
+estimated from solvent spectra due to the absorption of protein sample and it could cause a
+underestimation of EISF values.
+300K 500bar IN6
+300K 250bar IN6
+1 350K 500bar IN6
+350K 250bar IN6
+300K 250bar MD
+300K 500bar MD
+0.8 350K 500bar MD300K 1bar IN6
+300K 1bar MD
+0.6
+0.4
+0.2
+00 0.2 0.4 0.6 0.8 1 1.2 1.4 1.6 1.8 2
+q [A-1]
+Figure 63: Comparison EISF from IN6 measurements and MD simulation of aIF6-HTag
+7.4 discussion and conclusion
+The effects of pressure and temperature on IF6s have been characterized here both from
+structural and from a dynamical points of view. Each approach gave different insights
+into the response of IF6s to environmental changes: i) global structural responses were
+investigated by means of radius of gyration and SASA whereas local effects were studied
+by RMSF analysis combined with ScrewFit profiles. The latter, besides giving significant
+insights into the conformational changes induced by pressure and temperature, allowed
+to assess secondary structure fluctuations induced by the same thermodynamic variables;
+ii) dynamical responses were instead investigated by means of scattering functions which
+allowed direct comparison between MD simulations and QENS experiments.
+EISF
+152 results
+For the discussion of results shown in the previous sections, it is important to underline
+the role of the definition of extreme conditions: in contrast to what it is commonly thought,
+the conditions that request a significant re-adaptation of protein structures are not only
+those which have unfavorable chemical and thermodynamical conditions in the general
+sense. In fact, as already stated in the Introduction, some proteins seem to behave better at
+their own natural conditions than in other environmental situations, even though the former
+are, in principle, chemically and physically less favorable than the latter. This observation
+is comforted by works on enzymes activity which seemed to maintain corresponding states
+between different environmental conditions that requested evolutionary adaptation. These
+states are usually characterized by similar conformational flexibility [92].
+structure As a whole the effects of pressure and temperature on IF6 structures showed
+that the anti-association factor 6 from Methanococcus Jannaschii (aIF6) is much less sensitive
+than its mesophilic counterpart from Saccharomyces cerevisiae (eIF6) with respect to extreme
+conditions, as shown by variation in solvent accessible surface and in atomic root mean
+square fluctuations. In particular it was also found that its structural properties at high
+temperature and high pressure were very similar to those of eIF6 at 300K-1bar. This response
+is characterized by fluctuations of α-carbons in the protein backbone and by variations in
+secondary structures.
+Here, the presence of corresponding states was made evident from observations on structural
+fluctuations and by the comparison of different EISFs which proved by its relation to the
+mean square displacement that this process is linked to the change on spatial confinement of
+protein internal motions. The same type of results were obtained by Tehei and coworkers
+[191, 192] in the comparison of molecular dynamics in thermophilic and mesophilic proteins.
+As a whole, these results suggest that corresponding states are created by local structural
+re-arrangements that influences atomic motions in proteins. For this purpose, evolution plays
+on sequence point mutations to give the right adjustment of intramolecular interactions and
+thus obtain the desired effect on protein structure stability.
+Comparison between the EISFs of eIF6 and aIF6 gave the evidence that MSDs are very
+similar in the respective natural conditions. The comparison of these results with those
+previously obtained on the EISF from lysozyme [20] at ambient pressure (Figure 64), shows a
+7.4 discussion and conclusion 153
+surprising correspondence suggesting the presence of a condition for optimal "resilience" of
+protein structures.
+1
+lysozyme 300K 1atm
+eIF6(1-224) 300K 1bar
+aIF6 350K 500bar
+0.8
+0.6
+0.4
+0.2
+0
+0 20 40 60 80 100
+q [nm-1]
+Figure 64: Elastic Incoherent Structure Factor for aIF6, eIF6 and lysozyme.
+In IF6’s protein family this condition seems to be achieved thanks to a tail of 21 amino
+acids (CTAIL) attached to the C-terminus of the more evolutionarily conserved part of IF6,
+because its presence was the source of the lower stability of eIF6 in extreme conditions,
+whereas its absence made eIF6-NoCTAIL behave like aIF6. Moreover, the role of CTAIL is
+made even more important by the fact that it induces large thermal fluctuations to structural
+regions which are supposed to play a direct role in IF6 functions.
+Interestingly, similar results have been obtained on EISFs from aIF6-HTag indicating that
+even the presence of a fluctuating non-structured tail attached on the N-terminus of aIF6
+could make the latter not suited for warm deep sea environments.
+The application of the ScrewFit method to time-averaged structures allowed also some
+local effects of pressure and temperature to be detected and characterized by comparison
+with three-dimensional structures. The main outcome of this analysis revealed that pressure
+EISF
+154 results
+and temperature have locally different effects on IF6 structures. Some of these effects were
+enhanced by separate application of high pressure and high temperature, whereas they
+disappeared when both conditions where applied simultaneously.
+dynamics The investigation of the dynamical effects refined the structural results.
+Scattering functions from the MD simulations of both aIF6 and eIF6 were analyzed by means
+of fractional Brownian dynamics (fOU) model. The latter was proved in other works to be
+able to finely characterize the multiple relaxation time dynamics of proteins.
+The fOU model showed that aIF6 and eIF6 can be distinguished from each other by their
+dynamical properties. In particular it was shown that they have different characteristic
+q-dependent relaxation times and give different responses to pressure application. Indeed,
+when pressure is applied one would expect that slower diffusive motions on large length
+scales are slowed down since they require large scale spatial rearrangements which are
+increasingly hindered under pressure. Parameter τ from fit of aIF6 seems to confirm this
+behaviour whereas it does not for eIF6 in which it is lowered by pressure increase. This fact
+could be explained by the possible denaturation of eIF6, which has already been observed in
+real experiments and that could be visible already in the nanosecond time-scale.
+This outcome suggests that fOU parameters are able to capture dynamical properties of
+each protein, being able to pinpoint differences between two homologues of the same protein
+family. Moreover, it seems evident that if corresponding states can be found from the atomic
+MSD, the fOU model can chracterize how unfavorable environmental conditions differentiate
+from the physiological one by means of the dynamical parameters.
+Indeed, if variation of dynamical properties due to changes in pressure and temperature,
+must be related to each protein characteristic, the general framework in which this variation
+happens can somehow be a common property of protein families. In this context comparison
+of relaxation times in different environmental conditions showed that the approaching
+of a favorable environment corresponds to a non-uniform change in relaxation times.
+In particular motions involving large domains are less influenced than more localized motions.
+7.4 discussion and conclusion 155
+The limited amount and quality of experimental data did not permit to completely verify
+this hypothesis made by means of MD simulations. QENS experiments have shown however
+consistency with MD results. In particular EISF and the translational diffusion constant found
+by experiment at ambient pressure was found to be comparable with those estimated by MD
+simulations. High pressure experiments were largely biased by technical problems and could
+not give any quantitative result. Nevertheless, a qualitative comparison with MD simulation
+was possible by estimating the EISF contribution from the protein solution spectra.
+
+8
+GENERAL CONCLUS IONS AND PERSPECT IVES
+In the introduction was stated that this work was proposed to give an answer to the following
+questions:
+Where does the extremophilic signature come from ?
+If structure cannot be the origin for this, can it be the dynamics??
+The test case for this extremophilic signature searching was to be found in structural
+and dynamical properties of the Inititation Factor 6 from Methanococcus Jannaschii, an
+archaebacteria which lives in the warm deep sea, near the hydrothermal chemineys. This
+protein was chosen for its important role into the synthesis of other proteins, through its
+participation into the biogenesis of major ribosome subunits and the limitation of association
+of the two subunits.
+IF6 homologue from Saccharomyces cerevisiae was chosen as "normal" conterpart for a
+detailed comparison. The approach used in this work, which combined MD simulations and
+QENS experiments, presented several new aspects to both techniques that requested the
+development of novel theoretical and experimental methods. Firstly, a new computational
+method was needed to finely pinpoint even small changes in protein structures induced by
+environmental changes. For this purpose, a method based on quaternion superposition fits
+in conjunction with Chasles’ theorem on rigid body motions was developed. This method,
+called ScrewFit, proved to be efficient in finding variations in secondary structure of proteins
+and in characterizing them with respect to the deformations in protein structural motifs. The
+method found also further developments in protein secondary structure assignments and in
+finding the structural effects due to ligand binding in enzymes.
+Secondly, the two IF6 homologues were entirely new samples for QENS experiments and
+demanded new protocols for expression and purification in order to obtain adequate
+sample concentration in final solutions. The developed protocol reported here had a
+yield sufficient for neutron scattering measurements of protein solution. Nevertheless,
+it also involved other technical complications due to the presence of a N-terminal poly-
+histidine tag which was needed to improve the total yield of protein purification. The
+157
+158 general conclusions and perspectives
+clavage of the supplemental histidine-tag in large volumes needed for high pressure mea-
+surements is prohibitive due to its efficiency, the latter being inversely proportional to volume.
+The major results of this work are related to the finding of "corresponding states" in
+structure and dynamics of each homologue in its respective natural condition. These "states"
+are characterized by very similar atomic mean square displacements, meaning that the
+atomic internal motions in respective natural conditions are confined to the same length
+scales. This type of correspondence was already found in other works on other proteins both
+experimentally [192] and by MD simulations[69]. These results were formerly interpreted as
+an indication of different "resiliences" of extremophile and mesophile proteins. In this work I
+showed that even if corresponding states are found, they do not involve the same dynamical
+behavior in extremophilic and mesophilic homologues. Nevertheless, the variation of charac-
+teristic time as function of length-scale seems to be able to capture the optimality of conditions.
+Throughout this thesis the dynamical characterization of IF6 samples modeled by MD
+simulations was pursued using a fractional Brownian dynamics model which proved to
+efficiently characterize the multi-time-scale heterogeneity in protein internal motions.
+Besides the general discussion about "corresponding states", this work showed also that in
+the case of IF6, pressure and temperature induce different local effects in protein structures.
+Some of these effects seems to affect regions that probably host functionality of IF6s. The
+structural analysis by means of Screwfit parameter profiles showed that pressure and temper-
+ature effects are neither equivalent nor of opposite sign. They are qualitatively different. The
+present knowledge of these effects does not permit the association of the latter to the global
+effects inscribed into the formation of "corresponding states".
+The experimental results which were very limited by the absence of adequate protocols and
+previously unknown sample instability, could however support indirectly results obtained
+from MD simulations.
+perspectives This work proposed a new approach to the investigation of evolutionary
+adaptation of proteins to extreme environments from both a structural and a dynamical
+point of view. Nevertheless, its novelty had to face some experimental limitations. This
+did not prevent experimental results being obtained which supported the MD simulations.
+159
+Nevertheless, the results shown here should be verified by MD simulations also for longer
+time-scales in order to better explore dynamical properties of IF6s. In this context, some
+neutron backscattering experiments, which access longer time-scales, have already been
+performed during this thesis on the IN16 (Institut Laue Langevin, Grenoble, France) and
+HFBS (NIST, Gaithersbourg, USA) spectrometers.
+As a whole, this work must be considered preliminary and requires further development
+both in expression/purification protocols of samples and in technical instrumentation for
+QENS experiments. In fact, the latter may become a limiting factor when performing mea-
+surements on protein solutions which require stable samples even at very high concentrations.
+This thesis suggested, however, that IF6 constitutes a very interesting sample for studies
+on molecular evolution and it is worth being further investigated both by QENS and
+other molecular spectroscopy techniques. In particular small angle scattering (X-ray and
+neutrons) should be envisaged to obtain more insights into the structural effects of different
+environmental conditions and the role of CTAIL in eIF6 stability.
+In addition to its role in molecular evolution studies, IF6 dynamical properties could be
+explored by neutron scattering also in relation to its recently uncovered role in regulating the
+human tumor cell development[172].
+Finally this work constitutes a new approach for investigating molecular evolution. Sim-
+ilar approaches have been recently used to investigate the relation between other physical
+properties of proteins and their evolutionary history[215].
+
+Part III
+APPENDIX
+
+A
+BUFFERS USED FOR PROTE IN EXPRESS ION AND PURIF ICAT ION
+Table 21: Buffers used for cell lysis and protein purification
+Lysis buffer 50mM Tris-HCl pH 7.4
+200mM NaCl
+5% Glycerol
+1mM PMSF
+Wash buffer 50mM Tris-HCl pH 7.4
+1M NaCl
+5% Glycerol
+1mM β-mercaptoethanol
+Elution buffer 50mM Tris-HCl pH7.4
+200mM NaCl
+5% Glycerol
+200mM Imidazole
+1mM β-mercaptoethanol
+163
+164 buffers used for protein expression and purification
+Table 22: Buffers for dyalisis and storage
+Dialyse buffer 20mM Tris pH 7.9
+200mM NaCl
+5mM DTT
+Storage buffer 50mM Tris-HCl pH 7.4
+200mM NaCl
+5% glycerol
+5mM DTT
+B
+CORRECT IONS TO THE STOKES ’ LAW FOR SPHERE DIFFUS ION .
+perrin friction factors Perrin factor is a correction to the translational friction in
+the case of a rigid spheroid characterized by an axial ratio σ = a/b where a and b are the
+axial and the equatorial semiaxis, respectively. For p > 1 one has stick-shaped bodies and for
+p < 1 disc-shaped bodies.
+The Perrin factor is defined through a multiplicative correction term to the friction coefficient
+of a sphere:
+f = f ′cor sphere · fP (B.1)
+f ′sphere is the friction constant obtained for a sphere of equivalent volume of the spheroid
+body.
+The factor fP is defined by
+2σ2/3
+fP = (B.2)
+S
+where,
+a
+σ =
+b (√
+arcta |σ
+2−1|)
+S = 2 · √n σ
+|σ2−1|
+σ
+Hence, the diffusion constant for a spheroid reads as follow:
+KBT
+Dsp = ′ ·
+S
+f 2σ(sphere 2/3)
+diffusion constant for a torus The derivation of the translational diffusion
+constant for a torus can be found in [193]. Assuming rotational and traslational diffusion as
+decoupled, one obtains for the translational part:
+KBT · ( (8a) 1)Dsp = log +
+8πµa b 2
+where a and b are defined in Figure 65. µ is the viscosity.
+165
+166 corrections to the stokes’ law for sphere diffusion.
+Figure 65: Local coordinates of a Torus reprinted from reference [193]
+❚♦r✉s ❝♦rr❡❝t✐♦♥ To perform the correction due to the toroidal shape of the protein I
+estimated the values of a and b defined as in Figure 65. The inner and outer radius are
+calculated averaging over the distance of α-carbons respectively in the residues flanking the
+central hollow and in the five opposite sides of the pentameric pseudo-symmetry.
+The values shown in the text were obtained using the following viscosities (disregarding
+the differences between heavy and water):
+Table 23: Viscosity of water and heavy water as a function of temperature.
+Temp µH O µD O µD O/µ2 2 2 H2O
+Kelvin [10−3Pa · s] [10−3Pa · s]
+300 0.89 1.11 1.25
+350 0.35 0.45 1.29
+B IBL IOGRAPHY
+[1] F. Abe and K. Horikoshi. The biotechnological potential of piezophiles. Trends Biotechnol.,
+19(3):102–108, 2001. (Cité aux pages xviii et 20.)
+[2] M Abramowitz and IA Stegun. Handbook of Mathematical Functions. Dover Publications,
+1972. (Cité à page 136.)
+[3] MP Allen and DJ Tildesley. Computer Simulation of Liquids. 1987. (Cité aux pages xxi
+et 37.)
+[4] S.L. Altmann. Rotations, Quaternions, and Double Groups. Clarendon Press, Oxford, 1986.
+(Cité aux pages xxx, 73 et 97.)
+[5] CAF Andersen, AG Palmer, S Brunak, and B Rost. Continuum secondary structure
+captures protein flexibility. Structure, 10:175–184, 2002. (Cité aux pages 94, 100, 107
+et 108.)
+[6] A Balbo and S. Bozzaro. Cloning of dictyostelium eif6 (p27bbp) and mapping its
+nucle(ol)ar localization subdomains. Eur J Cell Biol, 85(9-10):1069–78, Sep 2006. doi:
+10.1016/j.ejcb.2006.05.010. (Cité aux pages xxiii, 25, 52 et 61.)
+[7] R.L. Baldwin. Temperature dependence of the hydrophobic interaction in protein
+folding. Proc Natl Acad Sci USA, 83(21):8069–72, 1986. (Cité à page 12.)
+[8] R.D. Ballard. Notes on a major oceanographic find. Oceanus, 20:35–40, 1977. (Cité à
+page 19.)
+[9] D.J. Barlow and J.M. Thornton. Helix geometry in proteins. J. Mol. Biol., 201:601–619,
+1988. (Cité aux pages 72, 80, 82, 83, 94 et 113.)
+[10] U Basu, K Si, J R Warner, and U Maitra. The saccharomyces cerevisiae TIF6 gene encoding
+translation initiation factor 6 is required for 60S ribosomal subunit biogenesis. Molecular
+and Cellular Biology, 75(5):1453–1462, 2001. (Cité aux pages xx et 25.)
+[11] U Basu, K Si, H Deng, and U Maitra. Phosphorylation of mammalian eukaryotic transla-
+tion initiation factor 6 and its saccharomyces cerevisiae homologue tif6p: Evidence that
+167
+168 bibliography
+phosphorylation of tif6p regulates its nucleocytoplasmic distribution and is required
+for yeast cell growth. Molecular and Cellular Biology, 23(17):6187–6199, 2003. (Cité aux
+pages 25 et 124.)
+[12] O. M. Becker, A. D. Jr. MacKerell, B. Roux, and M. Watanabe, editors. Computational
+Biochemistry and Biophysics. CRC Press, 2001. (Cité à page 62.)
+[13] M Bée. Quasielastic Neutron Scattering: Principles and Applications in Solid State Chemistry,
+Biology and Materials Science. 1988. (Cité aux pages xxi, 38 et 134.)
+[14] H.J.C. Berendsen, J.P.M. Postma, W.F. van Gunsteren, A. DiNola, and J.R. Haak. Molec-
+ular dynamics with coupling to an external bath. J. Chem. Phys., 81(8):3684–3690, 1984.
+(Cité aux pages xxvi et 36.)
+[15] J.P. Boon and S. Yip. Molecular Hydrodynamics. McGraw Hill, 1980. See eqs. (3.5.23),
+(3.5.33), (3.5.37) and the corresponding references. (Cité à page 129.)
+[16] J.F. Brandts, R.J. Oliveira, and C. Westort. Thermodynamics of protein denaturation.
+effect of pressu on the denaturation of ribonuclease a. Biochemistry, 9:1038–47, 1970.
+(Cité à page 10.)
+[17] P.W. Bridgman. The coagulation of albumem by pressure. J. Biol. Chem., 19:511–512,
+1914. (Cité à page 8.)
+[18] CJ Bult, O White, GJ Olsen, LX Zhou, RD Fleischmann, GG Sutton, JA Blake, LM FitzGer-
+ald, RA Clayton, JD Gocayne, AR Kerlavage, BA Dougherty, JF Tomb, MD Adams,
+CI Reich, R Overbeek, EF Kirkness, KG Weinstock, JM Merrick, A Glodek, JL Scott,
+NSM Geoghagen, JF Weidman, JL Fuhrmann, D Nguyen, TR Utterback, JM Kelley,
+JD Peterson, PW Sadow, MC Hanna, MD Cotton, KM Roberts, MA Hurst, BP Kaine,
+M Borodovsky, HP Klenk, CM Fraser, HO Smith, CR Woese, and JC Venter. Complete
+genome sequence of the methanogenic archaeon, Methanococcus Jannaschii. Science,
+273(5278):1058–1073, 1996. ISSN 0036-8075. (Cité aux pages xix, 23 et 47.)
+[19] V Calandrini and G Kneller. Influence of pressure on the slow and fast fractional
+relaxation dynamics in lysozyme: A simulation . . . . The Journal of Chemical Physics, Jan
+2008. (Cité à page 135.)
+[20] V Calandrini, V Hamon, K Hinsen, P Calligari, M.-C Bellissent-Funel, and G.R.Kneller.
+Relaxation dynamics of lysozyme in solution under pressure: Combining molecular
+bibliography 169
+dynamics simulations . . . . Chemical Physics, 345:289–297, Jan 2008. (Cité aux pages xxxvii,
+55, 135 et 152.)
+[21] H.B. Callen. Thermodynamics and an introduction to Thermostatistics. John Wiley, 1985.
+(Cité aux pages 9 et 10.)
+[22] PA Calligari, GR Kneller, A Giansanti, P Ascenzi, A Porrello, and A Bocedi. Inhibition
+of viral group-1 and group-2 neuraminidases by oseltamivir: a comparative structural
+analysis by the screwfit algorithm. Submitted, 2007. (Cité à page 123.)
+[23] M Carson, D Johnson, H McDonald, and C Brouillette. His-tag impact on structure.
+Acta Crystallographica Section D, 63(3):295–301, 2007. (Cité aux pages xxii et 50.)
+[24] J.V. Carter, D.G. Knox, and A. Rosenberg. Pressure effects on folded proteins in solution.
+hydrogen exchange at elevated pressures. J. Biol. Chem., 253(6):1947–53, 1978. (Cité à
+page 12.)
+[25] P Carter, CAF Andersen, and B Rost. Dsspcont: continuous secondary structure
+assignements for proteins. Nucleic Acids Research, 31(13):3293–3295, 2003. (Cité à
+page 94.)
+[26] D.A. Case, T.E. CheathamIII, T. Darden, H. Gohlke, R. Luo, K.M. Merz Jr., A. Onufriev,
+C. Simmerling, B. Wang, and R. Woods. The amber biomolecular simulation programs.
+J. Comp. Chem., 26:1668–1688, 2005. (Cité à page 30.)
+[27] D.A. Case, T.A. Darden, T.E. CheathamIII, C.L. Simmerling, J. Wang, R.E. Duke, R. Luo,
+K.M. Merz, D.A. Pearlman, M. Crowley, R.C. Walker, W. Zhang, B. Wang, S. Hayik,
+A. Roitberg, G. Seabra, K.F. Wong, F. Paesani, X. Wu, S. Brozell, V. Tsui, H. Gohlke,
+L. Yang, C. Tan, J. Mongan, V. Hornak, G. Cui, P. Beroza, D.H. Mathews, C. Schafmeister,
+W.S. Ross, and P.A. Kollman. AMBER 9. University of California, San Francisco., 2006.
+(Cité aux pages xxv et 59.)
+[28] M Ceci, C Gaviraghi, C Gorrini, L A Sala, N Offenhauser, PC Marchisio, and S Biffo.
+Release of eIF6 (p27BBP) from the 60S subunit allows 80S ribosome assembly. Nature,
+426:579–584, 2003. (Cité aux pages xx, 25 et 26.)
+[29] A. Certes. Sur la culture, à l’abri des germes atmosphériques, des eaux et des sédiments
+rapportés par les expéditions du travailleur et du talisman. Comptes Rendus, Accadémie
+des Sciences, 98:690–693, 1884. (Cité aux pages xviii et 19.)
+170 bibliography
+[30] A. Certes. De l’action des hautes pressions sur les phénomènes de la putréfaction et
+sur la vitalité des micro-organismes d’eau douce et d’eau de mer. Comptes Rendus,
+Accadémie des Sciences, 99:385–388, 1884. (Cité aux pages xviii, 8 et 19.)
+[31] JM Chandonia, G Hon, NS Walker, L Lo Conte, P Koehl, M Levitt, and S E Brenner.
+The astral compendium in 2004. Nucleic Acids Research, 32:D189–D192, 2004. (Cité à
+page 99.)
+[32] M Chasles. Note sur les propriétés générales du système de deux corps sembables
+entr’eux, et plaçés d’une manière queconque dans l’espace. Bulletin des Sciences Mathé-
+matiques, Astronomiques, Physiques et Chimiques, 14:321–326, 1830. (Cité aux pages xxx,
+72 et 96.)
+[33] M. Chasles. Rapport sur les Progrès de la Géométrie en France. Imprimérie Nationale, Paris,
+1870. See p. 77. (Cité aux pages xxx, 72 et 96.)
+[34] TP Chendrimada, KJ Finn, X Ji, D Baillat, RI Gregory, SA Liebhaber, AE Pasquinelli,
+and R. Shiekhattar. Microrna silencing through risc recruitment of eif6. Nature, 447:
+823–8, 2007. (Cité à page 25.)
+[35] G. Ciccotti and J.P. Ryckaert. Molecular dynamics simulation of rigid molecules. Comp.
+Phys. Rep., 4:345–392, 1986. (Cité à page 64.)
+[36] B. Cichocki, B.U. Felderhof, and R. Schmitz. Hydrodynamic interactions between two
+spherical particles. PhysicoChemical Hydrodynamics, 10:383, 1988. (Cité à page 57.)
+[37] B. Cichocki, B.U. Felderhof, K. Hinsen, E. Wajnryb, and J. Blawdziewicz. Friction and
+mobility of many spheres in Stokes flow. J. Phys. Chem., 100(5):3780–3790, 1993. (Cité à
+page 135.)
+[38] P. Cioni and G.B. Strambini. Pressure effects on protein flexibility in monomeric proteins.
+J. Mol. Biol., 242(3):291–301, 1994. (Cité à page 12.)
+[39] M. D. Collins, G. Hummer, M.L. Quillin B.W. Matthews, and S. M. Gruner. Cooperative
+water filling of a nonpolar protein cavity observed by high-pressure crystallography
+and simulation. Proc Natl Acad Sci USA, 102(46):16668–16671, 2005. (Cité à page 14.)
+[40] N Colloc’h, C Etchebest, E Thoreau, B Henrissat, and JP Mornon. Comparison of three
+algorithms for the assignment of secondary structure in proteins: the advantages of a
+consensus assignment. Protein Eng., 6(4):377–82, 1993. (Cité aux pages 94, 103 et 106.)
+bibliography 171
+[41] A.R. Cossins and A.G. Macdonald. The adaptation of biological membranes to temper-
+ature and pressure; fish from the deep and cold. J. Bioenerg. Biomembr., 21:115–35, 1989.
+(Cité à page 20.)
+[42] T.E. Creighton. Proteins, Structure and Molecular Properties. Freeman and Company, New
+York, 5th edition, 1997. (Cité aux pages 8, 11 et 13.)
+[43] T.E. Creighton. Disulphide bonds and protein stability. Bioessays, 8(2-3):57–63, 2005.
+(Cité à page 11.)
+[44] E.P. Dahlhoff and G.N. Somero. Pressure and temperature adaptation of cytosolic
+malate dehydrogenases of shallow- and deep-living marine invertebrates: evidence for
+high body temperature in hydrothermal vents aniumals. J. Exp. Biol., 159:473–87, 1991.
+(Cité à page 20.)
+[45] E.P. Dahlhoff, S. Schneidemann, and G.N. Somero. Pressure-temperature interactions
+on M4-lactate dehydrogenases from hydrothermal vents fishes. Biol. Bull. Woods Hole,
+179:134–139, 1990. (Cité aux pages 20 et 21.)
+[46] S.W. de Leeuw, J.W. Perram, and E.R. Smith. Simulation of electrostatic systems in
+periodic boundary conditions. I. lattice sum and dielectric constant. Proc. R. Soc. Lond.
+A, 373:27–56, 1980. (Cité à page 33.)
+[47] H. De Smedt, H. Olbrechts, and K. Heremans. Phase transi- tions in artificial membranes:
+high pressure light scattering studies. Europhys. Conf. Abstr. A, Leuwen, 1:98–99, 1975.
+(Cité à page 10.)
+[48] G. Decket and P.V. Warren. The complete genome sequence of the hyperthermophileic
+bacterium aquifex aeolicus. Nature, 392:353–358, 1996. (Cité aux pages xvii et 17.)
+[49] Y. Dehouck, B. Folch, and M. Rooman. Revisiting the correlation between proteins’
+thermoresistance and organisms’ thermophilicity. Protein Eng. Des. Sel., 21(4):275–278,
+2008. (Cité à page 17.)
+[50] R Diamond. A note on the rotational superposition problem. Acta Cryst. A, 44:211–216,
+1988. (Cité aux pages xxx, 96 et 97.)
+[51] H.G. Drickamer and Franck C.W. Electronic transition and high pressure chemistry and
+physics of solids. London: Chapman and Hall, 1973. (Cité à page 11.)
+172 bibliography
+[52] A. Erdélyi, W. Magnus, F. Oberhettinger, and F.G. Tricomi. Higher Transcendental
+Functions. McGraw Hill, 1955. (Cité à page 136.)
+[53] P. Ewald. Die Berechnung optischer und electrostatischer Gitterpotentiale. Ann. Phys.,
+64:253–87, 1921. (Cité à page 33.)
+[54] H Fischer. Average protein density is a molecular-weight-dependent function. Protein
+Science, 13(10):2825–2828, Oct 2004. doi: 10.1110/ps.04688204. (Cité à page 58.)
+[55] R.J. Frankenberg, M. Andersson, and D.S. Clark. Effect of temperature and pressure
+on the proteolytic specificity of the recombinant 20S proteasome from methanococcus
+jannschii. Extremophiles, 7:353–360, 2003. (Cité aux pages xix et 23.)
+[56] D. Frenkel and B. Smit. Understanding Molecular Simulation. Academic Press, London,
+San Diego, 1996. (Cité aux pages xxi et 37.)
+[57] D. Frishman and P. Argos. Knowledge-based secondary structure assignment. Proteins,
+23:566–579, 1995. (Cité aux pages 72, 94 et 103.)
+[58] F. Gaill. Aspects of life development at deep sea hydrothermal vents. FASEB J., 7(6):
+558–565, 1993. (Cité aux pages xvi et 16.)
+[59] C.W. Gardiner. Handbook of Stochastic Methods. Springer Series in Synergetics. Springer,
+Berlin, Heidelberg, New York, 2nd edition, 1985. (Cité à page 136.)
+[60] K. Gekko and Y. Hasegawa. Compressibility/structure relationship of globular proteins.
+Biochemistry, 25:6563–6571, 1986. (Cité à page 14.)
+[61] K. Gekko and Y. Hasegawa. Effect of temperature on the compressibility of native
+globular proteins. J. Phys. Chem., 93:426–429, 1989. (Cité à page 14.)
+[62] K. Gekko and H. Noguchi. Compressibility of globular proteins in water at 25 c. J. Phys.
+Chem., 83:2706–2714, 1979. (Cité à page 11.)
+[63] M. Gerstein and C. Chothia. Packing at the protein-water interface. Proc Natl Acad Sci
+USA, 93:101167–101172, 1996. (Cité à page 59.)
+[64] W.G. Glöckle and T.F. Nonnenmacher. A fractional calculus approach to self-similar
+protein dynamics. Biophys. J., 68:46–53, 1995. (Cité aux pages 135 et 137.)
+[65] K. Goosens, L. Smeller, and K. Heremans. Pressure tuning spectroscopy of the low-
+frequency raman spectrum of liquid amides. J. Chem. Phys., 99:5736–5741, 1993. (Cité à
+page 12.)
+bibliography 173
+[66] C M Groft, R Beckmann, A Sali, and S K Burley. Crystal structures of ribosome
+anti-association factor IF6. Nature Structural Biology, 7(12):1156–64, Dec 2000. doi:
+10.1038/82017. (Cité aux pages xx, xxi, xxii, 25, 26, 27, 51, 60, 61, 64, 121 et 124.)
+[67] M. Gross and R. Jaenicke. Proteins under pressure. Eur. J. Biochem., 221:617–630, 1994.
+(Cité aux pages 11, 13, 19 et 22.)
+[68] M. Gross, K. Lehle, R. Jaenicke, and K.H. Nierhaus. Pressure-induced dissociation of
+ribosomes and elongation cycle intermediates. stabilizing conditions and identification
+of the most sensitive functional state. Eur. J. Biochem., 218:463–468, 1993. (Cité à page 22.)
+[69] A Grottesi, MA Ceruso, A Colosimo, and A Di Nola. Molecular dynamics study of a
+hyperthermophilic and a mesophilic rubredoxin. Proteins Structure Function and Genetics,
+46(3):287–294, 2002. (Cité aux pages xvii, 18 et 158.)
+[70] G.D. Hawkins, C.J. Cramer, and D.G. Truhlar. Pairwise solute descreening of solute
+charges from a dielectric medium. Chem. Phys. Lett., 246:122–129, 1995. (Cité à page 62.)
+[71] G.D. Hawkins, C.J. Cramer, and D.G. Truhlar. Parametrized models of aqueous free
+ener- gies of solvation based on pairwise descreening of solute atomic charges from a
+dielectric medium. J. Phys. Chem., 100:19824–19839, 1996. (Cité à page 62.)
+[72] S.A. Hawley. Reversible pressure-temperature denaturation of chymotrypsinogen.
+Biochemistry, 10:2436–42, 1971. (Cité à page 10.)
+[73] S.A. Hawley and R.M. Macleod. The effect of base composition on the pressure stability
+of dna in neutral salt solution. Biopolymers, 16:1833–35, 1977. (Cité à page 10.)
+[74] D.J. Hei and D.S. Clark. Pressure stabilization of proteins from extreme thermophiles.
+Appl. Environ. Microbiol., 60:932–939, 1994. (Cité aux pages xix, 13 et 23.)
+[75] K. Heremans and L. Smeller. Protein structrure and dynamics at high pressure. Biochem.
+et Biophys. Acta, 1386:353–370, 1998. (Cité à page 8.)
+[76] L. Heremans and K. Heremans. Pressure effects on the raman spectrum of proteins:
+stability of the salt bridge in trypsin and elastase. J. Mol. Struct., 214:305–314, 1989.
+(Cité à page 11.)
+[77] L. Heremans and K. Heremans. Raman spectroscopic study of the changes in secondary
+structure of chymotrypsin: Effect of ph and pressure on the salt bridge. Biochem. et
+Biophys. Acta, 999:192–197, 1989. (Cité à page 11.)
+174 bibliography
+[78] D.M. Heyes. Electrostatic potentials and fields in infinite point charge lattice. J. Chem.
+Phys., 74:1924–29, 1981. (Cité à page 33.)
+[79] K Hinsen. The molecular modeling toolkit: A new approach to molecular simulations.
+J. Comp. Chem., 21:79–85, 2000. (Cité à page 91.)
+[80] K. Hinsen and G.R Kneller. A simplified force field for describing vibrational protein
+dynamics over the whole frequency range. J. Chem. Phys., 111(24):10766–10769, 1999.
+(Cité à page 14.)
+[81] K Hinsen and GR Kneller. Projection methods for the analysis of complex motions in
+macromolecules. Mol. Sim., 23:275–292, 2000. (Cité à page 99.)
+[82] K. Hinsen, A.-J. Petrescu, S. Dellerue, M.C. Bellissent-Funel, and G.R. Kneller. Har-
+monicity in slow protein dynamics. Chem. Phys., 261(1+2):25–38, 2000. Special Issue
+"Condensed Phase Structure and Dynamics: A combined neutron scattering and molec-
+ular modelling approach". (Cité à page 14.)
+[83] G. Hui Bon Hoa, M. Graffe, and M. Grunberg-Manago. Thermodynamic studies of the
+reversible association of escherichia coli ribosomal subunits. Biochemistry, 16(12):2800–5,
+1977. (Cité à page 22.)
+[84] U Hobohm and C Sander. Enlarged representative set of protein structures. Protein
+Science, 3:522, 1994. (Cité à page 99.)
+[85] K. Horikoshi. Barophiles: deep-sea microorganisms adapted to an extreme environment
+barophiles: deep-sea microorganisms adapted to an extreme environment. Curr. Opin.
+Microbiol., 1:291–295, 1998. (Cité aux pages xvi et 16.)
+[86] Viktor Hornak, Robert Abel, Asim Okur, Bentley Strockbine, Adrian Roitberg, and
+Carlos Simmerling. Comparison of multiple amber force fields and development
+of improved protein backbone parameters. Proteins, 65(3):712–725, Nov 2006. doi:
+10.1002/(ISSN)1097-0134. (Cité aux pages xxv, 30 et 59.)
+[87] G. Hummer, S. Garde, A.E. Garcia, M.E. Paulaitis, and L.R. Pratt. The pressure depen-
+dence of hydrophobic interactions is consistent with the observed pressure denaturation
+of proteins. PNAS, 95:1552–1555, 1998. (Cité aux pages 13 et 14.)
+[88] William Humphrey, Andrew Dalke, and Klaus Schulten. Vmd – visual molecular
+dynamics. Journal of Molecular Graphics, 14:33–38, 1996. (Cité à page 91.)
+bibliography 175
+[89] G Hutchinson. Promotif - a program to identify structural motifs in proteins. Protein
+Science, 5:212–220, 1996. (Cité aux pages 83 et 94.)
+[90] J.K. Ichikawa and S. Clarke. A highly active protein repair enzyme from the extreme
+thermophile t.marittima. Arch. Biophys. Biochem., 358:222–231, 1998. (Cité à page 17.)
+[91] R. Jaenicke. Current perspectives in high pressure biology, pages 257–272. Academic Press,
+1987. (Cité à page 22.)
+[92] R. Jaenicke. Protein stability and molecular adaptation to extreme conditions. Eur. J.
+Biochem., 202:715–728, 1991. (Cité aux pages xvi, xvii, 16, 17, 18 et 152.)
+[93] R Jaenicke. Stability and stabilization of globular proteins in solution. J Biotechnol, 79
+(3):193–203, May 2000. (Cité aux pages xvi, xvii, 10, 16, 17 et 18.)
+[94] R Jaenicke. Do ultrastable proteins from hyperthermophiles have high or low confor-
+mational rigidity? Proceedings of the National Academy of Sciences, 97(7):2962, 2000. (Cité
+aux pages 11 et 17.)
+[95] R. Jaenicke and G. Bohm. Stabilization of proteins: what extremophiles teach us about
+protein stability. Curr. Opin. Struct. Biol., 8:738–748, 1998. (Cité aux pages 13 et 17.)
+[96] R. Jaenicke and G. Bohm. Thermostability of proteins from thermotoga maritima.
+Methods Enzymol, 334:438–469, 2001. (Cité aux pages xvii et 18.)
+[97] R. Jaenicke, G. Bernhardt, H.D. Ludemann, and K.O. Stetter. Pressure induced al-
+terations in the protein pattern of the thermophilic arcaebacterium methanococcus
+thermolithotrophicus. Appl. Environ. Microbiol., 1988:2375–80, 54. (Cité à page 19.)
+[98] H.W. Jannasch and C.D. Taylor. Deep-sea microbiology. Ann. Rev. Microbiol., 38:487–514,
+1984. (Cité aux pages xviii, 19 et 21.)
+[99] J. Jonas. High-resolution nuclear magnetic resonance studies of proteins. Biochimica
+Biophysica Acta, 1595(1-2):145–159, 2002. (Cité à page 8.)
+[100] J. Jonas, A. Jonas, and Jon. High-pressure nmr spectroscopy of proteins and membranes.
+Ann. Rev. Biophys. Biomol. Struct., 23:287–318, 1994. (Cité à page 15.)
+[101] DT Jones. Protein secondary structure prediction based on position-specific scoring
+matrices. J. Mol. Biol., 292:195–202, 1999. (Cité à page 52.)
+176 bibliography
+[102] W. Jones, J. A. Leigh, F. Mayer, C. R. Woese, and R. S. Wolfe. Methanococcus jannaschii
+sp. nov., an extremely thermophilic methanogen from a submarine hydrothermal vent.
+Arch. Microbiol., 136:254, 1963. (Cité aux pages xix, 22 et 23.)
+[103] William L Jorgensen, Jayaraman Chandrasekhar, Jeffry D Madura, Roger W Impey,
+and Michael L Klein. Comparison of simple potential functions for simulating liquid
+water. The Journal of Chemical Physics, 79(2):926, Jan 1983. doi: 10.1063/1.445869. (Cité à
+page 31.)
+[104] WL Jorgensen, J Chandrasekhar, JD Madura, RW Impey, and ML Klein. Comparison of
+simple potential functions for simulating liquid water. The Journal of Chemical Physics,
+79:926, 1983. (Cité à page 31.)
+[105] C. Josefiak and Schneider G.M. Determination of reaction volumes of hydrogen-bonding
+equilibria by high-pressure near-infrared spectroscopy. 2. Self-association of phenol in
+CCI, up to 1 kbar. J. Phys. Chem., 84:3004–7, 1980. (Cité à page 12.)
+[106] W. Kabsch and C. Sander. Dictionary of protein secondary structure: Pattern recognition
+of hydrogen-bonded and geometrical features. Biopolymers, 22:2577–2637, 1983. (Cité
+aux pages 72, 82, 94 et 103.)
+[107] C. Kato and D.H. Bartlett. The molecular biology of barophilic bacteria. Extremophiles,
+1:111–116, 1997. (Cité aux pages xvi, 16 et 19.)
+[108] C. Kato, A. Inoue, and K. Horikoshi. Isolating and characterizing deep-sea marine
+organisms. Trends Biotechnol., 14:6–12, 1996. (Cité à page 19.)
+[109] W. Kauzmann. Some factors in the interpretation of protein denaturation. Adv. Protein
+Chem, 14:1–67, 1959. (Cité à page 12.)
+[110] W. Kauzmann. Thermodynamics of unfolding. Nature, 325:723–724, 1987. (Cité à
+page 12.)
+[111] SE Kearsley. On the orthogonal transformation used for structural comparisons. Acta
+Cryst. A, 45:208–210, 1989. (Cité aux pages 73 et 74.)
+[112] G Kneller and V Calandrini. Estimating the influence of finite instrumental resolution
+on elastic neutron scattering intensities . . . . The Journal of Chemical Physics, Jan 2007.
+(Cité à page 138.)
+bibliography 177
+[113] Gerald R Kneller. Quasielastic neutron scattering and relaxation processes in proteins:
+analytical and simulation-based models. Physical chemistry chemical physics : PCCP, 7
+(13):2641–55, Jul 2005. doi: 10.1039/b502040a. (Cité à page 135.)
+[114] Gerald R Kneller and Paolo Calligari. Efficient characterization of protein secondary
+structure in terms of screw motions. Acta Crystallographica Section D, 62(3):302–311, 2006.
+(Cité aux pages xxx, 95, 96, 97, 100, 101, 102, 106 et 109.)
+[115] G.R. Kneller. Superposition of molecular structures using quaternions. Mol. Sim., 7:
+113–119, 1991. (Cité aux pages xxx, 73, 74, 88, 96, 97 et 139.)
+[116] G.R. Kneller. Comment on “Using quaternions to calculate RMSD” [J. Comp. Chem. 25,
+1849 (2004)]. J. Comp. Chem., 26(15):1660–1662, 2005. (Cité aux pages xxx, 75, 96 et 97.)
+[117] G.R. Kneller. Quasielastic neutron scattering and relaxation processes in proteins:
+Analytical and simulation-based models. Physical Chemistry Chemical Physics, 7:2641 –
+2655, 2005. (Cité aux pages 136 et 137.)
+[118] GR Kneller and K Hinsen. Computing memory functions from molecular dynamics
+simulations. J. Chem. Phys., 115(24):11097–11105, 2001. (Cité à page 61.)
+[119] GR Kneller and K Hinsen. Fractional brownian dynamics in proteins. J .Chem. Phys.,
+121(20):10278–10283, 2004. (Cité aux pages xxxvii et 135.)
+[120] GR Kneller, V Keiner, M Kneller, and M Schiller. Nmoldyn, a program package for the
+calculation and analysis of neutron scattering spectra from md simulations. Comp. Phys.
+Comm., 91:191–214, 1995. (Cité à page 88.)
+[121] CE Kundrot and FM Richards. Crystal structure of hen egg-white lysozyme at a
+hydrostatic pressure of 1000 atmospheres. J. Mol. Biol., 193:157–170, 1987. (Cité aux
+pages 14, 15, 83, 84 et 85.)
+[122] J Kyte and RF Doolittle. A simple method for displaying the hydropathic character of a
+protien. J. Mol. Biol., 157:105, 1982. (Cité aux pages xxiii et 52.)
+[123] G Labesse, N Colloc’h, J Pothier, and J P Mornon. P-sea: a new efficient assignment of
+secondary structure from c alpha trace of proteins. Comput. Appl. Biosci., 13:291–295,
+1997. (Cité à page 103.)
+178 bibliography
+[124] J.V. Landau and D.H. Pope. Recent advances in the area of barotolerant protein synthesis
+in bacteria and implications concerning barotolerant and barophilic growth. Adv. Aquat.
+Micro., 2:49–76, 1980. (Cité à page 22.)
+[125] J.V. Landau, W.P. Smith, and D.H. Pope. Role of the 30s ribosomal subunit, initiation
+factors, and specific ion concentration in barotolerant protein synthesis in pseudomonas
+bathycetes. J. Bacteriol., 130:154–59, 1977. (Cité à page 22.)
+[126] H. Le Chatelier. Sur un énoncé général des lois des équilibres chimiques. Comptes
+Rendus, Accadémie des Sciences, 99:786–89, 1884. (Cité à page 9.)
+[127] V. Le Tilly, O. Sire, B. Alpert, and P.T.T. Wong. An infrared study of 2H-bond variation
+in myoglobin revealed by high pressure. Eur. J. Biochem., 205:1061–1065, 1992. (Cité à
+page 12.)
+[128] M Levitt and J Greer. Automatic identification of secondary structure in globular
+proteins. J. Mol. Biol., 114:181–239, 1977. (Cité à page 103.)
+[129] SW Lovesey. Theory of Neutron Scattering from Condensed Matter, volume I. 1984. (Cité
+aux pages xxi et 38.)
+[130] P.S. Low, J.L. Bada, and G.N. Somero. Temperature adaptation of enzymes: Roles of
+the free energy, the enthalpy, and the entropy of activation. Proc Natl Acad Sci USA, 70:
+430–43, 1973. (Cité à page 21.)
+[131] E. Madelung. Das elektrische Feld in Systemen von regelmassig angeordneten Punkt-
+ladungen. Phys. Z., 22:861–8, 1918. (Cité à page 33.)
+[132] P. Masson and C. Clery. Effect of pressure on structure and activity of cholinesterase.
+In A.S. Balasubramanian, B.P. Doctor, P. Taylor, and D.M. Quinn, editors, Enzymes of the
+Cholinesterase Family. Plenum, NewYork, 1995. (Cité à page 15.)
+[133] P. Masson, C. Clery, P. Guerra, A. Redslob, C. Albaret, and P.L. Fortier. Enzymes -
+hydration change during the aging of phosphorylated human butyrylcholinesterase:
+Importance of residues aspartate-70 and glutamate-197 in the water network as probed
+by hydrostatic and osmotic pressures. Biochemical Journal, 343:361–370, 1999. (Cité à
+page 14.)
+[134] B.W. Matthews. Structural and genetic analysis of protein stability. Ann. Rev. Biochem.,
+62:139–160, 1993. (Cité à page 18.)
+bibliography 179
+[135] B.W. Matthews. Studies on protein stability with t 4 lysozyme. Adv. Protein Chem, 46:
+249–278, 1995. (Cité à page 18.)
+[136] B.W. Matthews. Structural and genetic analysis of the folding and function of t4
+lysozyme. FASEB J., 10:35–41, 1996. (Cité à page 18.)
+[137] R. Metzler and J. Klafter. The random walk’s guide to anomalous diffusion: A fractional
+dynamics approach. Phys. Rep., 339:1–77, 2000. (Cité à page 135.)
+[138] P.C. Michels and D.S. Clark. Pressure enhanced activity and stability of a hyperther-
+mophilic protease from a deep-sea methanogen. Appl. Environ. Microbiol., 63:3985–3991,
+1997. (Cité aux pages xix, 13 et 23.)
+[139] P.C. Michels, D. Hei, and D.S. Clark. Pressure effects on enzyme activity and stability
+at high temperature. Adv. Protein Chem, 48:341–376, 1996. (Cité aux pages 11 et 13.)
+[140] S. Miller and J.L. Bada. Submarine hot springs and the origin of life. Nature, 342:255,
+1988. (Cité à page 17.)
+[141] S. Miller and A. Lazcano. The origin of life‚Äîdid it occur at high temperatures? J. Mol.
+Evol., 41:689, 1995. (Cité à page 17.)
+[142] Zoran Minic, Valérie Serre, and Guy Hervé. Adaptation of organisms to extreme
+conditions of deep-sea hydrothermal vents. C R Biol, 329(7):527–40, Jul 2006. doi:
+10.1016/j.crvi.2006.02.001. (Cité à page 21.)
+[143] E. Mombelli, M. Afshar, P. Fusi, M. Mariani, P. Tortora, J.P. Connelly, and R. Lange. The
+role of phenylalanine 31 in maintaining the conformational stability of ribonuclease
+p2 from solfolobus solfataricus under extreme conditions of temperature and pressure.
+Biochemistry, 36(29):8733–42, 1997. (Cité à page 8.)
+[144] V.V Mozhaev, K Heremans, J Frank, P Masson, and Claude Balny. High pressure effects
+on protein structure and function. Proteins: Structure, Function, and Genetics, 24:81–91,
+Nov 1996. (Cité aux pages xvi, 11 et 14.)
+[145] A. G. Murzin, S. E. Brenner, T. Hubbard, and C. Chothia. Scop: a structural classification
+of proteins database for the investigation of sequences and structures. J. Mol. Biol., 247:
+536–540, 1995. (Cité aux pages 80 et 99.)
+[146] A. Onufriev, D. Bashford, and D.A. Case. Modification of the generalized born model
+suitable for macromolecules. J. Phys. Chem. B, 104:3712–3720, 2000. (Cité à page 62.)
+180 bibliography
+[147] C.N. Pace, B.A. Shirley, M. McNutt, and K. Gajiwala. Forces contribuiting to the
+conformational stability of proteins. FASEB J., 10:75–83, 1996. (Cité aux pages xvii, 17
+et 18.)
+[148] E Paci and M Marchi. Intrinsic compressibility and volume compression in solvated
+proteins by molecular dynamics simulation at high pressure. Proc Natl Acad Sci US A,
+93(21):11609–11614, 1996. (Cité à page 14.)
+[149] A.A. Paladini, J.L. Silva, and G. Weber. Slab gel electrophoresis of oligomeric proteins
+under high hydrostatic pressure. Anal. Biochem., 161:358–364, 1987. (Cité à page 15.)
+[150] X. Peng, J. Jonas, and J.L. Silva. High-pressure nmr study of the dissociation of arc
+repressor. Biochemistry, 33:8323–8329, 1994. (Cité à page 15.)
+[151] G.A. Petsko. Structural basisof thermostability in hyperthermophilic proteins, or
+"there’s more than one way to skin a cat". Methods Enzymol, 334:469–478, 2001. (Cité
+aux pages xvi, xvii, 16 et 18.)
+[152] M. Potchka and T.M. Schuster. Determination of reaction volumes and polymer
+distribution characteristic of tobacco mosaic virus coat protein. Anal. Biochem., 161:
+70–79, 1987. (Cité à page 15.)
+[153] P.L. Privalov. In T.E. Creighton, editor, Protein folding, pages 83–126. W.H. Freeman and
+Company, New York, 1993. (Cité à page 13.)
+[154] O.B. Ptitsyn. The molten globule state. In T.E. Creighton, editor, Protein Folding, pages
+243–300. Freeman and Company, 1992. (Cité à page 15.)
+[155] J.R. Quine. Helix parameters and protein structure using quaternions. J. Mol. Struct.
+(Theochem), 460:53–66, 1999. (Cité à page 72.)
+[156] GPS Raghava. APSSP2 : A combination method for protein secondary structure
+prediction based on neural network and example based learning. CASP5, A:132, 2002.
+(Cité à page 52.)
+[157] R. Ragone and G. Colonna. Do globular proteins require some structural peculiarity
+to best function at high temperatures? J. Am. Chem. Soc., 117:16–20, 1995. (Cité aux
+pages xvii et 18.)
+[158] A. Razvi and J.M. Scholtz. Lessons in stability from thermophilic proteins. Proteins
+Science, 15(7):1569, 2006. (Cité aux pages xvi, xvii, 16 et 18.)
+bibliography 181
+[159] M. Refaee, T. Tezuka, K. Akasaka, and M.P. Williamson. Pressure-dependent changes
+in the solution structure of hen egg-white lysozyme. J. Mol. Biol., 327:857–865, 2003.
+(Cité aux pages 83 et 85.)
+[160] P. Regnard. La vie dans les eaux. Paris, 1891. (Cité à page 8.)
+[161] L.E. Reichl. A modern course in Statistical Mechanics. Arnold Publishers, 9180. (Cité à
+page 10.)
+[162] R.E. Rhoads. Signal transduction pathways that regulate eukaryotic protein synthesis.
+J. Biol. Chem., 274:30337–30340, 1999. (Cité à page 22.)
+[163] FM Richards and CE Kundrot. Identification of structural motifs from protein coordinate
+data: Secondary structure and first-level supersecondary structure. Proteins, 3:71–84,
+1988. protein secondary structure recognition. (Cité aux pages 72, 94 et 103.)
+[164] H. Risken. The Fokker-Planck Equation. Springer Series in Synergetics. Springer, Berlin,
+Heidelberg, New York, 2nd reprinted edition, 1996. (Cité aux pages 134 et 136.)
+[165] K.K. Rodgers and S.G. Sligar. Mapping electrostatic interactions in macromolecular
+associations. J. Mol. Biol., 221:1453–1460, 1991. (Cité à page 11.)
+[166] T. Rog, K. Murzyn, K. Hinsen, and G.R. Kneller. nMoldyn : A Program Package for
+a Neutron Scattering Oriented Analysis of Molecular Dynamics Simulations. J. Comp.
+Chem., 24(5):657–667, 2003. (Cité aux pages 88 et 139.)
+[167] L.J. Rothschild and R. Mancinelli. Life in extreme environments. Nature, 409:1092–1102,
+2001. (Cité à page 17.)
+[168] C. Royer. Revisiting volume changes in pressure-induced protein unfolding. BBA
+Biochem. et Biophys. Acta, 1595:201–9, 2002. (Cité à page 13.)
+[169] K. Ruan, C. Xu, Y. Yu, J. Li, R. Lange, N. Bec, and C. Balny. Pressure-exploration of the
+33-kDa protein from the spinach photosystem II particule. Eur. J. Biochem., 268:2742–50,
+2001. (Cité à page 8.)
+[170] D.W. Russell and L.L. Spremulli. Purification and characterization of a ribosome
+dissociation factor (eukaryotic initiation factor 6) from wheat germ. J. Biol. Chem., 254
+(18):8796–8800, 1979. (Cité aux pages xx, 23 et 25.)
+182 bibliography
+[171] S. Samarasinghe, D.M. Campbell, A. Jonas, and J. Jonas. High-resolution nmr study of
+the pressure-induced unfolding of lysozyme. Biochemistry, 31:7773–7778, 1992. (Cité à
+page 15.)
+[172] F. Sanvito. Expression of a highly conserved protein, p27BBP, during the progression
+of human colorectal cancer. Cancer Res., 60:510–516, 2000. (Cité à page 159.)
+[173] F. Sanvito, S. Piatti, A. Villa, M. Bossi, G. Lucchini, P.C. Marchisio, and S. Biffo. The β4
+integrin interactor p27(bbp/eif6) is an essential nuclear matrix protein involved in 60s
+ribosomal subunit assembly. J. Cell Biol., 144:823–837, 1999. (Cité aux pages xx et 24.)
+[174] M.J. Schlesinger. Heat-shock proteins. J. Biol. Chem., 265(21):12111, 1990. (Cité à
+page 19.)
+[175] V. Sears. Neutron scattering lengths and cross sections. Neutron News, 3(3):26–37, 1992.
+(Cité à page 41.)
+[176] J.M. Selig. Geometrical methods in robotics. Springer, 1996. (Cité à page 72.)
+[177] B. Senger, D. L.J. Lafontaine, J-S Graindorge, O Gadal, A Camasses, A Sanni, J-M
+Garnier, M Breitenbach, E Hurt, and F Fasiolo. The nucle(ol)ar tif6p and efl1p are
+required for a late cytoplasmic step of ribosome synthesis. Molecular Cell, 8:1–20, 2001.
+(Cité aux pages xx et 24.)
+[178] K. Si and U Maitra. The saccharomyces cerevisiae homologue of mammalian translation
+initiation factor 6 does not functions as a translation initiation factor. Molecular and
+Cellular Biology, 19(2):1416–1426, 1999. (Cité aux pages xx, 24 et 25.)
+[179] J.F. Siebenaller and G.N. Somero. Biochemical adaptation to the deep sea. CRC Crit.
+Rev. Aquat. Sci., 1:1–25, 1989. (Cité à page 20.)
+[180] J.L. Silva and G. Weber. Pressure stability of proteins. Ann. Rev. Phys. Chem., 44:89–113,
+1993. (Cité aux pages 14 et 15.)
+[181] H Sklenar, C Etchebest, and R Lavery. Describing protein structure: A general algorithm
+yielding complete helicoïdal parameters and a unique overall axis. Proteins: Str. Func.
+Genet., 6:46–60, 1989. (Cité aux pages 72, 94 et 103.)
+[182] G.N. Somero. Adaptations to high hydrostatic pressure. Annu. Rev. Physiol., 54:557–577,
+1992. (Cité aux pages xvi, 16 et 20.)
+bibliography 183
+[183] G.N. Somero, J.F. Siebenaller, and P.W. Hochachka. In G.T. Rowe, editor, The Sea. Wiley,
+1983. (Cité à page 21.)
+[184] J. M. Sperrazza, D. W. Russell, and L. L. Spremulli. Reversible dissociation of wheat
+germ ribosomal subunits: cation-dependent equilibriums and thermodynamic parame-
+ters. Biochemistry, 19(6):1053–1058, 1980. (Cité à page 22.)
+[185] A.S. Spirin. On the equilibrium of the association-dissociation reaction of ribosomal
+subparticles and on the existance of the so-called "60s intermediate" ("swollen 70s")
+during centrifugation of the equilibrium mixture. FEBS Letters, 14:349–353, 1971. (Cité
+à page 22.)
+[186] A.S. Spirin. Ribosomes. Cellular Organelles Series. Kluwer Academic/ Plenum Publisher,
+1998. (Cité à page 24.)
+[187] L. Stryer. Biochemistry. W.H. Freeman and Company, 1988. (Cité aux pages 8, 13, 72
+et 94.)
+[188] M.M.C. Sun, N. Tolliday, C. Vetriani, F. T. Robb, and D. S. Clark. Pressure-induced
+thermostabilization of glutamate dehydrogenase from the hyper thermophile pyrococcus
+furiosus. Protein Science, 8:1056–1063, 1999. (Cité à page 21.)
+[189] C. Tanford. Protein denaturation. Adv. Protein Chem, 23:121–282, 1968. (Cité à page 8.)
+[190] WR Taylor. Defining linear segments in protein structure. J. Mol. Biol., 310:1135–1150,
+2001. protein secondary structure recognition. (Cité aux pages 72 et 94.)
+[191] M Tehei and G Zaccai. Adaptation to high temperatures through macromolecular
+dynamics by neutron scattering. FEBS Journal, Jan 2007. (Cité aux pages xvi, 16 et 152.)
+[192] Moeava Tehei, Bruno Franzetti, Dominique Madern, Margaret Ginzburg, Ben Z
+Ginzburg, Marie-Thérèse Giudici-Orticoni, Mireille Bruschi, and Giuseppe Zaccai. Adap-
+tation to extreme environments: macromolecular dynamics in bacteria compared in vivo
+by neutron scattering. EMBO Rep, 5(1):66–70, Jan 2004. doi: 10.1038/sj.embor.7400049.
+(Cité aux pages 152 et 158.)
+[193] R.M. Thaorak. Brownian motion of a torus. Colloids and Surfaces A : Physicochem. Eng.
+Aspects, 317:650–657, 2008. (Cité aux pages 165 et 166.)
+[194] Thomas. The graduation of secondary structure elements. J. Mol. Graphics, 12:146–152,
+1994. (Cité aux pages 72 et 94.)
+184 bibliography
+[195] D.J. Tobias, G.J. Martyna, and M.L. Klein. Molecular Dynamics simulations of a protein
+in the canonical ensemble. J. Phys. Chem., 97:12959–12966, 1993. (Cité aux pages xxvi
+et 36.)
+[196] J Torrent, MT Alvarez-Martinez, F Heitz, JP Liautard, C Balny, and Reinhard Lange.
+Insights into alternative prion protein topologies induced under high hydrostatic
+pressure. J. Phys.: Condens. Matter, 16:S1059–S1065, 2004. (Cité à page 16.)
+[197] C.L. Tsou. Folding of the nascent peptide chain into a biologically active protein.
+Biochemistry, 27:1809–1812, 1988. (Cité aux pages xvii et 18.)
+[198] V. Tsui and D.A. Case. Theory and applications of the generalized born solvation model
+in macromolecular simulations. Biopolymers (Nucl. Acid. Sci.), 56:275–291, 2001. (Cité à
+page 61.)
+[199] D M Valenzuela, A Chaudhuri, and U Maitra. Eukaryotic ribosomal subunit anti-
+association activity of calf liver is contained in a single polypeptide chain protein of mr
+= 25,500 (eukaryotic initiation factor 6). J Biol Chem, 257(13):7712–9, Jul 1982. (Cité aux
+pages xx, 23, 25 et 53.)
+[200] R. Van Eldik, T. Asano, and W.J. Le Noble. Activation and reaction volume in solution
+2. Chem. Rev., 89:549–688, 1989. (Cité aux pages 11 et 12.)
+[201] L. van Hove. Correlations in space and time and Born approximation in systems of
+interacting particles. Phys. Rev., 93(1):249–262, 1954. (Cité à page 39.)
+[202] M.C. Vaney, S. Maignan, M. Ries-Kautt, and A. Ducruix. High-resolution structure (1.33
+a) of a hew lysozyme tetragonal crystal grown in the apcf apparatus. data and structural
+comparison with a crystal grown under microgravity from spacehab-01 mission. Acta
+Crystallogr. D, 52:505–517, 1996. (Cité aux pages 83 et 85.)
+[203] Guoli Wang and Roland L Dunbrack. Pisces: a protein sequence culling server. Bioinfor-
+matics, 19(12):1589–91, Aug 2003. (Cité à page 99.)
+[204] Guoli Wang and Roland L Dunbrack. Pisces: recent improvements to a pdb sequence
+culling server. Nucleic Acids Res, 33(Web Server issue):W94–8, Jul 2005. doi: 10.1093/
+nar/gki402. (Cité à page 99.)
+[205] M.C. Wang and G.E. Uhlenbeck. On the theory of Brownian motion II. Phys. Rev., 93(1):
+249–262, 1945. (Cité à page 136.)
+bibliography 185
+[206] G. Weber and H.G. Drickamer. The effect of high pressure upon proteins and other
+biomolecules. Quart. Rev. of Biophys., 16(1):89–112, 1983. (Cité à page 14.)
+[207] G. Weber, F. Tanaka, B.Y. Okamoto, and H.G. Drickamer. The effect of pressure on the
+molecular complex of isoalloxazine and adenine. Proc Natl Acad Sci USA, 71:1264–66,
+1974. (Cité à page 12.)
+[208] C. Wilson and S. Doniach. A computer model to dynamically simulate protein folding:
+studies with crambin. Proteins Structure Function and Genetics, 6:193, 1989. (Cité à
+page 65.)
+[209] A Wlodawer, J Walter, R Huber, and L Sjölin. Structure of bovine pancreatic trypsin
+inhibitor. results of joint neutron and x-ray refinement of crystal form ii. J. Mol. Biol.,
+180:301–329, 1984. (Cité à page 109.)
+[210] A Wlodawer, J Nachman, GL Gilliland, W Gallagher, and C Woodward. Structure of
+form iii crystals of bovine pancreatic trypsin inhibitor. J. Mol. Biol., 198:469–480, 1987.
+(Cité à page 109.)
+[211] P.T.T. Wong and K. Heremans. Pressure effects on protein secondary structure and
+hydrogen deuterium exchange in chymotrypsinogen: a fourier transform infrared
+spectroscopic study. BBA Biochimica Biophysica Acta, 956:1–9, 1988. (Cité à page 16.)
+[212] L.C. Wood, M N Ashby, C Grunfeld, and K R Feingold. Cloning of murine translation
+initiation factor 6 and functional analysis of the homologous sequence YPR016c in
+saccharomyces cerevisiae. J. Biol. Chem., 274:11653–11659, 1999. (Cité aux pages xx et 24.)
+[213] B. Wroblowski, J.F. Diaz, K. Heremans, and Y. Engelborghs. Molecular mechanisms
+of pressure induced conformational changes in bpti. Proteins Structure Function and
+Genetics, 25:446–455, 1996. (Cité à page 13.)
+[214] H. Yang, G. Luo, P. Karnchanaphanurach, T.M. Louie, I. Rech, S. Cova, L. Xun, and
+X.S. Xie. Protein conformational dynamics probed by single-molecule electron transfer.
+Science, 302(5643):262–266, 2003. (Cité à page 135.)
+[215] S. Yokoyama, T. Tada, H. Zhang, and L. Britt. Elucidation of phenotypic adaptations:
+Molecular analyses of dim-light vision proteins in vertebrates. Proc Natl Acad Sci USA,
+105(36):13480–13485, 2008. (Cité à page 159.)
+[216] G Zaccai. How soft is a protein? a protein dynamics force constant measured by neutron
+scattering. Science, 288:1604–1607, 2000. (Cité aux pages 130 et 135.)
+186 bibliography
+[217] P. Závodszky, J. Kardos, A. Svingor, and G. A. Petsko. Adjustment of conformational
+flexibility is a key event in the thermal adaptation of proteins. Proc Natl Acad Sci USA,
+95:7406–7411, 1998. (Cité aux pages xvii et 18.)
+[218] J. Zhang, X. Peng, A. Jonas, and J. Jonas. Nmr study of the cold, heat, and pressure
+unfolding of ribonuclease a. Biochemistry, 34:8631–8641, 1995. (Cité à page 13.)
+[219] J.M. Zhou, L. Zhu, C. Balny, and S. Perret. Pressure denaturation of the yeast prion
+protein ure2. Biochem. Biophys. Res. Comm., 287:147–152, 2001. (Cité à page 8.)
+[220] C.E. ZoBell and F.H. Johnson. The influence of hydrostatic pressure on the growth
+and viability of terrestrial and marine bacteria. J. Bacteriol., 57:179, 1949. (Cité aux
+pages xviii et 19.)
diff --git a/examples/theses/smigaj.pdf b/examples/theses/smigaj.pdf
new file mode 100644
index 00000000..ffc823b1
Binary files /dev/null and b/examples/theses/smigaj.pdf differ
diff --git a/examples/theses/smigaj/fulltext.pdf b/examples/theses/smigaj/fulltext.pdf
new file mode 100644
index 00000000..ffc823b1
Binary files /dev/null and b/examples/theses/smigaj/fulltext.pdf differ
diff --git a/examples/theses/smigaj/fulltext.pdf.txt b/examples/theses/smigaj/fulltext.pdf.txt
new file mode 100644
index 00000000..53effdd9
--- /dev/null
+++ b/examples/theses/smigaj/fulltext.pdf.txt
@@ -0,0 +1,6257 @@
+Design and numerical modelling of integrated optical
+components
+Wojciech S´migaj
+To cite this version:
+Wojciech S´migaj. Design and numerical modelling of integrated optical components. Mathe-
+matical Physics. Universite´ Paul Ce´zanne - Aix-Marseille III, 2010. English. <tel-00567213>
+HAL Id: tel-00567213
+https://tel.archives-ouvertes.fr/tel-00567213
+Submitted on 18 Feb 2011
+HAL is a multi-disciplinary open access L’archive ouverte pluridisciplinaire HAL, est
+archive for the deposit and dissemination of sci- destine´e au de´poˆt et a` la diffusion de documents
+entific research documents, whether they are pub- scientifiques de niveau recherche, publie´s ou non,
+lished or not. The documents may come from e´manant des e´tablissements d’enseignement et de
+teaching and research institutions in France or recherche franc¸ais ou e´trangers, des laboratoires
+abroad, or from public or private research centers. publics ou prive´s.
+Thèse presentée à l’Université Paul Cézanne (Aix-Marseille III)
+pour obtenir le grade de docteur en sciences
+Conception et modélisation numérique
+de composants optiques en nanophotonique intégrée
+Design and numerical modelling
+of integrated optical components
+Wojciech S´MIGAJ
+22 septembre 2010
+Laboratoire d’accueil Institut Fresnel, équipe CLARTE
+Formation doctorale physique théorique et mathématique
+Membres du jury
+Philippe LALANNE rapporteur
+Andrey A. FEDYANIN rapporteur
+Didier LIPPENS examinateur
+Maciej KRAWCZYK examinateur
+Mathias VANWOLLEGHEM examinateur
+Stefan ENOCH directeur de thèse
+Boris GRALAK tuteur de thèse
+
+Contents
+Acknowledgements 5
+Résumé en français 7
+1 Preliminaries 15
+1.1 Introduction . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 15
+1.2 Outline of the thesis . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 16
+1.3 Notational conventions . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 17
+1.4 Maxwell’s equations . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 18
+2 Effective-medium model of photonic crystals 21
+2.1 Introduction . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 21
+2.2 Definition of the effective parameters of photonic crystals . . . . . . . . . . . . . . . . . 22
+2.2.1 Preliminaries: the homogeneous-medium case . . . . . . . . . . . . . . . . . . 22
+2.2.2 Existing definitions . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 23
+2.2.3 Proposed definition . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 24
+2.3 Influence of symmetries on the effective parameters . . . . . . . . . . . . . . . . . . . . 27
+2.3.1 Real-valuedness . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 28
+2.3.2 Continuity and boundedness . . . . . . . . . . . . . . . . . . . . . . . . . . . . 28
+2.4 Examples . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 31
+2.4.1 Hexagonal lattice . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 31
+2.4.2 Square lattice . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 35
+2.4.3 Remarks . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 40
+2.5 Validity of the single-mode approximation . . . . . . . . . . . . . . . . . . . . . . . . . 40
+2.6 Conclusions . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 44
+3 Antireflection gratings for photonic crystals 45
+3.1 Introduction . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 45
+3.2 Types of antireflection structures . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 45
+3.2.1 Antireflection structures for homogeneous media . . . . . . . . . . . . . . . . . 45
+3.2.2 Antireflection structures for photonic crystals . . . . . . . . . . . . . . . . . . . 46
+3.3 Design procedure . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 48
+3.4 Examples . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 53
+3.4.1 A photonic-crystal flat lens . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 53
+3.4.2 A supercollimating photonic crystal . . . . . . . . . . . . . . . . . . . . . . . . 59
+3.4.3 A photonic-crystal superprism . . . . . . . . . . . . . . . . . . . . . . . . . . . 62
+3.5 Conclusions . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 63
+3
+4 Contents
+4 Magneto-optical circulators 65
+4.1 Introduction . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 65
+4.1.1 Basic characteristics of isolators and circulators . . . . . . . . . . . . . . . . . . 65
+4.1.2 Routes to nonreciprocity . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 66
+4.1.3 Experimental realisations of optical isolators and circulators . . . . . . . . . . . 67
+4.1.4 Outline of this chapter . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 72
+4.2 Extension of the coupled-wave model . . . . . . . . . . . . . . . . . . . . . . . . . . . 72
+4.2.1 Inclusion of direct coupling between waveguides . . . . . . . . . . . . . . . . . 72
+4.2.2 Inclusion of radiation loss . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 77
+4.3 Cavities with circular symmetry . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 79
+4.4 Photonic-crystal-based circulators . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 82
+4.5 Rib-waveguide-based circulators . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 90
+4.5.1 Introduction . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 90
+4.5.2 Numerical calculations . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 92
+4.5.3 Geometry optimisation . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 97
+4.5.4 Fabrication . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 101
+4.6 Simulations of three-dimensional axisymmetric cavities . . . . . . . . . . . . . . . . . . 101
+4.6.1 Evaluation of possible three-dimensional geometries . . . . . . . . . . . . . . . 101
+4.6.2 Towards cavities with higher quality factor . . . . . . . . . . . . . . . . . . . . 105
+4.7 Conclusions and perspectives . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 111
+5 Numerical methods 115
+5.1 Multiple-scattering method for systems containing gyrotropic media . . . . . . . . . . . 115
+5.2 Calculation of photonic-crystal band structures with Fourier-Bessel expansions . . . . . 118
+5.2.1 Introduction . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 118
+5.2.2 Formulation . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 119
+5.2.3 Numerical examples . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 123
+5.2.4 Conclusions . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 128
+5.3 Finite-element simulations of three-dimensional axisymmetric cavities . . . . . . . . . . 128
+5.3.1 Introduction . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 128
+5.3.2 Formulation . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 129
+5.3.3 Numerical implementation . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 137
+5.3.4 Evaluation of accuracy . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . 138
+6 Conclusions and perspectives 143
+Bibliography 145
+Acknowledgements
+I have been very privileged to have undoubtedly the most supportive, reliable and friendly advisor anyone
+could ask for, namely Boris Gralak. While not hesitating to offer his advice and share his experience, he
+let me enjoy a complete liberty in the pursuit of my scientific interests. I really appreciated his eye for
+detail, his striving for clarity and precision (even as I am writing these words, Boris is still hunting for
+the remaining mistakes in the French summary of this thesis), as well as his inextinguishable optimism.
+In addition to being a mentor, he became a friend. I thank him and Mylène for all the evenings we spent
+together. I am also indebted to Stefan Enoch, who agreed to act as the director of this thesis, in spite of
+his numerous responsibilities as the associate director of Institut Fresnel.
+My gratitude extends towards all the members of the CLARTE team in Institut Fresnel, who gave
+me a warm welcome upon my arrival to Marseille three years ago and have ensured an excellent work-
+ing environment ever since. Four persons deserve a special mention. Gérard Tayeb was always willing
+to share his experience in the development of computational methods. On various occasions, he took
+time to participate in rehearsals of my oral presentations, and his help and advice was invariably much
+appreciated. I was also fortunate to be able to collaborate with Daniel Maystre, whose profound un-
+derstanding of the mathematical foundations of numerical algorithms is unmatched by anyone I know.
+Sebastién Guenneau and Javier Romero-Vivas took active part in the development of magneto-optical
+circulators and performed numerous simulations that helped to optimise the devices. Besides, Javier and
+I shared the joys and sorrows of a foreigner in France (« C’est Marseille. . . »).
+This thesis owes also a lot to collaborations with several research groups from outside Marseille.
+The work on antireflection gratings for photonic crystals was done in collaboration with teams from
+Université de Lille I and Université de Bourgogne in Dijon. Maxence Hofman and Olivier Vanbésien
+from the DOME team in Université de Lille I manufactured samples of photonic-crystal flat lens covered
+with the antireflection gratings we had designed. Geoffroy Scherrer, Benoît Cluzel and Frédérique de
+Fornel from the OCP team in Université de Bourgogne performed the near-field characterisation of these
+samples. I would like to thank all of them for the interesting and fruitful meetings. Special thanks go to
+Olivier for giving us all a taste of the delicious Flemish cuisine. I am also indebted to Didier Lippens,
+director of the DOME team, for having accepted the invitation to act as a member of the examining board.
+I greatly enjoyed the collaboration with the members of the MMS team in Institut d’Électronique
+Fondamentale (IEF) in Orsay on magneto-optical circulators. I am particularly grateful to Mathias Van-
+wolleghem, who introduced me to the fascinating topic of non-reciprocity in optics, infecting me with his
+enthusiasm. Luba Magdenko and Béatrice Dagens devoted a lot of effort to the fabrication of prototypes
+of the circulators, gradually taming the etch-resistant bismuth-iron-garnet substrates. Luba also took part
+in the numerical modelling of the circulators. Always ready to ask inconvenient questions and to point
+out the experimental constraints, she was fun to work with. Thanks are due to the whole team for the
+innumerable discussions and e-mail interchanges we have had, as well as for inviting Boris and me to
+spend a month at IEF.
+I am no less indebted to Maciej Krawczyk from Adam Mickiewicz University in Poznan´, the advisor
+for my Master’s thesis, who has also accepted to be a member of the examination board. Thanks to
+5
+6 Acknowledgements
+Maciej I have been able to keep in touch with my alma mater. I am grateful for his continuous support
+and for his genuine interest in the progress of my research. I am also indebted to Henryk Puszkarski,
+director of the Surface Physics Division in Poznan´, for his willingness to share his experience and advice.
+I particularly want to thank all the members of Prof. Puszkarski’s group for the warm welcome they gave
+me whenever I came back to Poznan´.
+I would like to extend my sincere gratitude to Philippe Lalanne from Institut d’Optique in Palaiseau
+and to Andrey A. Fedyanin from Lomonosov Moscow State University for accepting to write reviews of
+this thesis. I also acknowledge the French Ministry of Higher Education and Research for providing its
+funding.
+Finally, I would like to thank all my friends and my family, whose presence has been absolutely
+invaluable during these three years. I am deeply grateful to my parents and sister for their continuing
+support, kindness and love. My fellow Ph.D. students from the CLARTE and HIPE teams in Institut Fres-
+nel, Alexis, Fabien, Raphaël P., Raphaël L., Mohamed, Xiaoyun, Frédéric, Muamer and Guillaume con-
+tributed to making the lab the great place it was. My special thanks go to all the members of Aumônerie
+Jer’aum,? who made me feel at home in Marseille. I will miss you much when I leave! Lastly, I want to
+thank all of my Polish friends, especially Kasia, Małgosia, Milena, Alicja, Marcin, Jacek, Wawrzyniec
+and Karol.
+Wojciech S´migaj, Marseille, 1 September 2010
+? Jean Pol and Jean, Louis and Paul, Jules Hervé and Estelle, Jeannette, Alexandra, Lucie, Marion, Alexis, Frédéric, Césaire,
+Romuald, Matthieu, Descartes, Jean-François and Yen, Rakia, Chinh, Olga, Damien, Jean-Marie, Charles and Yvri, Katell,
+Randy, Thibault, Priscilla, Melissa. . .
+Résumé en français
+Contexte historique
+L’aube de la seconde moitié du XXème siècle a été marquée par l’invention des circuits électroniques
+intégrés fabriqués dans des couches minces semiconductrices. En raison de leur faible coût et de leur
+petite taille, les circuits intégrés ont rapidement presque supplanté les « gros » composants électroniques :
+les bobines, les tubes électroniques etc. Ils ont fourni les moyens de la révolution technologique qui a
+fait des appareils électroniques compacts une partie intégrante de la vie moderne.
+Peu de temps après la première démonstration expérimentale du laser en 1960, le concept des cir-
+cuits optiques intégrés est apparu. Par analogie avec leurs homologues électroniques, ils devaient ouvrir
+la voie à la miniaturisation des dispositifs optiques. Depuis la découverte du laser, des progrès signifi-
+catifs ont été accomplis : de nombreux composants photoniques intégrés, tels que coupleurs, filtres ou
+multiplexeurs, sont couramment utilisés dans les dispositifs disponibles dans le commerce. Toutefois,
+il faut admettre que le développement de la technologie des circuits optiques intégrés a été beaucoup
+plus lent que celui des circuits électroniques. Pour preuve, si les processeurs modernes contiennent des
+millions de transistors sur une seule puce, les circuits intégrés optiques les plus complexes réalisés à ce
+jour se composent d’à peine quelques centaines de composants [1–4].
+Il semble y avoir deux raisons principales à cette différence. Premièrement, la longueur d’onde de
+la lumière aux fréquences de télécommunications, qui est de l’ordre de 0.1–1 µm dans des matériaux
+diélectriques typiques, est beaucoup plus grande que la longueur de l’onde de Broglie d’un électron au
+niveau de Fermi d’un métal classique, 0.1–1 nm [5, p. 120]. Celle-ci est si petite que, jusqu’à récemment,
+les propriétés ondulatoires des électrons pourraient être quasiment ignorées dans la conception de com-
+posants électroniques, qui pourraient donc être miniaturisés sans encombre. Au contraire, la longueur
+d’onde de la lumière constitue une vraie limite de la taille des composants optiques.? Deuxièmement,
+pour des applications diverses, il est avantageux d’utiliser des substrats avec des propriétés physiques
+particulières, présentant par exemple d’importants effets électro-, magnéto- ou acousto-optiques. Étant
+donné que ces propriétés sont difficiles à obtenir simultanément dans un seul matériau, les premiers
+circuits optiques intégrés ont été construits de la façon dite hybride, où tous les composants sont fabri-
+qués séparément en utilisant des matériaux et technologies différents avant d’être assemblés sur un seul
+substrat [7, p. 9]. Avec cette approche, chaque composant peut être optimisé séparément ; par contre,
+l’alignement et le couplage des différents éléments constituent une difficulté de taille. Ainsi, les circuits
+optiques intégrés hybrides ne comportent pas plus que quelques composants. Les circuits intégrés les
+plus complexes sont donc fabriqués de façon monolithique, où tout le système est gravé dans un seul
+substrat. Actuellement, la technologie de ce type la plus avancée est certainement celle qui est fondée sur
+le phosphure d’indium.
+L’introduction de la notion de cristaux photoniques à la fin des années 1980 [8, 9] a profondément
+influencé la recherche sur les circuits optiques intégrés. Le cristal photonique est défini comme un sys-
+? Les composants plasmoniques, qui constituent actuellement le sujet de recherches actives, pourraient néanmoins permettre
+d’aller plus loin dans la miniaturisation des dispositifs optiques [6].
+7
+8 Résumé en français
+tème dans lequel la permittivité et la perméabilité dépendent périodiquement de la variable d’espace :
+ainsi, il peut être considéré comme un analogue électromagnétique d’un solide cristallin. La périodi-
+cité de la permittivité et de la perméabilité peut donner lieu à des « gaps », c’est-à-dire, des bandes de
+fréquences où aucun état propagatif (transportant de l’énergie) n’existe à l’intérieur du cristal. Rapide-
+ment, pour des fréquences situées dans un gap, des défauts linéaires le long desquels des modes localisés
+peuvent se propager ont été imaginés dans des cristaux photoniques ; de tels défauts peuvent donc ser-
+vir de guides d’onde [10]. En même temps, on a démontré que les défauts ponctuels dans les cristaux
+photoniques peuvent se comporter comme des résonateurs avec la valeur du ratio entre le facteur de
+qualité et le volume du mode potentiellement très importante [10]. Toutefois, c’est une autre découverte
+qui va révéler l’énorme intérêt envers les cristaux photoniques en tant que moyen de miniaturiser les
+circuits optiques intégrés : les modes de guides d’onde à cristaux photoniques peuvent se propager le
+long des coudes pratiquement sans pertes d’énergie [11]. En effet, les rayons de courbure des guides
+d’onde standards doivent être de l’ordre de quelques millimètres afin de maintenir les pertes à un niveau
+raisonnable [10]. En revanche, les guides à cristaux photoniques peuvent avoir des coudes avec un rayon
+de courbure d’environ un micromètre. Jusqu’ici, de nombreux dispositifs optiques basés sur les guides
+d’onde et résonateurs à cristaux photoniques ont été proposés, et plusieurs d’entre eux ont été réalisés
+expérimentalement. Pour une revue relativement récente de l’état actuel de la recherche sur les cristaux
+photoniques, le lecteur peut consulter la référence 12.
+Alors que les premières études de cristaux photoniques ont porté principalement sur la recherche de
+structures fournissant le gap le plus large et sur la conception de composants fonctionnant dans le gap,
+la dernière décennie a vu la communauté porter une attention croissante aux propriétés inhabituelles des
+cristaux photoniques en dehors des gaps. Contrairement aux diélectriques homogènes, dont la surface
+d’isofréquence est une ellipsoïde, la forme de la surface d’isofréquence des cristaux photoniques peut
+être très compliquée.? En outre, la vitesse de groupe dans un cristal photonique peut être orientée dans
+n’importe quelle direction. Cette richesse de la relation de dispersion donne lieu à des phénomènes
+inhabituels [13], comme la réfraction négative de la lumière [14], l’apparition de faisceaux autocollimatés
+[15] ou l’effet « superprism » [16]. Ainsi, il a été reconnu que même les cristaux photoniques sans défauts
+(la présence de surfaces exceptée) peuvent constituer des dispositifs utiles, par exemple des lentilles
+planes [17, 18] ou des diviseurs de faisceau [19].
+Structure de la thèse
+Cette thèse est consacrée à la conception et l’analyse théorique et numérique de certains composants
+en cristaux photoniques. Dans le chapitre 1, nous donnons une brève introduction à la thématique de la
+thèse, nous définissons les notations utilisées dans la suite, et nous rappelons quelques faits de base sur
+les équations de Maxwell, fondement de tous les développements ultérieurs. L’essence de la thèse, les
+chapitres 2 à 5, se divise naturellement en trois parties distinctes. Dans les chapitres 2 et 3, nous étudions
+les cristaux photoniques bidimensionnels sans défauts, limités par une ou deux surfaces planes parallèles.
+En particulier, nous nous intéressons à la dépendance des propriétés de tels cristaux à l’égard de la
+structure des interfaces les séparant des milieux homogènes. Dans le chapitre 4, qui constitue la deuxième
+partie essentielle de cette thèse, nous tournons notre attention vers un type de composants optiques plus
+traditionnels, puisque basés sur les guides d’onde : les circulateurs magnéto-optiques. La troisième partie
+de la thèse, le chapitre 5, est consacrée à la présentation de quelques méthodes numériques développées
+pour les simulations des dispositifs analysés dans les chapitres précédents. La thèse se termine par le
+chapitre 6, dans lequel nous mettons en évidence les résultats qui nous semblent les plus importants
+? On observe la même chose dans la théorie de l’état solide : la surface de Fermi dans un gaz d’électrons libres est sphérique,
+mais dans un solide réel, elle a souvent une forme très complexe, parfois appelée, judicieusement, un monstre.
+Chapitre 2 : Modèle du milieu effectif pour les cristaux photoniques 9
+et nous indiquons les perspectives des futurs travaux sur certains sujets. Ci-dessous nous résumons le
+contenu des chapitres qui constituent le corps de la thèse.
+Chapitre 2 : Modèle du milieu effectif pour les cristaux photoniques
+Comme mentionné ci-dessus, une caractéristique essentielle des cristaux photoniques réside dans la ri-
+chesse de leur relation de dispersion. La forme des surfaces d’isofréquence des cristaux photoniques
+peut être très complexe : ils contiennent parfois des changements de direction brutaux séparant des ré-
+gions planes ou même concaves. Toutefois, à certaines fréquences, ils peuvent également atteindre une
+forme ellipsoïdale, caractéristique pour des milieux homogènes. En conséquence, la question se pose si
+les cristaux peuvent alors être correctement décrits par le modèle du milieu effectif, dans lequel ils sont
+représentés par un matériau homogène avec une certaine permittivité  et perméabilité . Comme les
+matériaux homogènes sont incomparablement plus faciles à analyser que les matériaux structurés, une
+réponse affirmative simplifierait le développement de dispositifs à cristaux photoniques, en particulier de
+ceux qui utilisent l’effet de la réfraction négative [14]. En effet, la plupart des composants basés sur ce
+phénomène, comme les célèbres superlentilles [17], ont été conçus pour des matériaux à indice négatif
+homogènes imaginés par Veselago [20].
+De nombreux documents traitant de ce sujet ont déjà été publiés [21–32], donnant lieu à plusieurs
+définitions des paramètres effectifs des cristaux photoniques, reportées au paragraphe 2.2.2. Cependant,
+ces définitions sont généralement introduites de façon heuristique et manquent de justification formelle.
+En outre, pour toutes ces définitions, la confrontation du coefficient de réflexion du cristal calculé rigou-
+reusement avec celui du milieu effectif correspondant n’a jusqu’alors été effectuée que pour l’incidence
+normale [24–26] ou quasi-normale [28]. Pourtant, de nombreuses applications, y compris celles utilisant
+la réfraction négative, s’appuient sur le comportement des ondes incidentes aux grands angles, voire des
+ondes évanescentes. Le domaine de validité de l’approximation du milieu effectif est, par conséquent,
+encore mal connu.
+L’objectif du travail présenté dans le chapitre 2 est de remédier à ces lacunes. Dans la section 2.2,
+nous adoptons l’hypothèse de l’approximation monomode pour fournir une justification mathématique
+rigoureuse à une certaine définition des paramètres effectifs des cristaux photoniques bidimensionnels.
+Dans la section 2.3, nous étudions l’influence de la symétrie du plan de troncature du cristal et celle des
+modes propres du cristal sur le comportement de ses paramètres effectifs. En particulier, nous dérivons
+les conditions dans lesquelles les paramètres effectifs sont réels et bornés pour tous les angles d’inci-
+dence. Nous généralisons ainsi le résultat obtenu par Pierre and Gralak [27] dans le cas unidimensionnel.
+Pour évaluer la précision du modèle du milieu effectif, nous comparons dans la section 2.4 les valeurs
+du coefficient de la réflexion spéculaire prévu dans le cadre du modèle avec les résultats des calculs
+numériques rigoureux. Ces tests, effectués pour deux cristaux différents à un nombre de fréquences et
+dans tout le domaine d’angle d’incidence, indiquent que la précision du modèle est limitée par celle de
+l’hypothèse de départ, l’approximation monomode.
+Ces résultats ont imposé d’analyser de façon précise le domaine de validité de l’approximation mo-
+nomode. Dans la section 2.5, nous établissons un lien entre les amplitudes relatives d’excitation des
+modes propres d’un cristal et le spectre de Fourier des champs électrique et magnétique de ces modes sur
+le plan de troncature du cristal. Ce lien est utilisé pour formuler un critère d’estimation de la précision de
+l’approximation monomode : cette hypothèse est d’autant plus pertinente que la courbe d’isofréquence
+du cristal photonique se rapproche de celle du milieu homogène avec l’indice de réfraction égal à la
+moyenne de l’indice de réfraction du cristal. Enfin, nous considérons le cas particulier des modes en-
+gendrant la réfraction négative. Nous observons que leur excitation par une onde plane est accompagnée
+pour la plupart des angles d’incidence par une excitation simultanée d’autres modes (évanescents) avec
+10 Résumé en français
+une amplitude importante. Dans ce cas, l’approximation monomode d’un cristal photonique présentant
+le phénomène de réfraction négative ne peut être considéré comme (relativement) précise que près de
+l’incidence normale. Notre analyse montre qu’il hasardeux de traiter un tel cristal photonique comme
+un matériau homogène pour des angles d’incidence importants ou dans le régime d’ondes évanescentes.
+Finalement, le comportement de systèmes contenant des matériaux d’indice négatif homogènes peut
+s’avérer considérablement différent lorsque ces matériaux sont remplacés par des cristaux photoniques,
+même si les courbes d’isofréquence (et, par conséquent, les indices de réfraction définis par l’intermé-
+diaire de la vitesse de phase) des deux milieux sont identiques.
+Chapitre 3 : Réseaux antiréfléchissants pour des cristaux photoniques
+Les courbes du coefficient de réflexion des cristaux photoniques étudiés dans le chapitre 2 (figures 2.5,
+2.7, 2.10, 2.12 et 2.13) montrent que des ondes réfléchies d’amplitude importante sont souvent générées
+sur la surface des cristaux photoniques. Dans de nombreuses applications, il est au contraire souhaitable
+d’obtenir un transfert d’énergie parfait entre l’onde plane incidente et le mode propre propagatif du cristal
+photoniques (ou, plus rarement, plusieurs modes propagatifs). Les ondes réfléchies de caractère propa-
+gatif doivent donc être éliminées. Le chapitre 3 concerne la conception de structures antiréfléchissantes
+qui, placées sur la surface d’un cristal photonique, diminuent significativement la fraction d’énergie per-
+due dans les ondes réfléchies. Après avoir examiné les classes de telles structures proposées à ce jour
+(section 3.2), dans la section 3.3, nous proposons une nouvelle méthode de conception de réseaux anti-
+réfléchissants avec une tolérance angulaire importante.
+L’algorithme de conception que nous proposons consiste en trois étapes. Premièrement, les para-
+mètres d’une couche homogène antiréfléchissante sont calculés à partir d’un modèle du milieu effectif
+du cristal photonique en question. Deuxièmement, une théorie analytique du milieu effectif des réseaux
+lamellaires binaires est utilisée pour trouver les paramètres d’un réseau composé des seuls matériaux
+constitutifs du cristal, et dont les propriétés sont proches de celles de la couche obtenue à l’étape pré-
+cédente. Troisièmement, la forme de la grille est raffinée à l’aide d’une routine numérique de recherche
+locale qui vise à minimiser la réflectance moyenne de la structure dans la gamme désirée d’angle ou de
+la fréquence. Cette dernière étape est nécessaire en raison des approximations faites dans les dérivations
+analytiques utilisées dans les deux premières étapes de la procédure.
+Dans la section 3.4, nous appliquons la méthode proposée à trois cristaux dont les courbes d’iso-
+fréquence sont de courbure différente : un cristal présentant le phénomène d’autocollimation, avec une
+courbe isofréquence très plate ; un cristal présentant l’effet de réfraction négative, avec une courbe d’iso-
+fréquence presque circulaire ; et un cristal photonique du type « superprism », dont la courbe isofréquence
+a des cornes. Dans les deux premiers cas, nous réussissons à concevoir des réseaux antiréfléchissants ga-
+rantissant une réflectance très faible dans une vaste gamme angulaire. Les structures obtenues sont très
+compactes et paraissent simple à fabriquer ; en fait, l’amélioration apportée par ces réseaux antiréflé-
+chissants à la transmission à travers une lentille plate de cristal photonique (basée sur l’effet de réfrac-
+tion négative) a déjà été confirmée expérimentalement [33]. Cependant, dans le cas du cristal du type
+« superprism », la procédure de conception échoue à cause de la violation de certaines contraintes sur
+l’impédance effective du cristal, qui doivent être remplies pour que la couche antiréfléchissante géné-
+rée dans la première étape puisse être approchée par un réseau binaire constitué de matériaux réalistes.
+L’existence de ces contraintes est la limitation principale de la procédure présentée.
+Chapitre 4 : Circulateurs magnéto-optiques 11
+Chapitre 4 : Circulateurs magnéto-optiques
+Dans le chapitre 4, nous étudions le problème de la miniaturisation des circulateurs optiques, qui ap-
+partiennent aux derniers composants optiques intégrés importants dont la version intégrée ne soit pas
+encore disponible dans le commerce. Le circulateur est un dispositif reliant n  3 guides d’onde de telle
+sorte que l’énergie entrant par le guide Wi (1  i < n) est entièrement transférée au guide WiC1 et
+l’énergie entrant par le guide Wn est transférée au guide W1. Un dispositif apparenté, l’isolateur, relie
+deux guides d’onde ainsi que le transfert d’énergie soit interdit dans un sens, mais autorisé dans l’autre.
+Manifestement, le circulateur peut également faire fonction d’isolateur.
+Ces deux composants ont plusieurs applications importantes. Ils peuvent servir à éliminer les ondes
+réfléchies des composants d’impédance mal adaptée dans des circuits complexes ; la présence de telles
+ondes peut donner lieu à des interférences indésirables et couplages parasites [34]. Les composants en
+question sont également employés dans l’acheminement des signaux dans des dispositifs tels que les
+multiplexeurs [35]. Dans le domaine optique, l’application la plus importante des isolateurs est sans
+doute la protection des lasers de la lumière réfléchie, qui perturbe la configuration des ondes stationnaires
+dans une cavité laser et peut entraîner le laser à devenir instable [36].
+Les circulateurs et les isolateurs sont dits des dispositifs non-réciproques. Cela signifie, en particu-
+lier, qu’ils ne peuvent pas être réalisés en utilisant uniquement des matériaux linéaires, invariants dans le
+temps et dont la permittivité et la perméabilité s’expriment par des tenseurs symétriques. La façon la plus
+commune d’obtenir un système non-réciproque est d’y inclure un matériau présentant l’effet magnéto-
+optique : par exemple, un grenat synthétique tel que le grenat de fer et bismuth. Traditionnellement, les
+isolateurs sont constitués d’une plaque d’un matériau magnéto-optique placée entre deux polariseurs, P1
+et P , tournés de 45ı2 l’un par rapport à l’autre. Le fonctionnement d’un tel isolateur s’appuie sur l’effet
+de Faraday, qui consiste en une rotation non-réciproque du plan de polarisation des ondes électromagné-
+tiques traversant un matériau magnéto-optique dans la direction parallèle à celle d’un champ magnétique
+statique externe. Grâce à cet effet, le plan de polarisation des ondes qui entrent dans l’isolateur par le
+polariseur P1 (par exemple) s’aligne progressivement avec l’axe du polariseur P2 ; par conséquent, ces
+ondes sont transmises à travers le dispositif. En revanche, le plan de polarisation des ondes entrant par le
+polariseur P2 devient perpendiculaire à l’axe du polariseur P1, par lequel ils sont donc absorbées.
+Malheureusement, en raison de leur structure non plane, les isolateurs décrits ci-dessus ne peuvent
+être produits comme éléments d’un circuit optique intégré. En conséquence, dans les deux dernières
+décennies, beaucoup d’efforts ont été faits pour concevoir des isolateurs et des circulateurs adaptés à la
+fabrication sur puce (voir la référence 35 pour une revue de la littérature). Le fonctionnement de la plupart
+des dispositifs proposés jusqu’à présent est basé sur la conversion non-réciproque des modes propres d’un
+guide d’onde (un phénomène analogue à l’effet de Faraday) ou sur l’interférence des ondes se propageant
+dans deux ou plusieurs guides d’onde placés dans un champ magnétique statique externe. Cependant,
+l’effet magnéto-optique est généralement faible : il ne peut influencer sensiblement le comportement
+de la lumière que si celle-ci interagit avec un matériau magnéto-optique sur un chemin optique très
+long, typiquement 1000, où  est la longueur d’onde de la lumière. En conséquence, les isolateurs et
+circulateurs basés sur des guides d’onde sont très longs (1mm), ce qui rend difficile leur intégration
+avec d’autres composants optiques fondamentaux, beaucoup plus petits.
+Une stratégie de miniaturisation potentielle consiste à employer des résonateurs optiques pour allon-
+ger le temps de l’interaction de la lumière avec le matériau magnéto-optique, au prix d’une réduction de la
+bande passante du composant. En 2005,Wang et Fan [34, 37] ont proposé un circulateur magnéto-optique
+inspiré d’une classe de dispositifs couramment utilisés dans le domaine micro-ondes, où, cependant, les
+effets induits par un champ magnétique statique externe sont beaucoup plus importants. Le circulateur
+de Wang et Fan se compose de trois guides d’onde à cristal photonique couplés à une cavité à cristal
+12 Résumé en français
+photonique dans laquelle deux modes propres bien localisés peuvent être excités. Leurs fréquences sont
+décalées l’une par rapport à l’autre en présence d’un champ magnétique statique externe, la matrice du
+cristal photonique étant d’un matériau magnéto-optique. En utilisant le formalisme du couplage faible,
+on peut montrer qu’un tel système fonctionne comme un circulateur.
+Il faut noter, cependant, que la séparation des fréquences des deux modes de la cavité originale pré-
+sentée dans les références 34 et 37 est négligeable dans un champ magnétique statique externe uniforme.
+Elle ne devient acceptable que si le matériau magnéto-optique dans la cavité est divisé dans de nombreux
+domaines magnétiques polarisés dans les sens contraires, chacun d’une superficie d’une fraction de µm2.
+La réalisation de tels domaines est, en pratique, très difficile technologiquement, car elle nécessite un
+contrôle précis – à l’échelle nanométrique – du champ magnétique statique externe appliqué. Pour cette
+raison, le dispositif conçu par Wang et Fan n’a jamais été fabriqué. L’objectif de la recherche présentée
+dans le chapitre 4 était d’élaborer la conception d’un circulateur s’appuyant sur un résonateur magnéto-
+optique et capable de fonctionner dans un champ magnétique statique externe uniforme, c’est-à-dire,
+avec tout le matériau magnéto-optique aimanté uniformément.
+Nous commençons par étudier comment la géométrie d’une cavité magnéto-optique bidimension-
+nelle placée dans un champ magnétique statique externe influence le décalage des fréquences de ses
+deux modes propres (section 4.3). Afin de mieux comprendre le problème, nous nous concentrons sur
+le modèle simplifié d’une cavité axisymétrique, c’est à dire composée d’une série d’anneaux concen-
+triques. De telles structures peuvent être traitées analytiquement ; en particulier, nous sommes en mesure
+de montrer que le décalage maximal des fréquences dans un champ magnétique statique externe uni-
+forme est obtenu pour des cavités ayant la forme d’un miroir de Bragg annulaire. Nous obtenons ainsi
+une procédure explicite pour la conception de cavités axisymétriques optimisées pour le fonctionnement
+dans un champ magnétique statique externe uniforme, ce qui constitue le fondement de cette étude.
+L’étape suivante de la conception du circulateur est de coupler efficacement la cavité avec les guides
+d’onde d’entrée et de sortie. Dans les sections 4.4 et 4.5, deux classes de structures sont examinées :
+les circulateurs à base de cristaux photoniques, semblables à ceux étudiés dans les références 34 et 37,
+et les circulateurs dans lesquels le revêtement à cristal photonique est supprimé et la cavité est couplée
+directement à des guides d’onde standards. Cette élimination du cristal photonique conduit à une simpli-
+fication importante de la géométrie du dispositif. Néanmoins, l’analyse théorique de son fonctionnement
+devient un peu plus compliqué, car on doit tenir compte des effets du couplage direct entre les guides
+d’onde et des pertes d’énergie par le rayonnement dans le plan du dispositif, comme il est décrit dans la
+section 4.2. Les performances des deux catégories de circulateurs sont évaluées à l’aide de simulations
+numériques rigoureuses. Nous concluons que la simplification de géométrie résultant de l’élimination du
+cristal photonique ne doit pas être accompagnée d’une détérioration de la performance du composant.
+Par conséquent, dans la suite du chapitre 4 nous nous concentrons sur les circulateurs avec des guides
+standards, c’est-à-dire sans cristaux photoniques.
+A ce stade, il convient de résumer les résultats des tests expérimentaux de nos circulateurs, fabriqués
+et caractérisés par L. Magdenko et B. Dagens (Institut d’Electronique Fondamentale, Orsay, France) dans
+des hétérostructures composées des grenats de bismuth et fer et de gadolinium et gallium. Ces résultats
+révèlent un problème significatif dans la conception originale des cavités : des pertes d’énergie impor-
+tantes par rayonnement hors plan du dispositif. Elles sont une conséquence du fait que la conception
+n’était originellement basée que sur des simulations bidimensionnelles (l’approximation d’indice effec-
+tif utilisée dans certaines des simulations s’est avérée ne pas avoir été assez précise). C’est pourquoi, dans
+la dernière partie du chapitre 4, nous présentons les premiers résultats des simulations tridimensionnelles
+des cavités, obtenus avec la méthode des éléments finis décrite dans la section 5.3. Nous démontrons
+que le problème des pertes hors-plan peut être surmonté par un ajustement approprié de la géométrie de
+la cavité. Plus précisément, le facteur de qualité des modes propres peut être sensiblement amélioré en
+Chapitre 5 : Méthodes numériques 13
+recouvrant la cavité avec un matériau ayant un indice de réfraction proche de celui du substrat et par
+l’optimisation numérique des positions et des largeurs des anneaux constitutifs de la cavité. A ce jour,
+ce raffinement de la conception basé sur des simulations tridimensionnelles demande à être confirmé
+expérimentalement.
+Chapitre 5 : Méthodes numériques
+Dans le chapitre 5, nous présentons les méthodes de calcul développées au cours de cette thèse et utilisées
+pour obtenir une partie des résultats présentés dans l’ensemble des chapitres.
+La section 5.1 est consacrée à la méthode de diffusion multiple [38–40] pour la solution du problème
+de la diffusion de lumière par des cristaux photoniques bidimensionnels composés de cylindres circu-
+laires. Cette technique est reconnue depuis longtemps comme l’une des méthodes les plus efficaces pour
+traiter ce type de problèmes. La raison en est double. D’une part, les fonctions de base utilisées pour
+développer le champ électromagnétique (à savoir les séries de Fourier-Bessel) sont des solutions exactes
+des équations de Maxwell, et donc elles sont bien adaptées pour représenter le champ électromagnétique
+en présence de ces domaines. Deuxièmement, comme les fonctions de base sont séparables en coordon-
+nées polaires, les conditions de continuité satisfaites par le champ électromagnétique sur les surfaces
+des cylindres sont simples à exprimer et imposer. Dans la section 5.1, nous montrons que la méthode
+en question peut être généralisée aisément au cas des cristaux photoniques contenant des milieux gyro-
+tropiques qui respectent la même symétrie axiale que les tiges circulaires [les tenseurs de permittivité et
+perméabilité ont alors la forme donnée par l’équation (5.5)]. Nous notons, toutefois, qu’une extension
+similaire pour le cas des matériaux avec une anisotropie plus générale n’est pas possible, car la réduction
+des équations de Maxwell à l’équation de Helmholtz n’est alors possible qu’au prix d’un changement de
+coordonnées transformant des cercles en des ellipses, ce qui engendre des effets secondaires indésirables.
+Compte tenu de l’efficacité et la simplicité de la méthode de diffusion multiple, cette méthode a été
+également appliquée au calcul de la relation de dispersion des cristaux photoniques infinis composés
+de cylindres ou de sphères [41–47]. Elle nécessite, pourtant, de calculer explicitement le champ produit
+par un nombre infini de diffuseurs disposés sur un réseau périodique. Ce champ peut être exprimé par
+une série dite « lattice sum». Malheureusement, des telles séries sont lentement convergentes, et les
+techniques particulières nécessaires pour l’accélération de leur calcul compliquent considérablement la
+mise en œuvre de la méthode par rapport au cas d’un système fini.
+Dans la section 5.2, nous proposons une technique élégante de calcul de la relation de dispersion des
+cristaux photoniques composés de cylindres circulaires. Comme la méthode de diffusion multiple, elle
+s’appuie sur le développement du champ électromagnétique sur des solutions exactes des équations de
+Maxwell (les séries de Fourier-Bessel), avec l’avantage d’éviter le calcul des « lattice sums ». L’idée de
+base est très simple : le champ dans une maille d’un cristal photonique est développé sur des solutions
+particulières de l’équation de Helmholtz, et les conditions de Bloch sur les limites de la maille sont im-
+posées par collocation. Cette approche est en fait similaire à la technique utilisée dans les simulations
+de réseaux avec la méthode de sources fictives afin d’éviter le calcul des fonctions de Green périodiques
+[48]. La méthode proposée ici partage également de nombreuses caractéristiques avec la technique des
+opérateurs de Dirichlet-Neumann, mise au point dans le groupe de Lu [49, 50]. Par rapport à cette tech-
+nique, la présente méthode est plus directe et plus efficace, mais aussi moins générale (spécialement
+adaptée aux calculs de la relation de dispersion).
+La principale vertu de la méthode que nous proposons est sa grande efficacité : en raison de la
+convergence exponentielle des résultats, il est possible d’atteindre une précision relative meilleure que
+10 10 avec un coût de calcul modeste, comme il est démontré dans plusieurs exemples étudiés dans le
+paragraphe 5.2.3. Par conséquent, la technique en question peut fournir des valeurs de référence extrê-
+14 Résumé en français
+mement précises aux fins des tests d’autres méthodes numériques. La haute précision est aussi précieuse
+dans les études avec des effets faibles, tels que la non-réciprocité entraînée par l’influence d’un champ
+magnétique statique sur la propagation des ondes aux fréquences optiques.
+Pour les cristaux photoniques dont la maille ne contient qu’une seule inclusion circulaire, la mise
+en œuvre de cette méthode est directe. Cependant, si plusieurs inclusions sont présentes, la maille doit
+être décomposée en sous-mailles englobant les inclusions individuelles, ce qui complique à un certain
+degré la mise en œuvre de la méthode. Les inconvénients principales de la technique en question sont
+(1) sa restriction à des systèmes contenant des inclusions circulaires et (2) la dégradation visible de sa
+précision à la présence des sous-mailles dont la forme diffère nettement de celle d’un cercle centré sur
+l’inclusion.
+Dans la section 5.3, nous décrivons une variante de la méthode des éléments finis utilisée pour cal-
+culer les modes propres de cavités axisymétriques tridimensionnelles ouvertes, contenant des matériaux
+gyrotropiques. Cette technique a été employée pour obtenir les résultats présentés dans la section 4.6.
+Elle combine des éléments de plusieurs approches décrites dans la littérature, en particulier celles pré-
+sentées dans les références 51 et 52. L’apport original de ce travail consiste en l’extension de la méthode
+au cas des systèmes contenant des milieux gyrotropiques. Jusqu’à présent, elle n’avait été formulée que
+pour des matériaux avec des permittivité et perméabilité représentées par des tenseurs diagonaux, ce qui
+est le niveau de généralité nécessaire pour la modélisation des couches absorbantes parfaitement adaptées
+(PMLs) [51, 53, 54].
+Nous donnons ici une caractérisation concise de la méthode décrite dans la section 5.3. Nous pro-
+fitons d’abord de la symétrie axiale du domaine tridimensionnel en réduisant le problème original à
+un système dénombrable des problèmes propres découplés, posés sur un seul plan méridien (bidimen-
+sionnel). Nous utilisons des éléments finis nodaux scalaires pour développer la composante azimutale
+du champ électrique, et des éléments finis vectoriels pour développer une superposition particulière des
+composantes azimutale et méridienne de ce champ. Ce choix d’inconnues permet d’exprimer simple-
+ment les conditions de continuité sur l’axe de la cavité. Afin de supprimer les réflexions parasites sur les
+limites du domaine de calcul, nous les revêtons de PMLs. La mise en œuvre de la méthode est facilitée
+par la disponibilité de plusieurs outils d’open source, en particulier les bibliothèques Hermes (éléments
+finis) [55, 56] et SLEPc [57–59] (solution des problèmes aux valeurs propres avec des matrices creuses).
+Les tests de convergence présentés dans le paragraphe 5.3.4 montrent que la fréquence propre des
+modes localisés d’une cavité magnéto-optique typique conçue de la manière décrite dans la section 4.6
+peut être déterminée avec la précision relative de 10 5 dans un délai raisonnable sur un ordinateur de
+bureau. Nous montrons également que les résultats sont très peu sensibles aux changements des para-
+mètres qui contrôlent la troncature du domaine.
+Chapter 1
+Preliminaries
+1.1 Introduction
+The dawn of the second half of the 20. century was marked by the invention of electronic integrated cir-
+cuits (ICs) fabricated in semiconductor thin films. Owing to their low cost and small size, ICs quickly all
+but displaced older “bulk” electronic components: coils, glass tubes and so on. They provided the means
+for the technological revolution that made compact electronic devices an integral part of modern life.
+Shortly after the first experimental demonstration of the laser in 1960, the concept of optical ICs
+appeared. In analogy to their electronic counterparts, they were to pave the way to the miniaturisation
+of optical devices. Significant progress has been made from that time: numerous integrated photonic
+components, such as splitters, couplers or multiplexers, are routinely used in commercially available
+devices. However, it must be admitted that the development of the optical IC technology has been
+incomparably slower than that of electronic ICs. Suffice it to say that while state-of-the-art processors
+contain millions of transistors on a single chip, the most complex optical ICs realised to date consist of
+barely several hundred components [1–4].
+There seem to be two principal reasons for this difference. First, the wavelength of light at telecom-
+munication frequencies, which is on the order of 0.1–1 µm in typical dielectric materials, is much larger
+than the de Broglie wavelength of an electron at the Fermi level of a typical metal, 0.1–1 nm [5, p. 120].
+The latter is so small that until recently the wave-like properties of electrons could be essentially ignored
+in the design of electronic components, which could therefore be rather straightforwardly miniaturised.
+In contrast, the wavelength of light is a real limit on the size of optical components.? Second, for specific
+applications it is advantageous to use substrates having particular physical properties, for example ex-
+hibiting strong electro-, magneto- or acousto-optical effects. Since these properties are difficult to obtain
+simultaneously in a single material, the first optical ICs were built with the so-called hybrid approach:
+their individual components were fabricated separately, possibly using different materials and technolo-
+gies, and then bonded together to a single substrate [7, p. 9]. The advantage of this approach is that each
+component can be optimised separately; the disadvantage lies in the inherent difficulty of aligning and
+coupling the various elements. Thus, hybrid optical ICs hardly ever consist of more than a few compo-
+nents. ICs of larger complexity can only be fabricated using the monolithic approach, where the whole
+system is etched in a single substrate. Currently, the most advanced technology of this type seems to be
+that based on indium phosphide.
+A boost to the research on optical ICs was given by the introduction of the concept of photonic
+crystals (PCs) in late 1980s [8, 9]. A PC is defined as a system in which the permittivity and permeability
+are periodically dependent on the position; thus, it can be viewed as an electromagnetic analogue of a
+? Plasmonic components, which are currently an area of active research, might enable further miniaturisation of optical
+devices [6].
+15
+16 Chapter 1. Preliminaries
+crystalline solid. The periodicity of the material properties can give rise to the appearance of band gaps,
+i.e., frequency ranges in which no propagative (energy-carrying) states can exist in the crystal. It was
+quickly recognised that linear defects in PCs can support localised eigenmodes with frequencies lying
+in the band gaps, and thus they can serve as waveguides [10]. Simultaneously, point defects in PCs
+were shown to act as resonant cavities with potentially very large quality factor–mode volume ratios
+[10]. However, it was the discovery that modes in PC waveguides can propagate around extremely sharp
+bends essentially without scattering losses [11] that led to an enormous increase of the interest in PCs as
+a possible means for further miniaturisation of optical ICs. Indeed, the bending radii of standard rib or
+ridge waveguides need be on the order of millimetres in order to keep the losses at a reasonable level [10].
+Since then, an overwhelming number of optical components made of interconnected PC waveguides and
+cavities have been proposed, and several of them have seen experimental realisation. For a relatively
+recent review of the current state of research on PCs, see ref. 12.
+While the early studies of PCs were focused primarily on the quest for structures providing the
+widest band gap and on the design of components operating within band gaps, in the last decade more
+and more attention has been devoted to the unusual properties of PCs outside band gaps. In contrast
+to homogeneous dielectrics, in which the equifrequency surfaces (EFSs) have the form of ellipsoids,
+the shape of the EFSs of PCs can be very complicated.? They can contain flat or even concave areas
+separated by sharp corners or edges. In addition, the group velocity need not point away from the origin
+of the reciprocal space. This richness of the dispersion relation gives rise to unusual phenomena [13],
+such as negative refraction of light [14], appearance of supercollimated beams [15] and the superprism
+effect [16]. Thus, it has been recognised that even defect-free (except for the presence of surfaces) PCs
+can constitute useful devices, for instance flat lenses [17, 18] or beam splitters [19].
+1.2 Outline of the thesis
+This thesis naturally splits into three parts. In chapters 2 and 3 we study defect-free two-dimensional
+(2D) PCs limited by one or two parallel surfaces. In particular, we are interested in the dependence of
+their properties on the structure of the interfaces separating them from the adjacent homogeneous media.
+In chapter 2 we introduce the single-mode approximation and use it as a mathematical foundation
+for an effective-medium model of 2D PCs. In contrast to most previous work, we do not restrict our
+considerations to the case of waves impinging perpendicularly to the PC surface. We show that our
+model allows to reproduce the strong dependence of the effective material properties of a PC on the
+position of its truncation plane, observed by previous authors [21]. In particular, we demonstrate that
+the effective permittivity and permeability derived in the framework of the model are guaranteed to be
+real and continuous only if the truncation plane is chosen in certain particular ways. We test the validity
+of the model by comparing the values of the specular reflection coefficient it predicts for some specific
+PCs against results of rigorous numerical calculations. Since there has been a lot of interest in using
+PCs exhibiting the negative-refraction effect as lossless replacements of metamaterials, we pay particular
+attention to the accuracy of the effective-index description of bands with negative group velocity. We find,
+however, that it leaves much to be desired, especially for large incidence angles and in the evanescent-
+wave region. By means of a qualitative theoretical analysis, we argue that this behaviour is not restricted
+to the particular PC under study; instead, the low accuracy of the effective-index approximation is due to
+the inherent structure of the field of PC modes responsible for negative refraction.
+In chapter 3 we consider the problem of reducing the reflection losses occurring at an interface
+between a semi-infinite PC and a homogeneous medium. This is an important issue, severely limiting
+? This is analogous to what happens in solid-state theory: the Fermi’s surface in a free electron gas is spherical, but in a real
+solid it can have a very complex form, sometimes called, fittingly, a monster.
+1.3. Notational conventions 17
+the performance of practical PC devices, especially those using “bulk” PCs (as opposed to components
+based on PC waveguides). We propose to minimise these losses by superposing an additional structure—
+antireflection (AR) grating—on the PC surface, and present in detail an algorithm for the design of
+compact, wide-angle AR gratings for general 2D PCs. To assess its strengths and limitations, we apply
+it to three specific PCs, exhibiting the negative refraction, beam supercollimation, and superprism effect,
+respectively. In the first two cases, we obtain gratings ensuring a very significant decrease of the reflection
+loss; in the last case, however, the design procedure fails due to the violation of certain assumptions
+made in the derivation of our algorithm. The improvement brought by the proposed AR gratings to
+the transmission through a PC flat lens (based on the negative-refraction effect) has been confirmed
+experimentally [33].
+In chapter 4, which constitutes the second major part of this thesis, we shift our attention to more
+traditional, waveguide-based optical devices. We study the problem of miniaturisation of optical circula-
+tors, one of the last important components whose integrated versions are not yet commercially available.
+We build on the design of a magneto-optical PC-based circulator proposed in 2005 by Wang and Fan
+[34, 37]. It consists of three PC waveguides coupled to a special PC cavity supporting a pair of modes
+whose frequencies are split in the presence of a static external magnetic field (SEMF). The mode fre-
+quency splitting of the original cavity from refs. 34 and 37 is negligible in a uniform SEMF; it can only be
+augmented if the magneto-optical material in the cavity is divided into many oppositely polarised mag-
+netic domains, each having the area of a fraction of µm2. Fabrication of such domains presents serious
+experimental difficulties, as it requires a precise control of the applied SEMF on the nanometre scale.
+Here, using an analytical model of an axisymmetric resonant cavity, we show how to design cavities
+exhibiting maximum frequency splitting in a uniform SEMF. We present 2D numerical simulations of
+two classes of circulators containing the proposed cavities: PC-based circulators, similar to those studied
+in refs. 34 and 37, and circulators in which the PC coating is dispensed with and the cavity is coupled
+directly to rib waveguides. This elimination of the PC lattice leads to a significant simplification of the
+device geometry, without any deterioration of its performance. Subsequently, we comment briefly on the
+results of the experimental tests of the proposed devices that have been done in Institut d’Electronique
+Fondamentale (Orsay, France). They reveal a significant problem with the original design of the resonant
+cavities: large out-of-plane radiation losses. In the final part of chapter 4 we report on the initial results
+of full three-dimensional (3D) simulations of the cavities, which show that the above problem may be
+overcome by an appropriate adjustment of the geometry of the cavity.
+In the last part of this thesis, chapter 5, we present several numerical methods developed for the sake
+of simulating some of the devices analysed in the earlier chapters. We start by discussing the extension
+of the multiple-scattering method, widely used to handle the problem of light scattering by finite PCs,
+to the case of 2D PCs containing gyrotropic materials. Next, we show how the band structures of 2D
+PCs composed of circular cylinders can be calculated to great accuracy using Fourier-Bessel expansions;
+remarkably, no lattice sum computations are necessary. Finally, we describe the implementation of the
+finite-element method for the calculation of eigenmodes of open, axisymmetric, 3D cavities containing
+gyrotropic materials.
+1.3 Notational conventions
+Throughout this thesis, symbols embellished with arrows (e.g., aE) will denote column vectors; with
+bars (aN), row vectors; and with hats (aO), matrices, tensors or operators. Complex conjugation will be
+indicated by an asterisk (), transposition by the symbol T, and Hermitian conjugation by a dagger ().
+A unit vector in a given direction  will be written as eE . In particular, the unit vectors directed along the
+axes of a Cartesian coordinate system will be denoted by eEx , eEy and eEz , and of a cylindrical coordinate
+18 Chapter 1. Preliminaries
+system, by eE, eE and eEz . Vector operators will be written using the nabla symbol; thus, rEa, rE  aE
+and rE  aE will denote the gradient, divergence and curl of a or aE. Finally, unless otherwise noted, the
+terms permittivity, permeability, impedance, admittance and immittancewill refer to relative permittivity,
+permeability etc.
+1.4 Maxwell’s equations
+The electromagnetic fields in PCs and other optical systems are governed by Maxwell’s equations [60,
+61]. For convenience, we shall gather here the forms of these equations that will be most often refer-
+enced in later chapters of this manuscript. Since we shall only be concerned with the propagation of
+electromagnetic waves with wavelength much larger than the atomic dimensions (typically  > 1 µm),
+we shall be using the macroscopic (phenomenological) Maxwell’s equations, in which the effects of
+light-matter interaction are taken into account by help of so-called material parameters.
+The most general differential form of macroscopic Maxwell’s equations is [61, eq. (I.1a)]
+rE  E  @B
+E
+E = E ; (1.1a)@t
+rE  E @D
+E
+H = E C J
+E; (1.1b)
+@t
+rE DE = ; (1.1c)
+rE  BE = 0; (1.1d)
+where EE denotes the electric field, HE the magnetic field, DE the electric displacement field, BE the mag-
+netic induction,  the free charge density and JE the free current density. All quantities are, in general,
+functions of the position rE and time t ; for conciseness, this dependence has not been written explicitly.
+Throughout this thesis we shall assume all fields to be time-harmonic, i.e., to depend on time as e i!t ,
+where i is the imaginary unit and ! the (angular) frequency. In this case, differentiation over t reduces
+to multiplication by . i!/ and hence eqs. (1.1) become
+rE EE = i!BE; (1.2a)
+rE HE =  i!DE C JE; (1.2b)
+rE DE = ; (1.2c)
+rE  BE = 0: (1.2d)
+The fields DE and BE are related to EE and HE by so-called constitutive relations. We shall be dealing only
+with linear media, in which these relations take the form
+E O  E Cp O˛  pD =   E   H and BE =   Oˇ0 0 0 0 0 E C 0O HE; (1.3)
+where 0 and 0 denote the (absolute) permittivity and permeability of free space, O and O are the
+dimensionless (relative) position-dependent permittivity and permeability tensors of the system under
+study, and O˛ and Oˇ describe the strength of the magneto-electric coupling in this system. In the vast
+majority of materials used in practice, the elements of the two latter tensors are very small and can be
+neglected, as we shall do in the following. We shall also usually consider situations in which no free
+1.4. Maxwell’s equations 19
+charges or currents are present. Using all the above assumptions, eqs. (1.1) can be brought into the form
+rE EE = i!0O HE; (1.4a)
+rE HE =  i!0O EE; (1.4b)
+rE  .O EE/ = 0; (1.4c)
+rE  .O HE / = 0: (1.4d)
+It should be noted that owing to the identityrE .rE FE/ = 0, valid for any vector field FE [60, eq. (A1.17)],
+eqs. (1.4c)–(1.4d) follow automatically from eqs. (1.4a)–(1.4b) as soon as the field is not static (! ¤ 0),
+and therefore can be omitted.
+In a large part of this manuscript we shall analyse 2D systems, in which the material properties O
+and O are invariant with respect to translations along a privileged axis, called  in the following. Under
+the additional conditions that (i) the fields EE and HE are also independent from  (the case of in-plane
+propagation) and (ii) the tensors O and O have the block form
+" # " #
+O 0E O 0E
+O = tN and O =
+t
+N (1.5)0  0  ;
+eqs. (1.4a)–(1.4b) split into a pair of uncoupled systems of equations. Specifically, denoting by EEt, HEt
+and rE t the components of the vectors EE,HE and rE perpendicular to  , we obtain
+rE t HEt =  i!0E ; (1.6a)
+rE t  .EeE/ = i!0O t HEt (1.6b)
+and
+rE t EEt = i!0H ; (1.7a)
+rE t  .HeE/ =  i!0Ot EEt: (1.7b)
+It can be easily seen that eqs. (1.6) contain only the E and HEt field components, whereas eqs. (1.7)
+contain solely EEt and H . A field satisfying eqs. (1.6) and having EEt = 0 and H = 0 will be called
+s-polarised. Conversely, a field satisfying eqs. (1.7) and having E = 0 and HEt = 0 will be called
+p-polarised.
+
+Chapter 2
+Effective-medium model of photonic crystals
+2.1 Introduction
+As mentioned in section 1.1, a crucial feature of photonic crystals (PCs) is the richness of their disper-
+sion relation. The shape of PC equifrequency surfaces can be very complex: they can contain sharp
+corners or edges separating flat or even concave areas. However, at specific frequencies, they can also
+attain ellipsoidal shape, characteristic for homogeneous media. In consequence, the question arises if
+the crystals can then be successfully described by the effective-medium model, in which they are ap-
+proximated by a homogeneous material with specific values of permittivity  and permeability —or,
+equivalently, refractive index n = ./1=2 and impedance  = .=/1=2. Since homogeneous materials
+are incomparably easier to analyse than structured ones, an answer in the affirmative would facilitate the
+development of PC devices, especially those using the negative-refraction effect [14]. Indeed, most com-
+ponents employing this phenomenon, like the famous superlenses [17], have been designed essentially
+with homogeneous negative-index materials, first analysed by Veselago [20], in mind.
+Numerous papers dealing with this subject have already been published [21–32], giving rise to sev-
+eral competing definitions of the effective parameters of PCs, which will be reviewed in subsection 2.2.2.
+Unfortunately, as a rule, these definitions have been only heuristically motivated and lack a formal justifi-
+cation. Moreover, the ultimate verification of each such a definition, the comparison of the true reflection
+coefficient of the crystal with that of the corresponding effective medium, has so far been performed only
+for normal [24–26] or near-normal [28] incidence. Yet many applications, including those involving neg-
+ative refraction, rely on waves incident at large angles, as well as evanescent ones. The range of validity
+of the effective-medium approximation is, therefore, still poorly known.
+The aim of the work presented in this chapter is to address these shortcomings. In section 2.2 the
+concept of the single-mode approximation is used to provide a mathematical justification for a particular
+definition of the effective parameters of two-dimensional (2D) PCs. In section 2.3 we study the influence
+of the symmetry of the crystal’s truncation plane and of the electromagnetic fields of its eigenmodes on
+the behaviour of its effective parameters, generalising the theorems obtained by Pierre and Gralak [27]
+in the one-dimensional (1D) case. To assess the accuracy of the effective-medium model, in section 2.4
+we compare the values of the specular reflection coefficient predicted within the model’s framework with
+the results of rigorous numerical calculations. These tests are done for two different crystals at a number
+of frequencies and in the full range of incidence angles. This leads to a detailed discussion of the appli-
+cability conditions of the single-mode approximation itself (section 2.5). We conclude that as far as the
+bands responsible for negative refraction are concerned, the single-mode approximation is (moderately)
+accurate only close to normal incidence. Thus, it does not make much sense to treat a PC exhibiting neg-
+ative refraction as a homogeneous material for large incidence angles or in the evanescent-wave regime.
+In consequence, the behaviour of systems containing homogeneous negative-index materials can change
+21
+22 Chapter 2. Effective-medium model of photonic crystals
+z z
+refracted excited
+wave eigenmodes
+O2; O 2
+z0 z0
+1; 1
+diffracted
+incident reflected incident waves
+wave wave wave
+x x
+(a) (b)
+Figure 2.1 Schematic diagrams of the fields generated by an s- or p-polarised plane wave incident from an
+isotropic homogeneous medium on the surface of (a) another homogeneous medium and (b) a photonic crystal.
+significantly if these materials are replaced with PCs, even if the equifrequency surfaces (and so the
+phase refractive indices) of both media are the same.
+A substantial part of the results presented in this chapter has previously been published in refs. 62
+and 63.
+2.2 Definition of the effective parameters of photonic crystals
+2.2.1 Preliminaries: the homogeneous-medium case
+In the effective-medium approximation, a lossless 2D PC is modelled by a lossless, homogeneous, pos-
+sibly anisotropic medium with one optical axis oriented along the invariant direction of the PC, hereafter
+taken to lie along the y axis. We shall begin with a brief analysis of the refraction of a plane wave inci-
+dent on the interface between an isotropic medium, labelled 1, with permittivity 1 and permeability 1,
+occupying the z < z0 half-space, and this anisotropic material, labelled 2, characterised by tensorial O2
+and O 2, lying in the z > z0 half-space [fig. 2.1(a)]. The wave is taken to propagate in the xz plane.
+For the sake of simplicity, we shall restrict our attention to PCs whose point group includes a mirror
+plane perpendicular to the x or z axis or a three-fold rotation axis parallel to the y axis. In these cases,
+by Neumann’s principle (“the symmetry elements of a physical property of a crystal must include the
+symmetry elements of the crystal point group” [64, p. 14]), the tensors O2 and O 2 become diagonal in the
+chosen coordinate system,
+2 3 2 3
+2x 0 0 2x 0 0
+O2 = 4 0  5 42y 0 ; O 2 = 0 2y 0 5 : (2.1)
+0 0 2z 0 0 2z
+Maxwell’s equations (1.6) can then be used to derive the dispersion relation of, say, s-polarised plane
+waves (with electric field perpendicular to the propagation plane) with wave vector kE = kxeEx C kzeEz
+propagating in medium 2,
+k2 k2 !2 2x C z = 1 with K2    and K2 !x 2y 2z z  2y2x ; (2.2)K2 K2 c2 c2x z
+2.2. Definition of the effective parameters of photonic crystals 23
+ pwhere ! denotes the frequency and c 1= 00 the speed of light defined in terms of the (absolute)
+permittivity 0 and permeability 0 of free space. Thus, the equifrequency curve (EFC) of material 2 is
+an ellipse with principal axes of length 2Kx and 2Kz .
+When a plane wave with wave vector kE1 = kxeEx C k1zeEz falls on the interface separating media 1
+and 2, reflected and refracted waves, with wave vectors kE01 = kxeEx   k1zeEz and kE2 = kxeEx C k2zeEz ,
+respectively, are generated. By imposing the continuity conditions at z = z0 on the field components par-
+allel to the interface, the well-known Fresnel’s formulas for the amplitude of the reflected and refracted
+waves can be derived:
+2x=k2z   1=k= 1zr C ; (2.3a)2x=k2z 1=k1z
+22x=k= 2zt C : (2.3b)2x=k2z 1=k1z
+These formulas can be written in a concise way by introducing the notion of transverse impedance of a
+material, defined as
+E
+= j tZj .j = 1; 2/; (2.4)
+p
+Z0Hj t
+where Z0 0=0 denotes the (absolute) impedance of free space, and Ej t (Hj t) is the amplitude of
+the transverse, i.e., parallel to the interface, component of the electric (magnetic) field of a plane wave
+E 0 Epropagating in the j th material in the given direction k . Since in our case E = E = E eikj rEj j t jy jy ,
+H =  H = .i!  / 11t 1x 0 1 @E1y=@z = .k1z=!01/E1y , andH2t = .k2z=!02x/E2y , we obtain
+! 
+= jxZj (2.5)
+c kjz
+and
+Z2  Z1 2Z
+r = 2C ; t = C : (2.6)Z2 Z1 Z2 Z1
+By the duality theorem [65, p. 72–73], analogous results for p-polarised waves can be obtained by
+substituting  HE , EE, O and O for EE,HE , O and O , respectively. Equations (2.6) must then be replaced by
+Y2   Y1 2Y
+r = 2C ; t = C ; (2.7)Y2 Y1 Y2 Y1
+where
+! 
+= jxYj (2.8)
+c kjz
+is the transverse admittance of j th material. Introduction of the notion of transverse immittance  of a
+medium, defined as its transverse impedanceZ in the s-polarisation case and its transverse admittance Y
+in the p-polarisation case, lets us write the Fresnel’s formulas (2.6) and (2.7) in a unified way:
+2  1 2
+r = 2C ; t = C : (2.9)2 1 2 1
+2.2.2 Existing definitions
+Several authors [24–26, 28, 66] have attempted to generalise the concept of transverse immittance to non-
+homogeneous media, the main obstacle being, obviously, that in such media the ratio Et=Ht is spatially
+dependent. The most straightforward is to define  as the ratio of the spatial field averages over the
+24 Chapter 2. Effective-medium model of photonic crystals
+surface unit cell, as proposed by Lu and Prather [26]; while this might seem an oversimplification, in
+subsection 2.2.3 we shall show that this approach is in fact rigorous if the single-mode approximation,
+defined in the same subsection, is valid. In an attempt to preserve more information from the detailed
+field structure, other authors [24, 25, 28, 66] suggested empirical definitions of the transverse impedance,
+expressed in terms of the average electromagnetic energy and Poynting vector of the dominant crystal
+eigenmode. However, no mathematical justification of these definitions has been given.
+Efros and Pokrovsky [23] and later Decoopman et al. [21] proposed an entirely different procedure.
+They considered the perturbation of the incident electromagnetic field caused by a PC slab embedded in
+a homogeneous medium whose permittivity  and permeability  were varied. The values of  and 
+corresponding to minimum perturbation were taken as the effective parameters of the crystal. Contrary
+to the approaches cited in the previous paragraph, this method is based on a full rigorous solution of
+Maxwell’s equations. On the other hand, it requires a significant computational effort since, for each
+value of the frequency and angle of incidence, simulations need to be performed for multiple, possibly
+complex, values of  and  of the homogeneous medium. Therefore, it is not well-suited to the analysis
+of the general behaviour of the effective parameters, for which an—even approximate—semianalytical
+approach would be useful.
+Finally, some authors [29–32] proposed definitions of effective parameters based on the extended
+Maxwell’s-Garnett theory, where the crystal unit cell is replaced by a coated cylinder (or sphere) embed-
+ded in a homogeneous host medium whose parameters are determined from the condition of vanishing
+scattering, calculated by the Mie theory. This approach enabled them to reproduce the band structure
+of PCs, usually composed of dispersive (e.g., polaritonic) materials, with good accuracy. Nevertheless,
+the effective parameters they obtained are independent from the choice of the crystal truncation plane,
+whereas one of the key observations of Decoopman et al. [21] was the strong variability of effective 
+and  with the position of the crystal surface. Thus, the parameters introduced in refs. 29–32 could not
+be used to determine accurately the reflection coefficient of a truncated PC.
+2.2.3 Proposed definition
+To arrive at the proper definition of the effective parameters of PCs, let us consider a semi-infinite 2D
+PC invariant along the y axis, on whose surface, z = z0, an s- or p-polarised plane wave with wave
+vector kE = kxeEx C kzeEz is incident [fig. 2.1(b)]. Owing to the system’s periodicity in the x direction,
+the reflected field will comprise infinitely many diffraction orders. Similarly, the transmitted field will
+be a superposition of infinitely many crystal eigenmodes (propagative and evanescent) characterised by
+different wave vectors. In contrast, as we have seen in subsection 2.2.1, if the crystal were replaced
+by a homogeneous material, only one transmitted plane wave would be excited. The effective-medium
+approximation can therefore be reasonably expected to give a good picture of reality only when some
+crystal eigenmode is excited with an amplitude significantly greater than the others. In other words, the
+validity of the effective-medium approximation is constrained by that of the single-mode approximation,
+which consists in neglecting all crystal eigenstates but the dominant one. We shall now show how this
+approximation leads to a natural definition of the crystal’s effective parameters.
+In the remaining part of this chapter we shall focus on s-polarised waves; formulas corresponding to
+p polarisation can be derived using the duality theorem and will be omitted for brevity. For the chosen
+polarisation, the electric field reduces to its component along the y axis, and Maxwell’s equations (1.6)
+take the form
+@Ey = i!0Hz; (2.10a)
+@x
+@Ey =  i!0Hx; (2.10b)
+@z
+2.2. Definition of the effective parameters of photonic crystals 25
+@Hz   @Hx = i!0Ey : (2.10c)
+@x @z
+We shall solve these equations separately in the homogeneous region and in the PC, and then match the
+solutions at the crystal surface by imposing the continuity of the Ey andHx components, in accordance
+with Maxwell’s boundary conditions.
+We assume the PC to be oriented so that a (not necessarily primitive) rectangular unit cell .ax; az/
+can be defined. The whole system is periodic with respect to the variable x, so it is possible to perform
+a Floquet-Bloch transform [13, 67] of the Maxwell’s equations (2.10). After this transform, as is well
+known from grating theory, the solution of the Maxwell’s equations in the homogeneous region is given
+by the Rayleigh’s expansion [68, 69]
+Eh.x; z/ = eiŒkxxCˇ0.z 
+X
+z0/C r eiŒ.kxCGxn/x ˇn.z z0/y n ; (2.11)
+n2Z
+whereG  2 n=a and ˇ  Œ  .!=c/2 .k CG /21=2xn x n 1 1 x xn with the sign of the square root chosen
+so that ReˇnCImˇn  0. In the crystal, we can expand the field in terms of the PC eigenmodes with the
+x component of the Bloch vector equal to kx , taking into account (i) propagative modes carrying energy
+in theCz direction and (ii) evanescent modes decaying in the same direction [13, 41–43, 70–72]. These
+modes can be determined by several methods, most of which utilise some variant of the scattering-matrix
+algorithm [73]; in the numerical calculations presented later in this chapter we have used the differential
+method [69, 74–76]. The electric field of themth eigenmode with Bloch vector Em = kxeEx C mzeEz can
+be written as a 2D Fourier expansion w npXith cXoefficients .um /n;p2Z:
+E .x; z/ = unp eiŒ.kxCGxn/xC.mzCGzp/zmy m ; (2.12)
+n2Z p2Z
+where G  2 p=a .?zp z Thus, the total electric fiXeld in the crystal will be
+Ecy.x; z/ = tmEmy.x; z/ (2.13)
+m2N
+with “transmission coefficients” tm denoting the amplitudes of individual modes.
+The requirement of continuity of E andH =  .i! / 1y x 0 @Ey=@z at z = z0 leads to
+X
+eikxxC r ei.kxCGxn/xn
+X n XX C C C (2.14a)= t np iŒ.kx Gxn/x .mz Gzp/z0m um e ;
+m
+iˇ X
+n p
+0 ik x   iˇe x n r ei.kxCGxn/xn
+1 X X n X1 (2.14b)
+= tm i.
+np iŒ.kxCGxn/xC.mzCGzp/z0
+mz CGzp/um e :
+m n p
+R
+Using the identity 1 e2 inx0 dx = ın0, where ınm equals 1 if n = m and 0 otherwise, we arrive at the
+? Since we shall be studying the influence of shifting the surface of the crystal with respect to the origin of its unit cell, it is
+convenient to expand the field in the PC [eq. (2.12)] about the fixed point .0; 0/ rather than the point .0; z0/ anchored on
+the surface.
+26 Chapter 2. Effective-medium model of photonic crystals
+following inhomogeneous system of linear equatioXns with unknowns .rn/n2Z and .tm/m2N:
+ı C r = unn0 n mtm; (2.15a)
+iˇ Xmn
+.ın0   rn/ = vnmtm; n 2 Z; (2.15b)1 m
+with the coefficient n nXs um and vm defined as X
+un  unp ei.mzCGzp/z0 ; vn  i. CG /unp ei.mzCGzp/z0m m m mz zp m : (2.16)
+p p
+This system can be written in the matrix form
+" O #" # " # I uO rE aE
+Oˇ O E = E0 ; (2.17)i =1 v t a
+where IO denotes the identity matrix, uO and vO are matrices with elements un and vn (the row and column
+indices being denoted by super- and subscripts, respectively), Oˇ
+m m
+is the diagonal matrix of the coeffi-
+cients ˇ , rE and tE are column vectors of the coefficients r and t , and the vectors aE and aE0n n m , whose
+elements are given by
+a  ı ; a0n n0 n  iˇ0ın0=1; (2.18)
+represent the incident field.
+If the crystal were replaced by a homogeneous medium, the only nonzero reflection coefficient would
+be the specular one, r0. Using eqs. (2.15) corresponding to n = 0, the following relation between r0 and
+the transmission coefficients of individual modes can be derived:
+r0 = P
+P
+0 0
+mŒum   .1=iˇ0/vmtm
+C : (2.19)Œu0m m .1=iˇ0/v0mtm
+As we have already seen, the effective-medium approximation relies on the assumption that the trans-
+mission coefficient of a particular (dominant) mode is much larger than of all others; without loss of
+generality, we can denote this mode with the index 1, so that our assumption reads jt1j  jt2j; jt3j; : : :
+If it holds, expression (2.19) reduces to
+ iu
+0
+1=v
+0
+1   1=ˇ0r0 C : (2.20)iu01=v01 1=ˇ0
+Comparing eq. (2.20) to the Fresnel’s formula (2.3a) and noting that ˇ0 and k1z denote the same
+physical quantity—the z component of the wave vector of the incident plane wave—we conclude that
+iu0=v01 1 in eq. (2.20) corresponds to 2x=k2z in eq. (2.3a). In the homogeneous-medium case, k2z
+is the z component of the wave vector of the refracted wave. Assuming that the EFC of the crystal
+at the considered frequency can be approximated by an ellipse with semiaxes Kx and Kz and centre
+KE0  .K0x; K0z/, as shown in fig. 2.2, it is natural to identify k2z in the PC case with the z component
+of the Bloch vector of mode 1 measured from the centre of this ellipse, i.e., 01z  1z   K0z . In this
+way, we arrive at the following definition of the effective x of the crystal:
+0 u0 = i 1x 1z : (2.21)
+v01
+2.3. Influence of symmetries on the effective parameters 27
+kz
+E0
+1
+Kx
+E1
+Kz
+KE0
+kx
+Figure 2.2 Relationship between the vectors KE , E and E00 1 1.
+The dispersion relation (2.2) provides then the formulas for the effective z and y ,
+K2x 1 K
+2
+z =  ;  =
+z
+x y ; (2.22)
+K2  !2 2z x =c
+and eq. (2.5), for the effective transverse impedance,
+! iu0
+Z = 1 : (2.23)
+c v01
+Thus, within the framework of the single-mode approximation the PC produces the same reflected wave
+as the homogeneous medium with material parameters given by eqs. (2.21) and (2.22).
+Finally, we note that the definition (2.23) of the effective transverse impedance agrees with that
+given by Lu and Prather [26, section 3], since from eqs. (2.10b), (2.12) and (2.16) it follows that u01
+and  v01=.i!0/ are the average periodic parts of the Ey and Hx fields of mode 1 on the PC surface;
+substituting these values to eq. (2.4), we arrive at the expression (2.23).
+2.3 Influence of symmetries on the effective parameters
+“Standard” lossless homogeneous materials are characterised by purely real ,  and Z. From the
+Fresnel’s formula (2.3a) it follows that the reflection coefficient of a plane wave incident on the interface
+separating two such materials will also be purely real provided that both the incident and the transmitted
+wave are propagative, i.e., k1z and k2z are real. These properties do not always carry over to the PC case.
+Indeed, Pierre and Gralak [27] proved that for 1D PCs they are guaranteed to hold only if the crystal is
+truncated along one of its mirror symmetry planes; otherwise, the effective material properties and the
+reflection coefficient may take complex values.
+Since the effective-medium description of PCs is an approximation, one might expect their effective
+material properties to have some kx-dependence. This does no harm as long as the variation with kx is
+fairly small. However, ref. 27 demonstrates that the effective parameters of a 1D PC cut elsewhere than
+along a mirror symmetry plane may diverge at the value of kx where the crystal eigenmode turns from
+propagative to evanescent. In consequence, the usefulness of the effective-medium model in this case is
+rather limited.
+In this section we shall extend the results from ref. 27 to the 2D case. It should be noted that in 1D
+systems mirror planes are in fact identical with inversion centres and two-fold rotation axes, so that a
+priori it is not obvious which of them turn out to be crucial in 2D.
+28 Chapter 2. Effective-medium model of photonic crystals
+2.3.1 Real-valuedness
+We shall now prove the following sufficient condition for the real-valuedness of the effective parameters
+and the specular reflection coefficient of 2D PCs.
+The reflection coefficient r0 and the effective parameters x , z , y , and Z of a 2D PC are real if:
+(i) both the incident wave and the dominant eigenmode are propagative, i.e., ˇ0 and 1z are real,
+(ii) the truncation plane z = z0 contains an inversion centre of the infinite crystal,
+(iii) the single-mode approximation is valid.
+Simple inspection of eqs. (2.20)–(2.23) shows that if the assumptions (i) and (iii) are fulfilled, the
+proposition is true provided the ratio i 0 0 is real. This expression involves the Fourier coefficients npu1=v1 u1
+of the electric field of the dominant PC mode. By assumption (i), this mode is propagative, and therefore
+the coefficients in question can be obtained with the standard plane-wave method as described in ref. 77.
+Now, if the crystal is centrosymmetric with respect to a point .x0; z0/, the electric field of the mode can
+be written as XX
+E .x; z/ = uQnp eiŒ.kxCGxn/.x x0/C.z1CGzp/.z z0/1y 1 ; (2.24)
+n p
+where Qnpu1 are the elements of a vector equal to the product of a real diagonal matrix and an eigenvector
+of a real symmetric matrix [77]; hence, they can be taken to be real. Comparing eq. (2.24) with the
+general formula (2.13), we obtain
+np = Qnpu u e iŒ.kxCGxn/x0C.z1CGzp/z01 1 ; (2.25)
+and, using eqs. (2.16), we arrive at
+P
+0 P Q0piu u1 = p 1 : (2.26)
+v0 0p1 p.1z CGzp/uQ1
+Owing to the real-valuedness of Qnpu1 and 1z , the above expression is real, and the proposition follows.
+On the contrary, if the interface contains no symmetry centres, a complex Hermitian eigenvalue
+problem is solved in the plane-wave method, so that the eigenvector elements Qnpu1 need not be real, and
+neither does iu0=v01 1 .
+2.3.2 Continuity and boundedness
+Preliminaries We proceed to the investigation of the behaviour of the effective permittivity and per-
+meability of a 2D PC near a value of kx at which its dominant eigenmode turns from propagative to
+evanescent, i.e., near a vertex KE = .K ˙ K ;K / of the elliptical EFC. At such a point, 0v˙ 0x x 0z 1z is
+zero; according to eqs. (2.21) and (2.22), this implies  =  = 0 and j j ! 1 unless v0x z y 1 is zero at
+the same time. In this subsection we shall study the circumstances in which this necessary condition for
+the continuity and boundedness of y at the transition point is guaranteed to be met. The considerations
+are necessarily somewhat technical; the reader not interested in mathematical details can skip to the last
+paragraph of this subsection, where the obtained results are summarised.
+We shall limit the discussion to PCs whose geometry is described by one of the symmorphic space
+groups.? Eigenmodes with a given Bloch vector kE can then be classified in terms of the irreducible
+? A symmorphic space group is a space group that contains all elements of its point group [78, p. 18]. This means, in
+particular, that the set of its generators must consist solely of pure rotations and mirror reflections (no screw rotation axes
+and glide planes are allowed).
+2.3. Influence of symmetries on the effective parameters 29
+representations of the largest common subgroup of the PC’s point group and the group of kE, i.e., the
+group of symmetry operations leaving kE invariant or transforming it to a Bloch vector kE0 differing from
+kE by a reciprocal-lattice vector [79, chap. 3; 80, chap. 8].
+If a vertex KEv˙ is located at a general reciprocal-space point, whose group consists solely of the
+identity operation I , no constraints on the symmetry of the corresponding eigenmode can be obtained.
+However, if K0z = 0 or K0z =  =az—as, in practice, is very often the case—the group of KEv˙ contains
+additionally the operation of mirror reflection with respect to the x axis,  .?x It follows that if the crystal
+itself has mirror planes parallel to x, the electric field of an eigenmode with Bloch vector KEv˙ is either
+symmetric or antisymmetric with respect to reflection about each of these planes. We shall assume the
+origin of the coordinate system to be chosen so that the mirror planes lie at z = 1qaz for all q 2 Z (it2
+is easy to see that there are always two parallel planes per a rectangular unit cell). Let us now consider
+separately the cases of K0z = 0 and K0z =  =az .
+The case of K 0 Setting 0 to K = 0 in the definition (2.16) of v00z = 1z 0z 1 and using the definition of
+Gzp, we get
+2 i X
+v0 = 0ppu e2 ipz0=az1 1 : (2.27)az
+p2Z
+Consider first the case of an eigenmode whose electric field E1y.x; z/ is symmetric with respect to
+reflection about the plane z = 0, i.e., E1y.x; z/ = E1y.x; z/. Expression (2.13) for E1y.x; z/ and the
+orthogonality of the Fourier basis yield
+n; p = npu1 u1 for all n; p 2 Z: (2.28)
+It is easy to check that the above condition guarantees also the symmetry of E1y.x; z/ with respect to all
+the other mirror planes z = 1qaz . Substituting eq. (2.28) into eq. (2.27), we obtain2
+0  4 
+X
+= 0p
+2 pz
+v1 pu1 sin
+0
+: (2.29)
+az az
+p>0
+Without further constraints on 0pu , the coefficient v01 1 is guaranteed to be null only if 2 z0=az is an
+integral multiple of  , so that all the sine factors vanish. With z0 restricted to the first unit cell (0  z0 <
+a ), this is equivalent to z = 0 or z = 1z 0 0 az . Thus, the crystal should be truncated along one of its mirror2
+planes.
+If the PC is based on a hexagonal or centred rectangular Bravais lattice, its primitive cell is two times
+smaller than the rectangular unit cell .ax; az/ we are using. It can then be shown that half of the Fourier
+coefficients npu1 , namely those with nC p odd, vanish. As a result, eq. (2.29) becomes
+8  X0 =   0;2p 4 pzv1 pu1 sin 0 : (2.30)az az
+p>0
+It follows that all the sine factors, and hence the total sum too, will vanish on two more planes per unit
+cell: z = 10 az and z0 = 3az .4 4
+Let us now proceed to the case of electric field antisymmetric with respect to the plane z = 0. Instead
+of eq. (2.28) we have then
+n; p =   npu1 u1 for all n; p 2 Z: (2.31)
+? Note in particular that the vector x.K0x ˙Kx ;  =az/ = .K0x ˙Kx ;  =az/ is equivalent to .K0x ˙Kx ;  =az/, since
+they differ by the reciprocal-lattice vector .2 =az/eEz .
+30 Chapter 2. Effective-medium model of photonic crystals
+and the sines in eq. (2.29) are replaced by cosines. To ensure that 0 vanishes for all sequences 0pv1 .u1 /p2N,
+to each p must correspond a q 2 such that 2 pz =a = .q C 1Z 0 z / . It is easy to see that this condition2
+cannot be fulfilled for any value of z0. For a PC based on a hexagonal or centred rectangular Bravais
+lattice, the condition becomes 4 pz =a = .q C 10 z / , which has no solutions, either.2
+The case of K0z = pi/az Instead of eq. (2.27), we have
+ i X0 = 0pv .2p C 1/u e i.2pC1/z0=az1 1 : (2.32)az
+p2Z
+Substitution of the expression (2.13) for E1y.x; z/ to the condition of symmetry/antisymmetry with
+respXectXto plane z = 0, E1y.x; z/ = ˙E1y.x; z/, yields
+unp eiŒ.kxC
+XX
+2n =ax/xC.2pC1/ z=az = ˙ unp eiŒ.kxC2n =ax/x .2pC1/ z=azm m ; (2.33)
+n p n p
+so that from the orthogonality of the Fourier basis we obtain
+unp = ˙un; p 1m m for all n; p 2 Z: (2.34)
+It can also be shown that a mode with kz =  =a that is symmetric with respect to the plane z = 0 must
+be antisymmetric with respect to the plane z = 1az and vice versa; thus, without loss of generality, we2
+can take the plus sign in the above equation. Substituting it into eq. (2.32), we get
+ i X
+v0 = .2p C 0p1/u Œei.2pC1/ z0=az   e i.2pC1/ z0=az1 1 az
+p0X C (2.35) 2 i .2p 1/ z= C 0p.2p 1/u1 sin 0 :az  azp 0
+Vanishing of v01 is thus ensured if sinŒ.2p C 1/ z0=az = 0 for all integer p  0, which is equivalent
+to z0 = qaz with q 2 Z. This corresponds to placing the truncation plane along a symmetry plane of
+the electric field of the crystal’s dominant eigenmode. The situation is the same if the PC is based on
+a hexagonal or centred rectangular Bravais lattice: the condition for vanishing v01 takes then the form
+sinŒ.4p C 1/ z0=az = 0 for all integer p  0, which is again equivalent to z0 = qaz with q 2 Z.
+Conclusions From the above considerations we can establish the following rule:
+The effective parameters x , z and y are continuous and bounded at the point of the propagative-to-
+evanescent transition of the dominant PC eigenmode in the two following cases:
+(i)  the transition occurs at kE = kxeEx ,
+ the crystal has mirror planes parallel to x,
+ the electric field of the dominant mode is symmetric with respect to these planes, and
+ the crystal is truncated along one of these planes or, provided it is based on a hexagonal or
+centred rectangular Bravais lattice, midway between these planes;
+(ii)  the transition occurs at kE = kxeEx C  =azeEz ,
+ the crystal has mirror planes parallel to x, and
+ the crystal is truncated along a symmetry plane of the electric field of its dominant eigen-
+mode.
+2.4. Examples 31
+a
+0:5
+0:4
+0:3
+plane 3 p
+3a 3=8 0:2
+plane 2 p
+a 3=4
+plane 1 0:1
+0
+  M K  
+(a) (b)
+Figure 2.3 (a) Geometry of the hexagonal-lattice PC analysed in the text. Horizontal lines mark the position of
+truncation planes 1, 2, and 3; inversion centres of the PC located at these planes are marked with crosses. (b) Band
+structure of the crystal shown in part (a). Horizontal lines mark the frequency values ! = 0:14  2 c=a and
+0:259  2 c=a.
+This rule is not a rigorous theorem. First, the sufficiency of the above conditions has not been proved.
+Assuming that the Taylor expansions of u01.
+0
+1z/ and v
+0 0
+1.1z/ about 
+0
+1z = 0 exist, the formula (2.21)
+for x can be written as
+0 
+0 u01z 1.0/C .0 2 0 0 01z/ .du1=d1z/ C   
+ . / = i 1z
+=0
+x 1z C 0 0 C    : (2.36)v01.0/ 1z.dv01=d /01z 1z=0
+The effective permeability x is then finite and different from zero if and only if exactly q   1 lowest
+derivatives of u01 and q lowest derivatives of v
+0
+1 , where q 2 N, vanish at 01z = 0. We have proved that
+in the two cases listed above v01.0/ vanishes; it can also be shown that in these cases u
+0
+1.0/ is in general
+non-zero. However, the proof that .dv0 0 01=d1z/ =0 does not vanish is missing.1z
+Second, the above conditions have not been proved to be strictly necessary. Indeed, the coefficients
+0p
+u1 can accidentally take such values that v
+0
+1 will vanish for some “random” truncation. This does not
+seem to be a major problem, though, and one should probably treat these situations like, for instance,
+accidental degeneracies in group theory.
+These reservations notwithstanding, in the following section it will be shown that the effective pa-
+rameters of two typical PCs at several distinct frequencies behave exactly as predicted by the above rule.
+So far, the author has not found any counterexample to it.
+2.4 Examples
+In this section we shall apply the theory presented above to the cases of two specific PCs, one with a
+hexagonal and one with a square lattice. In particular, the predictions of the effective-medium model will
+be compared with the results of numerical calculations made with the differential method [69, 74–76].
+2.4.1 Hexagonal lattice
+To begin with, we consider the crystal shown in fig. 2.3(a): the hexagonal lattice of air holes of radius
+0:35a, a being the lattice constant, embedded in a dielectric matrix with  = 16. Figure 2.3(b) presents
+its Brillouin diagram. At the frequency ! = 0:14 2 c=a, the EFC of the single s-polarised propagative
+crystal eigenmode has the shape of a circle centred at the   = .0; 0/ point [fig. 2.4(a), middle diagram,
+solid line]. In figs. 2.5(a), (d) and (g) the specular reflection coefficient of this crystal at the quoted
+!a=2 c
+32 Chapter 2. Effective-medium model of photonic crystals
+1:50
+(a) (b)
+1:25 n D  2
+n D  2
+1:00
+0:75
+n D  1
+0:50 n D  1
+0:25  D 4
+ D 2
+ D 1
+0:50 n D 0
+nD 1
+0:25
+n D 0
+0:00
+0:25
+0:00 0:25 0:50 0:00 0:25 0:50
+kxa=2  kxa=2 
+Figure 2.4 The EFCs at frequency (a) ! = 0:14  2 c=a andp(b) ! = 0:259  2 c=a of three PCs of the
+type shown inpfig.p2.3(a) with the same average refractive index h i = 2:67, but different values of the index
+contrast  = b= h between the background and the holes: b = 16, h = 1,  = 4 (solid lines), b = 11:76,
+h = 2:94,  = 2 (dotted lines), and b = h = 7:11,  = 1 (dashed lines). The middle part of the graphs shows
+the EFCs of the real bands (Re kz ¤ 0, Im kz = 0), the bottom one, of the imaginary bands of thpe first kind [81]
+(Re kz = 0, Im kz ¤ 0), and the top one, of the imaginary bands of the second kind (Re kz = 2 =a 3, Im kz ¤ 0,
+i.e., lying on the edge of the first Brillouin zone). Only the three bands with lowest values of Im kz are shown in
+each case. The bands of the empty lattice ( = 1) are labelled with the index n of the harmonic Gxn to which they
+correspond. For each mode with wave vector kE visible in the graph, the crystal supports three additional modes
+with wave vectors kE,  kE, and  kE [81].
+Im kza=2  Re kza=2  Im kza=2 
+2.4. Examples 33
+1 0:06 1 0:10
+(a) Im r0 (g)
+0:04
+0 ! 0 0:05
+rel. error
+Re 0:02 r0
+ 1 0:00  1 0:00
+4 4
+(b) (h)
+2 2
+0 0
+1:0 14 20  =2
+(c) (i)
+0:9 y ! 13
+10 0
+0:8  12 10jx j jy jx
+argx arg y
+0:7 11 0   =2
+0:0 0:1 0:2 0:3 0:4 0:5 0:0 0:1 0:2 0:3 0:4 0:5
+kxa=2  kxa=2 
+1 0:15
+(d)
+0:10
+0
+0:05
+ 1 0:00
+4
+(e)
+2
+0
+1:5 10
+(f)
+1:4
+9
+1:3
+8
+1:2
+1:1 7
+0:0 0:1 0:2 0:3 0:4 0:5
+kxa=2 
+Figure 2.5 (a) The kx-dependence of the specular reflection coefficient r0 of the crystal from fig. 2.3(a) trun-
+cated along plane 1, at ! = 0:14  2 c=a. Solid lines: results of rigorous calculations, rn0 ; circles: results of
+calculations made in the single-mode approximation, rsm0 ; dashed line: relative error  of the single-mode approx-
+imation. The vertical lines at kx = 0:14  2 =a and 0:447  2 =a mark where the incident wave and the single
+propagating crystal eigenmode, respectively, turn from propagating to evanescent. (b) Amplitudes of the three
+most slowly decaying crystal eigenmodes excited in the above conditions (solid, dashed, and dotted line, in order
+of increasing Im kz). (c) Effective x (dark lines) and y (light lines) of the crystal. (d)–(f) and (g)–(i) The same
+for planes 2 and 3.
+x j j Re r0, Im r0, xtm j j Re r0, Im r0,tm
+10jx j, jy j j j Re r0, Im r0,tm
+argx , arg y
+Relative error
+Relative error Relative error
+y y
+34 Chapter 2. Effective-medium model of photonic crystals
+1
+0
+ 1
+(a) (b)
+Figure 2.6 Real part of the electric field Ey of the modes of the crystal shown in fig. 2.3(a) with (a) ! =
+0:14 2 c=a, kx = 0:447 2 =a, and kz = 0, (b) ! = 0:259 2 c=a, kx = 0:259 2 =a, and kz = 0. A mirror
+plane of the crystal parallel to its surface is marked with a horizontal line.
+1 1:5 2 2
+(a) rel.!error
+(d)
+1:0
+ Im r0
+0 0 1
+ Re r 0:50
+ 1 0:0  2 0
+4 10
+(b) (e)
+2 5
+0 0
+0:2 50 0:1 50
+(c) (f)
+0:0
+0:0
+y ! 0  0:1 0
+ 0:2  x  0:2
+ 0:4  50  0:3  50
+0:0 0:1 0:2 0:3 0:4 0:5 0:0 0:1 0:2 0:3 0:4 0:5
+kxa=2  kxa=2 
+Figure 2.7 Same as fig. 2.5, at frequency ! = 0:259 2 c=a and for truncation planes (a)–(c) 1 and (d)–(f) 2.
+Discontinuities in the plots of rsm0 appear at kx = 0:33  2 =a, because at this value of kx the two most slowly
+decaying crystal eigenstates “swap places”, and the calculations of rsm0 are always done assuming the mode with
+the smallest Im ky to be dominant. The domain of the plots of effective parameters has been restricted to the range
+of kx in which the relative error of the single-mode approximation is less than 25%.
+frequency is plotted against the x component of the wave vector of the incident plane wave for three
+different positions, marked with horizontal lines in fig. 2.3(a), of the interface between the crystal and
+the homogeneous medium, taken to be vacuum (1 = 1 = 1). In these graphs, the results of rigorous
+numerical calculations (rn0 , solid lines) are juxtaposed with the values obtained from eq. (2.20) derived
+in the framework of the single-mode approximation (rsm0 , circles). Evidently, for surfaces containing
+inversion centres Im rn0 is very small in the whole range kx < 0:14  2 =a, in which the incident wave
+is propagative [figs. 2.5(a) and (d)]. On the contrary, when the termination is chosen in an arbitrary way,
+r0 acquires an appreciable imaginary part [fig. 2.5(g)]. This is in agreement with the rule formulated in
+subsection 2.3.1.
+x
+j j Re r0, Im r0,tm
+x jtmj Re r0, Im r0,
+y
+Relative error
+
+Relati yve error
+2.4. Examples 35
+In all the three graphs, the relative error of the single-mode approximation, defined as   jrsm0  
+rnj=jrn0 0 j, is plotted with a dashed line. It is clear that at the chosen frequency (corresponding to the mid-
+dle of the first band of the crystal) the single-mode approximation is very accurate for kx corresponding
+to propagative incoming waves (kx < !=c); for larger kx , the accuracy degrades slightly, but the relative
+error seldom exceeds 10%.
+Figures 2.5(c), (f) and (i) present the kx-dependence of the effective x and y at ! = 0:14 2 c=a
+for the three different termination planes of the crystal. As shown in fig. 2.6(a), at the chosen frequency
+(and in the whole first band) the electric field of the mode with kx = 0:447  2 =a and kz = 0 is
+symmetric with respect to the horizontal mirror planes of the crystal. Thus, the conditions enumerated
+in point (i) of the rule from subsection 2.3.2 are satisfied for truncation planes 1 and 2, and indeed, as
+shown in figs. 2.5(c) and (f), the effective permittivity y is continuous and bounded for these truncation
+planes. In contrast, y diverges at kx = 0:447  2 =a when the crystal is truncated along the arbitrarily
+chosen plane 3 [fig. 2.5(i)].
+It should be noted that shifting the truncation plane has a large influence on the numerical values
+of the effective parameters. For instance, at normal incidence, the crystal truncated along plane 1 has
+y = 14:0 and x = 0:73, whereas for the truncation plane 2 these values are y = 7:1 and x = 1:43—a
+difference of a factor of two. This corroborates the earlier observations of Decoopman et al. [21].
+As demonstrated above, at a frequency lying in the first band of the crystal under study the single-
+mode approximation works well, and so the effective-medium model is well-founded. In the second
+band, however, this approximation becomes much less accurate. We shall consider specifically the fre-
+quency ! = 0:259  2 c=a, at which the EFC of the crystal is, again, centred at   , approximately
+circular, and its radius corresponds to the effective index n   1 [fig. 2.4(b), middle diagram, solid
+line]. In figs. 2.7(a) and (d) the rigorous value of the specular reflection coefficient of the crystal at this
+frequency is juxtaposed with that calculated from eq. (2.20). The relative error grows with kx and is
+usually greater than 20% (plane 1) and 10% (plane 2). In the evanescent region, the single-mode ap-
+proximation is clearly irrelevant. The graphs of the amplitudes of the three most slowly decaying crystal
+eigenmodes [figs. 2.7(b) and (e)] clearly show that the influence of the second mode is nonnegligible
+in the whole range of kx , and for the first truncation plane even the third mode plays a significant part.
+Close inspection reveals that the ratios jt2=t1j and jt3=t1j tend to grow with the incidence angle; thus,
+the effective-medium model is a better approximation at near-normal than at grazing incidence (except
+for the immediate neighbourhood of kx = !=c, where r0 becomes exactly  1).
+In addition, as shown in fig. 2.6(b), the electric field of the mode with ! = 0:259  2 c=a, kx =
+0:259  2 =a and kz = 0 is antisymmetric with respect to the mirror planes of the crystal. Thus, y is
+divergent at kx = 0:259  2 =a regardless of the choice of the truncation plane [figs. 2.7(c) and (f)].
+2.4.2 Square lattice
+The second structure to be studied is the square lattice of air holes of radius 0:35a, where a is the lattice
+constant, drilled in a dielectric matrix with  = 11:56 [fig. 2.8(a)]. Its Brillouin diagram is plotted in fig.
+2.8(b). The analysis will be conducted at three discrete frequencies, ! = 0:13  2 a=c, 0:22  2 a=c
+and 0:31  2 a=c, at which the EFCs of the crystal have an approximately circular or ellipsoidal shape,
+as demonstrated in fig. 2.9.
+Figures 2.10(a), (d) and (g) show the kx-dependence of the reflection coefficient r0 at the frequency
+! = 0:13  2 a=c for the three positions of the truncation plane marked in fig. 2.8(a). Planes 1 and 2
+contain inversion centres of the PC, while plane 3 does not. According to the theorem from subsec-
+tion 2.3.1, for the former planes r0 should be real as long as both the incident wave and the dom-
+inant crystal eigenstate are propagative, which is the case for kx < !=c = 0:13  2 =a. Figures
+36 Chapter 2. Effective-medium model of photonic crystals
+a
+0:5
+0:4
+plane 3 0:3
+3a=4
+plane 2 0:2
+a=2
+plane 1 0:1
+0
+  X M  
+(a) (b)
+Figure 2.8 (a) Geometry of the square-lattice PC analysed in the text. Horizontal lines mark the position of
+truncation planes 1, 2 and 3; inversion centres of the infinite PC located at these planes are marked with crosses.
+(b) Band structure of the crystal shown in part (a). Horizontal lines mark the frequency values ! = 0:13 2 c=a,
+0:22  2 c=a and 0:31  2 c=a.
+0:50
+(a) (b) (c)
+0:25
+0:00
+ 0:25
+ 0:50
+ 0:5 0:0 0:5  0:5 0:0 0:5  0:5 0:0 0:5
+kxa=2  kxa=2  kxa=2 
+Figure 2.9 The EFCs at frequency (a) ! = 0:13  2 c=a, (b) 0:22  2 c=a, and (c) 0:31  2 c=a of the PC
+shown in fig. 2.8(a) (solid lines) and the corresponding “empty lattice”, i.e., the homogeneous medium of refractive
+index 2:476 (dashed and dotted lines). The empty-lattice bands corresponding to the n = 0 harmonics are plotted
+with dashed lines, the rest with dotted lines.
+2.10(a) and (d) confirm that this is fulfilled with a very good accuracy. In fact, Im rn0 does not exceed
+0.002, that is, 0.3% of the magnitude of rn0 ; this tiny imaginary part stems from the excitation of sec-
+ondary crystal eigenmodes, which are neglected in the single-mode approximation. In turn, when the
+PC is truncated along plane 3, r0 retains a large imaginary part also in the propagative-wave region
+[fig. 2.10(g)].
+The plots of the relative error show that when the incident wave is propagative, the single-mode
+approximation is extremely accurate at the frequency in question (the relative error is less than 0.3%).
+For larger kx , the error slowly grows, reaching   0:6–0:8 (planes 1 and 3) and   0:2 (plane 2)
+at the Brillouin zone edge. However, it does not exceed 10% until kx = 0:43  2 =a for planes
+1 and 3 and kx = 0:475  2 =a for plane 2, so that the single-mode approximation is still rele-
+vant at kx = 0:39  2 =a, where 1z vanishes and the dominant eigenmode becomes evanescent.
+We may then proceed to the analysis of the behaviour of the effective parameters at this value of kx .
+The EFC of the dominant eigenmode is centred at   , and its electric field at kx = 0:39  2 =a
+and kz = 0 is symmetric with respect to the horizontal mirror planes of the crystal, as evidenced by
+fig. 2.11(a). In consequence, the effective parameters x = z and y are continuous and bounded
+kza=2 
+!a=2 c
+2.4. Examples 37
+1 0:75 1 1:0
+(a) (g)
+ 0:50
+Im r0
+0 0 0:5
+R e r0 0:25
+!
+rel. error
+ 1 0:00  1 0:0
+4 4
+(b) (h)
+2 2
+0 0
+0:95 11 20  =2
+(c) (i)
+0:90
+y ! 10 arg y
+0:85 10 jy j 0
+9 arg
+ x0:80 x jx j
+0:75 8 0   =2
+0:0 0:1 0:2 0:3 0:4 0:5 0:0 0:1 0:2 0:3 0:4 0:5
+kxa=2  kxa=2 
+1 0:3
+(d)
+0:2
+0
+0:1
+ 1 0:0
+4
+(e)
+2
+0
+1:4 7:5
+(f) 7:0
+1:2 6:5
+6:0
+1:0 5:5
+0:0 0:1 0:2 0:3 0:4 0:5
+kxa=2 
+Figure 2.10 (a) The kx-dependence of the specular reflection coefficient r0 of the crystal from fig. 2.8(a) trun-
+cated along plane 1, at ! = 0:13  2 c=a. Solid lines: results of rigorous calculations, rn0 ; circles: results of
+calculations made in the single-mode approximation, rsm0 ; dashed line: relative error  of the single-mode approx-
+imation. The vertical lines at kx = 0:13  2 =a and 0:367  2 =a mark where the incident wave and the single
+propagating crystal eigenmode, respectively, turn from propagating to evanescent. (b) Amplitudes of the three
+most slowly decaying crystal eigenmodes excited in the above conditions (solid, dashed and dotted line, in order
+of increasing Im kz). (c) Effective x (dark lines) and y (light lines) of the crystal. (d)–(f) and (g)–(i) The same
+for planes 2 and 3.
+
+ xx j j Re r0, Im r0, j j Re r0, Im r0,tm tm
+jx j, jy j j Re r0, Im r0,tmj
+argx , arg y
+Relative error
+Relative error
+y Relative error y
+38 Chapter 2. Effective-medium model of photonic crystals
+1
+0
+ 1
+(a) (b) (c)
+Figure 2.11 Real part of the electric field Ey of the modes of the crystal shown in fig. 2.8(a) with (a) ! =
+0:13  2 c=a, kx = 0:367  2 =a and kz = 0, (b) ! = 0:22  2 c=a, kx = 0:264  2 =a and kz =  =a,
+(c) ! = 0:31  2 c=a, kx = 0:078  2 =a and kz = 0. Two nonequivalent mirror planes of the crystal parallel to
+its surface are marked with horizontal lines.
+1 1:0 1 0:2
+(a) (d)
+ 0
+Im r0
+0 0:5  1 0:1
+ Re r0  2
+  rel. error!1 0:0  3 0:0
+4 2
+(b) (e)
+2 1
+0 0
+3 1 50
+(c) (f)
+z
+2
+0 0
+1 y
+x
+0  1  50
+0:0 0:1 0:2 0:3 0:0 0:1 0:2 0:3
+kxa=2  kxa=2 
+Figure 2.12 Same as fig. 2.10, at frequency ! = 0:222 c=a and for truncation planes (a)–(c) 1 and (d)–(f) 2.
+The vertical lines at kx = 0:22 2 =a and 0:264 2 =a mark where the incident wave and the single propagating
+crystal eigenmode, respectively, turn from propagating to evanescent.
+in the whole range of kx for the cuts 1 and 2, which coincide with mirror planes of the PC [figs.
+2.10(c) and (f)]. In contrast, truncating the crystal along plane 3 leads to divergence of y at kx =
+0:39  2 a=c.
+We turn now to the study of the system at the frequency ! = 0:22  2 a=c. The EFC, shown in fig.
+2.9(b), consists of two elliptical “branches” encircling the points X = .0;  =a/ and X 0 = . =a; 0/. In the
+effective-medium model, we focus on the neighbourhood of the first EFC branch (jkxj < 0:39  2 =a)
+and use the dimensions of the ellipse encircling the X point to calculate the effective parameters. The
+electric field of the mode corresponding to the right vertex of this ellipse is plotted in fig. 2.11(b). It is
+symmetric with respect to plane 1, which passes through the cylinder centres, and antisymmetric with
+respect to plane 2, passing midway between the cylinders.
+j j Re r0, Im r0,x , z , y tm
+x , z j j Re r0, Im r0,tm
+
+Relati yve error
+Relative error
+2.4. Examples 39
+1 2 1 2
+(a) (d)
+ 
+Im r0
+0 1 0 1
+ Re r0
+rel. error!
+ 1 0  1 0
+20
+(b) 20 (e)
+10
+0 0
+ 0:08  0:5  0:100  0:4
+(c)  ! (f)y
+   0:60:10  0:125  0:5
+ 0:7
+ 0:12     0:150  0:6x 0:8
+ 0:14  0:9  0:175  0:7
+0:00 0:02 0:04 0:06 0:08 0:00 0:02 0:04 0:06 0:08
+kxa=2  kxa=2 
+Figure 2.13 Same as fig. 2.10, at frequency ! = 0:31  2 c=a and for truncation planes (a)–(c) 1 and (d)–
+(f) 2. The vertical line at kx = 0:0782 =a marks where the propagating crystal eigenmode turns evanescent (the
+incident wave is propagating throughout the kx range presented on the plot).
+Figures 2.12(a) and (d) show the kx-dependence of the reflection coefficient r0 for these two crystal
+terminations. As for ! = 0:13  2 c=a, the approximation accuracy is visibly better for plane 2 than 1:
+in the former case, r0 is rendered faithfully well beyond the propagative-wave region. The superior
+performance achieved for plane 2 is probably due to the uniformity of the crystal permittivity on this
+plane, which leads to smaller spatial field variations, making fewer Fourier harmonics necessary to match
+the field in the crystal with that in free space. However, the antisymmetry of the eigenmode’s electric
+field with respect to plane 2 implies that the effective permittivity y diverges at kx = 0:26  2 =a [fig.
+2.12(f)]. In contrast, if the other truncation plane is chosen, all effective parameters are continuous and
+bounded [fig. 2.12(c)], but at the cost of a significant single-mode approximation error:   17% close
+to normal incidence. (This time, the relative error is not very meaningful in the evanescent-wave region,
+since the rigorous reflection coefficient passes through zero at kx = 0:29  2 =a, so that  blows up.)
+Finally, we move on to the case of ! = 0:31  2 c=a. The EFC diagram shown in fig. 2.9(c)
+comprises an approximately circular part located at the centre of the Brillouin zone and four curves
+of irregular shape, together forming a closed path encircling the point M = . =a;  =a/. The circular
+EFC represents a negative-refraction band. As seen from fig. 2.11(c), the electric field of the mode
+with kx = 0:078  2 =a and kz = 0 is symmetric with respect to planes 1 and 2, which assures the
+continuity of the effective parameters at kx = 0:078  2 =a, where the mode turns from propagating to
+evanescent. This is in contrast to the negative-refraction band of the hexagonal crystal analysed in the
+previous subsection, whose symmetry properties made y diverge at the transition point. However, there
+is no improvement in the accuracy of the single-mode approximation: the comparison of the values of r0
+calculated rigorously and from eq. (2.20) [figs. 2.13(a) and (d)] reveals that the approximation introduces
+a significant error (above 33% for plane 1 and 11% for plane 2) due to the large excitation amplitude of
+secondary crystal eigenmodes [figs. 2.13(b) and (e)].
+x
+jtmj Re r0, Im r0,
+x
+jtmj Re r0, Im r0,
+y
+Relative error
+y
+Relative error
+40 Chapter 2. Effective-medium model of photonic crystals
+2.4.3 Remarks
+In the context of metamaterials containing resonant components, such as metallic split rings, it has been
+observed that inside band gaps, the effective permittivity and permeability of these structures (defined at
+normal incidence) have large imaginary parts of opposite sign, regardless of the location of the truncation
+plane [82–85]. This is not in contradiction with our theory, since one of the assumptions of the condition
+for real-valuedness of  and formulated in subsection 2.3.1 is the propagative nature of the fundamental
+crystal eigenstate (real 1z). Of course, inside band gaps all modes are evanescent, and so the condition
+in question is not applicable.
+On the other hand, our results show that in general the effective parameters of a lossless PC can attain
+complex values even outside band gaps, if the truncation plane does not exhibit certain symmetries. In
+this case, the product  is real (due to the absence of losses), and either  or  has a negative imaginary
+part. This is visible, for example, in fig. 2.5(i) showing the kx-dependence of the effective parameters
+for the low-symmetric truncation plane 3 of the PC from fig. 2.3(a): it is clear that arg 2 Œ  x ; 0, so2
+that Imx < 0. Only at specific truncation planes are effective  and  real. (It must be noted, though,
+that precisely these special truncation planes have usually been chosen in previous calculations of the
+effective parameters of PCs and metamaterials.)
+2.5 Validity of the single-mode approximation
+We have seen that the accuracy of the single-mode approximation for a given PC varies strongly with
+frequency and incidence angle. In some cases, one of the crystal modes is clearly dominant; in others,
+several eigenstates are excited with similar magnitude. In the following, we offer a qualitative argument
+relating the ratios jtm=t1j of the excitation coefficients of the individual modes to the Fourier spectrum of
+their electromagnetic fields on the crystal surface. This leads us to conclusions regarding, in particular,
+the viability of the effective-medium description of negative-refraction bands.
+Let us begin by writing the system (2.17) in a partitioned form, emphasising the rows corresponding
+to the nonzero elements of the vectors representing the incident field, a and a00 0, as well as the columns
+corresponding to the unknowns r0 and tk:
+2 32 3 2 3
+666
+ IO 0E 0O uO<0 uE<0 uO<07766rE<077 66 0E<k k >k6 0N  1 0N
+7
+uN0 u0 uN0 r 76 <k k >k7766 066 0O 0E  IO uO>0 uE>0 uO>076rE 7
+77 666 1 7770E
+6 <k k >k777666 >0777 = 6Oˇ E O E 66 77E 7 : (2.37)6i = 0 0 vO<0 vE<0 vO<06 <0 1 t<k k >k7766 <k 04 N N 54 757 664 770 iˇ = 0 vN00 1 v0 vN0 t iˇ =<k k >k k 0 15
+0O 0E i Oˇ>0= vO>01 vE>0 vO>0 tE>k 0E<k k >k
+We remind the reader that the symbols embellished with arrows, bars and hats are column vectors, row
+vectors and matrices, respectively, while those without any embellishment are scalars (see section 1.3).
+The meaning of the indices should be clear; for example, uO<0 stands for the submatrix of the uO matrix
+<k
+corresponding to rows with negative indices and columns with indices less than k. From the Cramer’s
+formula [86, p. 299], we have tl=tk = Dl=Dk , whereDj stands for the determinant of the matrix created
+by replacing the j th column in the right half of the matrix of the system from eq. (2.37) by the right-
+hand side of the system. After some algebra, where elementary properties of determinants are utilised,
+2.5. Validity of the single-mode approximation 41
+we arrive at ˇˇˇ ˇˇˇ
+ˇˇˇ  IO 0O uO<0 uO<0<l >l
+ˇˇˇ 0O  IO uO
+ˇˇˇ
+>0 uO>0
+<l >l
+Oˇ O O<0 O<0 ˇˇˇ
+ˇˇˇˇ
+i <0=1 0 v v<l >l
+>0 >0ˇ
+tl = . 1/l  0
+O i Oˇ
+k >0
+=1 vO vO<l >l ˇˇˇ : (2.38)
+tk ˇˇˇ  IO 0O uO<0 uO<0<k >k
+ˇˇˇ 0O   O O
+ˇˇˇ
+I u>0 uO>0
+<k >k
+ˇi Oˇ = 0O
+<0 <0 ˇˇˇ
+<0 1 vO vO<k >k
+0O i Oˇ>0= vO>0 vO>0ˇ1 <k >k
+By means of the Laplace expansion [86, p. 259] of the determinants in the numerator and denominator
+along the columns containing uEk and uEl , respectively, the ratio tl=tk can be written as the ratio of two
+sums of terms proportional to the components of the Fourier expansion of the electric and magnetic fields
+at the crystal surface of, respectively, the kth and l th eigenmode:
+P
+P ¤ .a un C b vntl = n 0 n n /k kn C n ; (2.39)tk n¤0.anu bnv /l l
+where an and bn denote the appropriate coefficients resulting from the Laplace expansion. It is crucial
+to observe that these sums do not contain the zeroth Fourier component of either field.
+The PC bands can be treated as mixtures of the eigenstates of the empty lattice with “average” 
+and ; for a fipxed kx , these eigenstates are the plane waves Eyn.x; z/ = expŒi.kx C Gxn/x C ikznz,
+where k = .!=c/2   .k CG /2zn x xn . When the index contrast of the PC is low enough, in some
+regions of the .!; kx/ space each of the PC eigenstates comprises a single dominant plane wave, the
+perturbative components having low amplitude. This means that each of the sets of coefficients .unm/n2Z
+corresponding to different modes m contains a single dominant component. From eq. (2.39) it follows
+that, in general, the mode whose dominant component is the zeroth one (n = 0) is then excited the
+most strongly. Indeed, labelling this mode with index m = 1, we see that in the expression (2.39) for
+the ratio t =t (l ¤ 1) the sum in the numerator does not contain terms proportional to u0 and v0l 1 1 1 ,
+which, by assumption, are the largest ones. On the contrary, the sum in the denominator contains two
+terms proportional to the dominant components of the th mode, say, nl and nl u v l , since nl is necessarilyl l
+different from zero. Thus, we see that the fraction tl=t1 is a ratio of a “small” and a “large” quantity—and
+so jtl j  jt1j for all l ¤ 1, that is, the defining assumption of the single-mode approximation is fulfilled.
+Conversely, if there is strong coupling between the zeroth harmonic and plane waves corresponding
+to different values of n, so that no mode with highly dominant zeroth component exists, the numerator in
+(2.39) for k = 1 is no longer a small quantity, and multiple eigenmodes can be excited with comparable
+amplitude.
+We conclude that the single-mode approximation should work best at those values of ! and kx for
+which the mode originating from the n = 0 harmonic—the plane wave exp.ikxx C ikz0z/—does not
+contain significant contributions of other plane waves. In practice, this usually means that when we
+consider the transition from the empty lattice to the final PC, the fragment of the EFC of the PC around
+a given value of kx should form mainly from the circle corresponding to the n = 0 harmonic of the
+empty lattice. For example, as can be seen in fig. 2.4(a), the EFC of the single propagating mode of
+the hexagonal-lattice PC at frequency ! = 0:14  2 c=a (solid line, middle diagram) is very similar to
+the original EFC of the n = 0 harmonic of the empty lattice (dashed line). In addition, the imaginary
+bands corresponding to n =  1 and n =  2 are very weakly perturbed (top diagram). We infer that the
+42 Chapter 2. Effective-medium model of photonic crystals
+1:0
+(a) (b)
+0:5
+0:0
+ 0:5
+1
+(c) (d)
+0
+  u
+n
+1=u
+0
+1 1
+vn=v0
+  1 12
+ 2  1 0 1 2  2  1 0 1 2
+n n
+Figure 2.14 Values of the harmonics .un/2 and .vn 21 n= 2 1 /n= 2 of the propagative eigenmode of the crystal from
+fig. 2.3(a) on the truncation plane 1 and at (a) ! = 0:14  2 c=a, kx = 0:10  2 =a, (b) ! = 0:14  2 c=a,
+kx = 0:40  2 =a, (c) ! = 0:259  2 c=a, kx = 0:05  2 =a, (d) ! = 0:259  2 c=a, kx = 0:20  2 =a.
+individual plane waves couple weakly, so that the zeroth harmonic of the field of the propagating crystal
+eigenmode should be dominant, and the eigenmode itself should be strongly excited. These claims are
+corroborated by figs. 2.14(a)–(b), where the amplitudes of several harmonics un n1 and v1 of this mode
+at the truncation plane 1 are shown for two values of kx , and fig. 2.5(b), where the amplitudes jtmj of
+individual eigenstates are juxtaposed.
+Now let us turn our attention to fig. 2.4(b), where the evolution of the EFCs at the frequency ! =
+0:259  2 a=c is shown; this frequency lies in the second band, which exhibits negative group velocity.
+We can see that in this case the plotted quarter of the circular EFC of the single propagating crystal
+eigenstate is formed by merging of the n = 0 and n =  1 harmonics of the empty lattice. Their strong
+coupling is further indicated by the substantial alteration of the shape of the imaginary bands. We can
+expect the contribution of the zeroth harmonic to be strongest at small values of kx , and so the accuracy
+of the single-mode approximation to be highest near normal incidence and deteriorate with increasing kx .
+This is again confirmed by figs. 2.14(c)–(d) and 2.7(b).
+To help establish a broader picture of the single-mode approximation’s performance for the hexagonal-
+lattice PC, in fig. 2.15(b) the relative error of the reflection coefficient r0 calculated in this approximation
+is plotted for a mesh of 101  100 points of the .kx; !/ space. In turn, figs. 2.15(c) and (d) present the
+amplitude variations of the zeroth harmonic of the electric and magnetic field, respectively, of the most
+slowly decaying crystal mode (on the truncation plane 1). It can be seen that, although there is no one-to-
+one correspondence, the areas of significant error generally match those in which the n = 0 component
+of either the electric or magnetic field, or both, of the least-evanescent eigenmode has small amplitude.
+(In fact, the dependence of the approximation’s accuracy on the Fourier spectrum of the magnetic field
+seems more pronounced than that on the electric field.)
+Finally, it should be noted that the EFC from fig. 2.4(b) is in fact typical for negative-refraction
+bands. Indeed, the EFCs of the empty lattice are circular, with group velocity directed outwards, and the
+negative bands arise from convex figures formed by arcs of three, four or six such intersecting circles,
+necessarily including those corresponding to harmonics with nonzero Gxn (see fig. 2.16). Thus, the
+resulting bands do not fulfil the validity condition of the single-mode approximation, or do it only in the
+restricted range of kx close to zero. Consequently, attribution of effective permittivity and permeability
+to negative-refraction bands makes sense at most for near-normal incidence, while in the evanescent
+regime the effective-medium description is definitely inappropriate.
+Normalized value
+Normalized value
+2.5. Validity of the single-mode approximation 43
+0:5
+0:4
+0:3
+0:2
+0:1
+(a)
+0:0
+0:5 1:00
+0:4
+0:75
+0:3
+0:50
+0:2
+0:25
+0:1
+(b)
+0:0 0:00
+0:5 1:00
+0:4
+0:75
+0:3
+0:50
+0:2
+0:25
+0:1
+(c)
+0:0 0:00
+0:5 1:00
+0:4
+0:75
+0:3
+0:50
+0:2
+0:25
+0:1
+(d)
+0:0 0:00
+0:0 0:2 0:4
+kxa=2 
+Figure 2.15 (a) Projection of the band structure of the PC shown in fig. 2.3(a) on the .kx ; !/ plane. Grey and
+white areas denote photonic bands and gaps, respectively. The arrows mark the frequency values ! = 0:14 
+2 c=a and 0:259  2 c=a. (b) The dependence of the relative error of the single-mode approximation of this
+crystalP’s reflection coefficient on kx andP! for the truncation plane 1. (c) The corresponding dependence ofj 1=2 1=2u01j= njunj21 . (d) Same for jv0 n 21 j= njv1 j .
+!a=2 c !a=2 c !a=2 c !a=2 c
+0 0
+Relative error Normalized ju1j Normalized jv1 j
+44 Chapter 2. Effective-medium model of photonic crystals
+(a) (b)
+(c) (d)
+Figure 2.16 Typical configurations of empty-lattice EFCs leading to formation of negative-refraction bands
+after introducing sufficient lattice modulation. In each case, the direction of normal incidence is from the bottom;
+circles corresponding to harmonics with Gxn = 0 are drawn in darker blue. Thin lines mark the boundaries of
+the first Brillouin zone of each lattice, and black dots denote reciprocal lattice points. Top row: square lattice,
+bands encircling (a) theM point of the first Brillouin zone, (b) the   point; bottom row: hexagonal lattice, bands
+encircling (c) the K point, (d) the   point.
+2.6 Conclusions
+In this chapter, we have analysed in detail the effective-medium description of 2D PCs. Its validity has
+been shown to be restricted by the accuracy of the single-mode approximation, and a definition of the
+effective permittivity, permeability and transverse impedance, rigorous under this approximation, has
+been given. In the framework of the single-mode approximation, we have studied the dependence of
+the specular reflection coefficient r0 of the crystal on the position of the truncation plane, deriving the
+conditions assuring r0, and consequently the effective parameters, to be real-valued. Continuity and
+boundedness of the latter have been shown to depend on the symmetry of the dominant eigenmode of the
+crystal.
+Subsequently, the conditions of validity of the single-mode approximation have been studied. We
+have established a link between the relative excitation amplitudes of individual crystal eigenmodes and
+the Fourier spectrum of the electric and magnetic fields of these modes on the crystal truncation plane.
+This link has been employed to formulate a criterion for estimating the accuracy of the single-mode
+approximation by comparing the equifrequency diagrams of the PC and of the homogeneous medium
+with refractive index equal to the average refractive index of the PC. Finally, we discussed the special
+case of negative-refraction bands; we concluded that the effective-medium description of these bands is,
+quite generally, inaccurate, since their Fourier-space structure entails simultaneous excitation of other
+bands by plane waves incident at most angles, and so attributing a definite effective permittivity and
+permeability to these bands is not physically meaningful.
+Chapter 3
+Antireflection gratings for photonic crystals
+3.1 Introduction
+As can be seen from the plots of the reflection coefficient of PCs presented in chapter 2 (figs. 2.5, 2.7,
+2.10, 2.12, and 2.13), reflected waves of significant amplitude are often generated at PC surfaces. In
+many applications, one strives after a perfect energy transfer between the incident plane wave and the
+propagative PC eigenmode (or, more rarely, several such modes). Propagative reflected waves should
+then be eliminated. This chapter concerns the design of antireflection (AR) structures that, placed on
+a PC surface, significantly diminish the fraction of energy lost to reflected waves. After reviewing the
+classes of these structures proposed to date (section 3.2), in section 3.3 we put forward a new method of
+designing AR gratings operating in a wide range of angles of incidence. This algorithm is illustrated in
+section 3.4 by means of several examples. We summarise the advantages and limitations of the proposed
+approach in section 3.5.
+3.2 Types of antireflection structures
+3.2.1 Antireflection structures for homogeneous media
+Since the design of AR structures for PCs is often guided by the experience gained from the long-
+standing study of methods for eliminating reflections from interfaces separating homogeneous media,
+we shall begin with a brief review of the AR structures employed in this simpler case.
+They can be divided into two broad classes. The refractive index n of AR coatings depends only on
+the coordinate z perpendicular to the interface; depending on whether n.z/ is piecewise-constant or not,
+we speak of homogeneous-layer or inhomogeneous-layer AR coatings [87]. In turn, the refractive index
+of AR gratings is also a function of the coordinates parallel to the interface. Figure 3.1 shows example
+AR structures belonging to these three classes.
+The simplest homogeneous-layer AR coating consists of a single thin film with refractive index n and
+thickness d chosen so as to ensure destructive interference of waves reflected from its top and bottom
+surfaces, excited by a plane wave with a certain frequency ! and angle of incidence  . The values of
+n and d can be obtained analytically. In order to improve the angular and frequency tolerance of the
+coating, one can increase the number of layers to make the transition between the refractive index of the
+super- and substrate more gradual [87], thus reducing the amplitude of waves reflected on the individual
+discontinuities of n.z/. In the limit of an infinite number of layers, one arrives at an inhomogeneous-
+layer coating with a continuous monotonic profile n.z/. Several specific profiles have been proposed in
+the literature (see ref. 88 for a review). Unfortunately, these “ideal” AR coatings, even the single-layer
+one, cannot usually be realised because of the lack of suitable materials with the required values of n.
+This is the case, in particular, for air-solid interfaces, where thin films with refractive index close to unity
+45
+46 Chapter 3. Antireflection gratings for photonic crystals
+z z z
+medium 2 medium 2 medium 2
+AR
+AR coating AR coating grat-
+ing
+medium 1 medium 1 medium 1
+x x x
+(a) (b) (c)
+Figure 3.1 Example AR structures belonging to the three principal classes described in the text. Darker areas
+denote regions with higher refractive index. (a) A homogeneous-layer AR coating. (b) An inhomogeneous-layer
+AR coating. (c) A (binary lamellar) AR grating.
+are needed. Short of using special ultra-low-index media, such as so-called Reststrahlen materials [87],
+there are two basic ways of circumventing this problem.
+One of them consists in abandoning completely the structures based on a “continuous transition”
+between the super- and substrate refractive indices in favour of interference-based coatings [87]. In
+these systems, the total reflected wave vanishes thanks to the destructive interference of partial waves
+generated at interfaces between layers with contrasting values of n. For instance, so-called v-coatings
+consist of two layers with prescribed refractive indices n1 and n2 (corresponding to realistic materials)
+and thicknesses d1 and d2 adjusted so as to eliminate reflection at the desired values of ! and  . Note
+that n1 and n2 must satisfy certain conditions in order that appropriate d1 and d2 can be found [89,
+p. 96]. A disadvantage of v-type AR coatings is that their angular and frequency tolerance are usually
+inferior even to those of the corresponding ideal single-layer coatings [89, p. 97; 90, p. 188].
+The other solution consists in using subwavelength gratings to simulate AR coatings with arbitrary
+n.z/ profiles. In many cases, the effective-medium theory of gratings can be employed to calculate
+the grating profile mimicking the desired n.z/ dependence [88]. Several types of gratings, such as the
+lamellar, trapezoidal, sinusoidal, triangular and pyramidal ones, have been studied in the literature and
+shown to have good AR properties [88, 91–93]. A review of the experimental methods used to fabricate
+such AR structures can be found in ref. 94.
+3.2.2 Antireflection structures for photonic crystals
+As pointed out in chapter 2, a distinguishing feature of PCs is the dependence of their reflection coeffi-
+cient on the position of their truncation plane. One could hope then that a significant reduction of a PC’s
+reflectance could be achieved without adding any AR structure, but simply by choosing an appropriate
+cut. For some crystals, this has indeed proved to be possible [95, 96]. In particular, Botten et al. [96] have
+shown that very low reflectance is a rather general feature of rod-type PCs truncated midway between
+successive layers of rods. For many crystals, however, no truncation plane provides a sufficiently small
+value of reflectance (see fig. 3.2). This method of reducing reflection is therefore not general enough,
+and one often has to resort to introducing some AR structure. Several types of them have been proposed
+in the literature. More often than not, they have much in common with one of the solutions developed
+with homogeneous materials in mind, reviewed in the previous subsection.
+3.2. Types of antireflection structures 47
+0:4
+z a
+0:3
+p
+a 3
+0:2
+2
+0
+0:1
+0:0 0:1 0:2 0:3 0:4 0:5
+p
+z0=.a 3/
+(a) (b)
+Figure 3.2 (a) The dependence of the reflectance jr 20j of the PC shown in part (b), placed in air, on the location
+of the truncation plane z = z0. The impinging wave is normally incident, s-polarised and has frequency ! =
+0:311  2 c=a. It can be seen that jr 20j does not fall under 0.13 for any truncation plane. (b) Geometry of the
+PC under study: a hexagonal lattice of air holes with radius 0:365a, where a is the lattice constant, etched in a
+dielectric matrix with permittivity  = 10:6.
+The simplest approach has been proposed by Li et al. [97]. It consists in placing in front of the
+crystal a v-type AR coating composed of two layers made of constituent materials of the crystal, usually
+air and a dielectric. Their thicknesses can be determined analytically or graphically as soon as the
+reflection coefficient of the semi-infinite uncoated PC at the selected operation frequency is known. This
+frequency is assumed to be low enough that only the zeroth diffraction order be propagative in the layer
+closest to the PC surface, so that all higher orders reflected by the crystal decay before reaching the
+boundary between the two layers. If it is not the case, the structure may still work, but the optimum layer
+thicknesses will not in general be given by the analytical formulas derived from the thin-film theory. The
+basic disadvantage of this otherwise very attractive approach is the relatively low angular and frequency
+tolerance of v-type AR coatings.
+Another group has studied a similar approach, in which one of the homogeneous layers is replaced
+by a grating of rods or holes [98, 99]. The performance of the resulting AR gratings was shown to be
+similar to that of v-type coatings [99]. Related structures, albeit with only a single degree of freedom
+(the radius of the outermost rods of a rod-type PC), were also analysed by Jin and He [100]. In turn,
+Zhang and Li [101] proposed a more complex wide-angle AR grating for the interface between air and
+a PC flat lens, whose fabrication would be seriously hindered, though, by the presence of extremely thin
+air slits and dielectric veins.
+In contrast to the above works, which concentrated on the low-frequency regime, the authors of refs.
+102–104 endeavoured to eliminate the reflection from an interface between a PC and a semiconductor at
+a frequency where multiple propagative diffraction orders existed in the latter medium. They proposed
+an AR grating consisting of elongated drop-shaped air holes, this nonstandard form being motivated
+by the desire of ensuring a gradual transition between the two media. In fact, the shape of the resulting
+structure resembles closely the classical trapezoidal AR gratings studied, e.g., by Raguin andMorris [92].
+The improvement brought about by these gratings has subsequently been demonstrated experimentally
+[105]. Unfortunately, Baba et al. did not provide any analytical guidelines regarding the choice of the
+geometrical parameters of the gratings, resorting instead to a time-consuming scan of the parameter space
+in order to find the optimum structure [102, 103].
+A very important contribution was made by Lawrence et al. [106, 107], who introduced the concept
+of generalised matrix-valued effective immittance O of gratings and showed that their effective-medium
+jr j20
+48 Chapter 3. Antireflection gratings for photonic crystals
+description can be made arbitrarily accurate by allowing O to have sufficiently large dimensions. Such
+matrix-valued immittance cannot serve as a drop-in replacement of the corresponding scalar quantity in
+standard formulas derived for homogeneous media [107]. Therefore, for instance, analytical determi-
+nation of the optimum parameters of an AR structure for a given PC composed of layers described by
+a matrix O is not possible. However, Lawrence et al. derived equations corresponding to the Fresnel
+formulas (2.9) involving the generalised immittances of two adjacent gratings, and showed that the im-
+mittance matrix of typical gratings can be truncated to 5 5 elements or less without a substantial loss in
+accuracy. Since numerical calculations involving such small matrices are very fast, it becomes feasible
+to design optimum AR gratings by performing a full scan of the available parameter space. Example AR
+structures presented in ref. 107 include, for instance, a relatively wide-band AR coating of a superprism-
+type PC at a frequency where multiple propagative diffraction orders exist in the adjacent dielectric. A
+slight limitation of the approach of Lawrence et al. is that the generalised immittance has only been
+defined for 2D gratings symmetrical with respect to a two-fold rotation axis parallel to the direction of
+invariance. Therefore, it does not cover, for instance, triangular or trapezoidal gratings.
+All the AR structures discussed so far are relatively compact, with thickness rarely exceeding one
+or two lattice constants of the underlying PC. Some authors have advocated sacrificing compactness in
+favour of potentially larger frequency and angular tolerance offered by thick stacks of gratings, whose
+geometry changes gradually so as to ensure a smooth transition of the electromagnetic field of the in-
+cident plane wave towards the Bloch mode of the semi-infinite PC. Several design principles for such
+gratings have been proposed [108, 109]. In this work, we shall focus on compact AR structures, and
+therefore we do not consider adiabatic AR gratings in detail.
+3.3 Design procedure
+We shall now present an alternative method of designing AR gratings for PCs. Compared to the ap-
+proaches reviewed in subsection 3.2.2, it has the following distinguishing features:
+1. Instead of performing a potentially time-consuming global scan of possible geometries, we use an
+effective-medium model of PCs to calculate analytically the geometrical parameters of a “tenta-
+tive” AR grating; then, if necessary, these parameters are refined with a numerical local-minimisa-
+tion procedure. The end result of our procedure is a trapezoidal AR grating.
+2. The resulting AR structures have good angular tolerance, which in some important applications
+of PCs is more significant than the frequency tolerance. For instance, the quality of the image
+produced by a PC flat lens with effective refractive index n   1 depends in the first place on
+the angular range of incident propagative plane waves which are transmitted through the lens with
+little or no energy loss. On the other hand, frequency tolerance is not vital since n can be close
+to  1 only in a narrow frequency band.
+We draw on the results of Raguin and Morris [92], who demonstrated that triangular and trapezoidal
+gratings allow a significant reduction of reflectance at interfaces between homogeneous media in a wide
+range of incidence angles. Let us now proceed to detailing the three constituent steps of the algorithm.
+Step 1 We begin by using the classical theory of AR coatings to calculate the refractive index and
+thickness of a single-layer coating that should minimise the reflection from the PC surface at a fixed
+angle of incidence  and frequency !. The value of  should lie approximately midway the desired
+angular operation range of the final AR structure.
+Consider the system shown in fig. 3.3, in which a propagative plane wave with frequency ! = ck0
+and wave vector kE1 = .kx; kz1/ = .n1k0 sin ; n1k0 cos / impinges from the dielectric 1 with refractive
+3.3. Design procedure 49
+z
+medium 3
+d2 medium 2
+n2
+E 
+medium 1
+k1
+n1
+x
+Figure 3.3 System considered in step 1 of the AR grating design procedure.
+index n1 on the surface of the homogeneous film 2 with thickness d2 and refractive index n2 coating the
+PC 3. Let us assume that medium 2 supports exactly one propagative diffraction order and is sufficiently
+thick for all the evanescent orders reflected from the PC surface to vanish at the interface between media
+1 and 2. We can calculate the total amplitude of the reflected plane wave, r , by summing up all the
+multiple reflections occurring in the system:
+hX1 i 2
+= C n r12 C .t12t21   r12r21/r= 23˚r r12 t12˚r23˚ .r21˚r23˚/ t21   ; (3.1)1 r 221r23˚
+n=0
+where rij and tij denote the amplitudes of the waves reflected from the interface between media i and j
+and transmitted through it, respectively, and˚  eikz2d2 with k  .n2k2 k2/1=2z2 2 0 x . From the Fresnel’s
+formulas [cf. (2.9)]
+j  i 2
+rij =
+j
+C ; tij = C (3.2)j i j i
+it immediately follows that r21 =  r12 and t12t21   r12r21 = 1, hence
+r C r ˚2
+= 12 23r C : (3.3)1 r 212r23˚
+The parameters of the antireflection coating, n2 and d2, can now be obtained by requiring the numerator
+of the fraction in the above equation to vanish. If the coating is lossless, so that j˚ j = 1, the numerator
+vanishes if and only if (i) the moduli of r12 and r23 are equal and (ii) the thickness d2 is such that
+arg r23 C 2kz2d2 = arg r12 C .2mC 1/ ; (3.4)
+where m 2 Z and arg z stands for the argument of the complex number z. Solving for d2, we get
+arg r12   arg r23 C .2mC 1/ 
+d2 = : (3.5)
+2kz2
+It is usually best to choose the value of m corresponding to the smallest positive admissible value of d2;
+otherwise, internal resonances in the coating layer can spoil its antireflective properties for some angles
+of incidence.
+50 Chapter 3. Antireflection gratings for photonic crystals
+We shall now use condition (i) to determine the refractive index n2 of the AR coating. Substituting
+the Fresnel’s formulas (3.2) into the condition jr j2 = jr j212 23 , we obtain
+.   /22 1 .3  2/.  2/
+C =
+3
+C  C : (3.6).  /22 1 .3 2/.3 2/
+Straightforward algebra leads to
+ Re C j j22 = 3 3 =1 22   1 : (3.7)Re3 1
+The s- and p-polarisation cases need now to be considered separately. Assuming materials 1 and 2 to be
+nonmagnetic (1 = 2 = 1), in the s-polarisation case we have 2 = Z2 and eq. (2.5) gives
+k0 k
+Z2 = = q 0 ; (3.8)
+kz2 n2 2 2 2 22k0   n1k0 sin 
+hence
+2 2 2 C 1n2 = n1 sin  : (3.9)
+Z22
+It can be seen that Z22 must be non-negative in order that kz2 be real, as we have assumed.
+For p polarisation, 2 = Y2 and eq. (2.8) yields
+n22k0 n
+2
+Y = = q 2k02 : (3.10)
+kz2 n22k
+2   n20 1k2 sin20 
+This leads to the quadratic equation for n22,
+n4   Y 2n2 C Y 2n2 sin22 2 2 2 1  = 0; (3.11)
+which has real solutions  q 
+1
+n2 2 4 2 2 22 = Y2 ˙ Y2   4Y2 n1 sin  (3.12)2
+provided that Y 4   4Y 2n2 sin22 2 1   0. It can be shown that this condition, together with the condition of
+real-valuedness of kz2 [for both solutions of eq. (3.12)], is fulfilled if and only if
+Y 2  4n2 sin22 1 : (3.13)
+In practice, there are further constraints on the choice of the constituent material of the coating. Other
+experimental issues aside, n2 is bounded from below by the refractive index of air, and from above, by
+the index at which a second propagative diffraction order appears at the given value of kx . We shall now
+show how such constraints of the general form
+n2  n2  n2min 2 max (3.14)
+can be transformed into equivalent constraints on the immittance of the PC, 3.
+We begin by noting that the conditions (3.14) can always be rewritten in the form
+2  2  2min 2 max (3.15)
+3.3. Design procedure 51
+Range of n2 , n2 and n2 Y 2 Y 2
+min max x min max
+2  n
+2
+2  2 n
+4 4
+0 < n min
+n
+; n n min maxx 2 min max n2  n2 n2  n2
+min x max x
+n2 4
+min 2 2  2  2 n4 n< n < n n 2n max min
+2 x min max x n2  n2 n2  n2max x min x
+n2 22 2 2 2  n n2 n
+4
+min < n < n ; 2n < n min x 4n2 min
+2 x min x max n2  n2 x n2  n2
+min x min x
+n2 n2 n2 4
+min < n2 < n2 ; min x
+n
+< n2 4n2 max
+2 x min n2  n2 max x n2  n2
+min x max x
+n2  n2 < n2  2 n42n maxx max x 2   2 1min nmax nx
+n2  n2 ; 2n2 < n2x x max 4n2x 1min
+Table 3.1 Minimum and maximum bounds on Y 22 sufficient and necessary for fulfilment of the condition (3.14)
+together with the constraint (3.13) for at least one of the solutions (3.12) of eq. (3.11). The symbol n2x denotes
+n2 sin21  .
+with appropriate  and  . Specifically, for s polarisation, the formulas for Z2 and Z2min max min max
+follow readily from eq. (3.9):
+2 1 1Zmin =   ; Z
+2
+max =   : (3.16)n2max n2 21 sin  n2 n21 sin2 min
+For p polarisation, due to the more complex form of eq. (3.12) and the presence of the supplementary
+condition (3.13), several cases must be considered. The final formulas for Y 2 and Y 2max are given inmin
+table 3.1.
+To arrive at the form of the constraints on 3, we substitute eq. (3.7) into inequality (3.15) and
+introduce reduced immittances Q i  i=1 (i = 3, min, max), obtaining
+Q  ReQ C jQ j22  3 3Q  Q
+2
+min   max: (3.17)Re3 1
+This expres"sion can be rewritten as Q   Q  #2 2 2 2
+ReQ3  
+1C 1  
+min C .ImQ3/2   min .ReQ3   1/  0; (3.18a)
+" 2 2Q   Q  #2 2 2 2
+ReQ   1Cmax C 1  .ImQ /2   max .ReQ3 3 3   1/  0: (3.18b)
+2 2
+It follows that the constraints (3.14) are equivalent to the following conditions on Q3:
+.Q3 2 extP  and Q3 2 extCmin and Q3 2 intCmax/
+Q 2 Q 2 Q 2 (3.19)or .3 intP  and 3 intCmin and 3 extCmax/;
+where P 
+Q 
+ 
+stands for the half-plane ReQ3 < 1, C 1 Q 2 1min, the circle of radius j1   j centred at .1C2 min 2
+2 /; 0 , and C , the circle of radius 1 j1   Q 2 j centred at 1max max .1C Q 2max/; 0 . The symbols intAmin 2 2
+and extA denote the interior and exterior of a region A, and the overbar denotes set closure. Thus, for
+instance, intA stands for the interior of the set A together with its boundary.
+To illustrate various possible geometries of the region of the complex Q3 plane determined by the
+constraints (3.14) transformed into the form (3.19), fig. 3.4 shows the shape of this region for s polarisa-
+tion and three distinct choices of the parameters nmin, nmax, n1 and  .
+52 Chapter 3. Antireflection gratings for photonic crystals
+1
+(a) (b) (c)
+Cmax
+Cmin Cmin Cmin
+Cmax
+0 Cmax
+ 1
+0 1 2 0 1 2 0 1 2 3
+ReZQ Q3 ReZ3 ReZQ 3
+Figure 3.4 Regions of the complex ZQ 3 plane determined by the condition (3.19) equivalent to the constraint
+(3.14) for s polarisation and (a) n1 = 1, nmin = 1:5, nmax = 3,  = 0, (b) n1 = 1, nmin = 1, nmax = 3,  = 30ı, (c)
+n1 = 1:5, nmin = 1, nmax = 3,  = 0. The circles Cmin and Cmax are defined in the text after eq. (3.19); note that
+in the case (b) Cmax degenerates into the point .1; 0/.
+Step 2 The coating obtained in step 1 is not practical, since its fabrication would call for integration
+of the PC with a completely different solid; moreover, a suitable material with the required value of
+refractive index might not be easily available. However, as noted in subsection 3.2.1, a homogeneous
+thin film can often be replaced without adverse effects by a subwavelength grating. Such a grating could
+be easily etched in the same process as the underlying PC; it would then naturally be composed of the
+same materials as the PC, with permittivities, say, l and h (l < h).
+In order to calculate the fill factor of a binary lamellar grating mimicking a layer with refractive
+index n2 obtained in the previous step, one can resort to the classical second-order effective-medium
+theory of gratings due to Rytov, described in ref. 92. According to this theory, the effective permittivity Qs
+of a binary grating with period a and fill factor f (0  f  1), composed of materials with permittivities
+l and h, and operating in the s polarisation is
+ 2
+  
+Q N C k0a
+2
+2   2 .h   l/
+2
+s = s 1 f .1 f / N ; (3.20)3 2  s
+where
+Ns = fh C .1   f /l: (3.21)
+For p polarisation, the effective permittivity Qp is
+ 2 2  2
+Q = N C   k0a 2   2   2 N Npp p 1 f .1 f / .h l/ s ; (3.22)
+3 2  hl
+where  
+N f C 1   f
+ 1
+p = (3.23)
+h l
+and Ns is given by eq. (3.21). Thus, the required fill factor can be obtained by setting Qs or Qp to n22 in eq.
+(3.20) or (3.22) and solving it numerically for f .
+It should be noted that in the domain of validity of Rytov’s theory (small k0a=2 ) the functions Qs.f /
+and Qp.f / are monotonically increasing from l to h. Thus, a binary grating cannot simulate a material
+with permittivity outside the range delimited by the permittivities of the grating’s constituent materials.
+As a result, the bounds n2 and n2max mentioned in step 1 must fulfil n
+2  l and n2min min max  h,
+respectively.
+ImZQ 3
+3.4. Examples 53
+0:50
+PC
+air
+0:25
+0:00
+ 0:25
+ 0:50
+ 0:5 0:0 0:5
+kxa=2 
+Figure 3.5 Solid line: EFC of the PC considered in subsection 3.4.1 at frequency ! = 0:311  2 c=a and for
+s polarisation. Dashed line: EFC of air at the same frequency.
+Step 3 The structure obtained at this stage should, in principle, ensure low reflectance for incidence
+angles close to  . Nevertheless, owing to the applied approximations—neglect of higher diffraction
+orders excited by the PC and the AR grating—its geometrical parameters might not be precisely optimal.
+In addition, it is well known [91, 92] that trapezoidal and triangular AR gratings have larger angular
+and frequency tolerance than lamellar ones. Therefore, it is advisable to apply a numerical optimisation
+procedure to adjust the geometry of the grating, described by some small number of parameters, so as
+to minimise a given objective function . The geometry obtained in step 2 can be expected to provide a
+good starting point for a local search algorithm, such as the Nelder-Mead simplex method [110, section
+10.4].
+3.4 Examples
+3.4.1 A photonic-crystal flat lens
+Preliminaries The first PC we shall consider is a hexagonal lattice of air holes of radius r = 0:365a,
+where a is the lattice constant, etched in a dielectric matrix of permittivity  = 10:6. These parameters
+correspond to the structure whose fabrication was reported in ref. 18. For s polarisation, at frequency
+! = 0:311  2 c=a, the effective refractive index n =  1 can be attributed to the crystal, since its
+EFC takes an approximately circular shape (fig. 3.5) with radius K  !=c and group velocity directed
+inwards. (Unless otherwise noted, all calculations whose results are presented in this subsection have
+been made with the differential method [69, 74–76].)
+Veselago [20] predicted that a slab of material with n =  1 should act as a flat lens: an image of
+an object placed near one of the surfaces of the slab should be produced on the other side of the slab.
+Figure 3.6 shows the map of the modulus of the electric field generated by a wire source with current
+1A (ampere) located above a slab of the PC in question.? The parts (a) and (b) refer to slabs truncated
+in the ways shown in figs. 3.7(a) and (b), respectively; from now on, these two structures will be referred
+to as S1 and S2. In accordance with the theoretical predictions, images are formed below the slabs.
+? The field maps shown in figs. 3.6 and 3.12 have been produced with the finite-element method using the RF module of
+the COMSOL program. The computational domains were rectangles of width 55a and height 30a surrounded by perfectly
+matched layers of thickness 3a. The meshes consisted of about 225,000 second-order triangular Lagrangian elements
+of maximum size 0:2a (refined further in the neighbourhood of the point source). Numerical convergence was tested by
+comparing the results of a representative calculation against those obtained after refining the mesh by dividing each element
+into four. This produced no visible changes in the field map and the maximum amplitude of the image produced by the
+lens changed by less than 1%.
+kza=2 
+54 Chapter 3. Antireflection gratings for photonic crystals
+200
+(a)
+10
+150
+0 100
+50
+ 10
+0
+200
+(b)
+10
+150
+0 100
+50
+ 10
+0
+ 20  10 0 10 20
+x=a
+Figure 3.6 Modulus of the electric field generated by an s-polarised wire source with current 1A located above
+a slab of the PC studied in subsection 3.4.1 truncated along a plane (a) lying midway between two neighbouring
+rows of holes, (b) crossing the centres of holes.
+However, their amplitude is low (67 and 79V=m for structures S1 and S2, respectively) and intense
+beams reflected from the top of the lenses are visible in the upper part of the plots. This suggests that
+only a small fraction of energy is transmitted through the lenses. Indeed, as shown in fig. 3.7(a), the
+reflectance of structure S1, jr 20./j , where r0 is the specular reflection coefficient, exceeds 29% for all
+angles of incidence. Structure S2 performs better for low incidence angles, but degrades quickly with
+increasing  . We shall now apply the algorithm presented in section 3.3 to design an AR grating for
+this PC.
+Step 1 We have seen in section 2.4 that the effective-medium model of PCs tends to be more accurate
+for crystals truncated along a plane with constant permittivity profile, as is the case, for instance, for
+structure S1. Therefore in the first step of the design procedure we shall calculate the effective transverse
+impedance Z3 of this structure. We consider two ways of obtaining this quantity. First, we calculate it
+from eq. (2.23), derived in the framework of the model presented in chapter 2. At frequency ! = 0:311
+2 c=a and angle of incidence  = 45ı (corresponding to kx = 0:220  2 =a) we get Z1 = 1:414 and
+Z3 = 0:319. We should now check whether ZQ 3  Z3=Z1 = 0:225 lies within the region determined by
+the conditions (3.19) equivalent to the constraints (3.14) with nmin = 1 and nmax = 2:51 (the maximum
+index of a medium in which only a single propagative diffraction order exists). Figure 3.8, in which
+z=a z=a
+jEy j (V=m) jEy j (V=m)
+3.4. Examples 55
+1:00
+S1
+0:75 S2
+0:50
+(a) S1
+0:25
+0:00
+0 30 60 90
+Angle of incidence  (deg)
+(b) S2
+(c)
+Figure 3.7 Geometry of the PC studied in subsection 3.4.1 truncated along a plane (a) lying midway between
+two neighbouring rows of holes, (b) crossing the centres of holes. (c) Angular dependence of the reflectance of
+the structures shown in parts (a) and (b).
+1
+Cmin
+B
+0 C
+A max
+ 1
+0 1 2
+ReZQ 3
+Figure 3.8 Shaded circle: region of the complex ZQ 3 plane determined by the condition (3.19) equivalent to the
+constraint (3.14) for s polarisation, n1 = nmin = 1 and nmax = 2:51. Points A and B: reduced impedances ZQ 3 of
+structure S1 calculated in two different ways described in the text.
+the value of ZQ 3 cited above is marked with point A, shows that this is indeed the case. Therefore eqs.
+(3.5) and (3.9) can be used to calculate the parameters of the AR coating of the crystal: refractive index
+n2 = 1:649 and thickness d2 = 0:540a. The geometry of this structure, called S3 from now on, is shown
+in fig. 3.9(a) and its reflectance is plotted in fig. 3.9(e) with a solid black line. It can be seen that the
+application of the coating reduces significantly the reflectance of the crystal, especially for small angles
+of incidence. However, the parameters of S3 are certainly not optimal, since its reflectance at the “design
+angle”  = 45ı is as large as 9%. This is due to the relatively large error introduced by the single-mode
+approximation for negative-refraction PC bands, as pointed out in chapter 2.
+We shall evaluate, therefore, an alternative method of obtaining Z3, which consists in calculating
+it directly from the rigorous specular reflection coefficient r0 of the uncoated crystal at the chosen !
+and kx . In other words, we assume that r0 can be expressed in the form r0 = .Z3  Z1/=.Z3CZ1/ [cf.
+eq. (3.2)] and invert this formula to obtainZ3 = Z1.1Cr0/=.1 r0/. Of course, the effective impedance
+defined in this way depends on the material properties of medium 1. Nevertheless, at least for the PC in
+question, this dependence is weak for sufficiently small n1: we obtain Z3 = 0:258C 0:175i for n1 = 1
+and the effective impedance does not change by more than 10% up to n1 = 2:25. As shown in fig. 3.8, the
+reduced impedance ZQ 3 = 0:182C 0:124i corresponding to the above value of Z3 (marked with point B)
+also lies within the allowed region of the ZQ 3 plane. Taking this value of Z3, from eqs. (3.5) and (3.9)
+ImZQ 3
+Reflectance jr j20
+56 Chapter 3. Antireflection gratings for photonic crystals
+n2 = 1:649
+d2 = 0:540a
+(a) S3
+1:00
+S3
+n2 = 1:884 0:75 S4
+d2 = 0:565a S5
+0:50 S6
+(b) S4
+0:25
+f = 0:192 0:00
+d 0 30 60 902 = 0:565a
+Angle of incidence  (deg)
+(c) S5
+(e)
+f = 0:192
+d2 = 0:565a
+(d) S6
+Figure 3.9 (a)–(b) Geometry of AR coatings S3 and S4, characterised by refractive index n2 and thickness d2
+specified next to the drawings. (c)–(d) Geometry of binary lamellar AR gratings S5 and S6, characterised by
+fill factor f and thickness d2 specified next to the drawings. (e) Angular dependence of the reflectance of the
+structures shown in parts (a)–(d).
+we get n2 = 1:884 and d2 = 0:565a. The angular dependence of the reflectance of the PC covered with
+this coating, shown in fig. 3.9(b) and called S4 in the following, is plotted in fig. 3.9(e) with a solid grey
+line. It is evident that this structure has much better angular tolerance than S3; moreover, its reflectance
+at  = 45ı is only 0.05%. Therefore we choose S4 as a basis for the further steps of the algorithm.
+Step 2 Numerical inversion of eq. (3.20) gives the fill factor f = 0:192 of the binary grating mimick-
+ing a medium with n = 1:884. Since we would like the angular dependence of r0 to be symmetric with
+respect to  = 0, the grating should be positioned so as to preserve the vertical mirror symmetry axes of
+the underlying PC. This can be done in two possible ways, shown in figs. 3.9(c) and (d). The reflectance
+of these two structures, called S5 and S6, is plotted in fig. 3.9(e). Clearly, grating S5 reproduces fairly
+faithfully the original reflectance curve of the AR coating S4. On the other hand, grating S6 behaves
+better in the high- region.
+Step 3 The lamellar gratings obtained in step 2 provide already a remarkable improvement over the
+uncoated PC and, in contrast to the AR coatings from step 1, should be manufacturable. Nevertheless,
+their geometry can be further ameliorated. To this end, as mentioned in the last paragraph of section 3.3,
+we use the Nelder-Mead simplex algorithm to find the optimum values of the dimensions wi, wo, hi, and
+ho parametrising the trapezoidal grating shown in fig. 3.10. The objective function  is defined as the
+average of the numerically calculated reflectance of the given structure over the desired angular tolerance
+Reflectance jr j20
+3.4. Examples 57
+a
+p
+a 3=4
+hi
+ho
+wo
+wi
+Figure 3.10 Definition of the geometrical parameters wi, wo, hi, and ho of a trapezoidal grating superposed on
+the surface of structure S1.
+interval Œmin; max, Z
+1 max
+ =   jr0./j
+2 d: (3.24)
+max min min
+The integral in eq. (3.24) is calculated with the 20-point Gauss-Legendre quadrature algorithm [110,
+section 4.5], whose typical relative accuracy, 10 5, is better than that of the reflectance calculations,
+10 3. The initial shape of the grating is taken to correspond to one of the lamellar gratings obtained in
+step 2, i.e., wi = wo = fa, hi = 0, and ho = d2. The search routine is terminated when the size of the
+simplex, defined as the average distance of its vertices from its geometric centre, falls below 10 5. The
+final values of the geometrical parameters of the grating are determined by selecting the best among the
+16 structures obtained by rounding each of the parameters delivered by the simplex algorithm upwards
+or downwards to a multiple of 0:01a.
+Application of this procedure with  = 0ı,  = 90ımin max to grating S5 yields grating S7 shown in
+fig. 3.11(a). The plot in fig. 3.11(e) (solid black line) demonstrates the excellent antireflective properties
+of this structure (note the scale of the vertical axis). Its average reflectance is as low as 2.8%; in fact,
+jr ./j2 does not exceed 5.5% until  = 87ı0 . The structure does not seem to present special fabrication
+difficulties—e.g., acute angles—except possibly for the relatively thin dielectric veins separating the
+circular holes from the surface. Should this pose a real experimental difficulty, one can increase the
+value of hi at the expense of a slight performance deterioration. For example, grating S8 with hi = 0:08a
+has average reflectance of 4.8%.
+Figure 3.12 shows the map of the modulus of the electric field produced by a point source placed
+above a PC slab coated with AR gratings of type S7 from above and below. The comparison with fig. 3.6
+reveals the significant improvement brought about by the AR grating: not only are the reflected beams
+prominent in the upper part of the latter figure suppressed, but the amplitude of the image formed by the
+lens grows to 159V=m, which is two times better than in the situation from fig. 3.6(b).
+Optimisation of structure S6 leads to gratings with average reflectance comparable to that of S7 and
+S8 but composed of “narrower” trapezoids (wiCwo  0:2a), thus less suitable for fabrication. Therefore
+we omit the detailed discussion of these structures.
+Other structures In refs. 111 and 112 two other trapezoidal AR gratings, here denoted S9 and S10,
+were presented. Their geometrical parameters, shown in figs. 3.11(c) and (d), were obtained by minimis-
+58 Chapter 3. Antireflection gratings for photonic crystals
+wi = 0:40a
+wo = 0:16a
+hi = 0:05a
+ho = 0:55a
+(a) S7
+0:20
+wi = 0:28a S7
+wo = 0:28a 0:15 S8
+hi = 0:08a S9
+ho = 0:50a 0:10 S10
+(b) S8
+0:05
+wi = 0:50a
+wo = 0 0:00
+hi = 0:01a 0 30 60 90
+ho = 0:69a Angle of incidence  (deg)
+(c) S9
+(e)
+wi = 0:29a
+wo = 0:22a
+hi = 0:08a
+ho = 0:53a
+(d) S10
+Figure 3.11 (a)–(d) Geometry of AR gratings S7–S10 characterised by parameters wi, wo, hi, and ho specified
+next to the drawings. (e) Angular dependence of the reflectance of the structures shown in parts (a)–(d). To help
+visualise the details of the jr 20./j dependence, the y axis has been truncated at jr 20j = 0:2.
+200
+10
+150
+0 100
+50
+ 10
+0
+ 20  10 0 10 20
+x=a
+Figure 3.12 Modulus of the electric field generated by an s-polarised wire source with current 1A located above
+a slab of the PC studied in subsection 3.4.1 with S7-type gratings placed on its horizontal surfaces.
+z=a
+Reflectance jr j20
+jEy j (V=m)
+3.4. Examples 59
+max wi wo hi ho
+90ı 0:378–0:424a ( 22 nm) 0:151–0:170a ( 9 nm) 0:045–0:055a ( 5 nm) 0:543–0:557a ( 7 nm)
+80ı 0:330–0:463a ( 63 nm) 0:132–0:186a (26 nm) 0:033–0:062a (14 nm) 0:530–0:569a (19 nm)
+60ı 0:192–0:533a (162 nm) 0:084–0:208a (59 nm) 0 –0:082a (39 nm) 0:497–0:586a (42 nm)
+Table 3.2 Ranges of geometrical parameters of grating S7 for which its average reflectance at frequency 0:311
+2 c=a in the angular range 0    max does not exceed 5%. The numbers in parentheses are the lengths of the
+tolerance intervals for a = 476 nm, which corresponds to operation wavelength  = a=0:311 = 1530 nm. Note that
+the tolerance intervals correspond to perturbations of one parameter at a time (not all parameters simultaneously).
+R
+ing the objective function 2  =20 jr0./j d (average modulus of the specular reflection coefficient r0) 
+calculated with a less accurate quadrature algorithm. The average reflectance of structure S9 in the full
+0ı–90ı range, 2.8%, matches that of S7; in a more restricted range, say, 0ı–80ı, the performance of
+grating S9 is even slightly better. Nonetheless, its disadvantage lies in the presence of very thin dielectric
+veins at the surface. Grating S10, with hi = 0:08a, is devoid of this problem. However, it is superseded
+by structure S8 with identical hi, which has somewhat lower average reflectance.
+Tolerance to fabrication imperfections A fabrication process invariably perturbs the geometrical
+parameters of the manufactured structure. To assess the sensitivity of the proposed gratings to fabrication
+errors, we have determined the maximum perturbation of each of the four geometrical parameters of
+grating S7 for which the grating’s average reflectance in the angular range 0    max did not exceed
+5%. Three values of  were considered: 90ı, 80ı, and 60ımax . The results of this test are summarised
+in table 3.2. It can be seen that the grating is more sensitive to variations of the height of the trapezoids
+(via the h and h parameters) than of their width (w and w ). The constraints for  = 90ıo i o i max and
+ = 80ımax are rather stringent and unlikely to be met in practice. In contrast, fabrication of a structure
+satisfying the constraints for  = 60ımax seems well within reach of current technology.
+We have also tested the frequency tolerance of grating S7, finding that the its average reflectance stays
+below 5% for 0:3094  !a=2 c  0:3113 ( = 90ı), 0:3048  !a=2 c  0:3122 ( = 80ımax max ),
+and 0:2511  !a=2 c  0:3173 ( = 60ımax ). This tolerance seems quite sufficient for applications
+related to lensing.
+3.4.2 A supercollimating photonic crystal
+Preliminaries The second example to be considered is a PC composed of a square lattice of air
+holes of radius r = 0:3a, where a is the lattice constant, etched in a dielectric matrix of permittivity
+ = 12:25. Near the frequency ! = 0:265  2 c=a its EFCs for p polarisation take a square-like
+shape (cf. fig. 3.13. In consequence, supercollimated beams [16, 113] can propagate in the crystal.
+All calculations reported in this subsection have been made with a frequency-domain finite-difference
+method with subpixel smoothing implemented along the lines of ref. 114.
+Figure 3.14(c) shows the angular dependence of the reflectance of this PC at ! = 0:265  2 c=a;
+two different truncation planes, shown in figs. 3.14(a)–(b) and called S11 and S12 in the following, are
+considered. It is seen that the crystal cut through hole centres has fairly low reflectance: about 10% at
+normal incidence and decreasing for larger angles up to   65ı. This level of power losses might in
+fact be already sufficient for practical applications. Nevertheless, for the sake of illustration, we shall
+present the design procedure of AR gratings that help to decrease even further the reflectance of the PC
+in question.
+60 Chapter 3. Antireflection gratings for photonic crystals
+0:50
+0:25
+0:00
+ 0:25
+ 0:50
+ 0:5 0:0 0:5
+kxa=2 
+Figure 3.13 EFC of the PC studied in subsection 3.4.2 at frequency ! = 0:265  2 c=a. The shaded region
+corresponds to the range   45ı (jkxj  0:187  2 =a), where the EFC is approximately flat and for which the
+minimisation of the PC’s reflectance is made.
+1:00
+S11
+0:75 S12
+0:50
+(a) S11
+0:25
+0:00
+0 30 60 90
+Angle of incidence  (deg)
+(b) S12
+(c)
+Figure 3.14 Geometry of the PC studied in subsection 3.4.2 truncated along a plane (a) lying midway between
+two neighbouring rows of holes, (b) crossing the centres of holes. (c) Angular dependence of the reflectance of
+the structures shown in parts (a) and (b).
+Step 1 We are mostly interested in coupling the incoming light to modes lying on the flat horizontal
+part of the PC’s EFC. As shown in fig. 3.13, at frequency ! = 0:265  2 c=a this corresponds roughly
+to the range j j  45ı, i.e., jkxj  0:187  2 =a. Therefore we choose  = 22:5ı as the design
+angle of the AR coating. As in the previous subsection, we test two different ways of calculating the
+effective immittance (in this case, admittance) of the crystal cut along a constant-permittivity plane, i.e.,
+structure S11. The effective-medium model presented in chapter 2 yields Y3 = 6:138. In turn, the
+effective admittance calculated from the rigorous reflection coefficient of structure S11 embedded in air
+is Y3 = 6:075   1:191i. Figure 3.15 shows that the reduced admittances corresponding to both these
+values lie within the region of the complex YQ3 plane determined by the conditions (3.19) equivalent to
+the constraints (3.14) with n1 = nmin = 1, nmax = 3:391 (the refractive index for which the second
+propagative diffraction order appears) and  = 22:5ı. The parameters of the AR coatings determined
+from these two values of Y3 are (n2 = 2:548, d2 = 0:374) and (n2 = 2:595, d2 = 0:391), respectively.
+Figure 3.16 shows the geometry of these coatings, henceforth referred to as S13 and S14, and the angular
+dependence of their reflectance. As in the PC lens case, the AR coating S14 designed using the value of
+Y3 obtained from the rigorous reflection coefficient of the crystal performs slightly better than the other
+one. Therefore structure S14 shall be used in the subsequent design step.
+kza=2 
+Reflectance jr j20
+3.4. Examples 61
+5 Cmax
+0 Cmin A
+B
+ 5
+0 5 10
+ReYQ3
+Figure 3.15 Shaded circle: region of the complex YQ3 plane determined by the condition (3.19) equivalent to the
+constraint (3.14) for p polarisation, n1 = nmin = 1 and nmax = 3:391. Points A and B: reduced admittances YQ3 of
+structure S11 calculated in two different ways described in the text.
+1:00
+= S13n2 2:548
+0:75 S14
+d2 = 0:374a
+0:50
+(a) S13
+0:25
+n2 = 2:595 0:00
+d = 0:391a 0 30 60 902
+Angle of incidence  (deg)
+(b) S14 (c)
+Figure 3.16 (a)–(b) Geometry of AR coatings S13 and S14, characterised by refractive index n2 and thick-
+ness d2 specified next to the drawings. (c) Angular dependence of the reflectance of the structures shown in parts
+(a) and (b).
+Step 2 From numerical inversion of eq. (3.22) it follows that the fill factor of the binary grating mim-
+icking a medium with n = 2:595 for p polarisation is f = 0:812. Figures 3.17(a)–(b) show the geometry
+of the two gratings, called S15 and S16, with this fill factor and a mirror symmetry plane perpendicular to
+the direction of periodicity. From the juxtaposition of their reflectance curves [fig. 3.17(c)] it follows that
+structure S15 has somewhat better performance than S16. Incidentally, there is some similarity between
+the geometry of grating S15 and the truncated crystal S12, which also exhibited fairly low reflectance:
+The surface of both these structures contains “teeth” shifted by 1a in the horizontal direction with re-
+2
+spect to the positions of the circular holes. Therefore, one could view the crystal S12 as an imperfect
+realisation of the AR grating S15.
+Step 3 The lamellar grating S15 can be further ameliorated by adjusting its thickness d2 and fill
+factor f to minimise the objective function  defined in eq. (3.24). We take min = 0, max = 45
+ı and,
+as before, perform the optimisation with the Nelder-Mead simplex algorithm. This leads to structure S17
+with d2 = 0:37a and f = 0:73, shown in fig. 3.17(c). Its reflectance curve is plotted in fig. 3.17(d) (solid
+line). In the angular range 0    45ı, the reflectance never exceeds 0.6%, on average amounting
+to only 0.12%. The structure does not seem to present any special fabrication problems. It is possible
+to continue the grating’s optimisation by allowing it to take a trapezoidal rather than a lamellar shape;
+however, in view of its already very good AR properties, this appears unnecessary.
+ImYQ3
+Reflectance jr j20
+62 Chapter 3. Antireflection gratings for photonic crystals
+f = 0:812
+d2 = 0:391a 1:00
+S15
+(a) S15 0:75 S16
+S17
+0:50
+f = 0:812
+d2 = 0:391a 0:25
+(b) S16 0:00
+0 30 60 90
+Angle of incidence  (deg)
+f = 0:730
+(d)
+d2 = 0:370a
+(c) S17
+Figure 3.17 (a)–(c) Geometry of binary lamellar AR gratings S15, S16 and S17 characterised by fill factor f
+and thickness d2 specified next to the drawings. (d) Angular dependence of the reflectance of the structures shown
+in parts (a)–(c).
+3.4.3 A photonic-crystal superprism
+We have also attempted to design an AR grating for the unidirectional mirror proposed by Vanwolleghem
+et al. [115]. This device, which will be analysed in some more detail in subsection 5.2.3, is slab of the PC
+shown in fig. 3.18(a). The PC consists of a hexagonal lattice of triples of adjacent circular holes etched
+in a magneto-optical (MO) matrix characterised by a gyrotropic permittivity tensor
+2 3
+O = 4.2:5/
+2 0 0:1i
+0 .2:5/2 0 5 : (3.25)
+ 0:1i 0 .2:5/2
+The presence of this MO material lifts the time-reversal symmetry of Maxwell’s equations; the spatial
+inversion symmetry is also broken owing to the particular choice of the motif. As a result, the crystal
+becomes nonreciprocal, i.e., the usual property of the dispersion relation, !.kE/ = !. kE/ [79, pp. 22–23],
+no longer holds. The p-polarisation EFC of this crystal at frequency ! = 0:3915  2 c=a, calculated
+with the method described in section 5.2, is shown in fig. 3.18(b). It can be seen that a plane wave
+impinging at the angle of about 58ı (corresponding to kx   =3a) on the top surface of a slab made
+from this PC will be coupled to its propagative mode, and thus will be partially transmitted. However,
+a wave travelling in the opposite direction, incident from the bottom, will be totally reflected, since the
+crystal has no propagative modes with kx    =3a. This behaviour justifies the name unidirectional
+mirror.
+The problem with the presented device is its large forward loss: even waves propagating in the
+“allowed” direction undergo a significant reflection on the surfaces of the slab. Currently we do not
+have a reliable code allowing to calculate accurately the reflection coefficient of the MO PC from fig.
+3.18(a) in p polarisation. Therefore we shall study instead the non-MO crystal in which the original motif
+composed of three circles is replaced by three overlapping squares, as shown in shown in fig. 3.19(a). The
+permittivity of the matrix is taken as  = .2:5/2. [This modified geometry is due to K. Postava (Technical
+Reflectance jr j20
+3.5. Conclusions 63
+(b)
+(a) 0:50
+a a 0:25
+r
+0:00
+ 0:25
+ 0:50
+a
+ 0:5 0:0 0:5
+kxa=2 
+Figure 3.18 (a) Geometry of the PC composed of a hexagonal lattice of groups of three adjacent circular holes
+with radius r = 0:20a, where a is the lattice constant, etched in a magneto-optical matrix. (b) p-polarisation EFC
+of this crystal at frequency ! = 0:3915  2 c=a.
+University of Ostrava, Czech Republic).] The EFC of this crystal at frequency ! = 0:4548  2 c=a,
+calculated with the differential method, is shown in fig. 3.19(b). Clearly, its shape in the regions marked
+by dashed circles is similar to that seen in fig. 3.18(b). Fig. 3.19(c) shows a magnification of this EFC
+near its inflection point kx = 0:309 2 =a, together with the kx-dependence of the crystal’s reflectance.
+It can be seen that the latter is very high. Therefore, to be useful in practice, the unidirectional mirror
+would need to be coated with some AR structure.
+Unfortunately, the design of an appropriate AR grating using the procedure described in section 3.3
+turns out to be impossible. For instance, at the inflection point of the EFC, the reflection coefficient of
+the uncoated PC is r0 = 0:969   0:086i, which corresponds to YQ3 = 6:50   20:5i. As evidenced by
+fig. 3.19(d), this lies far outside the region of the complex YQ3 plane determined by the conditions (3.19)
+equivalent to the constraints (3.14) with n1 = nmin = 1 and nmax = 1:52 (the refractive index of the
+least optically dense coating in which the second propagative diffraction order would appear). In fact, if
+we blindly apply eqs. (3.7) and (3.12) to calculate the refractive index of the optimum AR coating, we
+obtain n2 = 12:4 or 0:68. It is obvious that none of these indices can be simulated by any binary grating
+composed of the constituent materials of the PC. Therefore, an AR structure for the unidirectional mirror
+will probably need to be designed with some purely numerical method. In particular, Lawrence et al.
+[107] have shown their approach to give good results for a superprism that, uncoated, has an extremely
+high reflectance (jr j20 = 0:996).
+3.5 Conclusions
+In this chapter we have presented a new method of designing gratings that, superimposed on surfaces
+of PCs crystals, will minimise their reflectance. The design algorithm consists of three steps. First, the
+parameters of a homogeneous-layer AR coating are calculated from an effective-medium approximation
+of the PC in question. Second, an analytical effective-medium theory of gratings is used to find the
+parameters of a binary lamellar grating composed solely of the constituent materials of the crystal and
+approximating the coating obtained in the previous step. Third, the shape of the grating is refined with
+a numerical local-search routine so as to minimise the reflectance of the structure in the desired angular
+kya=2 
+64 Chapter 3. Antireflection gratings for photonic crystals
+a 0:746a
+(a) (b)
+0:4a 0:50
+0:25
+0:00
+0:3a
+0:4a  0:25
+p
+p 3
+3 a  0:50
+a 2
+2
+truncation plane  0:5 0:0 0:5
+kxa=2 
+1:0 0:60 1:0
+(c) (d)
+0:9 0:55 0:5
+Cmax
+0:8 0:50 0:0 Cmin
+0:7 jr0j2 0:45  0:5
+kza=2 
+0:6 0:40  1:0
+0:250 0:275 0:300 0:325 0:350 0:0 0:5 1:0 1:5 2:0
+kxa=2  ReYQ3
+Figure 3.19 (a) Geometry of the PC composed of a hexagonal lattice of non-centrosymmetric motifs etched
+in a dielectric matrix. (b) p-polarisation EFC of this crystal at frequency ! = 0:4548  2 c=a. (c) Solid line:
+kx-dependence of the reflectance jr 20j of this crystal, placed in air and truncated in the way indicated in part (a).
+Dashed line: a fragment of the EFC from part (b). (d) Shaded circle: region of the complex YQ3 plane determined
+by the condition (3.19) equivalent to the constraint (3.14) for p polarisation, n1 = nmin = 1 and nmax = 1:52. The
+reduced admittance of the crystal, YQ3 = 6:50   20:5i, lies far beyond the range of the graph.
+or frequency range. This last step is necessary owing to the approximations made in the analytical
+derivations used in the first two steps of the procedure.
+This algorithm of AR grating design can be viewed as complementary to the method proposed by
+Lawrence et al. [106, 107]. While their approach is based on an exhaustive scan of the whole parameter
+space (made very efficient by the application of the matrix-valued effective immittance of gratings), ours
+rests on approximate analytical considerations used to find a starting point for a local search procedure.
+In section 3.4 the proposed method has been applied to three example crystals with EFCs of different
+curvature: a supercollimating crystal with a very flat EFC, a crystal exhibiting negative refraction, with
+almost circular EFC, and a PC superprism, whose EFC has a kink. In the two first cases, the design
+process succeeded in producing AR gratings ensuring very low reflectance in a wide angular range.
+The obtained structures are quite compact and apparently rather straightforward to fabricate. In the
+last case, the procedure broke down owing to the violation of the constraints (3.19) on the effective
+immittance of the crystal that must be satisfied in order that the AR coating produced in the first step can
+be approximated with a binary grating made of realistic materials. The existence of these constraints is
+the basic limitation of the presented procedure.
+jr 20j
+kza=2 
+ImYQ3
+kza=2 
+Chapter 4
+Magneto-optical circulators
+4.1 Introduction
+4.1.1 Basic characteristics of isolators and circulators
+This chapter will be devoted to the design of magneto-optical circulators optimised for operation at in-
+frared frequencies in a uniform static external magnetic field (SEMF). Circulators and (closely related)
+isolators are devices widely used both in the optical and microwave domain. Their operation can be
+most easily explained with the formalism of scattering matrices. Consider the junction of waveguides
+W1, W2; : : : , Wn shown in fig. 4.1. On any cross-section Pj (called a port) of waveguide Wj located
+sufficiently far from the junction, the field can be represented solely in terms of the waveguide’s prop-
+agative eigenmodes. Let us assume all the waveguides to be single-mode and denote the amplitudes of
+the incoming and outgoing mode of Wj on the port Pj by sj;in and sj;out. If the system under study
+is linear, the amplitudes of the outgoing modes can be linked with those of the incoming ones by the
+scattering matrix SO of the junction [116, p. 249]:
+sEout = SOsEin; (4.1)
+where sE = Œs ; s ; : : : ; s T and sE = Œs ; s ; : : : ; s Tin 1;in 2;in n;in out 1;out 2;out n;out . An ideal isolator is a two-
+port device that passes a wave coming from waveguideW1 to waveguideW2, but blocks the transmission
+in the opposite direction. It is described by the scattering matrix [117, p. 523]
+ 
+0 0
+SO = : (4.2)
+1 0
+In turn, a circulator is an n-port device that couples a wave coming from waveguideW1 to waveguideW2
+only, a wave coming from W2 to W3 only, and so on [116, p. 468]. The simplest, 3-port circulator is
+described by the scattering matrix [117, p. 536]
+2 3
+0 0 1
+SO = 41 0 05 : (4.3)
+0 1 0
+It is worth noting that a circulator can be used as a replacement of an isolator if we ensure that no
+incoming waves ever reach one of its ports. This can be easily achieved by connecting that port to a
+matched load, which does not generate reflected waves.
+The above devices have several important applications. They can be used to eliminate waves reflected
+from imperfectly matched components of complex circuits; the presence of such waves can give rise to
+undesired interferences and parasitic couplings [34]. They are also employed in signal routing in devices
+65
+66 Chapter 4. Magneto-optical circulators
+Wn
+Pn
+: : :
+P1
+W1
+P2
+W2
+Figure 4.1 An n-port device.
+such as multiplexers [35]. In the optical domain, possibly the most important application of isolators
+is the protection of lasers from back-reflected light, which disturbs the standing-wave pattern in a laser
+cavity and may cause the device to become unstable [36].
+From the Lorentz reciprocity theorem it follows that the scattering matrix of a reciprocal system is
+symmetric provided that the amplitudes sj;in and sj;out are normalised so that any mode with unitary
+amplitude carries unitary power [116, pp. 235–236 and 249]. By a reciprocal system, we understand
+a system consisting of time-invariant, linear media whose material properties [cf. eq. (1.3)] satisfy the
+relations [118, p. 10]
+O = OT; O = OT and O˛ =   OˇT: (4.4)
+Since the scattering matrices from eqs. (4.2) and (4.3) are not symmetric, isolators and circulators must
+by necessity contain nonreciprocal materials.
+4.1.2 Routes to nonreciprocity
+Among the possible ways of building nonreciprocal systems, by far the most common is the introduc-
+tion of ferro- and ferrimagnetic materials. The propagation of low-amplitude microwaves in these media
+placed in a sufficiently strong SEMF is usually described by considering them to have a tensorial perme-
+ability of the form 2 C C   3
+O = 41 y z iz iy i 5z 1C x C z ix ; (4.5)
+iy  ix 1C x C y
+where i and i (i = x; y; z) are proportional to the i th component of the magnetisationME induced by
+the SEMF [119, p. 92; 117, p. 503]. For lossless media, O is Hermitian, so that all the parameters i and
+i are purely real. Therefore the diagonal part of the tensor defined in eq. (4.5) is real and (obviously)
+symmetric, while its off-diagonal part is imaginary and antisymmetric. Tensors with these properties are
+called gyrotropic.
+Near the ferromagnetic resonance frequency, which for sub-tesla SEMFs falls in the microwave
+range, the magnitude of the off-diagonal components of O is comparable to that of the diagonal ones.
+This can lead to very strong nonreciprocal effects.
+4.1. Introduction 67
+At optical frequencies, the propagation of electromagnetic waves in ferro- and ferrimagnetic media
+is more commonly handled by attributing them an anisotropic permittivity
+2   3 igz igy
+O = 4 ig 5z  igx ; (4.6)
+igy  igx 
+where gi = KMi and the parameter K describes the magneto-optical (MO) properties of the material
+[35; 119, p. 236]. MO effects are usually weak; therefore the SEMF-induced perturbation of the diagonal
+elements of O is commonly neglected. The real part of K is related to the specific Faraday rotation F
+by
+F = p
+ 
+Ms ReK; (4.7)
+ 
+where  is the free-space wavelength and Ms denotes the characteristic saturation magnetisation of the
+medium. The imaginary part ofK, in turn, is responsible for the effect of circular dichroism. In low-loss
+ferrimagnetic materials this imaginary part is often small and therefore in the rest of this chapter we shall
+assume K to be real. We shall also introduce the symbol g MsK.
+The most commonly used MO materials are (ferrimagnetic) synthetic garnets, of which the most
+well-known is yttrium iron garnet (YIG). It is usually grown on substrates made of gadolinium gallium
+garnet (GGG). The atoms of yttrium can be substituted by other elements, including bismuth and cerium.
+The specific Faraday rotation of partially cerium-substituted yttrium iron garnet (Ce:YIG) at  = 1550 nm
+has been measured to be  0:45ı=µm, which corresponds to g =  0:01 [120]. Bismuth iron garnet
+(BIG), which is reputed to outperform Ce:YIG [121], has been found to have as large as  30ıF =µm at
+ = 540 nm, i.e., g =  0:22 [122]. Unfortunately Vertruyen et al. [122] do not report on measurements
+of the specific Faraday rotation of BIG in the infrared range. The available data indicate that F of
+this material diminishes with increasing wavelength, but the effect of this decrease on g is partially
+compensated by the growth of . It seems realistic to expect that g  0:05–0:1 can be obtained at
+infrared frequencies. It is also worth noting that another (non-garnet) material, europium oxide, has been
+reported to have g = 0:4 in this frequency range [123]; however, its magneto-optical properties disappear
+above the Curie temperature of 69K [124].
+There are a few other methods of obtaining nonreciprocal behaviour. In the microwave domain it
+is possible to introduce off-diagonal imaginary components to the permittivity tensor of standard non-
+magnetic metals, such as gold, by placing them in a strong SEMF. Unfortunately, this method cannot be
+applied easily to optical systems because the strength of the necessary SEMF increases with frequency,
+reaching several teslas in the optical range; another obstacle consists in the relatively large losses ex-
+hibited by metals in this segment of the electromagnetic spectrum. Another possibility consists in using
+so-called Tellegen’s media, in which the relation O˛ =   OˇT does not hold; however, in known materials
+of this type the magnitude of the real component of the tensors O˛ and Oˇ is very small, and therefore this
+method of inducing nonreciprocal behaviour remains so far largely unexplored. Finally, instead of using
+materials whose parameters do not meet conditions (4.4), one can violate the other conditions of valid-
+ity of the standard Lorentz reciprocity theorem: introduce a time-dependent modulation of the material
+properties of the system or employ nonlinear effects.
+4.1.3 Experimental realisations of optical isolators and circulators
+Bulk magneto-optical isolators A basic feature of MO materials is the phase velocity difference
+between right- and left-circularly polarised plane waves propagating parallel to the magnetisation direc-
+tion. As a result of this difference, the polarisation plane of a linearly polarised plane wave propagating
+68 Chapter 4. Magneto-optical circulators
+along the direction ofME gradually rotates; moreover, the direction of this rotation (clockwise or counter-
+clockwise), when viewed in the laboratory frame, does not depend on whether the wave propagates par-
+allel or antiparallel to ME [116, p. 460–464]. This phenomenon, known as Faraday’s effect, is the basis
+of the operation of the archetypical “bulk” optical isolator, shown schematically in fig. 4.2(a). It consists
+of a slab of a MO material sandwiched between two polarisers rotated by 45ı with respect to each other
+[35]. The slab, magnetised perpendicularly to the planes of the polarisers, has thickness d such that the
+polarisation plane of waves traversing the medium rotates by 45ı. Let us assume that this happens in
+the clockwise direction. Then a wave coming in through polariser 1 will eventually find its polarisation
+plane aligned with the axis of polariser 2. In contrast, the polarisation plane of a wave coming in through
+polariser 2 will become perpendicular to the axis of polariser 1. As a consequence, the former wave will
+be transmitted, whereas the latter will be absorbed.
+As noted in subsection 4.1.2, the specific Faraday rotation (rotation angle per unit length) of com-
+monly used MO materials is small. Therefore, optical isolators built in the way presented in the previous
+paragraph need to be rather thick (d  0:1–1mm). It is, however, possible to reduce d to tens of mi-
+crometres by replacing the single MO layer by a Fabry-Perot resonator composed of a stack of dielectric
+and MO thin films, at the cost of a reduced operation bandwidth [125].
+Another way of reducing the thickness of a bulk isolator consists in the application of PCs. As
+noted first by Figotin and Vitebsky [126], a PC with both the spatial inversion symmetry and the time-
+reversal symmetry broken has a dispersion diagram that lacks inversion symmetry. From this it follows
+in particular that at a given frequency a band gap can exist for waves propagating in a direction kE, but
+not for those propagating in the direction  kE; thus, at such a frequency the PC behaves as an isolator. An
+example 1D PC of this type was presented in ref. 127. In this structure, the spatial inversion symmetry
+was lifted by the presence of MO layers polarised in opposite directions (but always parallel to the layers,
+unlike in Faraday rotators). Since fabrication of such layers might be difficult, Khanikaev and Steel
+[128] proposed to break the inversion symmetry by the introduction of a third material into the periodic
+lattice. They showed also an alternative resonator-type design, in which a single MO layer is sandwiched
+between two different dielectric Bragg mirrors. In turn, the isolator proposed by Vanwolleghem et al.
+[115] consists of a 2D PC composed of a lattice of holes drilled in a MO matrix magnetised in the
+out-of-plane direction. The shape of holes is chosen so that the system’s spatial inversion symmetry is
+lifted.
+Owing to their large lateral dimensions, bulk, non-planar structures are difficult to combine with
+integrated optical circuits. Therefore, in the last two decades there has been a lot of activity devoted to
+the design of isolators and circulators suitable for on-chip manufacturing. Most of these structures are
+intended for fabrication in MO garnet layers grown on GGG substrates, although methods of bonding
+garnet layers to semiconductor (e.g., silicon) substrates have also been developed. With respect to their
+geometry, the proposed devices can be divided into two broad classes: waveguide- and resonator-type
+components.
+Waveguide-type devices The operation of the earliest waveguide-type isolators was based on the
+nonreciprocal conversion between quasi-TE and quasi-TMmodes of rib waveguides, induced by a SEMF
+parallel to the waveguide axis. This phenomenon is analogous to Faraday’s effect [35]. However, it
+must be noted that in this case the conversion occurs between states whose polarisation planes differ by
+90ı rather than 45ı. Therefore, a 45ı-long nonreciprocal Faraday rotator must be connected in series
+with a 45ı-long reciprocal rotator. The presence of this additional element, together with the necessary
+polarisers at the input and output ports, complicates the fabrication procedure. The main deficiency of the
+design based on Faraday’s effect, though, is that while in a bulk MO material the phase velocities of all
+plane waves polarised perpendicularly toME are identical, the effective indices of quasi-TE and quasi-TM
+4.1. Introduction 69
+W3
+P2
+P1
+W1 cavity
+P3
+W2
+(a) (b)
+ME
+P nonreciprocal section2 P1
+(c)
+P2 P4
+ME
+nonreciprocal section
+P1 P3
+(d)
+Figure 4.2 Selected types of optical isolators and circulators. (a) Bulk isolator based on Faraday rotation (after
+ref. 35). (b) Three-way resonator-type circulator. (c) Mach-Zehnder interferometer with one nonreciprocal arm.
+(d) Nonreciprocal coupler acting as a four-port circulator. The arrows indicate the directions of energy transfer.
+70 Chapter 4. Magneto-optical circulators
+waveguide modes are, in general, different. For high isolation, the waveguide geometry should therefore
+be adjusted to force a close match of these indices. In practice, this is not easy to obtain without post-
+fabrication etch-tuning or deposition of an additional dielectric layer [129, 130]. It is worth mentioning,
+however, that Dammann et al. [131] showed that the stringent requirements for index matching can be
+somewhat relaxed, at the cost of incurring a modest additional forward loss, if the polarisation plane of
+the input mode is rotated by 22:5ı from the vertical direction.
+The drawbacks listed in the previous paragraph are eliminated in devices exploiting the difference
+in the phase velocity of forward- and backward-propagating modes of MO waveguides lacking a mirror
+symmetry plane parallel to their axis and placed in a SEMF perpendicular to that axis. The simplest
+isolator based on this effect has the form of a Mach-Zehnder interferometer [fig. 4.2(c)] with its two
+arms designed so as to introduce a nonreciprocal phase shift of 90ı and a reciprocal shift of the same
+value [120, 132, 133]. For a forward-propagating wave, these shifts cancel out, so that the waves coming
+from the two arms interfere constructively at the output; for a backward-propagating wave, the shifts add
+up, which leads to a destructive interference. Analogous structures based on PC waveguides have also
+been investigated [134]. In a different scheme, so-called nonreciprocal multi-mode imaging, a single
+multi-mode waveguide is used instead of two single-mode ones [135].
+A related type of device is a four-port circulator composed of two coupled MO waveguides [fig.
+4.2(d)], whose parameters are chosen so that the phase velocities of forward-propagating modes differ,
+while those of backward-propagating ones match. This leads to a difference in the coupling strength of
+the two pairs of modes. As a result, a forward-propagating mode stays in the original waveguide, while
+a backward-propagating one gradually leaks to the neighbouring waveguide. Both rib-waveguide-based
+[136] and PC-waveguide-based [137] designs have been proposed.
+Another way of achieving isolation is to employ nonreciprocal absorption. This phenomenon occurs
+primarily in ferromagnetic metals, which are usually highly lossy at optical frequencies. The concept
+of an isolator based on the difference of the decay rates of forward- and backward-propagating waves
+was originally proposed by Zaets and Ando [138] and Takenaka and Nakano [139]. The first success-
+ful demonstration of such a device was made by Vanwolleghem et al. [140], who fabricated a system
+containing a layer of a cobalt-iron alloy embedded in indium phosphide. Improved version of this iso-
+lator were reported on in refs. 141 and 142 (the latter authors used manganese arsenide instead of the
+cobalt-iron alloy). In turn, Takeda and John [123] proposed the device consisting of a MO PC waveguide
+designed so that its forward- and backward-propagating eigenmodes have significantly different group
+velocities. Since the slower mode experiences a longer effective optical path, in the presence of absorp-
+tion its decay rate exceeds that of the faster mode. In all these designs current injection is normally used
+to compensate for the undesired absorption of the forward-propagating mode.
+Certain MO waveguides are characterised by a difference in the cut-off frequency of forward- and
+backward-propagating modes. Therefore, in the range between these two frequencies guided-wave prop-
+agation is possible in one direction only. As pointed out by the authors of refs. 143, 144 and 145, this
+effect can also be used for the construction of an isolator.
+Wang et al. [146] have shown that a SEMF can lift degeneracies in the band structure of high-
+symmetry PCs containing materials with gyrotropic permittivity or permeability, thus leading to the
+creation of band gaps. They also predicted that unidirectional waveguide modes with frequencies lying
+within such band gaps can propagate along interfaces separating the just described PCs from dielectric
+PCs or metals. This has been subsequently confirmed experimentally [147]. However, these effects have
+so far been demonstrated only at microwave frequencies, where the permeability tensor can have off-
+diagonal components with magnitude comparable with that of the diagonal ones. The MO effects are
+much weaker, and it is not certain whether the band gaps generated in the optical regime will be robust
+against disorder [147].
+4.1. Introduction 71
+Resonator-type devices More suitable for integration than their bulk counterparts, waveguide-type
+MO devices must still be rather long in order to provide a satisfactory isolation. For instance, arm lengths
+of 1mm are used in the state-of-the-art Mach-Zehnder interferometers whose fabrication was reported
+on in ref. 120. According to the review of Dötsch et al. [35], this value is typical. Isolators are thus
+much larger than other standard components used in integrated circuits. A possible way of miniaturising
+them consists in employing resonant cavities to lengthen the time during which light interacts with the
+MO material. Of course, a drawback of this approach is the reduction of the operation bandwidth of the
+devices.
+Circulators based on resonant cavities are commonly used in the microwave domain [117]. A typical
+device of this type is composed of three identical reciprocal waveguides Wi (i = 1; 2; 3) coupled to a
+single resonant cavity containing a ferrimagnetic material and, in the absence of SEMF, supporting two
+degenerate localised modes of frequency !0 [fig. 4.2(b)]. In a SEMF perpendicular to the plane of the
+system, this degeneracy is lifted: the modes couple and form two linear combinations corresponding to
+left- and right-rotating modes with frequencies !  and !C [34, 148]. At the frequency 1.!  C !C/, a2
+wave incoming from, say, waveguideW1 excites such a superposition of these two eigenmodes that they
+interfere constructively in front of one output waveguide (say,W2), and destructively in front of the other
+(W3). As a result, an outgoing mode with a significant amplitude appears only in waveguide W2, while
+W3 is isolated from the incoming power. Analogously, owing to the three-fold rotational symmetry of
+the device, energy transfer occurs in the directions W2 ! W3 and W3 ! W1. The scattering matrix
+of the system is then given by eq. (4.3). If the SEMF polarisation is flipped, the direction of the energy
+transfer reverses, too.
+In 2005 Wang and Fan [34, 37] proposed an analogous device intended for operation at optical
+frequencies, composed of a 2D PC cavity coupled to three PC waveguides. Using a model based on
+the coupled-wave theory [149], they showed the bandwidth of the circulator to grow with the frequency
+splitting !  j!C   ! j. This frequency splitting, in turn, was demonstrated to be proportional to
+the integral of the out-of-plane component of the cross product of the electric fields of the cavity modes,
+weighted with g, over the area of the cavity.
+The authors of ref. 34 observed that in a typical PC cavity the sign of the cross product mentioned
+above oscillates rapidly, leading, as a result, to a severe diminution of !. To remedy this, they pro-
+posed to divide the MO material in the cavity into several domains polarised in opposite directions, thus
+flipping locally the sign of g and forcing the overall sign of the integrand to be constant everywhere.
+Unfortunately, the resulting structure is almost impossible to manufacture with the current technology,
+since the creation of the necessary magnetic subdomains would require the application of a SEMF inho-
+mogeneous on the scale of hundreds of nanometres, with the inhomogeneities precisely aligned with the
+geometric structure of the cavity.
+In a follow-up paper [150] the same authors presented a design of a four-port circulator composed of
+two straight PC waveguides coupled to a single MO cavity with a subdomain structure determined along
+analogous principles. In turn, Kono and Koshiba proposed a rib-waveguide-based circulator consisting of
+a Mach-Zehnder interferometer coupled to an exterior ring [151], and, subsequently, a device similar to
+that from ref. 150, but built from rib waveguides coupled to a MO microdisk [152]. Another contribution
+of the latter paper was the introduction of a method of increasing the circulator’s bandwidth by including
+several coupled resonators instead of just one. In all these designs, however, division of the MO material
+into oppositely-polarised domains is still required.
+It is worth noting that in ref. 34 a solution alternative to the introduction of magnetic domains was
+also considered, namely the inclusion of a single MO rod in an standard dielectric PC. In principle, it
+is possible, but it would also pose serious technological problems related to the growth of two different
+materials on a single substrate and the necessity of aligning precisely the structures obtained in two
+72 Chapter 4. Magneto-optical circulators
+etching processes. In any case, to the best of our knowledge, none of the devices proposed in refs.
+34, 37, 150, 151 and 152 has ever been fabricated.
+Non-magneto-optical devices As has been noted before, introduction of ferro- and ferrimagnetic
+materials is not the only method of making a system nonreciprocal. Therefore a number of isolator and
+circulator designs based on the alternative approaches have also appeared in the literature. For instance,
+Gallo et al. [153] described optical analogues of diodes employing nonlinear optical processes. Yu and
+Fan [154] proposed an isolator based on a time-dependent modulation of the refractive index of parts of
+a dielectric waveguide. In turn, Yu et al. [155] showed that the SEMF-induced gyrotropy of metals in the
+microwave domain can lead to the creation of unidirectional waveguide modes at the interfaces of these
+metals and dielectric PCs.
+4.1.4 Outline of this chapter
+The aim of the research reported on in this chapter was to design a three-port MO circulator of the
+type shown schematically in fig. 4.2(b), suitable for operation in a uniform SEMF, i.e., with all the MO
+material magnetised in the same direction. The plan of the text is as follows. In section 4.2 we set the
+stage by extending the coupling-wave model of the device in question, introduced by Wang and Fan [34],
+to include the influence of direct coupling between the three waveguides and the effect of radiation loss.
+These results are used later. In section 4.3 we derive an analytical axisymmetric model of a 2D MO PC
+cavity and use it to formulate a design principle of cavities exhibiting maximum frequency splitting in
+the presence of a uniform SEMF. This is the key result of this chapter.
+Section 4.4 is devoted to PC-based circulators. Having shown how to convert an axisymmetric cavity
+designed along the rules established in section 4.3 to a component liable for integration with a periodic
+lattice, we demonstrate numerical simulations of a complete circulator embedded in a 2D PC. In sec-
+tion 4.5 we investigate rib-waveguide-based devices, which should be simpler to fabricate than PC-based
+ones, but present design problems of their own due to imperfect in-plane light confinement. We begin by
+detailing the design process of a rib-waveguide-based circulator intended for fabrication in a GGG-BIG
+heterostructure. This design is based on 2D finite-element simulations with the influence of the third di-
+mension taken into account by help of the effective-index approximation. In subsection 4.5.4 we report
+briefly on the outcome of the first attempts to manufacture and characterise this device, made at Institut
+d’Electronique Fondamentale (Orsay, France). The measurements indicate that the vertical confinement
+provided by the cavity is insufficient. Therefore, in section 4.6 we describe the results of rigorous three-
+dimensional (3D) simulations of axisymmetric cavities designed by the method presented in section 4.3
+and discuss various methods of improving the vertical confinement. Finally, in section 4.7 we summarise
+the results of our work on MO devices.
+Some of the results presented in sections 4.3 and 4.4 have appeared previously in ref. 148.
+4.2 Extension of the coupled-wave model
+4.2.1 Inclusion of direct coupling between waveguides
+Let us consider a circulator composed of three identical single-mode waveguides, W1, W2, and W3,
+weakly coupled with a resonant cavity and arranged so that the whole system has C symmetry,?3v as
+shown schematically in fig. 4.2(b). We assume that in the absence of SEMF the cavity supports a pair of
+degenerate orthonormal eigenmodes belonging to the unique two-dimensional irreducible representation
+? The symmetry elements of the group C3v are a three-fold rotation axis and three mirror planes intersecting each other at
+the angle of 120ı along this axis [80, p. 325].
+4.2. Extension of the coupled-wave model 73
+of the C3v point group and having frequency !0. They can be classified as even or odd, according to
+their symmetry with respect to reflection about the axis of waveguide W1, which is assumed to lie along
+the  x axis. The circulator’s operation at frequency ! is described by the coupled-mode equations [149]
+ i!aE =  .i O˝ C  O /aE CDO TsEin; (4.8a)
+sEout = CO sEin CDO aE; (4.8b)
+where the vector aE = .a ; a /T contains the cavity mode amplitudes, sE = .s ; s ; s /Te o in 1;in 2;in 3;in and sEout =
+.s ; s ; s /T1;out 2;out 3;out , the amplitudes of the in- and outgoing waveguide modes, the matrix CO describes
+the direct coupling between waveguides,DO the cavity-waveguide coupling, O˝ the mode eigenfrequencies
+and their coupling, and  O their decay. These matrices are subject to the fundamental constraints [149]
+DO DO = 2 O; (4.9a)
+CODO  =  DO : (4.9b)
+Together with those following from the system’s symmetry, these constraints can be used to reduce the
+number of independent parameters necessary for the characterisation of the device. We shall now con-
+sider each of the matrices occurring in eqs. (4.8) in turn.
+Owing to the three-fold symmetry of the circ O2ulator, the3C matrix must have the form
+r t t
+CO = 4t r t5 ; (4.10)
+t t r
+where t  jt j ei and r  jr j ei.C/ are the transmission and reflection coefficients of waveguide modes
+in the absence of the cavity. If the system is lossless, as we shall assume in this subsection, we can use
+the condition of unitarity of CO to express t and r as
+2 cos ei i.C/
+t =  p C ; r = p
+e
+C : (4.11)1 8 cos2 1 8 cos2
+Note that the case of no direct coupling, considered in ref. 34, corresponds to  =   and  =   .
+2 2
+TheDO matrix has the general form 2 3
+d1e d1o
+DO = 4d d 52e 2o ; (4.12)
+d3e d3o
+where dim (i = 1; 2; 3; m = e; o) describes the coupling of mth cavity mode with i th waveguide. These
+coupling parameters are proportional to the values of the electromagnetic field of the modes along the
+waveguide axes. Making use of the assumed symmetry of the mode fields, it can be shown that these six
+parameters can be expressed in terms of a single complex co iı2 3upling constant d  jd j e :
+1 0
+DO = 46 p 7d  1 3p 5 : (4.13)2 2
+ 1   3
+2 2
+Substituting this formula into eq. (4.9a),we obtain
+1 0
+ O =  ; where   3 jd j2: (4.14)
+0 1 4
+74 Chapter 4. Magneto-optical circulators
+The second constraint, eq. (4.9b), yields
+.t   r/d = d: (4.15)
+Noting that from eq. (4.11) we have
+   p2 cos   e
+i
+i 3 cosC i sint r = e = ei. C/ = eiŒ CCarg.3 cosCi sin/C j C j (4.16)1 8 cos2 3 cos i sin
+and writing d in its polar form, we obtain the expression for ı:
+ı = 1 Œ.2nC 1/ C  C arg.3 cosC i sin/; (4.17)
+2
+where n is an integer. Lastly, since the coupling between the cavity modes is assumed to result solely
+from their interaction with the SEMF, the O˝ matrix takes the form [34]
+ j jO˝ !0 i V=   j j ; (4.18)i V !0
+where V is the mode coupling strength. The eigenvalues of this matrix, !˙  !0 ˙ jV j, are the
+frequencies of the eigenmodes of the cavity in isolation (uncoupled to waveguides). The frequency
+splitting!  !C !  = 2jV j is proportional to the mode coupling strength. As noted in ref. 148, it is
+often convenient to write jV j as jV j = g!0v, where g is the magnitude of the off-diagonal component of
+the permittivity tensor of the MO constitutive material of the cavity, and v, called reduced mode coupling
+strength, depends solely on the geometry of the cavity.
+Substituting eqs. (4.10), (4.11), (4.13), (4.14), (4.17), and (4.18) to the coupled-mode equations (4.8),
+taking W to be the input waveguide by setting sE = .1; 0; 0/T1 in , and solving for sEout, we obtain
+i  
+p e i 4.3 cosC i sin/ Œ   i.!   ! /s1;out = C e
+0
+    C j j ; (4.19a)1 8 cos2 3 Œ i.! ! /2 V 20
+p
+i  C   j j     p 2 e 3 cos i sin Œ V 3 i.! !0/s2;out =
+1C   cosC ; (4.19b)8 cos2 2 2 3 Œ   i.!   !0/ C jV jpi 
+p 2 e   C 3 cosC i sin Œ C jV j 3   i.!   !0/s3;out = C cos     C j j : (4.19c)1 8 cos2 3 Œ i.! ! /2 V 20
+This solution is valid provided that the matrix i. O˝  !IO/C O , where IO denotes the 22 identity matrix,
+is invertible. This is the case if
+! ¤ !0 ˙ jV j and  ¤ 0: (4.20)
+It is easily seen than the reflectance R  js j2 and transmittances T  js j21;out i i;out (i = 2; 3) are
+independent of  and  -periodic in . Moreover,
+jsE .; !/j2 = jsE .   ; 2!   !/j2i;out i;out 0 for i = 1; 2; 3: (4.21)
+Therefore it is sufficient to study the properties of R and T in the interval  2 Œ0;  i .2
+We are primarily interested in the behaviour of the isolation factor of the circulator, defined as I 
+T3=T2. Figure 4.3 shows the dependence of I on the frequency shift .!   !0/ and the waveguide-
+cavity coupling parameter  for a few representative values of  and a fixed mode coupling strength
+4.2. Extension of the coupled-wave model 75
+log10I for D = 0 log10I for D = Π4
+0.2 0.2
+1
+1
+0.1 01 0.1 0
+2 -1-
+0.0 -34 0.0-
+-2
+-3-4
+-0.1 -111 0 -0.1
+0
+-0.2 -0.2
+0.00 0.05 0.10 0.15 0.20 0.00 0.05 0.10 0.15 0.20
+Γ Γ
+log10I for D = Π3 log10I for D = Π2
+0.2 0.2
+1
+1
+0.1 02 0.1
+0.0 -1 0.0 4
+3
+2
+-2
+-0.1 -0.1
+-0.2 0 -0.2
+0.00 0.05 0.10 0.15 0.20 0.00 0.05 0.10 0.15 0.20
+Γ Γ
+Figure 4.3 Isolation I as a function of  and !   ! for  = 0,   ,  0 and   (logarithmic scale).4 3 2
+jV j = 0:1. It can be conjectured that for any ¤   infinite isolation factor can be obtained for a specific
+3
+value of ! and  . However, in practice one is more concerned with the maximum bandwidth B.Imin/,
+defined as the maximum range of frequencies for which the isolation factor or its inverse exceeds a
+predetermined threshold Imin. Figure 4.3 shows that this bandwidth is particularly large for vanishing
+( =   ) and maximum ( = 0) direct waveguide-to-waveguide coupling. In these cases,pthe isolation2
+factor is anpeven function of .!   !0/, and infinite isolation occurs at ! = !0 and  = jV j 3 ( =   )2
+or  = jV j= 3 ( = 0). It is also at these “optimum” values of  that maximum bandwidth is obtained.
+Figure 4.4 illustrates the frequency dependence of the transmittances and the isolation factor for
+ =   and 0, with  set to the respective “optimum” values cited above. In the first case, I > 1 every-
+2
+where: for the chosen SEMF polarisation, waveguide W3 receives more power than W2 at all operation
+frequencies. In contrast, the device with  = 0 acts as a switch: transmission occurs preferentially to
+Ω-Ω0 Ω-Ω0
+Ω-Ω0 Ω-Ω0
+76 Chapter 4. Magneto-optical circulators
+1:00
+(a) T2 ( D  =2)
+0:75 T3 ( D  =2)
+0:50
+0:25
+0:00
+1:00
+(b) T2 ( D 0)
+0:75 T3 ( D 0)
+0:50
+0:25
+0:00
+104
+3 (c) I ( D  =2)10
+1=I ( D 0)
+102
+101
+100
+10 1
+ 0:50  0:25 0:00 0:25 0:50
+!   !0
+Figpure 4.4 (a) Frequency dependence of the transmittapnces T2 and T3 for a circulator with  =   and  =2jV j 3. (b) Same for a circulator with  = 0 and  = jV j= 3. (c) Frequency dependence of the isolation factor I
+of the two circulators. In both cases jV j = 0:1.
+waveguide W2 for j!   !0j < jV j and to W3 outside this frequency range. In consequence, the band-
+width of the system with maximum coupling ( = 0) is inferior to that of the one with no direct coupling
+( =   ) regardless of the chosen threshold Imin. However, fig. 4.4(c) shows that the difference in band-2
+width becomes less and less pronounced as Imin grows: for very high isolation factors, the bandwidths
+of both structures are virtually indistinguishable.
+The conclusions from the previous two paragraphs, based in part on an analysis of plots made for
+several specific cases, can also be reached in a rigorous manner. We shall first derive the values of
+! and  at which the isolation factor or its inverse becomes infinite. By definition of I , this will be
+the case provided that exactly one of s2;out and s3;out vanishes. Rewriting the condition s2;out = 0 as
+(Re s2;out = 0 and Im s2;out = 0) and using assumption (4.20), we obtain
+p
+3ŒjV j2 C  jV j 3   .!   ! 20/  cos   .!  p!0/ sin = 0; (4.22a)
+Œ3.!   !0/ cosC .   jV j 3/ sin = 0: (4.22b)
+One solution of these equations, ! = !0 ˙ jV j and  = 0, is obviously incompatible with assumption
+(4.20). The other can be obtained by solving eq. (4.22b) for ! and substituting the result into eq. (4.22a).
+Isolation factor Transmittance Transmittance
+4.2. Extension of the coupled-wave model 77
+This yields
+C 2 sin.2/
+p
+j j 1   4 cos
+2 p
+! = !0 C V 3 and  = C jV j 3: (4.23)1 8 cos2 1 8 cos2
+Comparing the expressions (4.19b) and (4.19c) for s2;out and s3;out, one immediately sees that the con-
+dition for s3;out = 0 is given by formula (4.23) with jV j replaced by  jV j. Noting further that, by
+definition (4.14),  cannot be negative, we arrive at the following conclusion.
+The isolation factor I of a lossless circulator is infinite if and only if
+j j 1 C 2 sin.2/
+p
+j j 1   4 cos
+2 p
+cos < ; ! = !0 C V 3 and  = C jV j 3: (4.24a)2 1 8 cos2 1 8 cos2
+The factor I is zero if and only if
+j j 1   2 sin.2/
+p
+j j 4 cos
+2   1 p
+cos > ; ! = !0 C V 3 and  = C jV j 3: (4.24b)2 1 8 cos2 1 8 cos2
+Restricting to the interval Œ0;   , we see that jcosj < 1> if and only if <>   . It should be noted that2 2 3
+for  =   there exist no solutions of eq. (4.22) compatible with assumption (4.20).
+3
+It is convenient to introduce the reduced frequency
+Q  !   !0 ˙ 2 sin.2/
+p 1
+! 3 for jcosj ><j j C : (4.25)V 1 8 cos2 2
+It can be shown that the isolation I at the optimum level of coupling  quoted in conditions (4.24) can
+be written solely as a function of and !Q . The plot of this function is shown in fig. 4.5(a). It can be seen
+that for any Imin the bandwidth B.Imin/ depends strongly on the value of , and it is always the largest
+for  =   . The behaviour of B.Imin/ in the interval  2 Œ0;    is quite interesting. For sufficiently low2 3
+values of Imin, maximum bandwidth is obtained for some value of lying in the interior of this interval.
+However, as soon as Imin exceeds 55, the optimum value of  in the interval in question becomes
+equal to 0. As noted earlier, the difference in bandwidth at  = 0 and  =   diminishes as Imin grows.2
+This effect is demonstrated in fig. 4.5(b), in which the ratio of B.I ; =  min / and B.Imin;  = 0/ is2
+plotted as a function of Imin.
+In summary, direct waveguide-to-waveguide coupling has a detrimental effect on a circulator’s oper-
+ation bandwidth, and therefore should be minimised in a properly designed device. Nevertheless, a little
+paradoxically, devices with maximum direct coupling also provide a comparatively large bandwidth,
+exhibiting, in addition, an interesting switching effect.
+4.2.2 Inclusion of radiation loss
+Another effect that can play an important part in the operation of rib-waveguide-based circulators and
+three-dimensional (3D) PC circulators alike is the loss of energy to the free space surrounding the device.
+This loss can be fairly easily handled by the coupled-wave theory. We shall limit our discussion to the
+case without direct coupling ( =   ), which in the previous subsection was found to yield maximum
+2
+bandwidth. We shall also assume the energy to be lost solely owing to radiation of the cavity mode into
+free space, neglecting the energy radiated when the incident waveguide mode is reflected from the end
+of the input waveguide.
+Following ref. 156, pp. 208–212, we incorporate the
+O O C O O   cavity radiation loss in the coupled-wave equa-tions (4.8) by replacing   by    l, where   1 0l l 0 1 and l is the decay constant related to radiation
+78 Chapter 4. Magneto-optical circulators
+5
+(a) (b)
+2 2
+4
+0 0 3
+2
+ 2  2
+1
+0:0 0:2 0:4 1 10 100 1000
+=  Imin
+Figure 4.5 (a)Dependence of the isolation I on and !Q when the coupling level  is maintained at its optimum
+value given by eqs. (4.24). The visible discontinuity of I at  =   is due to the fact that at this value of  we
+3
+switch from the conditions for zero isolation [eq. (4.24b)] to those for infinite isolation [eq. (4.24a)]. (b) Ratio
+of the maximum bandwidths B.Imin/ of the two circulators with  =
+  and  = 0 as a function of I
+2 min
+. The
+coupling level  is still maintained at its optimum value.
+loss. Proceeding analogously as before, we solve the coupled-wave equations for the amplitudes of the
+outgoing modes in the three waveguides:
+s1;out =  1C
+4 Œ C l   i.!   !0/
+C     C j j ; (4.26a)3 Œ l i.! !0/2 V 2
+p
+ 2 Œ C l   jV j 3   i.!   != 0/s2;out ; (4.26b)
+3 Œ   i.!   ! 2 20/ C jV j
+p
+ 2 Œ C l C jV j 3   i.!   !0/s3;out =     C j j : (4.26c)3 Œ i.! ! /2 20 V
+From eqs. (4.26b) and (4.26c) it can be immediately seen that despite the presence of loss, infinite
+isolation I can still be obtained at frequency ! = !0 provided that the coupling coefficient  is taken as
+p
+ = jV j 3   l: (4.27)
+Interestingly, when  is chosen in this way, the isolation I.!/ becomes independent from l:
+C 12jV j
+2
+I.!/ = 1 : (4.28)
+.!   ! /20
+However, the power transmitted to the ‘hot’ waveguide, T3, obviously decreased when the loss coeffi-
+cient l increases. With  given by eq. (4.27), the expression for the maximum value of T3 takes the
+form p
+. 3    =jV j/2
+T3.! = !0/ =
+l
+: (4.29)
+3
+This formula is important because it allows to determine the minimum quality factorQl  !0=.2l/
+of a cavity with a given SEMF-induced relative frequency splitting !=!0 that can be used to build a
+circulator with a prescribed minimum level of transmitted power, T3;min. (Note thatQl describes solely
+the decay caused by radiation to free space, rather than that due to interaction with waveguide modes.)
+Indeed, expressing l in eq. (4.29) in terms ofQl and using therelation ! = 2jV j, we obtain that
+  !
+p p  1
+T3.! = !0/ Tmin if and only if Ql .1   Tmin/ 3 : (4.30)
+!0
+!Q
+B. D  2 /=B. D 0/
+log10 I
+4.3. Cavities with circular symmetry 79
+Thus, a circulator built with a cavity having !=!0 = 0:001 (a typical value) can provide 50-percent
+peak transmission if Ql  1970. A quality factor Ql  11;250 is needed for 90-percent efficiency, and
+Ql  115;000 for 99-percent.
+4.3 Cavities with circular symmetry
+Wang and Fan [34] used the perturbation theory to derive a formula for the mode coupling strength V ,
+introduced in the previous subsection, of a cavity containing a MO material polarised in the z direction.
+From eq. (4.6) it follows that such a material is characterised by the permittivity tensor
+2 3
+ ig 0
+O = 4 ig  05 ; (4.31)
+0 0 
+where g  KM . From now on we shall assume g to be real. The authors of ref. 34 obtained?z R
+i
+V =   qR! g.rE/ eE E
+
+z  ŒEe .RrE/ EEo.rE/ drE ; (4.32)2
+.rE/jEEo.rE/j2 drE .rE/jEEe.rE/j2 drE
+where the integrals run over the whole cavity volume, EEe and EEo are the electric fields of the even
+and odd modes of the cavity unperturbed by the SEMF, and ! is their frequency (denoted !0 in the
+previous section). Thus, the magnitude of V is proportional to the cross product of the electric fields
+EEe and EEo weighted by the off-diagonal component of the permittivity tensor, ig. To understand better
+the behaviour of this cross product and to formulate a design principle for resonant cavities with large
+frequency splitting in a uniform SEMF, we shall now study the restricted class of 2D cavities having
+perfect rotational symmetry. In contrast to general PC cavities, circularly symmetric cavities can be
+handled analytically, which makes it possible to get a better insight into their properties.
+We consider, then, a system of concentric rings [see fig. 4.6(a)], described by a piecewise-constant
+relative permittivity ./ independent from the azimuthal coordinate  and the vertical coordinate z. The
+relative permeability  is taken to be 1 everywhere. In the p-polarisation case [waves propagating in the
+.; / plane with the magnetic field parallel to the z axis] the Maxwell’s equations
+1 @Hz =  i!0E; (4.33a)
+ @
+@Hz = i!0E ; (4.33b)
+@
+@E C 1   1 @EE = i!0Hz; (4.33c)
+@   @
+reduce to the Helmholtz equation for the z component of the magnetic field,H :
+  z
+@ 1 @Hz C 1 @H
+2 2
+z
+ C 1 @ Hz C ! Hz = 0: (4.34)
+@  @  @ 2 @2 c2
+Hepre ! denotes the frequency, 0 and 0 the permittivity and permeability of free space, and c =
+1= 00 the speed of light in vacuum. By the usual method of separation of variables one can show
+? The difference in sign between eq. (6) from ref. 34 and eq. (4.32) is caused by the difference in the convention chosen for
+harmonic time-dependence (e i!t here vs. ei!t in ref. 34).
+80 Chapter 4. Magneto-optical circulators
+that the eigenmodes of the system occur in degenerate pairs of “even” and “odd” modes with magnetic
+field of the general form
+Hze.; / = R./ cos.l/ and Hzo.; / = R./ sin.l/; (4.35)
+respectively, where the azimuthal order l is an integer. (Of course, the exception is the modes with l = 0,
+which are not degenerate.) Within an arbitrary ring, the radial dependence R./ of the magnetic field of
+a mode with azimuthal order l can be expressed as a superposition of the Bessel functions of the first and
+second kind:
+R./ = amJl.nmk0/C bmYl.nmk0/; (4.36)
+where m is the ring’s number, nm its refractive index, am and bm constant coefficients, and k0  !=c
+the free-space wave number.
+From eq. (4.35) and the Maxwell’s equations (4.33) we can derive the general expressions for the
+cross product of the electric fields corresponding to a pair of degenerate modes with azimuthal order l ,
+E  E  E lR./R
+0./
+ez .Ee Eo/ = ; (4.37)!2 ./2
+and their norm,
+Z Z Z
+E E 1 l2ŒR./2 C 2ŒR0./2.rE/jEe.rE/j2 drE = .rE/jEo.rE/j2 drE = d; (4.38)
+0  ./
+with R0./ denoting the derivative of R./. Substituting eqs. (4.37) and (4.38) to the general formula for
+the coupling strength (4.39), we obtain
+Z 1 g./R./R0./
+V =  Z i!l d20 ./1 C 0 : (4.39)l2ŒR./2 2ŒR ./2
+d
+0  ./
+Clearly, the sign of the integrand in the numerator of the above expression depends on the sign of the
+product g./R./R0./. In general, this sign will oscillate due to the oscillatory behaviour of the func-
+tion R./ itself. Therefore, to avoid unnecessary cancellations in the integral in question, the ring
+boundaries need to be placed so that the product g./R./R0./ be always nonnegative (or nonposi-
+tive). Excluding the possibility of introducing inversely-magnetised domains, this can only be achieved
+by ensuring that the boundaries between the MO and non-MO material coincide with the zeros of the
+product R./R0./, i.e., the zeros and extrema of R./. With this design principle in mind, we offer
+the following method for the determination of the radii of the alternating MO and non-MO rings making
+up a cavity supporting a pair of degenerate modes with azimuthal order l  1 at a particular frequency
+! = k0c.
+As a first step, we determine the radius 0 of the central rod (“zeroth ring”), assumed to have refrac-
+tive index n0. In this rod, the radial field dependence is expressed solely by means of the Bessel function
+of the first kind Jl.n0k0/, since the Yl.n0k0/ function has a singularity at the origin. Hence, b0 = 0
+and, since the global mode amplitude is arbitrary, a0 can be set to 1. It is then evident that the product
+R./R0./ in the central rod will not change sign until the first extremum of the Jl.n0k0/ function.
+Therefore, we set the rod’s radius, 0, to the value of  corresponding to the location of this extremum.
+The amplitudes a1 and b1 of the Bessel functions in the first ring, having refractive index n1, can
+now be determined from the condition of continuity ofHz and E . The outer radius of the first ring, 1,
+4.3. Cavities with circular symmetry 81
+(a) y
+magneto-optical
+air
+x
+1:0
+R.r/
+rzO E0:5 e Eo
+0:0
+(c)
+ 0:5
+0:0 0:5 1:0 1:5
+r=
+Figure 4.6 (a) The geometry of a cavity composed of a sequence of rings made of air and a MO material with
+refractive index 2.25. (b) The magnetic fieldHz of the even eigenmode of azimuthal order l = 1 supported by the
+cavity at frequency ! = 2 c=. (c) Radial dependence of the magnetic field Hz of the cavity eigenmodes and of
+the cross product of their electric fields. Both functions are normalised to their maximum values. The areas filled
+with the MO material are shaded.
+should then be chosen so as to coincide with the first zero of the function a1Jl.n1k0/C b1Yl.n1k0/
+located in that ring, as which point the product R./R0./ will again change sign. By repeating this
+process, we obtain the radii of the subsequent rings. The outer radii of the even rings (with refractive
+index n0) coincide with the extrema of the function R./, and those of the odd rings (with refractive
+index n1), with its zeros. Thus, the cavity designed in this way resembles an annular Bragg grating
+[157], with each layer a quarter-wavelength thick (in the sense of the Bessel-function quasi-periodicity).
+We need now to make sure that the field of the mode constructed in this way is localised, i.e., that
+R./ decays as  tends to infinity. Let us estimate the ratio ofR./ at its two successive extrema, located
+at 2n and 2nC2, where n 1. The Bessel functions of large arguments can be approximated by [158,
+82 Chapter 4. Magneto-optical circulators
+eqs. (9.2.1) and (9.2.2)]
+r  
+ 2    Jl.x/ cos x l  
+ 
+; (4.40a)
+r x  2 4
+ 2        Yl.x/ sin x l : (4.40b)
+ x 2 4
+By construction, the field in the .2nC1/th ring, located between 2n and 2nC1, behaves approximately
+as
+R./  c C  1=22n 1 cosŒn1k0.   2n/; (4.41)
+and in the .2nC 2/th ring as
+R./  c C  1=22n 2 sinŒn0k0.   2nC1/; (4.42)
+where c2nC1 and c2nC2 are constant coefficients. Since the rings are supposed to be a quarter-wavelength
+thick, the expressions n k . C    / and n k . C    C / are approximately equal to  1 0 2n 1 2n 0 0 2n 2 2n 1 and2
+the successive extremal values of R./ are
+ C  1=2R.2n/ c2n 1 2n (4.43a)
+and   
+    1 1  1=2
+R.2nC 1=22/  c2nC2 2nC2  c2nC2 2n C C : (4.43b)2k0 n0 n1
+From the requirement of continuity of E / R0 ./=./ at  = 2nC1 it follows that c2nC2=c2nC1 =
+ n0=n1. Hence,
+ˇˇˇ ˇˇˇ   
+R. C / n   1 1  1=2ˇ 2n 2 ˇ  0 C C  n !  1! n01 : (4.44)R.2n/ n1 2k02n n0 n1 n1
+Thus, a localised mode is obtained only if the refractive index of the central rod, n0, is chosen smaller
+than that of the first ring, n1.
+Figure 4.6(a) shows the geometry of an example cavity constructed with the above algorithm. The
+system consists of an alternating sequence of rings made of air (refractive index n0 = 1) and a MO
+material with refractive index n1 = 2:25. It supports a pair of degenerate localised eigenmodes of
+azimuthal order l = 1. The magnetic field of the even mode is plotted in fig. 4.6(b); the field of the odd
+mode can be obtained by rotating the map from fig. 4.6(b) by 90ı in the counter-clockwise direction. In
+fig. 4.6(c), the radial dependence of these magnetic fields,R./, is juxtaposed with the radial dependence
+of eE EE EE calculated from eq. (4.37). Clearly, R./R0z e o ./ is negative throughout the MO rings and
+positive elsewhere; as a result, no cancellations in the upper integral in eq. (4.39) occur. The reduced
+coupling strength of this pair of modes is v = 0:00874.
+4.4 Photonic-crystal-based circulators
+The insight gained in the previous section is valuable not only in the design of axisymmetric cavities
+with maximum frequency splitting induced by a uniform SEMF, but also of PC-based ones. Figure
+4.6(c) shows that the cross product EEe  EEo in a well-designed axisymmetric cavity has a significant
+amplitude only within the rings closest to the cavity centre. Thus, one can conclude that the frequency
+4.4. Photonic-crystal-based circulators 83
+(a) (b)
+(c) (d)
+0
+r
+in
+Figure 4.7 Adjustment of an axisymmetric cavity for integration into a PC lattice. (a) Superposition of the
+cavity and a hexagonal block of the PC. (b) Structure obtained by combining the central air hole and the innermost
+air ring of the cavity with the external region of the PC block. (c) The result of shifting the circular air holes of
+the cavity from part (b) in the radial direction, according to the mapping described in the text. (d) The cavity from
+part (c) with its air ring approximated by a string of circular air holes.
+splitting of the cavity modes depends mostly on the geometry of the innermost region, whereas the
+primary function of the external rings is to provide a sufficient isolation from the surrounding free space.
+TheMO properties of the cavity should not suffer, therefore, if the inner air rings were preserved, whereas
+the outer ones were replaced by a regular photonic lattice.
+In practice, some difficulties related to geometric constraints can arise. Consider, for instance, a
+2D PC made up of a hexagonal lattice of circular air holes with radius 0:30a, where a is the lattice
+constant, etched in a matrix of a MO material with refractive index n = 2:5 (close to that of BIG
+at infrared frequencies). This crystal has a band gap for p-polarised waves with frequencies between
+! = 0:285 and 0:350  2 c=a. In fig. 4.7(a) its geometry is juxtaposed with the contours of the BIG
+rings of the axisymmetric cavity composed of BIG and air and supporting a pair of eigenmodes with
+azimuthal order l = 1, frequency ! = 0:320  2 c=a and reduced coupling strength v = 0:0062. The
+dimensions of the rings are listed in table 4.1. It can be seen that no matter how many inner rings are
+preserved, a wide gap will appear between them and the surrounding PC. Its presence will certainly shift
+the eigenfrequencies of the cavity modes and diminish the frequency splitting between them: the modes
+will be more weakly localised, and hence the denominator of expression (4.32) for V will increase,
+while the numerator will stay roughly the same. In order to overcome this difficulty, we propose to
+adjust the positions of the PC holes using an appropriate coordinate transform. While its optimum
+form remains an open problem, we obtained satisfactory results with a simple mapping whose principle
+is illustrated in figs. 4.7(b) and (c). The mapping has the form .; / 7! .a./ C b./; /, where
+the coefficients a./ and b./ are chosen so that the centres of the holes hatched horizontally in fig.
+4.7(b) move onto a circle of radius 0 , as shown in fig. 4.7(c), while the position of the ones hatched
+in
+vertically does not change. We have found the value of 0 = 2:60a to be approximately optimal for the
+in
+considered system.
+84 Chapter 4. Magneto-optical circulators
+Ring number Inner radius Outer radius
+1 0:916a 1:255a
+2 1:995a 2:319a
+3 3:068a 3:387a
+4 4:143a 4:461a
+5 5:221a 5:538a
+Table 4.1 Radii of the high-index rings of the cavity with  = .2:5/2h = 6:25 and l = 1 supporting a resonant
+mode with azimuthal order l = 1 at frequency ! = 0:32  2 c=a.
+# x=a y=a r=a # x=a y=a r=a # x=a y=a r=a
+1 0.000 0.000 0.92 8 2.967 3.426 0.30 15 4.000 3.464 0.30
+2 1.403 0.810 0.40 9 3.001 1.733 0.30 16 4.451 0.857 0.30
+3 1.620 0.000 0.40 10 3.433 0.849 0.30 17 4.500 2.598 0.30
+4 1.965 1.702 0.30 11 3.496 2.595 0.30 18 4.867 0.000 0.30
+5 2.452 2.548 0.30 12 3.500 4.330 0.30 19 5.000 1.732 0.30
+6 2.457 0.851 0.30 13 3.733 0.000 0.30 20 5.500 0.866 0.30
+7 2.600 0.000 0.30 14 3.995 1.730 0.30 21 6.000 0.000 0.30
+Table 4.2 Cartesian coordinates .x; y/ and radii r of the circular air holes making up the cavity shown in fig.
+4.7(d). For brevity, only the holes lying in the sector 0   < 60ı are included.
+To simulate PC-based cavities and circulators, we have been using the multiple-scattering method
+extended to systems containing MO materials (see section 5.1). At present, our code cannot handle
+scatterers composed of several concentric layers. Therefore we have approximated the preserved air ring
+with a string of air holes with radius 0:4a arranged on a circle of radius 1:62a, in the hope that this will
+not seriously deteriorate the MO properties of the cavity. In this way we arrived at the final geometry
+of the proposed PC-based cavity, shown in fig. 4.7(d). For completeness, the positions and radii of its
+constituent air holes are listed in table 4.2.
+By means of the multiple-scattering method we have found that in the absence of SEMF the cavity
+in question supports a pair of degenerate dipolar modes at the complex frequency ! = .0:31241  
+0:00037i/  2 c=a [148]. Figures 4.8(a) and (b) show the magnetic field Hz corresponding to these
+modes, and fig. 4.8(c), the cross product of their electric fields weighted with g.rE/ taken to be 1 in the
+MO material and 0 in air. It can be seen that the cross product remains positive practically everywhere
+in the MO material. The reduced mode coupling strength is v = 0:0048, which is slightly less than
+the value obtained for the initial axisymmetric cavity. This deterioration could probably be reduced
+by a more careful optimisation of the transition between the inner region, approximately axisymmetric,
+and the surrounding PC lattice. However, the obtained value of v is still eight times larger than that
+of the cavity from ref. 34, figs. 2 and 3(a)–(b), placed in a uniform SEMF, i.e., without introduction of
+oppositely-magnetised domains. For the sake of comparison, the map of geE  .EEz e  EEo/ of that cavity
+is shown in fig. 4.8(d). It can be seen that the cross product changes sign inside the defect, so that the
+contributions of the areas with positive and negative eE  .EEz e Eo/ almost cancel out.
+The next step in the design of a PC circulator is the determination of the geometry of waveguides.
+The simplest would be to make them by removing a single row of holes from the chosen hexagonal-lattice
+PC. Yet, as can be seen on the dispersion diagram in fig. 4.9(a), such waveguides, while being technically
+single-mode at the resonant frequency of the cavity, !0 = 0:312412 c=a, support another mode, whose
+cut-off frequency, 0:314 2 c=a, is barely higher than !0. Its decay constant can therefore be expected
+to be small. As a result, even relatively long waveguides of this type might still exhibit multi-mode be-
+4.4. Photonic-crystal-based circulators 85
+1:0
+5:0 (a) 5:0 (b)
+0:5
+2:5 2:5
+0:0 0:0 0:0
+ 2:5  2:5  0:5
+ 5:0  5:0
+ 1:0
+ 5 0 5  5 0 5
+x=a x=a
+1:0
+5:0 (c) 2 (d)
+0:5
+2:5 1
+0:0 0 0:0
+ 2:5  1  0:5
+ 5:0  2
+ 1:0
+ 5 0 5  2 0 2
+x=a x=a
+Figure 4.8 (a)–(b) Magnetic field Hz of the degenerate eigenmodes of the cavity from fig. 4.7(d). (c) Distri-
+bution of geE  .EE  EE / of the same cavity. (d) Distribution of geE  .EE  EEz e o z e o/ of the cavity from ref. 34, figs.
+2 and 3(a)–(b). All plots show the real parts of the respective quantities normalised to the interval Œ 1; 1; with the
+chosen global phase of eigenmode fields, the imaginary parts are negligible.
+haviour. This problem can be eliminated by bringing the holes nearest to the waveguide axis even closer
+to it, which causes a blueshift of the dispersion curves of both the modes. The dispersion curve of the
+lower-frequency mode must not be allowed to move up too much, though, since this would lead to a sub-
+stantial decrease of its group velocity at frequency !0. Such a decrease would be accompanied by an in-
+crease of absorption [123] and scattering losses [159] in the presence of structural defects, unavoidable in
+an experimentally manufactured device. The waveguide obtained by shifting its innermost holes by dw =
+0:09a towards its axis seems a reasonable compromise; its dispersion diagram is shown in fig. 4.9(b).
+We can now proceed to simulations of a complete circulator. The device to be considered, shown
+schematically in fig. 4.10, is composed of the cavity from fig. 4.7(d) and three waveguides designed
+as described in the previous paragraph. The holes marked by hatching, located near the ends of the
+waveguides, will be modified for reasons explained in what follows. The wapveguides comprise N = 12
+unmodified unit cells and the total thickness of their cladding is dclad = 5 3a. The whole system is
+embedded in the MO material, assumed to have g = 0:1. The system is excited by a point source placed
+close to the inlet of waveguide W1. As in the case of the isolated cavity, the simulations are done with
+the multiple-scattering method.
+We have tested two ways of measuring the power transmitted through thpe circulator. The first consists
+in integrating the Poynting flux over the “ports” Pj (j = 2; 3) of length 4 3a, shown in fig. 4.10. The
+results obtained in this way would be severely perturbed by reflections occurring at the outlets of the
+waveguides W2 and W3. To eliminate them, we have modified the radius rh of the holes lying closest
+to waveguide ends, hatched horizontally in fig. 4.10. Using the method described in ref. 160, we have
+y=a y=a
+y=a
+y=a
+jHz j geE  .EEz EEe o/
+86 Chapter 4. Magneto-optical circulators
+0:4
+0:3
+0:2
+0:1
+(a) (b)
+0:0
+0:0 0:1 0:2 0:3 0:4 0:5 0:0 0:1 0:2 0:3 0:4 0:5
+ka=2  ka=2 
+Figure 4.9 Dispersion relation of p-polarised modes of (a) a waveguide created by removing a row of air holes
+from the PC studied in section 4.4, (b) the waveguide from part (a) after shifting the holes nearest to the waveguide
+axis by 0:09a towards it. The regions of the .k; !/-space in which bulk PC modes exist have been shaded. Dashed
+horizontal lines mark the resonant frequency of the cavity from fig. 4.7(d), ! = 0:31241 2 c=a. All calculations
+have been done with the method described in section 5.2.
+verified that if rh is reduced from to 0:17a, the modal reflectance of the waveguide outlet at frequency !0
+decreases to barely 0.04%.
+The second technique for obtaining the scattering matrix of the system consists in fitting the field
+in the waveguides with a linear combination of their forward- and backward-propagating guided modes.
+Since there are practically no reflections at the waveguide outlets, we can approximate the magnetic field
+at pointsQj;n marked in fig. 4.10 by
+H .Q / = H ˚n C rH ˚2N nz 1;n inc inc ; (4.45a)
+Hz.Q
+NCn
+2;n/ = t2Hinc˚ ; (4.45b)
+Hz.Q3;n/ = t3Hinc˚
+NCn; (4.45c)
+where˚  eika, k denotes the wave number of the waveguide eigenmode,Hinc stands for the excitation
+amplitude, r is the reflection coefficient of the circulator, and t2 and t3, the transmission coefficients into
+waveguides W2 and W3. Since the wave number k is known from the dispersion diagram shown in fig.
+4.9(b), we can find the coefficients r , t2 and t3 simply from a linear least-squares fit of formulas (4.45)
+to the data obtained in simulations. To avoid perturbations induced by the presence of evanescent modes
+near the waveguide ends, in the fitting procedure we have disregarded the pointsQj;n with indices n < 3
+and n > N   3. The spirit of this approach is similar to that advocated in ref. 160. In contrast to the
+method based on Poynting flux integration, it allows to calculate not only the transmittances T 2j  jtj j
+(j = 2; 3), but also the reflectance R  jr j2 and the amount of power lost to non-guided modes,
+1   .RC T2 C T3/.
+Figure 4.11 shows a juxtaposition of the values of the isolation coefficient I  T2=T3 obtained with
+the two above methods for the circulator from fig. 4.10. Clearly, there is an excellent match between the
+two sets of data. Therefore in the following we shall limit our discussion to the results obtained with the
+second, more powerful approach.
+Figure 4.12(a) presents the frequency dependence of the transmittances T2 and T3 of the same cir-
+culator, along with the total power passed to guided modes, P  R C T2 C T3. It can be seen that in
+the neighbourhood of !0 the amount of power not accounted for by the guided modes increases to about
+10%. We believe this power deficit to be primarily a consequence of radiation occurring from the cavity,
+and possibly also from the waveguides, into free space. These losses might conceivably be reduced if the
+thickness of the cladding were increased.
+!a=2 c
+4.4. Photonic-crystal-based circulators 87
+dclad
+P3
+2r
+Waveguide W h3
+: : Q
+3
+: N
+: :
+: : : :
+: : :: : :
+a .N   1/a
+Q3
+2
+Q3
+: : : 1
+: : :
+: : :
+: : :
+: : :
+Q1 Q1 Q1  
+1 2 : : : N
+: : :
+: : :
+: : :
+: : :
+Q2
+1
+Q2Waveguide W1 2
+: : :: : :
+: : : :
+Point source : :
+: : :
+Q2
+N
+Waveguide W2 P2
+ p 
+3
+  dw a2
+Figure 4.10 Schematic of the PC circulator described in the text.
+: : :
+: : :
+: : :
+: : :
+
+
+: : : 
+: : :
+: : :
+: : :
+: : :
+: : :
+
+
+
+88 Chapter 4. Magneto-optical circulators
+100
+Method 1
+Method 2
+10
+1
+0:3110 0:3115 0:3120 0:3125 0:3130
+!a=2 c
+Figure 4.11 Comparison of the isolation I of the circulator from fig. 4.10 calculated by integrating the Poynt-
+ing fluxes through ports P2 and P3 (“method 1”, crosses) and by fitting the data obtained in multiple-scattering
+simulations with formulas (4.45) (“method 2”, circles).
+1:00 100
+(a)
+0:75
+T2
+T3
+0:50 10
+P
+I
+0:25
+0:00 1
+0:3110 0:3115 0:3120 0:3125 0:3130
+!a=2 c
+1:00 10000
+(b)
+0:75 1000
+T2
+T3
+0:50 100
+P
+I
+0:25 10
+0:00 1
+0:3115 0:3120 0:3125 0:3130 0:3135
+!a=2 c
+Figure 4.12 Frequency dependence of the transmittances T2 and T3, isolation I , and the sum P  RCT2CT3
+of the circulator shown in fig. 4.10 with the vertically hatched holes shifted by (a) dh = 0 and (b) dh =  0:038a
+in the radial direction with respect to their original position. All the quantities were calculated by fitting the data
+obtained in multiple-scattering simulations with formulas (4.45).
+T2, T3, P T2, T3, P
+Isolation I
+I
+I
+4.4. Photonic-crystal-based circulators 89
+# x=a y=a r=a # x=a y=a r=a # x=a y=a r=a
+1 0.000 0.000 0.92 32 5.922 8.705 0.30 63 8.422 13.035 0.30
+2 0.810 1.403 0.40 33 6.000 0.000 0.30 64 8.500 6.062 0.30
+3 1.403 0.810 0.40 34 6.000 1.732 0.30 65 8.500 7.794 0.30
+4 1.620 0.000 0.40 35 6.000 3.464 0.30 66 8.500 9.526 0.30
+5 1.965 1.702 0.30 36 6.000 5.196 0.30 67 8.500 11.258 0.30
+6 2.452 2.548 0.30 37 6.000 6.928 0.30 68 8.922 13.901 0.30
+7 2.457 0.851 0.30 38 6.422 9.571 0.30 69 9.000 6.928 0.30
+8 2.600 0.000 0.30 39 6.500 0.866 0.30 70 9.000 8.660 0.30
+9 2.967 3.426 0.30 40 6.500 2.598 0.30 71 9.000 10.392 0.30
+10 3.001 1.733 0.30 41 6.500 4.330 0.30 72 9.000 12.124 0.30
+11 3.422 4.375 0.30 42 6.500 6.062 0.30 73 9.500 7.794 0.30
+12 3.433 0.849 0.30 43 6.500 7.794 0.30 74 9.500 9.526 0.30
+13 3.496 2.595 0.30 44 6.922 10.437 0.30 75 9.500 11.258 0.30
+14 3.733 0.000 0.30 45 7.000 0.000 0.30 76 9.500 12.990 0.30
+15 3.922 5.241 0.30 46 7.000 1.732 0.30 77 10.000 8.660 0.30
+16 3.995 1.730 0.30 47 7.000 3.464 0.30 78 10.000 10.392 0.30
+17 4.000 3.464 0.30 48 7.000 5.196 0.30 79 10.000 12.124 0.30
+18 4.422 6.107 0.30 49 7.000 6.928 0.30 80 10.000 13.856 0.30
+19 4.451 0.857 0.30 50 7.000 8.660 0.30 81 10.500 9.526 0.30
+20 4.500 2.598 0.30 51 7.422 11.303 0.30 82 10.500 11.258 0.30
+21 4.500 4.330 0.30 52 7.500 0.866 0.30 83 10.500 12.990 0.30
+22 4.867 0.000 0.30 53 7.500 2.598 0.30 84 10.500 14.722 0.30
+23 4.922 6.973 0.30 54 7.500 4.330 0.30 85 11.000 10.392 0.30
+24 5.000 1.732 0.30 55 7.500 6.062 0.30 86 11.000 12.124 0.30
+25 5.000 3.464 0.30 56 7.500 7.794 0.30 87 11.000 13.856 0.30
+26 5.000 5.196 0.30 57 7.500 9.526 0.30 88 11.500 11.258 0.30
+27 5.422 7.839 0.30 58 7.922 12.169 0.30 89 11.500 12.990 0.30
+28 5.500 0.866 0.30 59 8.000 5.196 0.30 90 12.000 12.124 0.30
+29 5.500 2.598 0.30 60 8.000 6.928 0.30 91 12.000 13.856 0.30
+30 5.500 4.330 0.30 61 8.000 8.660 0.30 92 12.500 12.990 0.30
+31 5.500 6.062 0.30 62 8.000 10.392 0.30 93 9.422 14.767 0.17
+Table 4.3 Cartesian coordinates .x; y/ and radii r of the circular air holes making up the optimised circulator
+shown in fig. 4.13. For brevity, only the holes lying in the sector 0    60ı are included.
+The maximum isolation obtained with the circulator from fig. 4.10, I  50, is somewhat unsatis-
+factory. According to the coupled-wave model from section 4.2, low maximum I may be caused by
+a suboptimal coupling level between the cavity and the waveguides. This level can be controlled by
+fine-tuning the positions of the holes in the neighbourhood of the cavity. We have found that by shifting
+the holes hatched vertically in fig. 4.10 by dh =  0:038a in the radial direction, the maximum isolation
+can be boosted to about 2600, as shown in fig. 4.12(b). The isolation I stays above 100 in a frequency
+band of width B.100/ = 0:00011  2 c=a, which corresponds to 81GHz for the operation wavelength
+ = 1300 nm. The level of power losses to radiative modes, 1   P , does not change appreciably with
+respect to the case from fig. 4.12(a). Figure 4.13 shows the map of the magnetic field excited by a point
+source placed close to the entrance of waveguideW1 of the “optimised” circulator with dh =  0:038a at
+frequency ! = 0:3124  2 c=a, where maximum isolation is obtained. The standing-wave ratio in the
+input waveguide is very small, which reflects the good quality of the match between the waveguides and
+the cavity. Table 4.3 lists the positions and radii of the air holes making up the optimised circulator.
+90 Chapter 4. Magneto-optical circulators
+1:0
+20
+0:8
+10
+0:6
+0
+0:4
+ 10
+0:2
+ 20
+0:0
+ 20  10 0 10
+x=a
+Figure 4.13 Magnitude of the magnetic fieldHz in the circulator with dh =  0:038a, excited by a point source
+of frequency ! = 0:3124  2 c=a.
+4.5 Rib-waveguide-based circulators
+4.5.1 Introduction
+In section 4.4 we have shown how an axisymmetric cavity designed along the rules derived in section 4.3
+can be adapted for embedding in a PC lattice and coupling with PC waveguides. One could well ask,
+however, whether the introduction of a periodic lattice is strictly necessary. At first sight, the answer is
+no. Having the form of a circular Bragg grating, the cavity is by itself well isolated from the surrounding
+medium (at least in-plane), so there is little to be gained by embedding it additionally in a PC exhibiting
+a band gap. The PC waveguides can also be straightforwardly replaced by rib waveguides with constant
+cross-section, whose operation is based on the index-guiding mechanism. To obtain a working circulator,
+however, one needs also to ensure the appropriate level of coupling between the localised cavity and
+waveguide modes and to minimise the power lost to free space during the energy transfer between these
+two families of modes. The latter objective is much easier to fulfil in a PC-based circulator, which
+operates in the band gap of the periodic lattice surrounding all the functional elements. Nevertheless, in
+this section we shall study a class of non-PC-based systems that allow to achieve the two goals mentioned
+above, at least to a certain degree.
+The general geometry of the structured to be considered is shown in fig. 4.14. The depicted circulator
+consists of a resonant cavity, composed of nf full and ns split rings with inner and outer radii determined
+by the procedure described in section 4.3, and three identical waveguides of width dwg. The distance
+from the centre of the cavity to the ends of the waveguides is wg, while the widths of the slits in the split
+rings are denoted by dn with n = nfC 1, nfC 2, : : : , nfC ns. The rings and waveguides are made of a
+y=a
+jHz j
+4.5. Rib-waveguide-based circulators 91
+dwg
+d6 d5 d4 d3
+rwg
+Figure 4.14 Geometry of an example rib-waveguide-based circulator with nf = 2 full and ns = 4 split rings.
+MO material with permittivity 2 3
+h ig 0
+O = 4 5h  ig h 0 (4.46)
+0 0 h
+and are embedded in an isotropic medium with permittivity l.
+The level of coupling between the cavity and waveguide modes, and hence the circulator’s perfor-
+mance, will of course depend on the values of all the geometrical parameters, which should therefore
+be optimised. The space spanned by them is rather large, and it is not possible to scan it exhaustively.
+Therefore our optimisation of the presented structure has been somewhat heuristic. We have chosen the
+material parameters as  = .2:25/2h = 5:0625, l = 1 and g = 0:1; the quoted value of h corresponds
+approximately to the effective index of the fundamental s-polarised guided mode of a planar waveguide
+composed of a BIG layer of thickness 340 nm sandwiched between GGG and air. The waveguide width
+dwg was fixed to 250 nm. The radii of the rings, listed in table 4.4, were determined with the procedure
+described in section 4.3 to ensure the existence of a pair of cavity modes with the azimuthal order l = 1
+at the wavelength  = 1300 nm.
+92 Chapter 4. Magneto-optical circulators
+Ring number Inner radius (nm) Outer radius (nm)
+1 381 539
+2 847 998
+3 1309 1457
+4 1772 1919
+5 2236 2382
+6 2700 2846
+7 3165 3310
+Table 4.4 Radii of the high-index rings of the cavity with  = .2:25/2h = 5:0625 and l = 1 supporting a
+resonant mode with azimuthal order l = 1 at wavelength  = 1300 nm.
+With the chosen value of g, the relative frequency splitting of the cavity is!=!0 = 2gv = 0:00175.
+From eq. (4.27), in the absence of losses the optimum value of =!0 is 0.00151, i.e., the quality factor
+Q  !0=.2/ describing the cavity-waveguide coupling should be Q = 330. The quality factors of
+the chosen cavity with 3 and 4 rings are 163 and 829, respectively. Therefore one can expect that the
+waveguides of an optimally designed circulator should end somewhere close to the third innermost ring—
+or possibly even inside it, since the coupling to waveguides is doubtlessly less efficient that to the whole
+surrounding free space.
+The total number of rings necessary for ensuring a prescribed level of peak transmission Tmin could
+in principle be estimated from eq. (4.30): for instance, for Tmin = 0:9 the quality factor Ql describing
+radiation loss should be greater than 6430. This is already ensured by a cavity composed of 6 rings,
+whose quality factor reaches 21,140. However, the quality factors of cavities with split outer rings will
+necessarily be smaller than of those with full rings; therefore, a larger number of rings might be necessary
+to ensure a 90-percent efficiency. In our calculations, we restricted our attention to systems with at most
+7 rings.
+The results of the optimisation process will be reported on in subsection 4.5.3. In the meantime,
+we shall describe the numerical method used to analyse these systems and evaluate the accuracy of
+calculations.
+4.5.2 Numerical calculations
+The calculations of the transmission through the circulators studied in this section, and shown schemati-
+cally in fig. 4.14, have been performed with the finite-element method (FEM) using the RF module of the
+COMSOL program. In contrast to the multiple-scattering method used to analyse PC-based circulators in
+ref. 148, FEM can easily handle structures composed of scatterers with complex (especially elongated)
+shapes. On the other hand, unlike that method, it requires a finite computational domain. Since the
+system shown in fig. 4.14 is, in principle, infinite, it must be truncated for the sake of FEM calculations.
+Problems involving light scattering by finite objects are routinely handled with FEM by letting the
+computational domain consist of a finite region enclosing the objects in question and surrounded by
+a perfectly matched layer (PML) of finite thickness, which ideally behaves as a perfect non-reflecting
+absorber [53]. In our case, the situation is complicated by the presence of infinite waveguides; the
+scatterer to be modelled obviously cannot fit within any finite contour. To circumvent this problem, we
+construct the computational domain in the way shown in fig. 4.15. The region surrounded by the dashed
+line is a fragment of the physical system shown in fig. 4.14. The parts of its boundary lying “far” from
+the waveguide ends are covered with PMLs of thickness dPML. We have used standard PMLs adapted
+4.5. Rib-waveguide-based circulators 93
+Circulator n n  (nm) d (nm)  (ıf s wg  cone )
+C1 3 3 1250 1570 —
+C2 3 4 1240 1770 —
+C3 3 4 1210 — 35.1
+Table 4.5 Geometrical parameters of the circulators analysed in the text. The ring radii are listed in the first
+.nf C ns/ rows of table 4.4.
+for cylindrical coordinates, implemented in COMSOL by means of the coordinate transform?
+!7    in sPML.1   i/; (4.47)
+dPML
+where  is the radial coordinate measured form the centre of the cavity, in denotes the radius of the
+inner PML boundary, and sPML, called the PML strength, influences the field decay rate inside the PML
+[161, p. 44]. On the other hand, the electromagnetic fields on the segments Pn (n = 1; 2; 3) perpendicu-
+lar to the waveguides are constrained to be a superposition of the incoming and outgoing guided modes
+of the corresponding waveguides, which are assumed to be single-mode. The profile of these modes is
+calculated analytically and normalised to unitary power, and the amplitude of the incoming mode is set
+to unity on P1 and to zero on P2 and P3. Physically, these constraints correspond to the assumption
+that all the radiative waveguide modes excited by the cavity decay before reaching the ports Pn. Math-
+ematically, they reduce to Robin’s boundary conditions and are implemented as COMSOL’s matched
+boundary conditions. On the remaining part of the computational domain’s boundary (solid line in fig.
+4.15) perfect-electric-conductor boundary conditions are imposed. The domain is divided into triangular
+Lagrangian elements of order p. The mesh density is controlled by fixing the mpaximum allowed size
+of individual elements in each subdomain with constant permittivity  to hmax= , where hmax is a
+constant. The mesh in areas with higher permittivity is made finer, since the fields is these regions are
+expected to vary faster.
+In our calculations we are primarily interested in the isolation factor I = T2=T3, where T2 and T3
+are the powers transmitted through ports P2 and P3. We can see that the numerically calculated value
+of I of a given circulator at a fixed free-space wavelength  depends on the following six parameters:
+ maximum element size in air, hmax,
+ element order, p,
+ PML thickness, dPML,
+ PML strength, sPML,
+ length of the part of the waveguides extending past the outermost ring, dsep,
+ port height, dport.
+To determine the values of these parameters sufficient for obtaining satisfactory accuracy, we have stud-
+ied the influence of their variation on the isolation I of a particular circulator, denoted henceforth as C1,
+whose parameters are listed in the first row of table 4.5.
+We tested first the dependence of I on hmax and p for fixed values of the remaining parameters.
+Figure 4.16(a) shows the values of I obtained for p = 2 and five different values of hmax, whereas
+fig. 4.16(b) presents the dependence of I on the element order p with hmax fixed to 500 nm. We see
+that the convergence with increasing p is much faster than with decreasing hmax. Therefore in future
+calculations we have taken hmax = 500 nm and p = 5.
+? In COMSOL simulations the ei!t convention for time-harmonic dependence is used, opposite to that employed here.
+94 Chapter 4. Magneto-optical circulators
+PML
+P3
+PML
+dsep dPML
+dport P1
+P2
+PML
+Figure 4.15 Geometry of the domain used in FEM calculations.
+400
+(a) (b)
+300
+200
+100
+0
+500 250 125 62:5 2 3 4 5
+hmax (nm) p
+Figure 4.16 Influence of the finite-element expansion parameters, hmax and p, on the calculated value of the
+isolation I of circulator C1. The parameters related to the truncation of the computational domain are fixed to
+dsep = 5000 nm, dPML = 600 nm, sPML =  and dport = 2250 nm. The wavelength  = 1299:5 nm was chosen to
+lie in the proximity of the maximum of I./, but not exactly at it. (a) Convergence of I with decreasing maximum
+element size in air, hmax, at fixed element order p = 2. (b) Convergence of I with increasing element order p at
+fixed hmax = 500 nm.
+I
+4.5. Rib-waveguide-based circulators 95
+86
+84
+82
+sPML D 
+sPML D 2
+80
+0 250 500 750 1000
+dPML (nm)
+Figure 4.17 Convergence of the isolation I of circulator C1 with increasing PML thickness dPML. Two PML
+strengths, sPML =  and 2, are considered; the wavelength  = 1299:5 nm. The other parameters are fixed as
+hmax = 500 nm, p = 5, dsep = 5000 nm and dport = 2250 nm.
+(a) (b)
+Figure 4.18 Change of the mesh structure in the PML with dPML increasing from (a) 400 nm to (b) 500 nm.
+Note that in the former case the mesh of the PML consists of two interleaving rows of triangles, whereas in the
+latter case the number of rows increases to four.
+We proceeded to the study of the influence of the PML parameters, dPML and sPML. Figure 4.17
+shows the dependence of I on the PML thickness for two different PML strengths, sPML =  and 2.
+It can be seen that the values obtained with sPML =  (which is COMSOL’s default) are very stable
+with respect to dPML: the difference between the maximum and minimum value of I does not exceed
+0.15%. On the other hand, the I.dPML/ curve corresponding to sPML = 2 has a noticeable jump
+between dPML = 400 and 500 nm. This jump is due to a change in the mesh structure: as illustrated in
+fig. 4.18, for dPML = 400 nm the mesh in the PML region consists of two rows of triangles, while for
+dPML = 500 nm two more rows appear. For dPML  600 nm the isolation factor obtained with both
+PML strengths are very similar; moreover, the subsequent appearance of another pair of rows, occurring
+between dPML = 800 and 900 nm, does not have any discernible effect on the I.dPML/ curves. All
+in all, the detailed choice of the PML parameters does not seem very important for the accuracy of the
+calculations. Therefore, we continue to take dPML = 600 nm and sPML = .
+We studied next the sensitivity of I to dsep. The I.dsep/ curves shown in fig. 4.19, corresponding
+to two different wavelengths, exhibit irregular oscillations of amplitude roughly equal to 3% of the mean
+value. We interpret them as stemming mainly from the interference of the fundamental waveguide mode
+with slowly decaying radiative modes excited by the cavity. Another culprit might be the mesh modifi-
+cations induced by changes of the location of the domain’s boundary. Elimination of these oscillations
+would be difficult without considerable enlargement of the computational domain, which would neces-
+I
+96 Chapter 4. Magneto-optical circulators
+88
+(a)  D 1299:5 nm (b)  D 1300:5 nm
+21:0
+87
+86
+20:5
+85
+84 20:0
+3000 4000 5000 6000 7000 8000 3000 4000 5000 6000 7000 8000
+dsep (nm) dsep (nm)
+Figure 4.19 Dependence of the isolation I of circulator C1 on the value of dsep for two different wavelengths 
+located in the neighbourhood of a maximum of I./. The other parameters are fixed as hmax = 500 nm, p = 5,
+dPML = 600 nm, sPML =  and dport = 2250 nm.
+sarily lead to a drastic increase of the time of calculations. Therefore, we decide to leave unchanged the
+value dsep = 5000 nm taken previously.
+The choice of dport is definitely the most difficult. In principle, the value of dport=2 should corre-
+spond to the distance from the waveguide axis at which the magnitude of the field of the guided mode
+becomes comparable to that of the radiative modes excited by the cavity. Unfortunately, it is not easy to
+determine this distance a priori. The value dport = 2250 nm taken so far corresponds to the width of a
+port at whose ends the magnetic field of the waveguide mode with  = 1300 nm decays to 1% of its
+maximum value.
+Figure 4.20 shows the dependence of I on dport at four different wavelengths. For ease of compar-
+ison, the plots have been normalised to the values of I obtained for dport = 3000 nm. The curves have
+several interesting features. First, the isolation factor varies very rapidly for small values of dport. This
+is not surprising: for such small port lengths, the incident field is not represented accurately, since the
+profile of the waveguide mode is severely truncated in the direction perpendicular to the waveguide axis.
+Second, for large port lengths we observe a steady, seemingly linear decay of I . In fact, a look on the
+plots of the field excited on these long ports reveals that in the port regions lying far from the waveguide
+axis the field shape does not resemble that of the guided mode any more; this effect is especially pro-
+nounced in the isolated waveguideW3. This indicates that the optimum port length might be close to the
+value of dport at which the linear decay emerges; however, this value varies with the wavelength. Third,
+the dependence of I on dport is visibly strongest at  = 1300:0 nm, which is the wavelength closest to
+the peak of I./. This indicates that the maximum value of I./ observed for a given circulator might
+be strongly influenced by the choice of dport. Unfortunately, this proves to be the case: the maximum
+isolation factors of circulator C1 obtained for dport = 1700, 2000 and 2250 nm are 2130, 3560 and 6140,
+respectively. The extreme values differ, then, by nearly a factor of three. On a more positive note, the
+bandwidth B.Imin/, a quantity much more important from the experimental point of view, turns out to
+be significantly less sensitive to the choice of port length, as long as Imin is not too large. For instance,
+the range of wavelengths in which C1 provides an isolation factor better than 100 has width 0:610, 0:615
+and 0:618 nm according to simulations performed with the three values of dport quoted previously. We
+conclude that while the maximum isolation factors calculated with the present technique do not have
+absolute significance, and can at most be used for the purposes of comparison between different struc-
+tures, the bandwidths are robust against changes of the domain truncation parameters. Lacking reliable
+guidelines on the selection of the optimum port length, we stick to the value chosen previously, i.e.,
+dport = 2250 nm.
+I
+I
+4.5. Rib-waveguide-based circulators 97
+2:0
+1:5
+1:0
+ D 1299:0 nm
+ D 1299:5 nm
+0:5
+ D 1300:0 nm
+ D 1300:5 nm
+0:0
+0 1000 2000 3000
+dport (nm)
+Figure 4.20 Dependence of the isolation I of circulator C1 on the value of dport for four different wavelengths 
+located in the neighbourhood of a maximum of I./. The other parameters are fixed as hmax = 500 nm, p = 5,
+dPML = 600 nm, sPML =  and dsep = 5000 nm.
+It is worth noting that some authors [137, 162] have proposed a different method of handling infinite
+waveguides in FEM calculations. In their approach, PMLs surround the whole computational domain,
+including the waveguide outlets, and the incident waveguide mode is introduced into the system by im-
+posing special boundary conditions on a cross-section of the input waveguide lying inside the domain.
+As an alternative, one could also divide the system under study in two parts: one comprising the input
+waveguide, and the other, the cavity with the output waveguides. In the latter, the finite-element expan-
+sion would continue to stand for the total electromagnetic field. In the former, however, the expansion
+would represent only the scattered field, i.e., the total field minus the incident waveguide mode. The
+latter could be introduced into the system by means of appropriate boundary conditions imposed on the
+junction of the two subdomains. The combined structure could then be completely surrounded in PMLs,
+as shown in fig. 4.21.
+We have not tested any of these solutions, mostly owing to time constraints. However, they could be
+implemented in future if the accuracy limits of the approach followed so far become a serious issue.
+4.5.3 Geometry optimisation
+Having fixed most of the geometrical parameters of the circulator in the way described at the end of
+subsection 4.5.1, we were essentially left with the problem of optimising the values of dn and wg.
+For the sake of simplicity, we initially focused on structures with dn independent from n, i.e., with
+waveguides enclosed in rectangular “slits” of width d . The bandwidth proved a rather cumbersome
+objective function, since it is nonzero only for structures already rather close to optimum. Therefore,
+the reservations from subsection 4.5.2 notwithstanding, we chose the maximum isolation factor as the
+objective function, hoping that circulators with large values of this parameter would also be characterised
+by a large bandwidth.
+Figure 4.22(a) shows the geometry of the best structure that we have found, called C2 in the follow-
+ing. It has 3 full and 4 split rings. The slit width d = 1770 nm and the waveguide ends are located at
+wg = 1240 nm from the cavity centre, so that the waveguides cross the outermost full ring. For ease
+of reference, the values of all the geometrical parameters of C2 are listed in table 4.5. This circulator
+offers maximum isolation of 3590, and the wavelength dependences of T2, T3 and I are shown in fig.
+4.22(b). Clearly, the curves are fairly symmetric with respect to the central wavelength  = 1300:0 nm,
+which indicates that the direct coupling between waveguides is insignificant. Figure 4.22(c) shows the
+map of the magnetic field at  = 1300:0 nm. At this wavelength, 88% of the input power is transmitted
+I=I.dport D 3000 nm/
+98 Chapter 4. Magneto-optical circulators
+PML
+Subdomain 2
+Subdomain 1
+Figure 4.21 Alternative technique of domain truncation. In subdomain 1, the electromagnetic field is repre-
+sented by the sum of the field of the incident waveguide mode (assumed known) and the scattered field expanded
+on a finite-element basis. In subdomain 2, the finite-element basis is used to expand the total field. Electromagnetic
+continuity conditions are imposed on the interface separating the two subdomains (dashed line).
+to waveguide 2; the rest is not reflected, but mainly lost to the surrounding free space. Far from the
+peak, the amount of these losses can exceed 50%. This behaviour contrasts with that of the PC circu-
+lator, where almost 100% of the input power remains in the waveguide system due to the quasi-perfect
+isolation provided by the surrounding periodic lattice. The 20-dB bandwidth B.100/ of circulator C2 is
+0.729 nm.
+The grey curves in fig. 4.22(b) show the transmittance curves of circulator C2 as predicted by the
+coupled-wave model with radiation losses taken into account, presented in subsection 4.2.2. The values
+of the parameters !0, !,  and l were found by fitting the expressions for T2 and T3 obtained from
+eqs. (4.26) to the values calculated numerically. The Levenberg-Marquardt algorithm was used as the
+fitting procedure. The best fit was obtained for parameters corresponding to 0  2 c=!0 = 1299:9 nm,
+  2 c!=!20 = 2:3 nm,Q  !0=.2/ = 370 andQl  !0=.2l/ = 5730. Clearly, there is a good
+match between the theoretical and numerical curves; its quality would probably be further improved by
+taking into account the direct coupling between waveguides, which causes the slight asymmetry of the
+numerical plots. The quality factor related to losses, Ql, is significantly lower than that of an isolated
+cavity with 7 full rings, which is as large as 107,000. This is obviously due to the presence of slits. On
+4.5. Rib-waveguide-based circulators 99
+1:00 10000
+T2
+0:75 T 10003
+T2 (fit)
+0:50 T 1003 (fit)
+I
+0:25 10
+0:00 1
+1295:0 1297:5 1300:0 1302:5 1305:0
+ (nm)
+(a) (b)
+(c)
+Figure 4.22 (a) Geometry of circulator C2. (b) Wavelength dependence of the transmission (left axis) and
+isolation (right axis) of this circulator. (c) Magnitude of the magnetic field in the circulator at the wavelength
+ = 1300:0 nm, corresponding to the maximum isolation. The waveguide mode is incident from the left.
+the other hand, the position of the ends of the waveguides (just inside the third innermost ring) is in good
+accord with the predictions made at the end of subsection 4.5.1.
+We have found this device fairly tolerant to variations of the slit width d ; figs. 4.23(a)–(b) show the
+plot of the maximum isolation and bandwidth of C2 when this parameter is varied. It can be seen that the
+bandwidth stays above 0.5 nm in a 300-nm-wide range of d . The constraints on wg are more stringent:
+as shown in fig. 4.23(c), the corresponding range of wg is only about 40 nm wide.
+The performance of this structure changes rather abruptly when the number of rings is modified. For
+instance, if the seventh ring is removed, the maximum isolation decreases to only 140 and the bandwidth
+to 0.386 nm. However, it is possible to improve these figures by readjusting the slit widths and the
+Transmission T2, T3
+Isolation I
+100 Chapter 4. Magneto-optical circulators
+0:75
+(a) (c)
+0:50
+0:25
+0:00
+10000
+(b) (d)
+1000
+100
+10
+1200 1400 1600 1800 2000 1200 1220 1240 1260 1280
+d (nm) rwg (nm)
+Figure 4.23 Tolerance of the maximum isolation Imax and the bandwidth B.100/ of circulator C2 to perturba-
+tions of the parameters (a)–(b) d and (c)–(d) wg.
+1:00 10000
+T2
+0:75 T 10003
+I
+0:50 100
+cone 0:25 10
+0:00 1
+1295:0 1297:5 1300:0 1302:5 1305:0
+ (nm)
+(a) (b)
+Figure 4.24 (a) Geometry of a circulator with conical slits surrounding the waveguides. The values of the vari-
+ous parameters have been chosen to match those of circulator C3. (b)Wavelength dependence of the transmission
+(left axis) and isolation (right axis) of this circulator.
+position of the waveguide ends: for wg = 1250 nm and d = 1570 nm (10% less than in the 7-ring case)
+Imax reaches 2140 and the bandwidth 0.603 nm.
+It is interesting to note that both for 6 and 7 rings the optimum angular length of the removed sectors
+of the outermost ring is almost the same: 34ı. This led us to test the performance of a second class
+of structures, in which the outer rings are truncated along radial lines instead of ones parallel to the
+waveguides, so that the latter are enclosed by conical rather than rectangular air slits, as illustrated in fig.
+4.24(a). We found the optimum cone aperture  ıcone to be 35:1 , which is close to the value obtained
+in the simulations of the first class of structures (with dn independent from n). The optimum position
+of the waveguide end, wg = 1210 nm, is also only slightly different from the original one. More
+importantly, the maximum isolation and bandwidth decrease much less (from 3300 to 700 and from
+0.770 to 0.708 nm, respectively) when the seventh ring is removed. This relative insensitivity to the
+details of the geometrical structure of the exterior region of the device is the behaviour that one would
+intuitively expect from a well-designed circulator; therefore, structures with conical slits seem closer to
+the ideal that those with rectangular ones. Figure 4.24(b) shows the wavelength dependence of T2, T3
+and I of the optimum 7-ring circulator with conical slits, referred to as C3. Its parameters are listed in
+table 4.5.
+Max. isolation Bandwidth (nm)
+Transmission T2, T3
+Isolation I
+4.6. Simulations of three-dimensional axisymmetric cavities 101
+(a) (b)
+Figure 4.25 Microphotographs of a rib-waveguide-based circulator etched in a BIG layer grown on a GGG sub-
+strate (courtesy of L. Magdenko and B. Dagens, Institut d’Électronique Fondamentale, Orsay, France). (a) Tung-
+sten mask before etching. (b) Complete circulator after etching.
+4.5.4 Fabrication
+Our collaborators from Institut d’Électronique Fondamentale (Orsay, France) have developed a tech-
+nique of fabricating magnetophotonic structures in BIG thin films [163]. The films used in experiments,
+supplied by the GEMAC team from Versailles, France, were grown on GGG substrates by pulse layer
+deposition. The circulators were fabricated by inductively coupled plasma ion etching the BIG layer in a
+mixture of boron trichloride and argon, with a nanostructured tungsten layer used as a mask. An example
+circulator fabricated in this way is shown in fig. 4.25.
+To evaluate the optical properties of the manufactured structures, a series of measurements of the
+power transmitted to the two output waveguides was made. The transmittances to the two output branches
+were found not to be completely equal. However, reversal of the polarisation of the applied SEMF
+brought no discernible change of the transmission levels. Apparently, then, the observed difference
+between T2 and T3 was due to fabrication imperfections rather than to nonreciprocal effects.
+4.6 Simulations of three-dimensional axisymmetric cavities
+4.6.1 Evaluation of possible three-dimensional geometries
+Motivation We strongly suspected that the incorrect operation of the fabricated circulators was due to
+the fact that their design had been based solely on two-dimensional simulations. While we had attempted
+to take the three-dimensional (3D) nature of the true physical system into account by using the effective-
+index model to find the material properties of the high- and low-index regions of the simulated structures,
+this was evidently not enough. Indeed, the effective-index description is known to give erroneous results
+for high-contrast systems, such as those considered in this chapter [164]. In any case, its accuracy can
+only be evaluated by comparing its predictions with results of rigorous 3D calculations.
+Owing to the time requirements of full-blown 3D simulations, which would be necessary to anal-
+yse complete circulators consisting of a cavity coupled to waveguides, we decided to implement first a
+method allowing to calculate the eigenmodes of axisymmetric 3D cavities. In this case it is possible to
+profit from the knowledge of the azimuthal dependence of the eigenmodes to restrict the computational
+mesh to a single meridional (z) plane of the cavity. Our calculations were made with the finite-element
+method, described in detail in section 5.3.
+High-contrast cavities We began by considering the simplest type of structures, in which the rings
+are etched in a layer of BIG with thickness dBIG, sandwiched between a GGG substrate and air, as shown
+102 Chapter 4. Magneto-optical circulators
+in fig. 4.26(a). We set dBIG = 340 nm and took the refractive indices of BIG and GGG to be nBIG = 2:51
+and nGGG = 1:97. The effective index of the unetched areas was calculated to be 2.25, while that of
+the etched rings was set to the index of air, nair = 1. The radii of the rings were determined with the
+procedure described in section 4.3, with the target wavelength  = 1300 nm. For future reference, we
+shall denote this just described geometry with the symbol G1.
+Very soon it became apparent that cavities of type G1 behaved very badly in 3D. In fact, they do
+not seem to support any well-localised modes near the design wavelength  = 1300 nm. This turns
+out to be easily explicable: sufficiently far from the cavity centre, a circular Bragg grating can be well
+approximated by a linear grating with period d = 1.n 1Cn 10 1 /, where n0 and n1 denote the refractive4
+indices of etched and unetched areas. If d is larger than =.2nGGG/, all Bloch eigenmodes of the grating
+will leak into the GGG substrate [165, p. 203]. Unfortunately, this is the case with G1-type structures:
+d = 469 nm > =.2nGGG/ = 330 nm.
+Low-contrast cavities In view of the failure of the effective-index description of structures of type
+G1, we have studied a handful of geometries liable to be approximated better by the effective-index
+model. They were proposed by L. Magdenko and B. Dagens (Institut d’Electronique Fondamentale,
+Orsay, France).
+The first structure that was considered is shown in fig. 4.26(b). In this case, the BIG layer is left
+unetched, and the necessary effective-index contrast between successive rings is introduced by etching
+an additional high-index layer deposited on top of BIG. This geometry has distinct theoretical and ex-
+perimental advantages. First, owing to the continuity of the BIG layer, it supports everywhere a locally
+guided mode. This lets us avoid the problem that the effective index, defined with the help of the prop-
+agation constant of the fundamental guided mode of a given region, is in fact undetermined for regions
+where no guided modes exist. Conventionally, these areas are attributed the index of the sub- or super-
+strate but, as noted by Hammer and Ivanova [164], this choice is not based on any rigorous arguments.
+In the case of the geometry from fig. 4.26(b), the effective index is well-defined everywhere and one can
+hope that this will improve the accuracy of the effective-index description.
+From the experimental point of view, the structure in question has the advantage that it does away
+with the necessity of etching the BIG layer. This process, while already successfully demonstrated [163],
+remains less well developed than the nanostructuration of materials such as silicon or indium phosphide.
+On the other hand, the presence of a MO material both in the high- and low-index rings will necessarily
+diminish the SEMF-induced mode coupling strength, owing to the cancellation effect described in ref.
+148. A possible solution consists in depriving the uncovered areas of BIG of their MO properties, which
+can be experimentally achieved by ion implantation.
+The structure shown in fig. 4.26(b) is characterised by the refractive index nspl of the supplemen-
+tary layer, its thickness dspl, and the thickness of the BIG layer, dBIG. We have taken nspl = 3:50,
+corresponding to the index of amorphous silicon around the wavelength  = 1300 nm. The choice of
+dspl and dBIG was motivated by two competing goals. On one hand, the supplementary layer had to
+be sufficiently thick to provide an appreciable contrast of the effective index of the etched and unetched
+areas. On the other hand, dspl could not be chosen too large for fear of generating a second s-polarised
+guided mode in the unetched region and of displacing too large a fraction of the guided mode’s energy
+away from the BIG layer, which would diminish the MO properties of the system. As a compromise,
+the two thicknesses were taken as dspl = 80 nm and dBIG = 280 nm. The effective indices of the etched
+and unetched regions were then calculated as 2.19 and 2.50, and the fraction of energy of the guided
+mode of the unetched region contained in BIG was found to be 0.48. For convenience, the just described
+geometry will henceforth be referred to as G2.
+In another type of structures, shown in fig. 4.26(c), the etched BIG layer of thickness dBIG is covered
+4.6. Simulations of three-dimensional axisymmetric cavities 103
+z
+nair
+nBIG dBIG
+
+nGGG
+(a)
+z
+nair
+nspl dspl
+nBIG dBIG
+
+nGGG
+(b)
+z
+nsup
+nBIG dBIG
+
+nGGG
+(c)
+Figure 4.26 Schematics of 3D structures of types (a) G1, (b) G2, and (c) G3 and G4 (which differ only with
+the value of nsup).
+with a solid superstrate with refractive index nsup close to that of GGG. In this way, the index contrast
+between the etched and unetched areas is lessened and one can expect the effective-index approximation
+to be more accurate. We considered mainly systems with nsup = 1:97 (exactly equal to the refractive in-
+dex of GGG) or nsup = 1:90 (refractive index of silicon nitride) and chose dBIG to be 330 nm. Structures
+with these parameters will be called G3 and G4 in the following. The effective indices of their unetched
+regions were calculated to be 2.275 and 2.282, respectively, whereas those of the etched areas were set
+to min.nGGG; nsup/, i.e., 1.97 and 1.90.
+Table 4.6 summarises the results obtained for a handful of structures. Three cavities, designed for
+azimuthal orders l = 1, 4 and 10, were tested for each of the geometry types G2, G3 and G4. In addition,
+for cavities of type G2 two distributions of the MO coefficient g were investigated. In one series of
+simulations, the whole BIG layer was assumed to be uniformly magnetised, so that g was taken to be
+0.1 throughout that layer. In the other, the areas of BIG not covered with silicon were assumed to be
+deprived of their MO properties and, consequently, attributed g = 0. For ease of reference, these two
+variants of geometry G2 will be called G2(a) and G2(b).
+The magnitude the relative frequency splitting !=!0 obtained in 3D simulations does not differ
+drastically from that predicted by 2D ones. The observed deviation is easily explicable by the fact that
+not the whole vertical profile of the unetched areas has MO properties. Anyway, the coupling strength
+of the eigenmodes of most of the cavities listed in table 4.6 exceeds that of the 2D high-contrast cavity
+104 Chapter 4. Magneto-optical circulators
+Type l C   !=!0 (3D) !=!0 (2D) QC Q  Qavg
+G2(a) 1 1:27779C 0:00618i 1:27833C 0:00617i  0:00042 — 103 104 103
+4 1:27546C 0:00607i 1:27633C 0:00611i  0:00068 — 105 104 105
+10 1:27564C 0:00582i 1:27666C 0:00588i  0:00080 — 110 109 109
+G2(b) 1 1:27892C 0:00616i 1:27727C 0:00618i 0:00129 0:00166 104 103 104
+4 1:27722C 0:00603i 1:27466C 0:00615i 0:00200 0:00286 106 104 105
+10 1:27764C 0:00570i 1:27475C 0:00600i 0:00227 0:00342 112 106 109
+G3 1 1:28103C 0:00461i 1:27926C 0:00498i 0:00138 0:00224 139 128 134
+4 1:28102C 0:00355i 1:27829C 0:00391i 0:00213 0:00356 180 164 172
+10 1:28032C 0:00179i 1:27724C 0:00206i 0:00241 0:00408 357 310 334
+G4 1 1:28550C 0:00722i 1:28366C 0:00773i 0:00143 0:00207 89 83 86
+4 1:28675C 0:00606i 1:28403C 0:00662i 0:00212 0:00348 106 97 102
+10 1:28710C 0:00401i 1:28415C 0:00454i 0:00229 0:00411 160 141 151
+Table 4.6 Results of 3D calculations of the eigenmodes of cavities with geometries G2(a), G2(b), G3 and G4.
+The symbols   and C denote the wavelengths of the modes with azimuthal order l and  l . In addition to the
+relative frequency splitting !=!0 of the modes of the 3D cavities, calculated as .ReC   Re /=Œ.ReC C
+Re /=2, the values obtained for the corresponding infinite 2D cavities are also given; they are calculated as in
+section 4.3. The symbolsQ˙ = .Re˙/=.2 Im˙/ stand for the quality factors of the modes with order l and  l .
+Finally,Qavg is defined as .QC CQ /=2.
+presented at the end of section 4.3. This can be attributed to the decrease of the effective-index contrast
+between etched and unetched areas, and is in accord with the observation from ref. 148 that the reduced
+coupling strength of a 2D high-contrast cavity can be augmented three times by making its core of
+demagnetised BIG instead of air.
+As opposed to the values of!=!0, well preserved in the 2D-to-3D transition, the quality factors of
+the 3D cavities are on average ten times smaller than the quality factors obtained with 2D calculations
+(related only to the in-plane confinement). The geometry that fares best, G3, provides barely Q = 334.
+In addition, even the small deviation from symmetry induced by changing the superstrate’s refractive
+index from 1.97 to 1.90 decreases the quality factor by about 50%.
+Figures 4.27, 4.28 and 4.29 show the maps of the z components of the magnetic field and the cross
+product EEe  EEo of the electric fields of the even and odd eigenmodes of the G2-, G3- and G4-type
+cavities designed for the azimuthal order l = 10, in the absence of SEMF. Comparison of figs. 4.28(a) and
+4.29(a) gives testimony to the substantial increase of out-of-plane radiation losses in the cavity of type
+G4 with respect to that of type G3: the field in the asymmetric cavity features a prominent beam directed
+into the substrate, which is absent from that of the symmetric cavity’s eigenmode. The field in the G2-
+type cavity from fig. 4.27 is well localised in the vertical direction, and the low quality factor of this
+mode seems to stem from the excitation of the fundamental p-polarised mode of the highly asymmetric
+GGG-BIG-air multilayer, as evidenced by the relatively large amplitude of the Ez field component on
+the plot from fig. 4.27(b).
+Both !=!0 and Q typically increase with l (the exception is the geometry G2, for which little
+change ofQ is observed). This effect is further illustrated in fig. 4.30(a), which shows the l-dependence
+of !=!0 and Q of circulators of type G3. Figure 4.30(b), in turn, presents the dependence of these
+parameters on the number of high-index rings, N , with l fixed to 10. It can be seen that !=!0 and Q
+reach their asymptotic values around N = 25.
+To sum up, the results listed in table 4.6 attest that the SEMF-induced coupling strength of the
+eigenmodes of structures G2, G3 and G4 is sufficient to cause a substantial frequency splitting; even in
+4.6. Simulations of three-dimensional axisymmetric cavities 105
+1:00
+(a) jHz j
+1000 0:75
+0:50
+0
+0:25
+ 1000
+0:00
+1:00
+(b) jEz j=Z0
+1000 0:75
+0:50
+0
+0:25
+ 1000
+0:00
+1:0
+(c) eEz  .EEe EEo/
+1000 0:5
+0:0
+0
+ 0:5
+ 1000
+ 1:0
+0 2000 4000 6000
+ (nm)
+Figure 4.27 (a) Magnitude of the z component of the magnetic field of the eigenmodes of the G2-type cavity
+designed for l = 10, in the absence of SEMF. (b) Magnitude of the z component of the electric field divided
+by Z0. The colour scale is the same for parts (a) and (b). (c) The z component of the cross product EE Ee  Eo of
+the electric fields of the even and odd modes of the same cavity, which occurs as the integrand in the expression
+for the SEMF-induced mode coupling strength [34].
+the unfavourable case of geometry G2 with uniformly MO BIG the frequency splitting of high-l modes
+is fairly large. However, the quality factor of these cavities is unsatisfactory. The cavity design must
+clearly be further improved to make the resulting devices usable in practice.
+4.6.2 Towards cavities with higher quality factor
+There are several routes that might potentially lead to an increase ofQ. First, one could augment further
+the azimuthal order of the cavity mode; fig. 4.30(b) lets us expect that this will lead to a rise of Q.
+Indeed, we have verified that the G3-type cavity designed for l = 40 has Q = 1760. This growth of Q
+is achieved, however, at the expense of a significant enlargement of the cavity volume, which may not
+always be desirable.
+z (nm) z (nm) z (nm)
+106 Chapter 4. Magneto-optical circulators
+1:00
+(a) jHz j
+1000 0:75
+0:50
+0
+0:25
+ 1000
+0:00
+1:0
+(b) eE z  .EEe EEo/
+1000 0:5
+0:0
+0
+ 0:5
+ 1000
+ 1:0
+0 2000 4000 6000 8000
+ (nm)
+Figure 4.28 (a) Magnitude of the z component of the magnetic field of the eigenmodes of the G3-type cavity
+designed for l = 10, in the absence of SEMF. (b) The z component of the cross product EE  EEe o of the electric
+fields of the even and odd modes of the same cavity. The plot of jEzj=Z0 has been omitted because this field
+component is very small.
+1:00
+(a) jHz j
+1000 0:75
+0:50
+0
+0:25
+ 1000
+0:00
+1:0
+(b) eE z  .EE EEe o/
+1000 0:5
+0:0
+0
+ 0:5
+ 1000
+ 1:0
+0 2000 4000 6000 8000
+ (nm)
+Figure 4.29 Same as fig. 4.28, but for the G4-type cavity.
+z (nm) z (nm) z (nm) z (nm)
+4.6. Simulations of three-dimensional axisymmetric cavities 107
+600 0:0025
+(a)
+400 0:0020
+200 0:0015
+Q
+!=!0
+0 0:0010
+0 5 10 15
+Bessel order l
+400 0:002500
+(b)
+0:002475
+300
+Q
+0:002450
+!=!0
+200
+0:002425
+100 0:002400
+10 15 20 25 30
+Number of rings N
+Figure 4.30 Dependence of the relative frequency splitting !=!0 and quality factor Q of G3-type cavities
+(a) on the azimuthal order l with fixed number of high-index rings N = 20 and (b) on the number of rings N with
+fixed l = 10.
+Second, one might look for ways of improving the accuracy of the effective-index approximation. As
+we have mentioned before, the effective index of regions supporting no guided modes is not rigorously
+defined. We have tested the influence of changing the value taken for the effective index of the etched
+areas of G4-type cavities from 1.90 to 1.97 and found that it brought about a 20-percent growth of Q.
+However, the wavelength of the cavity modes shifted by 2.5 nm further away from the design value of
+1300 nm, which indicates that the increase of Q was not due to an improvement in the accuracy of
+the effective-index description. We have also tried the variational effective-index method proposed by
+Hammer and Ivanova [164], but found it to degrade both the quality factor and the match between the
+predicted and true value of the frequency of cavity modes.
+Third, one should certainly profit from the extensive research on the optimisation of PC cavities done
+in the course of the last decade. As discussed in the review by Lalanne et al. [166], the approaches to this
+subject proposed so far can be divided into two large classes.
+Some authors [167, 168] treat a PC cavity as a system consisting of many “elementary” cells of size
+comparable to the lattice constant of the surrounding PC. In each such cell, they expand the field in the
+basis of the cell’s Bloch eigenstates. Often, each cell supports only one guided mode (one that does not
+radiate energy in the vertical direction). The radiation loss from the cavity is then regarded as resulting
+from the scattering of the guided modes into radiative ones at the intercell boundaries. To reduce this
+loss, the geometry of each cell must then be adjusted so as to improve the match between the profiles of
+the guided modes of successive cells.
+Unfortunately, this approach cannot be directly applied to axisymmetric structures, since it relies
+on the idea of expanding the field in each cell in its Bloch basis. Maxwell’s equations in cylindrical
+Quality factor Q Quality factor Q
+Relative shift !=!0
+Relative shift !=!0
+108 Chapter 4. Magneto-optical circulators
+coordinates are not invariant with respect to translations in the radial direction, however, even if the
+permittivity and permeability are; therefore the Bloch’s theorem does not carry over to systems periodic
+in the radial direction. On the other hand, sufficiently far from the z axis, an approximate version of
+the Bloch’s theorem can certainly be formulated. The results from a recent paper [169] indicate that this
+approximate formalism is fairly accurate even in small distances from the axis. Thus, it might be possible
+to apply the ideas from refs. 167 and 168 to axisymmetric systems. This will be the subject of future
+work.
+Other researchers [170–173] base their cavity optimisation procedures on the link between the cav-
+ity’s radiation pattern and the Fourier transform of its electromagnetic field. The quality factor Q of a
+cavity mode can be written asQ = .Re!/U=P , where ! is the mode’s frequency, U stands for the time-
+averaged energy stored in its electromagnetic fields, and P is the rate of energy loss [166, 172]. Treating
+the cavity as an aperture antenna, one can relate the out-of-plane energy loss rate P? to the 2D Fourier
+transforms of the  and  field components on two planes, one lying in the substrate and the other in
+the superstrate of the cavity [174, 175]. Englund et al. [172] have gone one step further, rewriting P? in
+terms of the z components of EE andHE :
+X Z qZ k k2   k2 C k2    x y 1
+P? = dkx dky C jE
+Q .k 2 Q 2z x; ky/j C jHz .kx; ky/j ;
+8 2 2C 2 2 k2 k2 Z2k k
+=sub;sup x y
+k x y 
+(4.48)
+where Z
+ p 
+p
+.0 /=.0 / is the (absolute) impedance of medium  (substrate or superstrate),
+k k0  and Z Z
+Q 1 1 1F .k ; k /  dx dy F .x; y; z / e i.kxxCkyy/z x y z  (4.49)
+2   1  1
+denotes the 2D Fourier transform of the field Fz on the plane z = z . The plane z = zsub can be taken
+to lie just below the interface of the substrate and the guiding layer, and the plane z = zsup, just above
+the boundary between the guiding layer and the superstrate. It is important to note that the integrals in
+eq. (4.48) run only over the light cones. One concludes that to obtain a high-Q cavity it is necessary to
+sweep all the peaks of the Fourier transforms EQ andHQ away from the circle k2 C k2  k2z z x y  [171].
+In the axisymmetric case it is possible to simplify eq. (4.48). It can be shown [176, section 9.3] that
+the 2D Fourier transform of a function f .; /  f ./ eill is
+fQ.k ; /  fQ .k / eil l  ; (4.50a)
+where Z
+Q 1fl.k/  d  fl./Jl.k/ (4.50b)
+0
+is the l th-order Hankel transform of f ./. The symbols .; / and .k; / denote the polar coordinates
+in the direct and reciprocal space. Using eqs. (4.50) one can bring eq. (4.48) into the form
+X Z qk k2   k2 Z k    1
+P? =
+  dk jEQz .k 2/j C jHQ 2z .k/j : (4.51)
+4  k Z20 
+=sub;sup 
+Figure 4.31(a) shows the squared norms of the Hankel transforms Z 1 EQz;sub.k/ and HQz;sub.k/sub
+of the clockwise-rotating eigenmode of a G2-type cavity designed for l = 10 and comprising as much
+as 40 high-index rings (to eliminate border effects related to insufficient lateral size). The plane zsub is
+4.6. Simulations of three-dimensional axisymmetric cavities 109
+taken to lie 1 nm below the top boundary of the substrate. The curves obtained with 3D FEM simulations
+are juxtaposed with that stemming from Hankel-transforming theHz field of the eigenmode of the corre-
+sponding 2D cavity (this mode is purely p-polarised, so the Ez component vanishes). Clearly, the peaks
+of all the curves are fairly well localised outside the light cone, whose boundary, k = 1:97k0, is marked
+with a vertical line. Remarkably, the areas under the curves Z 2 jEQ .k /j2z;sub  and jHQz;sub.k/j2 ob-sub
+tained with 3D calculations are roughly equal, while the Ez component should vanish according to 2D
+simulations. This confirms our earlier conclusions that the low quality factor of the eigenmodes of G2-
+type cavities stems from the excitation of a p-polarised guided mode of the multilayer rather than from
+radiation losses.
+The corresponding plots obtained for G3- and G4-type cavities are shown in figs. 4.31(b) and (c).
+While the transforms calculated in the 2D case are virtually indistinguishable, there is a marked differ-
+ence in the 3D case: the transform ofHz of the mode of the G4-type cavity extends considerably further
+into the light cone than that corresponding to the G3-type structure. This is reflected in the lower quality
+factor of the mode of the former cavity, as evidenced in table 4.6. In contrast to what we saw in the
+previous paragraph, for G3- and G4-type cavities the part played by the Ez component is completely
+negligible.
+In all the three systems considered here, the refractive index of the substrate is at least equal to that
+of the superstrate. Hence, radiation loss into the substrate dominates over that into the superstrate and,
+for brevity, we omit the discussion of the Hankel transforms of the fields on z = zsup.
+Advocates of the Fourier-transform-based optimisation of PC cavities have demonstrated that the
+quality factor–mode volume ratio of an eigenmode of a given structure can be increased by adjusting its
+geometry so as to lessen the decay rate of the mode field near the centre of the cavity. This narrows the
+peak of the Fourier transform, so that, provided that the centre of the peak lies outside the light cone, the
+integral of the squared norm of the Fourier transform over the light cone diminishes. This design rule
+has been summarised as “light should be confined gently in order to be confined strongly” [173].
+Unfortunately, it is not easy to establish a link between the geometry of the cavity and the shape of its
+eigenmode field. Englund et al. [172] have derived an approximate formula for the permittivity profile of
+a cavity supporting a mode with a prescribed spatial dependence. However, they assumed that the field
+near the centre of the cavity could be approximated by that of a PC waveguide mode close to cut-off,
+i.e., with a very flat dispersion curve. For axisymmetric structures, this assumption is not met: near the
+z axis, the cavity mode could possibly be approximated with a guided mode of the multilayer, whose
+dispersion relation is in general not flat. Moreover, the formula derived by Englund et al. is based on the
+application of the perturbation theory rather far from its domain of validity—to describe discontinuous
+high-amplitude perturbations of permittivity. Therefore, its predictions might conceivably be not always
+accurate.
+The last method that can be tried is the adjustment of ring dimensions based on a purely numerical
+optimisation algorithm. We have made some limited attempts at this sort of optimisation, parametrising
+the cavity geometry by the seven variables rc, ah, bh, ch, al, bl and cl, defined as follows. The symbol
+rc denotes the radius of the central low-index hole. The widths of the high-index rings are taken to be
+C bh C cwh;n = hah with n = 1; 2; : : : ; (4.52a)
+n n2
+whereas these of the low-index rings are set to
+b
+= C lwl;n al C C
+cl
+C with n = 1; 2; : : : : (4.52b)n 1 .n 1/2
+These particular functional forms were chosen because of their ability of approximating well the ring
+width distributions generated by the procedure from section 4.3. As the optimisation routine, we used
+110 Chapter 4. Magneto-optical circulators
+10:0
+(a)
+7:5
+5:0 jHQ 2z j , 2D calc.
+jHQ j2z , 3D calc.
+2:5
+Z 2jEQ j20 z , 3D calc.
+0:0
+10:0
+(b)
+7:5
+5:0 jHQ j2z , 2D calc.
+jHQ 2z j , 3D calc.
+2:5
+Z 2jEQ j20 z , 3D calc.
+0:0
+10:0
+(c)
+7:5
+5:0 jHQ j2z , 2D calc.
+jHQz j2, 3D calc.
+2:5
+Z 2 Q 20 jEz j , 3D calc.
+0:0
+0 1 2 3
+k=k0
+Figure 4.31 Squared norms of the Hankel transforms of the eigenmode fields of the cavities of types (a) G2,
+(b) G3 and (c) G4 designed to support modes with l = 10 at wavelength  = 1300 nm. In each plot, the Hankel
+transforms ofHz and Ez of the eigenmodes of the respective 3D cavities, calculated at the plane lying 1 nm below
+the substrate-BIG interface, are juxtaposed with the Hankel transform of the Hz field of the eigenmode of the
+corresponding 2D cavity. The vertical line at k = 1:97k0 marks the boundary of the light cone of the substrate.
+the trust-region-based gradient-free NEWUOA algorithm by Powell [177]. The objective function was
+initially taken as  
+! ˛ ˇ
+  Qavg (4.53)
+!0
+with the exponents ˛ and ˇ chosen heuristically as ˛ = 2 and ˇ = 1 to favour cavities with a large
+frequency splitting. Later it was found necessary to prevent a drift of the wavelength of the cavity
+eigenmodes far away from the design value of  = 1300 nm; this was done by multiplying  by an
+additional penalty factor
+ 1 1p
+1C e .  (4.54)min/ 1C e .max /
+with  = 0:2 nm 1, min = 1250 nm and max = 1350 nm. At the start of the optimisation algorithm,
+the seven parameters were set so as to mimic the ring width distribution obtained with the procedure
+described in section 4.3.
+jHQ j2 Z 2jEQ j2 jHQ j2 Z 2jEQ j2 jHQ j2 Z 2jEQ j2z , 0 z z , 0 z z , 0 z
+4.7. Conclusions and perspectives 111
+0:5 (a)
+0
+0:5 (b)
+0
+0 2 4 6 8
+ (nm)
+Figure 4.32 Geometry of (a) the original and (b) the numerically optimised cavity G3-type cavity designed for
+the azimuthal order l = 10. The shaded areas are the cross-sections of BIG rings, which are immersed in a material
+with refractive index 1.97.
+We have not yet tested extensively the above optimisation algorithm, applying it so far only to a few
+special cases. One of them was the 20-ring G3-type cavity designed to support a mode with l = 10
+at the wavelength  = 1300 nm, whose geometry is shown in fig. 4.33(a). According to table 4.6 the
+average quality factor of the counter-propagating modes of this cavity is 334 and the relative frequency
+splitting, 0.00241. Using the just described procedure to optimise the radii of the rings, we arrived at
+the geometry shown in fig. 4.32(b). The average Q factor of the resonant mode of this structure is as
+large as 2630. One can suspect this Q factor to be limited by in-plane rather than out-of-plane losses,
+since it is already higher than the Q factor of the corresponding 20-ring 2D cavity, 2156. Remarkably,
+the observed improvement of the mode confinement does not occur at a cost of deterioration of the MO
+properties of the cavity, whose relative frequency splitting, 0.00260, is even slightly larger than that of
+the original structure. Figure 4.33 shows the map of the z components of the magnetic field and of the
+cross product EE Ee  Eo of the eigenmodes of this cavity, as well as the squared norms of the Hankel
+transformsZ 1 EQz;sub.k/ andHQz;sub.k/. Comparing these curves with those from fig. 4.31(b), it cansub
+be seen that the peak of jHQ 2z;sub.k/j of the optimised structure is indeed more tightly localised outside
+the light cone of GGG.
+4.7 Conclusions and perspectives
+The research presented in this chapter was founded on the algorithm for the design of z-invariant axi-
+symmetric MO cavities that in the presence of a uniform SEMF exhibit maximum frequency splitting
+(section 4.3). In sections 4.4 and 4.5 we put forth a number of designs of three-port circulators incorpo-
+rating such cavities and operating according to the model presented in section 4.2. Lastly, in section 4.6,
+we studied the properties of the proposed cavities in a 3D setting, using full 3D simulations.
+In the course of this work, we increasingly tried to take into account the 3D nature of real integrated
+systems, in which the components are etched in BIG thin layers grown on GGG substrates. Initially,
+we performed purely 2D calculations, using bulk indices of the constituent materials. To some extent,
+this approach was justified: the algorithm from section 4.3 was based on 2D considerations, and it was
+necessary to compare the performance of the cavities designed by its help against those proposed before
+[34, 37, 150], which were also evaluated in a purely 2D setting.
+At the next stage, we attempted to take into account the multilayer structure of the experimental sys-
+tem with the effective-index approximation, which is fairly widely used to bring the results of 2D simu-
+lations of, in particular, PC-slab-based devices closer to reality. The design of the rib-waveguide-based
+circulators, reported on in section 4.5, was done in this way. However, measurements of the transmittance
+z (nm) z (nm)
+112 Chapter 4. Magneto-optical circulators
+1:00
+(a) jHz j
+1000 0:75
+0:50
+0
+0:25
+ 1000
+0:00
+1:0
+(b) eE z  .EEe EEo/
+1000 0:5
+0:0
+0
+ 0:5
+ 1000
+ 1:0
+0 2000 4000 6000 8000
+ (nm)
+7:5
+(c)
+5:0
+2:5 jHQ j2z , 3D calc.
+Z 2jEQ j20 z , 3D calc.
+0:0
+0 1 2 3
+k=k0
+Figure 4.33 (a) Magnitude of the z component of the magnetic field of the eigenmodes of the optimised G3-
+type cavity designed for l = 10, in the absence of SEMF. (b) The z component of the cross product EEe  EEo of
+the electric fields of the even and odd modes of the same cavity. (c) Squared norms of the Hankel transforms of
+the eigenmode fieldsHz and Ez at the plane located 1 nm below the surface of the substrate.
+through fabricated components of this type revealed that the behaviour of the 3D cavity differed strongly
+from the predictions of the 2D model. It became apparent that full 3D simulations were inevitable.
+The results of these calculations, summarised in section 4.6, proved that resonant cavities designed by
+help of the effective-index approximation do have good MO properties: the SEMF-induced splitting of
+the frequencies of their eigenmodes is indeed spectacular. However, the cavities suffer from substantial
+radiation losses in the vertical direction. The outcome of the various attempts at increasing the quality
+factor of these cavities, presented in subsection 4.6.2, points to the conclusion that 3D simulations are,
+unfortunately, all but unavoidable. They are required not only in the somewhat “brute-force” numerical
+optimisation of ring widths described at the end of subsection 4.6.2, but also in the approach based on
+Bloch’s theorem, which we have not tested, but which definitely looks promising.
+Regardless of the way in which a cavity is designed, it must still be integrated with waveguides. The
+results from section 4.5, while based on the effective-index approximation and therefore inaccurate, do
+z (nm) z (nm)
+jHQ j2 Z 2jEQ j2z , 0 z
+4.7. Conclusions and perspectives 113
+provide some insight into the problem of cavity–rib-waveguide coupling. In particular, they confirm that
+the optimum location of the waveguide ends can be approximately determined by analysing the quality
+factors of cavities with a varying number of rings. Therefore, if the distance from the cavity centre to
+the ends of 3D waveguides is figured out with this method, some nonreciprocal isolation should be ob-
+servable in experiment. Clearly, though, some numerical fine-tuning of this distance will be necessary
+to optimise the maximum isolation and the operation bandwidth of the device. Three-dimensional sim-
+ulations of a complete circulator would be prohibitively slow. However, as a workaround one might try
+the method of Andreani and Gerace [178], who successfully calculated the diffraction losses of eigen-
+modes of PC slabs by expanding the fields in terms of a few lowest guided modes of a specific multilayer
+(dependent on the structure of the slab) and including the radiation losses in a perturbative way.
+
+Chapter 5
+Numerical methods
+5.1 Multiple-scattering method for systems containing gyrotropic media
+In section 4.4 we presented results of numerical simulations of the scattering of electromagnetic waves
+by 2D PCs composed of circular cylinders etched in a MO, and thus anisotropic, matrix. The multiple-
+scattering method used to make these calculations was originally derived for isotropic materials [38].
+Here we show that it can be extended with very little effort to the case of gyrotropic media.
+The most important assumption of the method, which is described in detail in refs. 38, 39 and 40,
+is that the field Fz (standing for Ez for s-polarised waves and Hz for p-polarised ones) in the medium
+surrounding the scatterers is governed by the Helmholtz equation
+r2F C k2n2z 0 Fz = 0; (5.1)
+where k0  !=c, ! denotes the frequency, and n is the refractive index of the medium in question.
+It can be shown that in each circular annulus surrounding a particular scatterer Si and intersecting no
+other scatterers the field F can be decomposed into three parts: F srcz zi , the incident field coming directly
+from the source, F inc, the field scattered towards S by other scatterers, and F scattzi i zi , the field scattered
+by Si itself. Each of these fields can be writtenXin the form of a Fourier-Bessel series:
+F src. ;  / = asrcJ .k n / eimizi i i im m 0 i ; (5.2a)
+mX2Z
+F inc. ;  / = aincJ .k n / eimizi i i im m 0 i ; (5.2b)
+mX2Z
+F scatt. ;  / = b H .1/.k n / eimizi i i im m 0 i ; (5.2c)
+m2Z
+where src, inc and are constant coefficients, and .1/aim aim bim Jm.x/ Hm .x/ denote the Bessel and Hankel
+functions of the first kind, and .i ; i / are polar coordinates defined with respect to the centre of the
+annulus. With the so-called Graf’s theorem, a link can be established between the series (5.2) expressed
+in coordinate systems associated with different scatterers. This makes it possible to write F inczi in terms
+of F scattzj for all j ¤ i . Moreover, a linear relation exists between the Fourier-Bessel coefficients of the
+sum F src C F inc and those of F scattzi zi zi . With aEi and bEi denoting the column vectors of the coefficients
+.asrc C aincim im / and bim, respectively, this relation can be expressed as
+bEi = SOiaEi ; (5.3)
+where SOi is conventionally called the scattering matrix of Si . Its entries can be obtained by imposing
+the electromagnetic boundary conditions on the inner surface of the annulus mentioned above. Their
+115
+116 Chapter 5. Numerical methods
+derivation is particularly simple for a homogeneous isotropic circular scatterer with refractive index ni ;
+in this case, the total field Fz inside Si can alsoXbe written as a Fourier-Bessel series,
+F int. ;  / = c J .k n  / eimizi i i im m 0 i i ; (5.4)
+m2Z
+and since the surface of Si coincides with a constant coordinate line of the polar coordinate system
+anchored at the centre of Si , field matching can be done analytically and in fact the matrix SOi becomes
+diagonal.
+We shall now show that Maxwell’s equations describing wave propagation in a homogeneous medium
+can also be reduced to a Helmholtz equation if the medium has gyrotropic permittivity and permeability
+of the form 2 3 2 3
+t ig 0 t ig 0
+O  4 i  05 and O  4 i  0 5g t g t : (5.5)
+0 0 z 0 0 z
+We shall focus on p polarisation; the results for s polarisation can be obtained from the duality principle
+[65, p. 72–73]. Substituting eqs. (5.5) into Maxwell’s equations for p polarisation, eqs. (1.7), and writing
+the differential operators explicitly in Cartesian coordinates, we get
+@Ey   @Ex = i!0zHz; (5.6a)
+@x @y
+@Hz =  i!0.tEx C igEy/; (5.6b)
+@y
+ @Hz =  i!0. igEx C tEy/: (5.6c)
+@x
+Solving the two last equations for the components of EE, we obtain
+ 
+1 @H
+= i z
+@Hz
+Ex   g C t ; (5.7a)i! .20 g 2t / @x @y 
+1 @Hz
+Ey =    t C
+@H
+i zg : (5.7b)
+i! 2 20.g  / @x @yt
+Substitution of these expressions into eq. (5.6a) yields
+2 2  2@ Hz C @ Hz C k20 t   g zHz = 0: (5.8)@x2 @y2 t
+Thus, the fieldHz fulfils a Helmholtz equation with an “effective refractive index”
+n0  Œ.   2= / 1=2t g t z : (5.9)
+It is also possible to derive analytically the expression for the entries of the scattering matrix SO of a
+homogeneous gyrotropic cylinder S of radiusR embedded in a gyrotropic matrix. We need to impose the
+conditions of continuity of the components of the electric and magnetic fields tangential to the surface
+of S , i.e.,Hz and E . The fieldHzXon the exterior side of the surface of S is given by
+H ext.R; / = Œa J .k n0 R/C b H .1/.k n0 R/ eimz n m 0 ext n m 0 ext ; (5.10a)
+m2Z
+5.1. Multiple-scattering method for systems containing gyrotropic media 117
+and on the interior side, X
+H int.R; / = c J .k n0 R/ eimz n m 0 int I (5.10b)
+m2Z
+in these formulas, the subscripts “int” and “ext” label quantities measured on the interior and exterior
+side of the surface of S . Equations (5.7) imply that
+ 
+1 @Hz
+E =    t C
+ig @Hz
+; (5.11)
+i!0.2 2g / @r r @t
+hence
+X
+ext   1 .mg;ext=R/Jm.k0n
+0 R/C  k 0 0 0ext t;ext 0nextJm.k0nextR/E .R; / = ami! 2   20
+m2Z g;ext t;ext
+.1/ 0 C 0 .1/0 0 C .mg;ext=R/Hm .k0nextR/ t;extk0nextHm .k0n R/b ext imm   e ; (5.12a)2 2g;ext t;ext
+  1
+X .mg;int=R/J 0m.k0n R/C  0t;intk0n J 0 .k n0 R/
+Eint
+m 0
+.R; / = c int int int im m   e ; (5.12b)i! 2 20
+m2Z g;int t;int
+where the symbols 0 and .1/0Jm.x/ Hm .x/ denote the derivatives of the Bessel and Hankel functions at x.
+To condense the notation, we can rewrite eqs. (5.10) and (5.12) in the form
+X X
+H ext.R; / = .AHa C BHb / eim ; H intz m m m m z .R; / = CH c imm m e ; (5.13a)
+mX2Z mX2Z
+Eext.R; / = .AEa C BEb / eim ; Eint m m m m  .R; / = CE imm cm e ; (5.13b)
+m2Z m2Z
+where the definitions of the constant coefficients AHm etc. can be obtained straightforwardly by com-
+paring the above expressions with eqs. (5.10) and (5.12). Imposing now the conditions H extz .R; / =
+H int.R; / and Eext.R; / = Eintz   .R; / for all  2 Œ0; 2 / and noting that, owing to the orthogonality
+of the functions eim (m 2 Z) on this interval, the sums over m can be dropped, we arrive finally at the
+formulas
+H E
+ AmCm   A
+E
+mC
+H
+b = mm   am; (5.14a)BH E Em Cm BmCHm
+H E
+ AmBm   A
+E
+mB
+H
+c = mm   am: (5.14b)BH E Em Cm BmCHm
+Thus, by virtue of eq. (5.14a), we conclude that the scattering matrix SO of a gyrotropic cylinder embedded
+in a gyrotropic matrix is diagonal and its elements are given by
+H E
+ AmCm   A
+E H
+S = m
+Cm
+mn   ımn: (5.15)BH E Em Cm BmCHm
+We have thus demonstrated that only minor modifications of the multiple-scattering method are nec-
+essary to make it able to tackle gyrotropic materials. First, the refractive index n supplied to the argument
+of Bessel functions must be replaced by the “effective refractive index” n0 defined in eq. (5.9). Second,
+118 Chapter 5. Numerical methods
+the formulas for the entries of the scattering matrix of a cylinder acquire additional terms proportional to
+the off-diagonal elements of the material property tensors.
+It is natural to ask whether these steps suffice for different classes of anisotropic materials. The
+answer is, unfortunately, negative. For instance, consider the case of a medium with permittivity O 
+diag.x; y ; z/ with x ¤ y . The transformation of Maxwell’s equations into the Helmholtz equation
+comes now at the price of the change of coordinates
+r
+sx y
+.x; y/!7 .sxx; syy/ with = ¤ 1: (5.16)
+sy x
+An unwelcome side-effect of this change of coordinates is the mapping of circles into ellipses. This has
+two consequences. First, the elements of the scattering matrix of a circular cylinder cease to be diagonal
+and have to be determined in a more complicated way than that presented above, since after the mapping
+the cylinder’s surface does not coincide any more with a line of constant polar coordinates. Second, if
+it is the matrix (rather than the scatterer) that is anisotropic, the mapping (5.16) may cause the circles
+circumscribing the scatterers to overlap. It is well known that if this overlap is sufficiently large, the
+Fourier-Bessel expansion (5.6c) of the scattered field becomes invalid and the multiple-scattering theory
+in it classical form cannot be applied [179, 180].
+5.2 Calculation of photonic-crystal band structures
+with Fourier-Bessel expansions
+5.2.1 Introduction
+The multiple-scattering method, whose extension to MO materials we have presented in the previous
+section, has long been recognised as one of the most efficient techniques of modelling finite PCs com-
+posed of circular cylinders. The reason for this is twofold: first, the basis functions used to expand the
+fields are exact solutions of Maxwell’s equations, and hence they are well-adapted for the representation
+of these fields; second, since the basis functions are separable in polar coordinates, it is easy to apply the
+electromagnetic boundary conditions at the surfaces of the cylinders.
+In view of these advantages of the multiple-scattering method, it is tempting to extend its domain of
+application to the calculation of band structures of infinite PCs. Such an extension has indeed been made
+both for PCs composed of cylinders and spheres [41–47]. In this approach it is necessary to calculate ex-
+plicitly the field produced by an infinite number of scatterers arranged on a periodic lattice, which can be
+expressed by a series termed a lattice sum. Unfortunately, lattice sums are slowly convergent, and special
+techniques needed for acceleration of their computation complicate significantly the implementation of
+the method with respect to the finite-system case.
+Here we propose a much simpler technique of calculating band structures of PCs composed of cir-
+cular cylinders. Like the multiple-scattering method, it relies on Fourier-Bessel field expansions, but it
+dispenses with the calculation of lattice sums. The underlying idea is very simple: the field in a unit cell
+of a PC is expanded in terms of particular solutions of the Helmholtz equation, and the Bloch conditions
+on the boundaries of the cell are imposed by collocation (point matching). This approach is actually
+similar to the technique used in the fictitious-sources method to avoid the calculation of periodic Green’s
+functions in simulations of gratings [48]. The method is easy in implementation and it leads to expo-
+nential convergence of the band structure, potentially yielding very high relative accuracy, as will be
+demonstrated in the following.
+The proposed method shares many features with the technique of Dirichlet-to-Neumann mappings
+developed in the group of Lu [49, 50]. In their approach, a field expansion in particular solutions of the
+5.2. Calculation of photonic-crystal band structures with Fourier-Bessel expansions 119
+Helmholtz equation is used to calculate a finite-dimensional approximation of the Dirichlet-to-Neumann
+operator that maps the distribution of the field on the unit cell’s boundary to that of the normal derivative
+of this field. The resulting operator can then be used to calculate the band structure of the PC. Our method
+is more direct and more efficient, since it does not require the construction of the Dirichlet-to-Neumann
+matrix, and hence dispenses with the need of performing a matrix inversion. On the other hand, it is
+also less powerful, since a Dirichlet-to-Neumann operator can be used for the sake of computing not
+only a band structure, but also, for instance, the transmission and reflection coefficients of a finite or
+semi-infinite PC [50]. One could say that while the method of Lu et al. is more general, ours has been
+specifically tailored to band-structure calculations.
+In the next subsection we shall present the formulation of the proposed technique. Some concrete
+numerical examples of its application will be given in subsection 5.2.3, and the obtained results will be
+briefly discussed in subsection 5.2.4.
+5.2.2 Formulation
+Let us consider a 2D PC whose unit cell, shown in fig. 5.1(a), is composed ofM nonoverlapping circular
+inclusions of radius rm, permittivity Om and permeability Om (m = 1; 2; : : : ;M ), embedded in a matrix
+with permittivity O0 and permeability O 0. The tensors Om and Om (m = 0; 1; : : : ;M ) are assumed to
+have the (gyrotropic2) form 3 2 3
+tm igm 0 tm igm 0
+Om  4 i  0 5 and O  4 i  0 5gm tm m gm tm : (5.17)
+0 0 zm 0 0 zm
+As we have shown in section 5.1, for p polarisation, the Maxwell’s equations in a homogeneous region
+with permittivity Om and permeability Om reduce to the Helmholtz equation for the z component of the
+magnetic field,Hz:
+r2H C k2z mHz = 0; (5.18)
+where  2 1=2
+km  !
+gm
+tm   : (5.19)
+c tm
+The corresponding equation for s polarisation can be obtained simply from the duality principle [65, p.
+72–73]. Vekua [181, section 22] showed that every regular solution of the Helmholtz equation (5.18) in
+a multi-connected domain D  D0n.C1 [ C2 [    [ CM /, where D0, C1, C2, : : : , CM are simply-
+connected domains and C1; C2; : : : ; CM  D0, can be approximated uniformly by a linear combination
+of the functions
+J .k / eil and Y .k  / eilml m l m m for l 2 Z and m = 1; 2; : : : ;M; (5.20)
+where .; / are standard polar coordinates and .m; m/ are the polar coordinates defined with respect
+to the point Om 2 Cm [see fig. 5.1(b)].
+We shall use Vekua’s theorem to determine the representation of the field in the PC unit cell shown
+in fig. 5.1(a). We divide it into M 0  M polygonal subcells, each containing exactly one circular
+inclusion. (For numerical purposes it can be advantageous to introduce subcells containing no “physical”
+inclusions; these can be treated as if they contained an inclusion with permittivity O0, permeability O 0
+and a sufficiently small radius.) Inside the inclusion of the mth subcell, the solution of the Helmholtz
+equation can be approximated by the series
+XL
+.L/  .L/H .m; m/ c Jl.kmm/ eilm ; (5.21)z;in ml
+l= L
+120 Chapter 5. Numerical methods
+D0
+P
+C1
+1
+1
+ 2
+O1
+ 
+C
+2 2
+O O2
+(a) (b)
+Figure 5.1 (a)Geometry of a PC’s unit cell that containsM = 3 circular inclusions embedded in a homogeneous
+matrix. It is subsequently divided into M 0 = 4 quadrilateral subcells. (b) Schema of the domain D referred to in
+Vekua’s theorem. Note that the symbol D0 denotes the whole interior of the large contour, whereas D stands for
+the shaded region.
+with the polar coordinates .m; m/ defined with respect to the origin Om lying in the centre of the
+inclusion. In turn, the field outside the inclusion can be approximated by
+XL
+.L/  .L/ .L/H . ;  / Œa J .k  /C b Y .k  / eilmz;out m m l 0 m l 0 m : (5.22)ml ml
+l= L
+The superscripts .L/ in the above formulas stress that, according to Vekua’s theorem, the system
+(5.20) is complete, but need not be a basis. In other words, it is not guaranteed, for instance, that there
+exist coefficients aml and bml (Xl 2 Z) such that the series
+Œa J .k  /C b Y .k  / eilmml l 0 m ml l 0 m (5.23)
+l2Z
+converges to the true solution Hz;out.m; m/. What is guaranteed is that a finite superposition of the
+functions (5.20) can be found that approximates Hz;out.m; m/ to any desired accuracy  > 0. This is
+quite sufficient for practical purposes. An example illustrating clearly the difference between a basis and
+a complete set is given by Christensen [182, pp. 98–99]. For compactness of notation, the superscripts
+.L/ will be dropped from now on.
+At the present stage, to each subcell correspond three families of unknown coefficients: aml , bml
+and cml . The former two can be easily expressed in terms of the latter one by imposing analytically the
+electromagnetic boundary conditions at the surfaces of the circular inclusions. This is done exactly in
+the same way as in the multiple-scattering method, and has been detailed in ref. 40 for the isotropic case
+and in section 5.1 of this thesis for the gyrotropic case. Therefore, we do not describe it again here. In
+any case, this procedure leads to expressions of the form
+aml = Amlcml and bml = Bmlcml ; (5.24)
+where Aml and Bml are known. Substituting them to eq. (5.22), we get
+XL
+H . ;  /  c ŒA J .k  /C B Y .k  / eilmz;out m m ml ml l 0 m ml l 0 m : (5.25)
+l= L
+To determine the values of cml , we impose appropriate boundary conditions at discrete collocation points
+distributed on the inter-subcell boundaries, which can be divided into two classes. On an interface of two
+5.2. Calculation of photonic-crystal band structures with Fourier-Bessel expansions 121
+subcells belonging to the same unit cell, we impose the continuity of Hz and its derivative normal to
+that interface. (The continuity of the tangential derivative should follow, in the limit of infinitely many
+collocation points, from the continuity of Hz itself.) On an external boundary of a unit cell, in turn,
+we impose Bloch conditions on Hz and its normal derivative. Assuming that the number of collocation
+points is equal to half the number of unknowns cml , the above procedure leads to a homogeneous system
+of linear equations, whose matrix is square and depends on the Bloch vector kE. This system is subse-
+quently transformed into a generalised eigenvalue problem for one of the components of kE, as will be
+demonstrated on an example later in this section.
+In the meantime, there is a technical difficulty to be resolved. As we have seen, we have always an
+even number of boundary conditions. However, the expansion (5.25) contains an odd number (2LC 1)
+of coefficients cml . In order to match the number of equations and that of unknowns, it is necessary
+to dispense with one coefficient. To this end, we follow a procedure used in spectral Fourier-expansion
+techniques [183, subsection 2.2.1]. We rewrite the exponential functions eilm in eq. (5.25) in terms of
+the trigonometric functions cos.l / and sin.l /, and use the relations J  .x/ = . 1/lm m l Jl.x/, Y l.x/ =
+. 1/lYl.x/, Am; l = Aml and Bm; l = Bml to convert the series from eq. (5.25) to the form
+XL
+Hz;out.m; m/  ŒAmlJl.k0m/C BmlYl.k0m/Œd cml cos.lm/C d sml sin.lm/; (5.26)
+l=0
+where
+d c  c C . 1/lc   and d s  iŒc   . 1/lml ml m; l ml ml cm; l : (5.27)
+We set now d smL = 0, obtaining
+XL
+Hz;out.m; m/  d cml ŒAmlJl.k0m/C BmlYl.k0m/ cos.lm/
+l=0
+X  (5.28)L 1
+C d sml ŒAmlJl.k0m/C BmlYl.k0m/ sin.lm/
+l=1
+and reducing the total number of unknowns to 2L.
+We shall now present in detail the conversion of the square system of linear equations resulting from
+the collocation procedure to an eigenvalue problem, considering the example case of a PC composed
+of a hexagonal lattice of cylinders, shown in fig. 5.2(a). Its unit cell can be chosen as the Wigner-Seitz
+cell delimited by the segments ˙i (i = 1; 2; : : : ; 6). Since it contains only a single inclusion, it is not
+necessary to divide it into subcells. Let us assume that on each segment ˙i L=3 collocation points with
+polar coordinates .1;ij ; 1;ij / (j = 1; 2; : : : ; L=3) are distributed so that the positions of the points lying
+on opposite sides of the cell differ by a lattice vector. Let us denote by HO i the matrix of size .L=3; 2L/
+that, right-multiplied by the vector of unknowns dE  Œd c ; d c ; : : : ; d c ; d s ; d s ; : : : ; d s T1;0 1;1 1;L 1;1 1;2 1;L 1 ,
+will produce the vector of values of the fieldHz at the collocation points lying on the segment˙i . From
+eq. (5.28), the elements ofHO i are given by (
+O C  cos.l1;ij / for l = 0; 1; : : : ; L;.Hi /jl = ŒA1lJl.k01;ij / B1lYl.k01;ij / C C (5.29)sin.l1;ij / for l = L 1;L 2; : : : ; 2L:
+The analogous matrix that, right-multiplied by dE, will produce the vector of derivatives of Hz taken in
+the direction normal to ˙ will be denoted byHO 0i i .
+122 Chapter 5. Numerical methods
+bE2
+aE2
+a ˙3 ˙2
+M
+˙ r4 ˙1
+0
+aE   K M1
+collocation ˙5 ˙6
+E
+points b1
+(a) (b)
+Figure 5.2 (a) Geometry of a hexagonal-lattice PC composed of circular air holes etched in a dielectric matrix.
+A Wigner-Seitz unit cell is marked by shading. (b) Reciprocal space of this PC. Large dots mark the positions
+of reciprocal lattice points. The hexagonal first Brillouin zone is also shown; its irreducible part  MK has been
+shaded.
+In this matrix notation, the equations resulting from imposition of the Bloch boundary conditions at
+all the collocation points take then the form
+O E ikEH d = e aE1 HO dE; HO 0dE =   eikEaE1 HO 01 4 1 4dE;
+O E ikEaE O E O 0 E   ikEH d = e 2 H d; H d = e aE2 HO 0dE2 5 ; (5.30)2 5
+HO dE = eikE.aE2 aE / E13 HO6dE; HO 03dE =   eik.aE2 aE1/HO 06dE;
+p
+where aE 1 31  .a; 0/ and aE2  . a; a/ denote the basis vectors of the hexagonal lattice show2 2 pn in fig.
+5.2(a). The Blo
+E  p
+ch vector kE can be expressed as kE = k E E E 2 1b1 C k2b2, where b1  .1; 1= 3/ anda
+b 2 2 .0; 2= 3/ are the basis vectors of the reciprocal lattice of the PC in question, shown in fig.a
+5.2(b), and have the property aEi  bEj = 2 ıij . Consequently, eqs. (5.30) can be rewritten as
+.HO   e2 ik1 HO /dE = 0; .HO 0 C e2 ik1 HO 01 4 1 4/dE = 0;
+.HO   e2 ik2 HO /dE = 0; .HO 0 C e2 ik22 5 HO 0 /dE = 0; (5.31)2 5
+.e2 ik1 HO 2 ik2 O E 2 ik1 O 0 2 ik2 O 0 E3   e H6/d = 0; .e H3 C e H6/d = 0:
+To bring this system into the form of an eigenvalue problem, we can fix the value of some linear combi-
+nation of k1 and k2. For instance, calculations of the band structure of the hexagonal-lattice PC from fig.
+5.2(a) are most often done along the boundaries of the irreducible fragment of its first Brillouin zone, the
+triangle  MK, shown in fig. 5.2(b). On the segment  M , the Bloch vector kE has the form kE = bE1CbE2
+with 0    1 . Thus, setting k1 = k2   in eq. (5.31) and reordering terms, we obtain the linear2
+eigenvalue problem 2 O 3 2 36 H HO666
+1 4
+HO 0 7 6 O 07
+O1
+7
+6 77 6
+6
+H 7 E 6
+ H 7
+6 HO
+47
+6 2 7 d = e2 i6 O 0 7 6
+57 E
+6  O 0777 d: (5.32)4 HHO 2 HO3 65 4 H50O 5
+HO 03 CHO 0 0O6
+5.2. Calculation of photonic-crystal band structures with Fourier-Bessel expansions 123
+Since the matrices HO and HO 0i i have dimensions .L=3; 2L/, it can be easily verified that the matrices in
+the above equation are square.
+Things are slightly more complex for the segment  K. There, the Bloch vector kE = 2bE1 C bE2
+with 0    1 , and eqs.
+3 2(5.313) reduce to thO 2
+e quad3ratic eigenva2lue pro3blem
+H 0O  HO
+6 1 466HO 0777 666 0O 777 666 HO 076 17 76HO 7 O O
+47
+6 26 O 077
+E C e2 i 666 H57d O 077 dE6 7 C e
+4 i
+66
+66 0 7O 77 dE7 = 0: (5.33)4HO25 4 HO5H6  H35 4 00O 5
+HO 0 HO 06 3 0O
+This problem can be solved in a number of ways [184]. The most popular of them, which we employ
+here, is linearisation: given an equation of the form .AO C BO C 2CO /xE = 0, one defines yE  xE and
+solves a linear eigenvalue problem"of doub#leO O "
+siz#e, e."g.,O O #" #A B xE 0  C xE
+O O E = O O E ; (5.34)0 I y I 0 y
+where IO denotes the identity matrix. Alternative linearisations are also possible, but they are advanta-
+geous primarily if the original quadratic eigenvalue problem has a particular structure—for instance, is
+symmetric—which is not the case here.
+The band structure on the KM segment could be calculated by solving a third eigenvalue problem
+obtained from eq. (5.31) by imposing the constraint k1 C k2 = 1. However, owing to the six-fold
+rotational symmetry of the PC from fig. 5.2(a), its dispersion diagram on KM is identical with that on
+the segmentKM 0, shown in fig. 5.2(b), which is collinear with  K. Thus, the band structure on  K and
+KM 0 can be obtained simultaneously by solving the eigenvalue problem (5.33); values of  belonging
+to the intervals Œ0; 1  and Œ1 ; 1  will then correspond to Bloch vectors lying on the segments  K and
+KM 0
+3 3 2
+, respectively.
+5.2.3 Numerical examples
+We shall now apply the method introduced in the previous subsections to the determination of the band
+structure of several example PCs. The results obtained with this technique will be compared to those
+produced by another, well-tested code. We shall also examine the convergence rate of Fourier-Bessel
+expansions and discuss some technical details of the implementation of the proposed method.
+We begin with the simple case of a PC composed of a hexagonal lattice of air holes of radius r =
+0:3a, where a is the lattice constant, etched in a dielectric matrix with refractive index 2.5, as shown
+schematically in fig. 5.2(a); this is in fact the PC introduced in section 4.4. First, it is necessary to check
+whether the proposed method yields results convergent with increasing truncation order L. We shall
+therefore study how the changes in L influence the magnitude of the Bloch vector kE of the state located
+on the  M segment and having frequency ! = 0:40  2 c=a (chosen arbitrarily). In practice, the
+determination of the error of a calculated value of k is complicated by the fact that the exact magnitude
+of kE is not known. As a workaround, given a series of values ki (i = 1; 2; : : : ; NL) obtained at several
+monotonically increasing truncation orders Li , we shall take as a reference the value ki for which the
+expression .jki   ki 1j C jki   kiC1j/=jki j is smallest.
+The collocation points on all boundaries ˙i (i = 1; 2; : : : ; 6) of the unit cell will be initially placed
+at the Gauss-Legendre quadrature points, i.e., at the roots of the Legendre polynomial of order L=3C 1
+[183, p. 252]. This choice will be later demonstrated to be near-optimal.
+124 Chapter 5. Numerical methods
+100
+(a) (b) Equidistant
+  Chebyshev10 5 Legendre
+10 10 No bal.
+Bal. (1)
+10 15 Bal. (2)
+0 50 100 150 200 0 50 100 150 200
+L L
+Figure 5.3 (a) Convergence of the magnitude of the Bloch vector kE of the state located on the  M seg-
+ment in the first Brillouin zone of the hexagonal-lattice PC shown in fig. 5.2(a). The frequency was fixed to
+! = 0:40  2 c=a. The different data series refer to results obtained with different levels of eigenvalue-problem
+balancing. Crosses: no balancing. Black circles: out-of-the-box balancing as provided by LAPACK. White cir-
+cles: balancing preceded by elimination of nonzero matrix entries due to round-off error, as described in the text.
+(b) Convergence of k with three different distributions of collocation points: equidistant points (crosses), Gauss-
+Chebyshev quadrature points (black circles), Gauss-Legendre quadrature points (white circles).
+Since Bessel functions of different orders vary greatly in magnitude for a fixed argument, the eigen-
+value problems (5.32) and (5.33) very quickly become numerically close to singular if no rescaling of
+the basis functions is done. This leads to erroneous results. As a remedy, it is possible to scale the
+basis functions manually, e.g., by normalising them to the value they attain at a typical (in some sense)
+distance from the collocation points to the origin of the coordinate system. However, we found it more
+convenient to rely on the matrix-pair balancing algorithm due to Ward [185], which can be invoked auto-
+matically by the generalised non-symmetric eigensolver routine ggevx from the LAPACK library [186].
+In fig. 5.3 the points marked with black circles show the convergence of k calculated in this way with
+the truncation order L. Clearly, relative accuracy of 10 7 is achieved in a fairly wide range of trunca-
+tion orders. However, there is still room for improvement, since the machine precision is much higher
+(10 16/.
+The performance of the balancing algorithm of Ward [185] is degraded by the presence of small
+matrix elements due to round-off error [187, balance function]. Such entries do occur in our case; they
+correspond to collocation points located on nodal lines of trigonometric functions cos.lm/ and sin.lm/
+of various orders l [cf. eq. (5.29)]. It is impractical to locate such points by hand. Therefore we have
+used instead a heuristic procedure that looks for matrix entries smaller than a given fraction  of the
+average magnitude of the elements of the column they lie in. These entries are subsequently replaced
+with zeros. The value  = 10 10 seems to work well. As demonstrated by the series marked with white
+circles in fig. 5.3(a), introduction of this procedure leads to a significant increase of the attainable relative
+accuracy, which reaches 10 14.
+We have also studied the dependence of the convergence rate on the placement of collocation points.
+Three distributions were considered: Gauss-Legendre, Gauss-Chebyshev and equispaced. As shown in
+fig. 5.3(b), the former two yield approximately the same convergence rate of k (the Gauss-Legendre
+distribution performing marginally better), while the equispaced points fare distinctly worse. These
+tendencies have also been observed for other frequencies and PC geometries. Thus, in the remaining
+examples we use the Gauss-Legendre distribution.
+In figs. 5.4(a) and (b) the band structures of the crystal from fig. 5.2 computed for p and s polarisa-
+tions with the method under study are compared with the data obtained using the MPB library [188]. For
+both polarisations, a perfect visual agreement can be seen.
+Relative error
+5.2. Calculation of photonic-crystal band structures with Fourier-Bessel expansions 125
+0:4 (a) (b)
+0:2
+0:0
+  M K     M K  
+Figure 5.4 Comparison of the (a) p-polarisation and (b) s-polarisation band structure of the hexagonal-lattice
+crystal from fig. 5.2, calculated with the method described here (points) and with the MPB library (lines).
+aE bE2 2
+M
+r
+aE   X1 bE1
+a
+a
+(a) (b)
+Figure 5.5 (a) Geometry of a square-lattice PC composed of circular air holes etched in a dielectric matrix. A
+Wigner-Seitz unit cell is marked by shading. (b) Reciprocal space of this PC. Large dots mark the positions of
+reciprocal lattice points. The square first Brillouin zone is also shown; its irreducible part  MX has been shaded.
+We shall now move on to the analysis of the square-lattice PC shown in fig. 5.5(a), composed of air
+holes of radius r etched in a dielectric matrix with refractive index 3.4. We shall focus on the case of
+large r (close top1a). Without Vekua’s theory, one could have doubts about the validity of the method2
+for r > a.1   2/=2  0:29a, since in this case the circumscribed circle of a unit cell crosses the
+inclusions from the neighbouring cells, and hence it is not clear whether a Fourier-Bessel representation
+of the field near the cell corners is valid. We shall show that even for r  1a the method still produces
+2
+correct results, in accordance with Vekua’s assertion.
+Figure 5.6 shows the juxtaposition of the band structures of the PC from fig. 5.5(a) with r = 0:49a
+obtained with the present technique and with MPB. As before, a perfect visual agreement in apparent.
+In turn, in fig. 5.7 we compare the convergence of the magnitude of the vector kE of a Bloch state lying
+on the  M segment for the two polarisations and three values of r : 0:45a, 0:49a and 0:50a. In each
+case, the frequency is fixed so as to correspond to k roughly equal to 0:25a. It can be seen that in the
+p polarisation case the convergence slows down distinctly as r approaches 0:50a; this is probably related
+to the occurrence of field singularities at the points of contact of neighbouring holes. Such singular fields
+cannot be represented efficiently with a regular function basis. Even so, a relative accuracy of 10 4 is
+attainable with a reasonable number of basis functions.
+Comparison of figs. 5.3(a) and 5.7 shows that the ultimate relative error of the calculations done for
+!a=2 c
+126 Chapter 5. Numerical methods
+0:4 (a) (b)
+0:2
+0:0
+  X M     X M  
+Figure 5.6 Comparison of the (a) p-polarisation and (b) s-polarisation band structure of the square-lattice
+crystal from fig. 5.5, calculated with the method described here (points) and with the MPB library (lines).
+100
+(a) p pol. (b) s pol. r D 0:45a
+r D 0:49a
+10 5 r D 0:50a
+10 10 r D 0:45a
+r D 0:49a
+r D 0:50a
+10 15
+0 50 100 150 200 0 50 100 150 200
+L L
+Figure 5.7 Convergence of the magnitude of the Bloch vector kE of the state located on the  M segment in
+the first Brillouin zone of the square-lattice PC shown in fig. 5.5(a) for (a) p polarisation and (b) s polarisation.
+The frequency was fixed to: (a) ! = 0:38  2 c=a for r = 0:45a; ! = 0:40  2 c=a for r = 0:49a; and
+! = 0:47  2 c=a for r = 0:50a; (b) ! = 0:35  2 c=a for r = 0:45a; ! = 0:40  2 c=a for r = 0:49a; and
+! = 0:40  2 c=a for r = 0:50a. In all these cases, k  0:25  2 =a.
+the square-lattice PC is slightly larger than in the hexagonal-lattice case. This is probably caused by the
+fact that the spread of the radial coordinates of the collocation points placed on a square is greater than
+on a hexagon. Therefore the range of values taken by any given basis function at different collocation
+points is larger in the former case, and this reduces the efficiency of the balancing algorithm.
+The third example to be studied is the PC composed of a hexagonal lattice of “shamrocks”, i.e.,
+patterns of three adjacent circular air holes of radius 0:2a, shown in fig. 5.8(a). The PC matrix is assumed
+to be magneto-optical, with a tensorial permittivity of the form (4.31) with  = .2:5/2 and g = 0:1; these
+parameters correspond roughly to those of BIG in the infrared range (see section 4.4). In this structure,
+which has already been discussed briefly in section 3.4.3, both the spatial inversion symmetry and the
+time-reversal symmetry of Maxwell’s equation are broken; therefore, it is nonreciprocal and its band
+structure has no centre of symmetry. A particularly striking consequence of this fact is the existence
+of unidirectional band gaps. Such a band gap appears, for instance, in the neighbourhood of frequency
+! = 0:3915  2 c=a. Figure 5.8(b) shows the equifrequency curve at this value of !. Clearly, there
+exist propagative bands at kx =  =.3a/ (close to theK points), whereas there are none at kx =   =.3a/
+(close to the K 0 points). As noted in ref. 115, a slab of such a PC can be used as an isolator.?
+? As a historical note, we mention that the unidirectional-mirror effect caused by the lifting of the spatial inversion symmetry,
+described in ref. 115, had originally been discovered in the PC shown in fig. 5.8(a). However, it was subsequently found
+that a PC composed of triples of slightly overlapping holes provides a larger unidirectional gap and would be easier to
+manufacture. Such a system cannot be directly handled by the method presented here; therefore, calculations of its band
+Relative error
+!a=2 c
+5.2. Calculation of photonic-crystal band structures with Fourier-Bessel expansions 127
+(a)
+(b) K
+0 M K
+0:50
+a a
+0:25 M M
+r
+0:00
+ 
+K K0
+ 0:25
+M M
+ 0:50
+K0 M K
+ 0:5 0:0 0:5
+a
+kxa=2 
+100 (c)
+10 3
+10 6
+0 50 100 150 200
+L
+Figure 5.8 (a) Geometry of the PC composed of a hexagonal lattice of groups of three adjacent circular holes
+etched in a magneto-optical matrix. The shaded region is the unit cell composed of four hexagonal subcells
+that was used in calculations. (b) p-polarisation equifrequency curve of this crystal at ! = 0:3915  2 c=a.
+(c) Convergence of the magnitude of the Bloch vector kE of the state located on the  M segment in the first
+Brillouin zone of this crystal at the same frequency.
+The calculations of the equifrequency curve shown in fig. 5.8(b) were made by dividing the PC’s unit
+cell into four hexagonal subcells outlined in fig. 5.8(a), one of them empty. Owing to the presence of
+field singularities at the cylinder junction points and the offset of the inclusion centres with respect to the
+hexagon centres, which causes a wider spread of the radial coordinates of different collocation points,
+only a moderate relative accuracy of10 5 was attained in simulations, as evidenced by the convergence
+plot from fig. 5.8(c). For very large truncation orders (L  150) round-off error increasingly corrupts
+the results.
+In section 4.4 another class of PC systems was studied with the method proposed here: waveguides
+embedded in the hexagonal-lattice crystal from fig. 5.2. The band structures of two such waveguides
+are plotted in fig. 4.9. These calculation were done using the supercell technique, with artificial quasi-
+periodic boundary conditions imposed on the segments ˙1–˙4 of the supercell shown schematically in
+fig. 5.9.
+structure reported in ref. 115 were performed with the MPB library [188].
+Relative error
+kya=2 
+128 Chapter 5. Numerical methods
+dw
+˙3
+˙2 ˙4
+˙1
+Figure 5.9 Geometry of the supercell used for the calculation of the waveguide dispersion relations shown in
+fig. 4.9.
+5.2.4 Conclusions
+In this section we have presented a method of calculating band structures of 2D PCs composed of circular
+cylinders by help of Fourier-Bessel expansions. Its cardinal virtue is its high efficiency: owing to the
+exponential convergence of the method, it is possible to achieve a relative accuracy better than 10 10 at a
+modest computational cost. Therefore the proposed technique can provide extremely accurate reference
+values for the purposes of testing other numerical methods. High accuracy is also invaluable in studies
+of tiny effects, such as the nonreciprocity induced by a static magnetic field at optical frequencies.
+For PCs whose unit cell need not be divided into subcells, the method has an extremely simple imple-
+mentation. On the other hand, if multiple subcells are present, the necessary bookkeeping can be tricky;
+however, it should be possible to automatise the imposition of the appropriate boundary conditions to
+a certain degree. Disadvantages of the technique in question lie primarily in its restriction to systems
+containing circular inclusions and in the degradation of its accuracy for subcells whose shape deviates
+markedly from that of a circle concentric with the embedded inclusion. This latter problem might pos-
+sibly be alleviated with more advanced matrix-pair balancing algorithms, such as those presented in
+ref. 189.
+5.3 Finite-element simulations of three-dimensional axisymmetric cavities
+5.3.1 Introduction
+In this section we shall describe the finite-element (FE) method used to calculate the eigenmodes of open
+3D axisymmetric cavities containing gyrotropic materials. This technique was used to obtain the results
+presented in section 4.6.
+There are two major approaches to FE simulations of axisymmetric systems [60, p. 912–913]. Early
+researchers [190, 191] made use of the possibility of expressing all the components of the electromag-
+netic fields EE and HE in such systems in terms of the so-called coupled azimuthal potentials E and
+H , which were subsequently discretised with standard nodal FEs. However, Maxwell’s equations
+written in terms of these potentials have nonphysical singularities at certain radii, whose presence affects
+adversely the accuracy of calculations.
+In 1993, Lee et al. [192] proposed an alternative approach to the problem of finding the eigenmodes
+of a closed axisymmetric cavity. He formulated the equations in terms of the two meridional ( and z)
+components of the electric fields, expanded into curl-conforming vector elements, and the electric az-
+imuthal potential E , expanded into nodal elements. The boundary conditions on the z axis were not
+yet treated in a sophisticated way. Therefore, the expressions for the elements of the matrices repre-
+senting the discretised equations contained singular integrals, whose computation can be numerically
+demanding. Later, Chinellato [193] established a solid mathematical foundation for this approach, intro-
+ducing also a set of carefully crafted techniques for the calculation of the singular integrals. Combined
+with a PML-based truncation of the computational domains, this method was used for the determina-
+tion of the eigenmodes of open dielectric axisymmetric resonators [194]. Hiptmair and Ledger [195]
+5.3. Finite-element simulations of three-dimensional axisymmetric cavities 129
+extended it to FEs of arbitrary order, so-called hp FEs, which allow to obtain exponential convergence,
+even if field singularities are present, by combining mesh refinement with an increase of the element
+order.
+In the meantime, however, it had been shown that the enforcement of the boundary conditions on
+the z axis is facilitated if a particular change of variables is made so that the vector FEs are used to
+expand a specific combination of the azimuthal and meridional components of EE rather than the “pure”
+meridional part [196, 197]. This change of variables removes also all singular integrals. Greenwood and
+Jin applied this idea to simulations of wave scattering [51] and radiation [198] by axisymmetric bodies,
+using PMLs to truncate the computational domain. Finally, Venkatarayalu [52] proposed an algorithm
+of elimination of unwanted static (zero-frequency) cavity eigenmodes from the FE approximation space,
+which is reputed to accelerate the convergence of iterative eigenvalue solvers.
+The particular variant of the axisymmetric FE method implemented during this thesis combines el-
+ements of several works cited above. It is probably closest to that of Greenwood and Jin [51]: vector
+FEs are used to expand a superposition of the azimuthal and meridional components of EE; exponential
+Fourier expansions in the azimuthal direction are used rather than trigonometric ones; and the computa-
+tional domain is truncated with PMLs. On the other hand, unlike Greenwood and Jin, we look for the
+eigenmodes of the modelled system rather than its response to an incident field; thus, in a manner similar
+to that of Venkatarayalu [52], we derive an eigenvalue problem rather than an inhomogeneous system of
+equations. Finally, like Hiptmair and Ledger [195], we use relatively high-order FE expansions is order
+to improve the efficiency of calculations. The original contribution of our work is the extension of the
+method to the case of media with gyrotropic material properties. Before, it had been formulated only for
+diagonal permittivity and permeability tensors, which are used to represent PMLs adapted to cylindrical
+coordinates [51, 53, 54].
+In the next subsection we present the derivation of our algorithm. Some issues, in particular the
+manner of boundary condition enforcement on the z axis, are discussed in rather more detail than it has
+been done in literature [51, 52, 196].? We hope that their pedagogical derivation here will be useful for
+future researchers intending to use or program the FE method for axisymmetric structures. Subsection
+5.3.3 is devoted to the numerical implementation of the proposed technique. Finally, in subsection 5.3.4
+we evaluate its accuracy.
+Several examples of the application of the method to the calculation of the eigenmodes of specific
+cavities can be found in section 4.6.
+5.3.2 Formulation
+Axisymmetric systems We begin by defining precisely what we mean by an axisymmetric structure.
+A system characterised by position-dependent permittivity and permeability tensors is said to be axisym-
+metric if the representations of these tensors in cylindrical coordinates .; ; z/ are independent from
+the azimuthal coordinate . It is instructive to check in what circumstances a tensor field whose Carte-
+sian components are constant in some area of space stays independent from  when it is transformed to
+cylindrical coordinates. Consider, for instance, the permittivity tensor O. Its Cartesian components are
+defined by the relation 2 3 2 32 3
+4Dx5 4xx xy xz54ExDy =   5yx yy yz Ey ; (5.35)
+Dz zx zy zz Ez
+? We have not had access to ref. 197, in which this topic is probably also considered.
+130 Chapter 5. Numerical methods
+where EE  .E ;E ;E /T is the electric field and DE  .D ;D ;D /Tx y z x y z the electric displacement.
+Since the Cartesian components of a vector FE are related to the cylindrical ones by
+2 3 2   32 34Fx5 4cos sin 0F = sin cos 054FF 5y  ; (5.36)
+Fz 0 0 1 Fz
+the tensor O in cylindrical coordinates will take the form
+2   3 12 32 34cos sin 05 4xx xy xz54cos   sin 0O.cyl/ = sin cos 0 yx yy yz sin cos 05
+20 0 1 zx zy 3zzC   2
+0 0 3 1
+1
+= 4 xx yy xy yx 0 5 4 0 0 xz .xy   yx/  5xx C yy 0 C 0 0 yz cos
+2
+2 0 30 2z2z zx zy 0 3 (5.37)
+4 0 0 yz xx   yy xy C yx 0C 10 0   5 sin C 4xz xy C yx  .xx   yy/ 05 cos 2
+2
+2zy  zx 0 30 0 0
+4 1 xy C yx  .xx   yy/ 0C  . 5xx   yy/  .xy C yx/ 0 sin 2:
+2
+0 0 0
+Obviously, in order that .cyl/ be independent of , all the terms proportional to trigonometric functions
+of  in the above expression must vanish. This is the case if and only if xx = yy , xy =  yx and
+xz = yz = zx = zy = 0. Thus, a permittivity tensor field having a locally constant Cartesian
+representation will be independent from  after transformation to cylindrical coordinates if and only if it
+has the form 2 3
+t ig 0
+O.Cart/ = 4 i 5g t 0 (5.38)
+0 0 z
+(the imaginary unit has been introduced into the off-diagonal components purely for future convenience
+and for consistency with other parts of this manuscript). It is worth noting that from eq. (5.37) it follows
+that in this case O.cyl/ = O.Cart/. Obviously, the above reasoning can be repeated for the permeability
+tensor O .
+In this way we have shown that axisymmetric systems may not contain physical? materials whose
+permittivity or permeability tensors have a form other than (5.38).
+Statement of the problem We seek the (leaky) eigenmodes of an open axisymmetric cavity with
+the given permittivity O.; z/ and permeability O .; z/ (in the rest of this section, components of material
+property tensors will be assumed to be given in cylindrical coordinates unless mentioned otherwise), ful-
+filling the Sommerfeld’s boundary conditions [60, p. 294] at infinity. Since it is not possible to discretise
+the whole space 3R with FEs, simulations will be done on the finite cylindrical domain
+˝0  f.; ; z/j0    R and 0   < 2  and Z   z  ZCg : (5.39)
+? This conclusion does not apply to “numerical” media such a PMLs, which need not have piecewise-constant Cartesian
+representations of the permittivity and permeability tensors.
+5.3. Finite-element simulations of three-dimensional axisymmetric cavities 131
+In order to suppress spurious reflections on the boundaries of ˝0, its surface will be coated with PMLs,
+treated numerically as special anisotropic media, whose nature will be specified later in this section. On
+the whole surface of ˝0 perfect-electric-conductor boundary conditions will be imposed.
+Wave equation We shall now demonstrate that the independence of O and O from  allows to convert
+the vector wave equation for the electric field EE in ˝0 into an infinite set of decoupled equations for the
+restriction of EE to a single meridional plane of ˝0.
+Eliminating the magnetic field HE from the time-harmonic source-free Maxwell’s equations (1.4a)–
+(1.4b), we get
+rE  ŒO 1  .rE EE/ = k20O EE; (5.40)
+where k0  !=c is the free-space wave number. The electric field EE can be expanded in a Fourier series
+with respect to :
+E XE.; ; z/ = EE .; z/ eill ; (5.41)
+l2Z
+so that eq. (5.40) becomes
+X E   E E Xr  fŒO .; z/ 1  Œr E .; z/ eil g = k2 O.; z/ EE .; z/ eill 0 l : (5.42)
+l l
+In cylindrical coordinates,
+rE = rE C eE  1t  @ ; where rE t  eE@ C eEz@z : (5.43)
+Since all functions in eq. (5.42) depend on  only through factors eil , differentiation over  reduces to
+multiplication by il . As a result, eq. (5.42) can be rewritten as
+X
+rE  fŒO .; z/ 
+X
+1  ŒrE EE .; z/g eil = k2 O.; z/ EE .; z/ eill l l 0 l ; (5.44)
+l l
+where
+rE  rE C eE il 1l t  : (5.45)
+From the linear independence of the functions eil (l 2 Z) on the interval Œ0; 2  it follows that eq. (5.44)
+is equivalent to a system of decoupled equations on individual Fourier coefficients EEl.; z/:
+rE  fŒO .; z/ 1  ŒrE EE .; z/g = k2l l l 0O.; z/ EEl.; z/ for each l 2 Z: (5.46)
+Thus, the eigenmodes of an axisymmetric system can be classified according to their azimuthal order l
+and found by solving separately each of the equations (5.46) for the field EEl.; z/ defined on the 2D
+domain
+˝  f.; z/j0    R and Z   z  ZCg : (5.47)
+Needless to say, this brings substantial savings in computational time in comparison to the solution of
+the original equation (5.40) defined on the 3D domain ˝0. The geometry of the domain ˝ is shown
+schematically in fig. 5.10.
+132 Chapter 5. Numerical methods
+z
+ 1 eEn
+ZC
+PML
+ 0  1
+˝
+R 
+PML
+Z 
+ 1
+Figure 5.10 Geometry of the domain ˝. Regions filled with PMLs are hatched.
+Weak form The FE method is based on the Galerkin’s technique, itself a representative of the class of
+weighted-residual methods for solving differential equations. In these methods, a generalised differential
+eigenvalue problem [like the one from eq. (5.46)] of the general form A u = Bu, where A and B are
+differential operators, u is the unknown function, and  is the eigenvalue, is converted into a system of
+algebraic linear equations by (i) expanding u in a series of known basis functions un and (ii) requiring
+that an appropriately defined inner product .vn;Ru/ of a number of test functions vn with the residual
+Ru  A u   Bu vanish. In the Galerkin’s method the set of test functions is chosen to be identical
+with that of basis functions [199, section 3.1].
+Boundary conditions can be incorporated into the equation .vn;Ru/ = 0 using integration by parts.
+This leads to the weak form of a differential equation, in which the original equation and its associated
+boundary conditions are merged in a single formula.
+We shall now derive the weak form of eq. (5.46). We define the inner product in the usual way,
+“
+.vE; uE/  vE.; z/  uE.; z/ d˝: (5.48)
+˝
+The condition that the inner product of an arbitrary test function vE with the residual of eq. (5.46) vanish
+takes then the form (henceforth we omit the superscript l in EEl )
+“ “
+vE  frE  ŒO 1  .rE EE/g d˝ = k2 vE  O EEl l 0 d˝ (5.49)
+˝ ˝
+It can be shown that the following integration-by-parts formula is valid:
+“ “ I
+vE  .rE  uE/ d˝ = .rE  vE/l l  uE d˝   .vE  uE/  eEn dl I (5.50)
+˝ ˝ @˝
+here, vE and uE are arbitrary sufficiently regular functions, @˝ is the boundary of ˝, and eEn denotes the
+unit vector normal to @˝ and directed outwards. Applying this formula to eq. (5.49), we get
+“ I “
+.rE  vE/ O 1  .rE EE/ d˝   fvE  ŒO 1  .rE EE/g  eE dl = k2 vE  O EEl l l n 0 d˝: (5.51)
+˝ @˝ ˝
+Later in this subsection we shall use the boundary conditions to dispense with the contour integral in the
+above equation.
+5.3. Finite-element simulations of three-dimensional axisymmetric cavities 133
+Boundary conditions The contour @˝ can be divided into two parts: that lying on the z axis, denoted
+henceforth  0, and the rest, denoted  1 (see fig. 5.10). The segment  1 is a subset of the surface of the
+original 3D domain ˝0. Therefore the boundary condition imposed on it has already been specified to
+be of the perfect-electric-conductor type. In contrast, the segment  0 does not belong to the surface
+of˝0, and the boundary conditions on it have still to be determined. They will follow from the physical
+requirement that the limits lim!0EE.; ; z/ and lim!0HE.; ; z/ exist and be independent from 
+for all z 2 ŒZ ; ZC.
+For an eigenmode of a given order l , EE.; ; z/ = EE.; z/ eil . Using eq. (5.36) and rewriting cos
+and sin in terms of the exponential functions e˙i , we obtain that
+E .; ; z/ = 1fŒE .; z/C iE .; z/ ei.lC1/ C ŒE .; z/   iE .; z/ ei.l 1/x     g; (5.52a)2
+E .; ; z/ = 1 fŒE .; z/C iE .; z/ ei.lC1/   ŒE .; z/   iE .; z/ ei.l 1/y     g; (5.52b)2i
+E .; ; z/ = E .; z/ eilz z : (5.52c)
+Thus the lim8ˆits of these expressions with ! 0 exist and are independent from  only if< for l = 0; (a) E.0; z/ = 0 and (b) E.0; z/ = 0; (5.53)
+:ˆ for jl j = 1; (a) E.0; z/C ilE.0; z/ = 0 and (b) Ez.0; z/ = 0; (5.54)
+for jl j > 1; (a) E.0; z/ = 0; (b) E.0; z/ = 0 and (c) Ez.0; z/ = 0: (5.55)
+Turning now to the magnetic field, from eq. (1.4a) we get
+HE.; ; z/ = Œi! O .; z/ 10  ŒrE EE.; ; z/
+O    rE  E (5.56)= Œi!0.; z/ 1 Œ l E.; z/ eil :
+R8ˆˆˆeasoning analogously as in the case of the electric field, we obtain the conditions
+ˆˆˆ for l = 0; (a) ŒO 1  .rE l EE/.0; z/ = 0 and (b) ŒO 1  .rE El E/.0; z/ = 0; (5.57)< for jl j = 1; (a) ŒO 1  .rE EE/ .0; z/C il ŒO 1  .rE EEl  l /.0; z/ = 0 and (5.58)
+ˆˆˆˆˆ (b) ŒO 1  .rE l EE/z.0; z/ = 0;
+:ˆ for jl j > 1; (a) ŒO 1  .rE EE/ .0; z/ = 0; (b) ŒO 1l   .rE l EE/.0; z/ = 0 and (5.59)
+(c) ŒO 1  .rE l EE/z.0; z/ = 0:
+Finite-element expansions From now on we restrict our attention to the case jl j  1. The deriva-
+tions go slightly differently for modes with order l = 0, and such modes are less interesting for us, since
+they do not exhibit the twofold degeneracy required in a cavity forming part of a circulator. Following
+refs. 51, 196, 197 and 52, we introduce the following change of variables:
+EE  eE E C eE E = .il/ 1.eE E   EE 0t   z z   t/: (5.60)
+We expand the azimuthal component of EE into nodal FE basis functions u0n.; z/ (n = 1; 2; : : : ; N):
+XN
+E = E
+0
+nun; (5.61)
+n=1
+and the new field EE 0t, tangential to the meridional plane z, into curl-conforming vector FE basis func-
+tions uE0tn.; z/ (n = 1; 2; : : : ; Nt):
+E 0 XNtEt = E 0 0tnuEtn: (5.62)
+n=1
+134 Chapter 5. Numerical methods
+The coefficients E and E 0n tn are the unknowns to be determined. The restrictions of the functions
+u0 and of both components of uE0 to any element are polynomials in  and z. The functions u0n tn n are
+continuous on ˝, whereas uE0tn have the property that their tangential components are continuous across
+element borders; as a result, rE  uE0t tn is finite everywhere.
+Gathering together eqs. (5.60)–(5.62), we obtain thus the following FE expansion of the electric
+field EE, XN XNt
+EE = ŒeE C .il/ 1eEE   .il/ 1EE 0t = EnuEn C E 0tnuEtn; (5.63)
+n=1 n=1
+in terms of the azimuthal basis functions
+uE  ŒeE C .il/ 1eE u0n   n .n = 1; 2; : : : ; N/ (5.64)
+and the meridional basis functions
+uE   .il/ 1uE0tn tn .n = 1; 2; : : : ; Nt/: (5.65)
+Imposition of boundary conditions We shall now demonstrate that the chosen form of FE ex-
+pansions allows to impose conditions (5.53) and (5.57) in a simple way, as well as to remove from the
+integrals in eq. (5.51) all singular weights, stemming from the presence of the term eE il 1 in definition
+(5.45) of rE l . We shall assume that close to the z axis the tensor O has the gyrotropic form2 3
+t ig 0
+O = 4 i 5g t 0 (5.66)
+0 0 z
+As will be shown in section 5.3.3, this is the case even if PMLs are present.
+We begin by expressing E , E and all the components of rE EE in terms of E and EE 0 z l  t. Using eq.
+(5.60), after some straightforward algebra we obtain
+E = .il/ 1.E   E 0  /; (5.67a)
+E = .il/ 1E 0z z; (5.67b)
+.rE EE/ =  @ E  E 0l  z  z; (5.67c)
+.rE EE/ = .il/ 1Œ@ E CE 0   .@ E 0   @ E 0l  z  z z   z; (5.67d)
+.rE EE/ = @ E CE 0l z   : (5.67e)
+Owing to the regularity properties of the basis functions used to expand the fields E and EE 0 t, discussed
+above, the limits of expressions (5.67) with ! 0 exist and are equal to
+E .0; z/ = .il/ 1 E.0; z/; (5.68a)
+Ez.0; z/ = 0; (5.68b)
+.rE EE/ .0; z/ =  .@ E /.0; z/  E 0l  z  z.0; z/; (5.68c)
+.rE EE/ .0; z/ = .il/ 1Œ.@ E /.0; z/CE 0l  z  z.0; z/; (5.68d)
+.rE EE/ .0; z/ = .@ E /.0; z/CE 0l z   .0; z/: (5.68e)
+Let us now study the cases jl j = 1 and jl j > 1 in turn.
+For jl j = 1, conditions (5.54) on the electric field on the z axis are satisfied automatically: the
+fulfilment of condition (5.54b) follows directly from eq. (5.68b), while that of condition (5.54a) is the
+5.3. Finite-element simulations of three-dimensional axisymmetric cavities 135
+consequence of eq. (5.68a) and the observation that l = l 1 if jl j = 1. The satisfaction of condition
+(5.58a) also follows from eqs. (5.68c) and (5.68d), as can be verified by hand (the assumption that O is
+gyrotropic on the z axis is crucial here). In contrast, condition (5.58b) is not met automatically, and it
+will need to be imposed weakly by help of the contour-integral term in eq. (5.51), as will be demonstrated
+below.
+For jl j > 1, only condition (5.55c) is automatically fulfilled, by virtue of eq. (5.68b). To satisfy
+conditions (5.55a), (5.55b), (5.59a) and (5.55b), homogeneous Dirichlet boundary conditions on E and
+E 0z on  0 must explicitly be imposed by removing from the series (5.63) the functions uEn and uEtn
+whose  or z components are nonzero on  0. As in the case jl j = 1, the remaining condition (5.59c) will
+be imposed weakly.
+For all values of l , of course, the perfect-electric-conductor boundary conditions eEn  EE = 0 on  1
+must also be imposed; this can be done in the manner described in the previous paragraph, by removing
+appropriate terms from expansion (5.63).
+We are now ready to tackle the contour integral from eq. (5.51). The integration path @˝ is the sum
+of  0 and  1; let us consider first the latter part of this contour. From the identity .aE  bE/  cE = .cEaE/  bE,
+where aE, bE and cE are arbitrary vectors, we get
+Z Z
+fvE  ŒO 1  .rE EEl /g  eEn dl = .vE  eE n/  O 1  .rE l EE/ dl: (5.69)
+ 1  1
+But since in the Galerkin’s method the set of test functions is identical with that of basis functions and,
+as we have said above, the latter will be chosen so as to fulfil the perfect-electric-conductor boundary
+conditions on  1, the cross product vE  eEn will vanish on  1 and this part of the integration path will
+bring no contribution to the integral. Integration over  0 is more interesting. Using the aforementioned
+identity one more time, we convert the integral to the form
+Z Z
+fvE  ŒO 1  .rE l EE/g  eEn dl = vE  fŒO 1  .rE El E/  eEng dl: (5.70)
+ 0  0
+Since on  0 the unit vector eEn =  eE,
+Z Z Z
+fvE ŒO 1  .rE l EE/g  eEn dl =   ŒO 1  .rE l EE/ zv dlC ŒO 1  .rE El E/ vz dl: (5.71)
+ 0  0  0
+By conditions (5.58b) and (5.59c), for all l  1 the z component of O 1  .rE l EE/ should vanish on  0;
+hence, the first term on the right-hand side of eq. (5.71) will approach zero as the FE approximation of a
+given cavity eigenmode tends to the true solution. Therefore, we shall omit this term from the discretised
+equation (5.51). On the other hand, the second term will vanish because, as we have said above, the
+chosen FE expansions satisfy automatically the condition that Ez = 0 on  0 [conditions (5.54b) and
+(5.55c)]; hence, vz will disappear on this part of the integration contour.
+In this way we have shown that the contour integral can be dropped from the weak form (5.51) of the
+vector wave equation of an axisymmetric system. We arrive thus at the final form of this equation:
+“ “
+.rE  vE/  O 1  .rE EE/ d˝ = k2 vEl l 0  O EE d˝: (5.72)
+˝ ˝
+Conversion into algebraic eigenvalue problem In order to convert eq. (5.72) into a system of
+algebraic equations, we write it separately for each test function vE = uEn (n = 1; 2; : : : ; N) and vE = uEtn
+136 Chapter 5. Numerical methods
+(n = 1; 2; : : : ; Nt), substituting for EE expansion (5.63). We assume the cylindrical representation of the
+permittivity tensor to have the form 2 3
+ ig 0
+O = 4 i 5g  0 ; (5.73)
+0 0 z
+and the permeability tensor to be diagonal, 2 3
+ 0 0
+O = 4 0  5 0 ; (5.74)
+0 0 z
+with the additional constraint that  =  close to the z axis, which is necessary for the boundary con-
+ditions on that axis to be met.? The reader will certainly have noted that we have let the tensors O and O
+take a more general form than the gyrotropic one from eq. (5.38). This is because we allow for the pres-
+ence of PMLs, whose material properties need not have a piecewise-constant Cartesian representation.
+After some algebra, we obta"in the following generalised eigenvalueO O #" E # " O O #
+p"roble#m:
+A At E E 2 B Bt E
+O O NE 0 = k0 O O NE 0 ; (5.75)At Att EN Bt t Btt EN t
+where EE and EE 0 denote the column vectors of coefficients E and E 0 t n tn, respectively (the underbars
+have beNen addedNto distinguish these symbols from those denoting components ofEE), whereas the entries
+of matrices AO O˛ˇ“and B˛ˇ (˛; ˇ = ; t) are given by
+.AO / = . 1@ u0 @ u0 C  1@ u0 @ u0 C l 2 1@ u0 @ u0 mn   z z z z /  d dz; (5.76a)
+“ z m n  m n  m n˝
+.AO / = f 1@ u0 u0 C  1@ u0 u0t mn z  m n  z m zn
+˝
+C l 2 1@ u0 Œu0   .rE  uE0 z m zn t tn/zg  d dz; (5.76b)
+.AOt/mn =“.AOt/nm; (5.76c)
+.AO / = f 1u0 u0 C  1u0 u0tt mn z m n  zm zn
+˝
+“C l 2 1 0 E 0 0 E 0 Œuzm   .rt  uEtm/zŒuzn   .rt  uEtn/zg  d dz; (5.76d)
+.BO / = Œ.l 2   2l 1 mn  g C /u0 u0   d dz; (5.76e)
+“ m n˝
+.BO / = Œ. l 2 C l 1 /u0 u0  2t mn  g m n d dz; (5.76f)
+˝
+.BOt/mn = .“BOt/nm; (5.76g)
+.BO / = l 2. u0 u0 C  u0 u0 / 3tt mn  m n z zm zn d dz: (5.76h)
+˝
+In these formulas u0 and u0 denote the  and z components of the basis function uE0n zn tn. It has been
+assumed that all the functions u0 and uE0n tn are real-valued.
+? It is equally possible to handle the slightly more general case with  =   ¤ 0, at the cost of more complicated
+formulas.
+5.3. Finite-element simulations of three-dimensional axisymmetric cavities 137
+5.3.3 Numerical implementation
+Software We have implemented the method presented in the previous subsection using the Hermes
+C++ library [55, 56], which significantly facilitates the development of FE-method-based codes. First,
+it provides ready-made implementations of commonly used classes of FEs, including standard nodal
+FEs and vector curl-conforming FEs, up to the polynomial order 10. Both triangular and quadrilateral,
+recti- and curvilinear elements are available. Second, the library completely automatises the matrix
+assembly, allowing also to impose Dirichlet and Neumann boundary conditions on selected portions
+of the computational domain’s boundary. In principle, a user of Hermes needs only to write functions
+calculating the integrals occurring in the weak form of the differential equation at hand and to specify
+the geometry of the computational domain along with the boundary conditions.
+Meshing A characteristic feature of axisymmetric cavities produced by etching multilayer structures
+is that the material interfaces in any meridional plane are almost always parallel to the  or z axis. This
+is the case with all the structures studied in section 4.6. Therefore we have meshed the domain ˝ with
+rectangular FEs with sides parallel to eE and eEz . The process of mesh generation for a typical cavity goes
+as follows. In the first step,˝ is divided into as many conforming elements as are necessary to ensure that
+each interface between two different materials coincides with an interelemental boundary. The elements
+created in this way are subsequently subdivided into smaller ones with side lengths approximately equal
+to a predefined constant hideal. If desired, the resulting mesh is further uniformly refined by splitting
+each element into quarters. This step can be repeated as many times as necessary.
+FE expansions The unknown fields E and EE 0 t are expanded into hierarchical polynomial bases pro-
+vided by Hermes. The expansion order p, defined as the maximum degree of the polynomials included
+in these expansions, is taken to be the same in all elements.
+Quadratures All the matrix entries (5.76) are calculated with Gauss-Legendre quadratures. In ele-
+ments containing materials with constant O and O , we employ quadratures of the minimum order neces-
+sary to ensure their exactness (for the given expansion order p). In elements containing PMLs, whose
+material properties depend on the position in a non-polynomial way (see below), the quadrature order is
+chosen as greater by ten than that which would ensure exact integration for constant O and O .
+Eigenvalue problem solving To solve the complex sparse non-symmetric generalised eigenvalue
+problem (5.75), we have used the Krylov-Schur iterative sparse eigenvalue solver implemented in the
+SLEPc library [57–59]. Hermes provides interfaces to several popular sparse linear equation solvers;
+unfortunately, at present it does not offer integration with any eigenvalue solvers. Therefore we have
+written a custom interface between Hermes and SLEPc.
+The vector wave equation (5.40) incorporates Gauss’s law rE .O EE/ = 0, but only if k0 ¤ 0 [200]. As
+a result, eq. (5.75), derived from (5.40), possesses a large cluster of spurious static solutions that do not
+obey Gauss’s law. Therefore even if the lowest-frequency eigenmodes of a given cavity are desired, they
+cannot be found by using an iterative eigenvalue solver to find a few lowest-magnitude eigenvalues of
+(5.75). Rather, a shift-and-invert transformation of (5.75) must be used to bring the part of its spectrum
+closest to a prescribed shift  into the neighbourhood of zero, so that the eigenmodes belonging to this
+part of the spectrum may be found by the iterative algorithm [59]. Such spectral transformations are
+handled transparently by SLEPc.
+It is possible to modify the bases used for field expansions so as to eliminate altogether the spuri-
+ous static solutions [201]. Another possibility consists in modifying an iterative eigenvalue solver so
+as to prevent it from converging to a solution violating Gauss’s law. This technique has recently been
+demonstrated by Venkatarayalu [52]. Although these approaches probably improve the efficiency of
+138 Chapter 5. Numerical methods
+z
+ 1
+ZC
+PML dPML
+ 0 dsup  1
+dsep dPML
+R
+d sub
+PML dPML
+Z 
+ 1
+Figure 5.11 Geometry of an example domain ˝. Darker regions have larger permittivity. PMLs are hatched.
+calculations—in particular, a sparse matrix inversion required by a shift-and-invert transformation is
+avoided—their implementation is quite non-trivial. We have therefore stuck to shift-and-invert transfor-
+mations, which we found to work very reliably.
+Perfectly matched layers As mentioned in the previous subsection, to suppress spurious reflections
+due to the finite size of the computational domain, the boundary  1 is coated from inside by PMLs
+of thickness dPML, as shown in fig. 5.11. We use standard PMLs adapted for cylindrical coordinates,
+which can be interpreted as anisotropic materials with diagonal permittivity tensors O = O and O = O,
+where  and  are the material parameters of the “real” media adjacent to PMLs and the diagonal tensor
+O  diag.;  ; z/ is responsible for the absorbing properties of the PML. Its elements are given by
+[51, 54]
+ SzQ  SzS ;  Q and z 
+SQ
+; (5.77)
+S  Sz
+where       2
+S./  1C  .R dPML/isPML U ; (5.78a)
+  dPMLC   2        C .Z  dPML/ z z .ZC d / 2PMLSz.z/ 1 isPML U C isPML U ; (5.78b)
+dPML dPML
+ŒU.   .R   d //3
+Q PML./  C isPML (5.78c)
+3d2
+PML
+and U.x/ is x if x > 0 and zero otherwise. The real parameter sPML is called the PML strength. It is
+worth noting that for   R   dPML we have S./ = Q./ = 1; hence,  =  = Sz , in accord with
+our earlier assumption that the tensor O should be gyrotropic close to the z axis.
+5.3.4 Evaluation of accuracy
+The accuracy of calculations made with the proposed technique is affected by a number of factors, which
+can be divided into two groups. The first of them includes the parameters of the FE expansion itself:
+ typical element size h,
+ expansion order p.
+5.3. Finite-element simulations of three-dimensional axisymmetric cavities 139
+# rin (nm) rout (nm) # rin (nm) rout (nm)
+1 1236 1443 11 4618 4765
+2 1656 1828 12 4933 5079
+3 2019 2181 13 5246 5392
+4 2363 2519 14 5559 5705
+5 2696 2849 15 5872 6017
+6 3023 3174 16 6184 6329
+7 3346 3496 17 6495 6640
+8 3667 3816 18 6806 6951
+9 3986 4134 19 7117 7262
+10 4303 4450 20 7428 7572
+Table 5.1 Radii of the high-index rings of the G4-type cavity used to test the accuracy of calculations. The
+symbols rin and rout denote the inner and outer radius of a ring, respectively.
+nref p C  
+0 1 1:25199C 0:00612i 1:25194C 0:00610i
+0 2 1:24329C 0:00367i 1:24022C 0:00419i
+0 3 1:25691C 0:00340i 1:25384C 0:00387i
+0 4 1:26034C 0:00333i 1:25728C 0:00379i
+1 1 1:25900C 0:00362i 1:25597C 0:00411i
+1 2 1:26133C 0:00333i 1:25827C 0:00378i
+1 3 1:26148C 0:00331i 1:25842C 0:00376i
+2 1 1:26145C 0:00331i 1:25839C 0:00376i
+2 2 1:26149C 0:00331i 1:25843C 0:00376i
+Table 5.2 Influence of the number of mesh refinements, nref, and the expansion order p on the calculated values
+of the wavelengths ˙ of the counter-rotating modes of the cavity described in the text. The remaining parameters
+were chosen as dsub = dsup = 600 nm, dsep = dPML = 500 nm and sPML = 6.
+The second is formed by the domain truncation parameters:
+ substrate thickness dsub,
+ superstrate thickness dsup,
+ distance from the outermost inhomogeneity in the multilayer to the inner boundary of the radial
+PML, dsep,
+ PML thickness, dPML,
+ PML strength, sPML.
+In fig. 5.11 graphical definitions of the first four items from the above list are shown.
+To determine the values of the above parameters required to get a reasonable accuracy, we have
+studied the influence of their variation of the calculated values of the wavelengths C and   of the
+modes with azimuthal order l = 10 and  10 of a particular G4-type cavity (see section 4.6) containing
+20 high-index rings, whose radii are listed in table 5.1.
+We began by testing the dependence of ˙ on h and p. The former was varied as follows: first, in the
+way described in subsection 5.3.3, we generated an initial mesh composed of rectangular elements with
+side lengths roughly equal to hideal = 150 nm, and subsequently we refined it uniformly nref times. Table
+5.2 lists the values of ˙ obtained for a number of combinations .nref; p/; the values of the remaining
+parameters are specified in the caption of that table. Clearly, at least one level of refinement is necessary
+to get accurate results. This is probably related to the occurrence of field singularities at the edges of
+140 Chapter 5. Numerical methods
+nsub = nsup C  
+0:1 1:26135C 0:00311i 1:25831C 0:00354i
+0:2 1:26146C 0:00319i 1:25842C 0:00364i
+0:3 1:26150C 0:00325i 1:25845C 0:00370i
+0:4 1:26150C 0:00329i 1:25845C 0:00374i
+0:5 1:26150C 0:00330i 1:25844C 0:00376i
+0:6 1:26149C 0:00331i 1:25843C 0:00376i
+0:7 1:26148C 0:00331i 1:25843C 0:00376i
+0:8 1:26148C 0:00331i 1:25843C 0:00376i
+0:9 1:26148C 0:00331i 1:25842C 0:00376i
+1:0 1:26148C 0:00331i 1:25842C 0:00376i
+Table 5.3 Influence of the substrate and superstrate thicknesses, dsub and dsup (taken equal to each other) on
+the calculated values of the wavelengths ˙ of the counter-rotating modes of the cavity described in the text. The
+remaining parameters were chosen as nref = 1, p = 3, dsep = dPML = 500 nm and sPML = 6.
+rings; these singularities can be clearly seen on plots of the meridional components ofEE. It is well known
+[202, section 3.3] that the convergence of a FE expansion can be accelerated by an additional refinement
+of the elements at whose corners singularities occur.
+In any case, the data in table 5.2 show that the wavelengths obtained for .nref; p/ = .1; 3/, .2; 1/
+and .2; 2/ differ only with the sixth significant digit. Therefore, one can expect them to have absolute
+accuracy of at least 0.1 nm. This is enough for the purposes of the evaluation of the wavelength splitting
+  C     between the counter-rotating modes, which is typically on the level on 2–3 nm. For the
+remaining calculations we fixed nref = 1 and p = 3.
+We studied next the sensitivity of ˙ to the changes of dsub and dsup, for simplicity taking them
+to be equal. The results, listed in table 5.3, indicate that the influence of these parameters is negligible
+(˙ does not change by more than 0.03 nm) as soon as they are chosen larger than 100 nm. We decided
+therefore to stay with the originally assigned values, dsub = dsup = 600 nm. We have also calculated ˙
+as a function of dsep ranging from 100 nm to 800 nm, and found all the obtained values to be identical to
+six significant digits. In future calculations we continue to take dsep = 500 nm.
+Lastly, we evaluated the dependence of ˙ on the PML parameters, dPML and sPML. We made two
+series of calculations, in which the PML strength was fixed to 6 and 12, respectively, while its thickness
+was varied from 100 to 800 nm. The results are given in table 5.4. Clearly, for both PML strengths the
+wavelengths ˙ converge quickly to practically the same values (˙0:01 nm).
+To sum up, the parameters related to the truncation of ˝ have been found to affect little the results
+of calculations. Thus, one can be reasonably confident that the data presented in section 4.6, which were
+obtained with nref = 1, p = 3, dsub = dsup = 600 nm, dsep = dPML = 500 nm and sPML = 6, are
+accurate to about˙0:05 nm, which corresponds to a relative error of 4  10 5.
+5.3. Finite-element simulations of three-dimensional axisymmetric cavities 141
+sPML = 6 sPML = 12
+dPML C   C  
+0:1 1:25945C 0:00388i 1:25617C 0:00423i 1:26114C 0:00439i 1:25796C 0:00488i
+0:2 1:26107C 0:00385i 1:25793C 0:00430i 1:26163C 0:00331i 1:25858C 0:00378i
+0:3 1:26148C 0:00350i 1:25841C 0:00396i 1:26147C 0:00330i 1:25842C 0:00375i
+0:4 1:26151C 0:00334i 1:25845C 0:00380i 1:26148C 0:00330i 1:25842C 0:00376i
+0:5 1:26149C 0:00331i 1:25843C 0:00376i 1:26148C 0:00331i 1:25842C 0:00376i
+0:6 1:26148C 0:00331i 1:25843C 0:00376i 1:26148C 0:00331i 1:25842C 0:00376i
+0:7 1:26148C 0:00331i 1:25843C 0:00376i 1:26148C 0:00331i 1:25843C 0:00376i
+0:8 1:26148C 0:00331i 1:25842C 0:00376i 1:26148C 0:00331i 1:25843C 0:00376i
+Table 5.4 Influence of the PML thickness dPML and PML strength sPML on the calculated values of the wave-
+lengths ˙ of the counter-rotating modes of the cavity described in the text. The remaining parameters were chosen
+as nref = 1, p = 3, dsub = dsup = 600 nm and dsep = 500 nm.
+
+Chapter 6
+Conclusions and perspectives
+The work whose results have been presented in this thesis encompasses a fairly wide range of topics,
+concerning mostly, but not exclusively, those related to PCs. Here we attempt to summarise these results,
+putting them in perspective, highlighting those we find the most important, and offering some ideas on
+future work.
+In chapter 2, the most theoretical one in this thesis, we formulated an effective-medium model of
+2D PCs. Using this model, we conducted an in-depth study of the validity of the effective-medium
+description of PCs exhibiting the negative-refraction effect. We believe this to have been the first analysis
+encompassing both the propagative and the evanescent region and not limited to at most a few discrete
+incidence angles. We think we provided convincing arguments that the effective-medium approximation
+of PCs with negative refraction is too simplistic and, therefore, such PCs cannot be used as a drop-in
+replacement of homogeneous negative-index media.
+The rest of the manuscript was more device-oriented. In chapter 3 we presented an algorithm for the
+design of AR gratings for PCs and showed its applicability to certain specific PC components. At the
+same time, we strived to be explicit about its limitations, which stem from its reliance on a number of
+approximations.
+It needs to be stressed that the possibilities offered by the numerical shape optimisation procedure,
+which is the last step of the proposed algorithm, have not been exploited in full in the examples presented
+in section 3.4. For instance, in the case of a flat lens, it is not sufficient that the device pass (almost) all
+the incident energy; creation of a high-quality image requires also that the waves incident at different
+angles arrive on the image plane with appropriate phases. Thus, it might be more judicious to formulate
+the objective function (to be minimised) in terms of the amplitudes and phases of the transmitted waves
+rather than the reflected ones. This would also allow to optimise the transmission of the evanescent
+waves, and hence, possibly, to overcome the diffraction limit.
+In chapter 4 we reported on our work on magneto-optical circulators. The crucial step was the
+idea of studying closely the class of resonant cavities having the rotational symmetry. It led to the
+formulation of a novel design principle for uniformly magnetised, and therefore manufacturable, cavities
+that nonetheless exhibit a substantial mode frequency splitting. We then initially pursued the beaten
+path of PC-based circulator designs. It was M. Vanwolleghem (Institut d’Electronique Fondamentale,
+Orsay, France) who first suggested testing simpler systems based on uniform waveguides. Despite initial
+problems with securing a sufficient degree of coupling between such waveguides and the central cavity (it
+was not possible to use side-coupling owing to an extreme phase mismatch between the waveguide and
+cavity modes), we finally succeeded by employing butt-coupling instead of side-coupling and optimising
+the shape of the waveguide slot.
+As we have remarked in section 4.5.4, the circulator designed on the basis of 2D calculations did
+not fare well in experiment owing to excessive out-of-plane losses. In March 2010 it was therefore
+deemed necessary to turn to 3D simulations. Good progress has already been made; in particular, at
+143
+144 Chapter 6. Conclusions and perspectives
+the end of section 4.6.2 we presented a 3D cavity with markedly reduced radiation losses. To arrive at
+an experimental demonstration of a working circulator, however, further work is still necessary. The
+optimisation should be repeated using the exact value of the refractive index of the potential coating
+material, silicon nitride. More importantly, we do not understand yet the mechanism for the improvement
+of the mode confinement provided by the optimised cavity. A Bloch-mode-based theory might be able
+to explain this effect. We also hope that it will lead to successful designs—no longer based on the
+effective-index approximation—of uncoated cavities, which should have smaller footprint than coated
+ones, thanks to stronger in-plane mode localisation.
+Even if a satisfactory 3D model of axisymmetric cavities is established in future, some numerical
+optimisation of their geometry may still be necessary, or at least desirable. It is well known that gradient-
+based optimisation techniques are in general more efficient than derivative-free methods, such as the
+NEWUOA algorithm used thus far. It should be quite possible to calculate the derivative of the frequency
+splitting ! of a given cavity over the radius of any particular ring, symbolically denoted r here. The
+derivative of the eigenvalue k20 of the problem eq. (5.75) over r is simple to calculate, at least assuming
+that there are no repeated eigenvalues:
+2 @k @AO @BO 0 = yE    k20  xE; (6.1)@r @r @r
+where xE and yE are the right and left eigenvectors corresponding to k2 and normalised so that yE0 BO xE = 1.
+(See refs. 203 and 204 for a review on the computation of eigenvalue derivatives.) The derivatives of AO
+and BO over r can be evaluated from the explicit formulas (5.76) for their entries.
+An optimised cavity will eventually need to be integrated with the input and output waveguides.
+Which numerical method will be most suitable for the simulation of the complete 3D system is not clear
+yet; some views on this matter have been offered in the conclusions to chapter 4.
+Finally, as noted in section 4.1.3, Yu et al. [155] have recently proposed theoretically an isolator based
+on time-dependent refractive-index modulation. In the structure presented in their article, introduction of
+a boundary separating the modulated and unmodulated parts of the waveguides is needed; this requires
+a precise alignment of the electric field enforcing the modification of the refractive index. It might be
+possible to employ the ideas developed in chapter 4, and in particular the design rule from section 4.3, to
+dispense with the necessity of introducing domains free from the modulating field.
+Bibliography
+[1] R. Nagarajan, C. Joyner, J. Schneider, R.P., J. Bostak, T. Butrie, A. Dentai, V. Dominic, P. Evans,
+M. Kato, M. Kauffman, et al., J. Sel. Top. Quant. Electron. 11, 50 (2005).
+[2] R. Nagarajan, M. Kato, J. Pleumeekers, P. Evans, D. Lambert, A. Chen, V. Dominic, A. Mathur,
+P. Chavarkar, M. Missey, et al., J. Opt. Netw. 6, 102 (2007).
+[3] S. C. Nicholes, M. L. Mašanovic´, B. Jevremovic´, E. Lively, L. A. Coldren, and D. J. Blumenthal,
+J. Lightwave Technol. 28, 641 (2010).
+[4] Infinera’s 400 Gb/s PIC sets new record for integration, http://www.infinera.com/j7/servlet/
+NewsItem?newsItemID=150.
+[5] W. A. Harrison, Solid state theory (Dover, New York, 1980).
+[6] E. Ozbay, Science 311, 189 (2006).
+[7] R. G. Hunsperger, Integrated optics: theory and technology (Springer, New York, 2009).
+[8] E. Yablonovitch, Phys. Rev. Lett. 58, 2059 (1987).
+[9] S. John, Phys. Rev. Lett. 58, 2486 (1987).
+[10] R. D. Meade, A. Devenyi, J. D. Joannopoulos, O. L. Alerhand, D. A. Smith, and K. Kash, J. Appl.
+Phys. 75, 4753 (1994).
+[11] A. Mekis, J. C. Chen, I. Kurland, S. Fan, P. R. Villeneuve, and J. D. Joannopoulos, Phys. Rev.
+Lett. 77, 3787 (1996).
+[12] K. Busch, G. von Freymann, S. Linden, S. Mingaleev, L. Tkeshelashvili, and M. Wegener, Phys.
+Rep. 444, 101 (2007).
+[13] B. Gralak, S. Enoch, and G. Tayeb, in Metamaterials: physics and engineering explorations,
+edited by N. Engheta and R. W. Ziolkowski (Wiley, New York, 2006), chap. 10, pp. 261–283.
+[14] B. Gralak, S. Enoch, and G. Tayeb, J. Opt. Soc. Am. A 17, 1012 (2000).
+[15] H. Kosaka, T. Kawashima, A. Tomita, M. Notomi, T. Tamamura, T. Sato, and S. Kawakami, Appl.
+Phys. Lett. 74, 1212 (1999).
+[16] H. Kosaka, T. Kawashima, A. Tomita, M. Notomi, T. Tamamura, T. Sato, and S. Kawakami, Phys.
+Rev. B 58, R10096 (1998).
+[17] J. B. Pendry, Phys. Rev. Lett. 85, 3966 (2000).
+145
+146 BIBLIOGRAPHY
+[18] N. Fabre, L. Lalouat, B. Cluzel, X. Mélique, D. Lippens, F. de Fornel, and O. Vanbésien, Phys.
+Rev. Lett. 101, 073901 (2008).
+[19] J. Amet, F. I. Baida, G. W. Burr, and M. Bernal, Photonics Nanostruct. Fundam. Appl. 6, 47
+(2008).
+[20] V. G. Veselago, Sov. Phys. Usp. 10, 509 (1968).
+[21] T. Decoopman, G. Tayeb, S. Enoch, D. Maystre, and B. Gralak, Phys. Rev. Lett. 97, 073905
+(2006).
+[22] J. Ushida, M. Tokushima, M. Shirane, A. Gomyo, and H. Yamada, Phys. Rev. B 68, 155115
+(2003).
+[23] A. Efros and A. Pokrovsky, Solid State Commun. 129, 643 (2004).
+[24] R. Biswas, Z. Y. Li, and K. M. Ho, Appl. Phys. Lett. 84, 1254 (2004).
+[25] B. Momeni, A. Asghar Eftekhar, and A. Adibi, Opt. Lett. 32, 778 (2007).
+[26] Z. Lu and D. W. Prather, Opt. Express 15, 8340 (2007).
+[27] R. Pierre and B. Gralak, J. Mod. Opt. 55, 1759 (2008).
+[28] B. Momeni, M. Badieirostami, and A. Adibi, J. Opt. Soc. Am. B 24, 2957 (2007).
+[29] Y. Wu, J. Li, Z.-Q. Zhang, and C. T. Chan, Phys. Rev. B 74, 085111 (2006).
+[30] V. Yannopapas and A. Moroz, J. Phys. Cond. Mat. 17, 3717 (2005).
+[31] V. Yannopapas and N. V. Vitanov, Phys. Rev. B 74, 193304 (2006).
+[32] V. Yannopapas, Phys. Rev. B 75, 035112 (2007).
+[33] G. Scherrer, M. Hofman, W. S´migaj, B. Gralak, X. Melique, O. Vanbésien, D. Lippens, C. Dumas,
+B. Cluzel, and F. de Fornel, Appl. Phys. Lett. 97, 071119 (2010).
+[34] Z. Wang and S. Fan, Appl. Phys. B 81, 369 (2005).
+[35] H. Dötsch, N. Bahlmann, O. Zhuromskyy, M. Hammer, L. Wilkens, R. Gerhardt, P. Hertel, and
+A. F. Popkov, J. Opt. Soc. Am. B 22, 240 (2005).
+[36] D. R. Goff, Fiber optic reference guide (Focal Press, Amsterdam, 2002).
+[37] Z. Wang and S. Fan, Opt. Lett. 30, 1989 (2005).
+[38] D. Felbacq, G. Tayeb, and D. Maystre, J. Opt. Soc. Am. A 11, 2526 (1994).
+[39] G. Tayeb and D. Maystre, J. Opt. Soc. Am. A 14, 3323 (1997).
+[40] D. Maystre, S. Enoch, and G. Tayeb, in Electromagnetic theory and applications for photonic
+crystals, edited by K. Yasumoto (CRC Press, Boca Raton, 2005), chap. 1.
+[41] N. Stefanou, V. Karathanos, and A. Modinos, J. Phys. Cond. Mat. 4, 7389 (1992).
+[42] N. Stefanou, V. Yannopapas, and A. Modinos, Comp. Phys. Commun. 113, 49 (1998).
+BIBLIOGRAPHY 147
+[43] N. Stefanou, V. Yannopapas, and A. Modinos, Comp. Phys. Commun. 132, 189 (2000).
+[44] N. A. Nicorovici, R. C. McPhedran, and L. C. Botten, Phys. Rev. E 52, 1135 (1995).
+[45] S. K. Chin, N. A. Nicorovici, and R. C. McPhedran, Phys. Rev. E 49, 4590 (1994).
+[46] K. Ohtaka and Y. Tanabe, J. Phys. Soc. Jpn. 65, 2265 (1996).
+[47] A. Moroz, Phys. Rev. B 51, 2068 (1995).
+[48] R. Pierre, Ph.D. thesis, Institut Fresnel, Marseille (2008).
+[49] J. Yuan and Y. Y. Lu, J. Opt. Soc. Am. A 23, 3217 (2006).
+[50] Y. Huang and Y. Y. Lu, J. Lightwave Technol. 24, 3448 (2006).
+[51] A. D. Greenwood and J. Jin, IEEE Trans. Antennas Propag. 47, 620 (1999).
+[52] N. V. Venkatarayalu, Int. J. Numer. Model. 23, 231 (2010), ISSN 0894-3370.
+[53] J. Jin, The finite element method in electromagnetics (Wiley, New York, 2002).
+[54] F. Teixeira and W. Chew, IEEE Microw. Guided Wave Lett. 7, 371 (1997), ISSN 1051-8207.
+[55] Hermes – higher-order modular finite element system (user’s guide), http://hpfem.org (2010).
+[56] P. Solin, Partial differential equations and the finite element method (Wiley, 2005).
+[57] V. Hernandez, J. E. Roman, and V. Vidal, ACM Trans. Math. Software 31, 351 (2005).
+[58] V. Hernandez, J. E. Roman, E. Romero, A. Tomas, and V. Vidal, http://www.grycap.upv.es/slepc
+(2009).
+[59] V. Hernandez, J. E. Roman, E. Romero, A. Tomas, and V. Vidal, SLEPc Users Manual (2009).
+[60] J. G. Van Bladel, Electromagnetic fields (Wiley, 2007).
+[61] J. D. Jackson, Classical electrodynamics (Wiley, New York, 1998).
+[62] W. S´migaj and B. Gralak, Phys. Rev. B 77, 235445 (2008).
+[63] W. S´migaj and B. Gralak, Proc. SPIE 6987, 698726 (2008).
+[64] C. Giacovazzo, ed., Fundamentals of crystallography (Oxford University Press, Oxford, 1992).
+[65] C. G. Someda, Electromagnetic waves (Chapman & Hall, London, 1998).
+[66] S. Boscolo, C. Conti, M. Midrio, and C. G. Someda, J. Lightwave Technol. 20, 304 (2002).
+[67] P. Kuchment, Floquet theory for partial differential equations (Birkhäuser Verlag, Basel, 1993).
+[68] R. Petit, in Electromagnetic theory of gratings, edited by R. Petit (Springer, Berlin, 1980), chap. 1,
+pp. 1–52.
+[69] M. Nevière and E. Popov, Light propagation in periodic media. Differential theory and design
+(Marcel Dekker, New York, 2002).
+[70] Z.-Y. Li and K.-M. Ho, Phys. Rev. B 68, 155101 (2003).
+148 BIBLIOGRAPHY
+[71] L. C. Botten, T. P. White, A. A. Asatryan, T. N. Langtry, C. M. de Sterke, and R. C. McPhedran,
+Phys. Rev. E 70, 056606 (2004).
+[72] E. Istrate, A. A. Green, and E. H. Sargent, Phys. Rev. B 71, 195122 (2005).
+[73] L. Li, J. Opt. Soc. Am. A 13, 1024 (1996).
+[74] P. Vincent, in Electromagnetic theory of gratings, edited by R. Petit (Springer, Berlin, 1980),
+chap. 4, pp. 101–122.
+[75] E. Popov and B. Bozhkov, Appl. Opt. 39, 4926 (2000).
+[76] W. S´migaj, Master’s thesis, Faculty of Physics, Adam Mickiewicz University in Poznan´ (2007).
+[77] M. Plihal and A. A. Maradudin, Phys. Rev. B 44, 8565 (1991).
+[78] J. F. Cornwell, Group theory and electronic energy bands in solids (North-Holland, Amsterdam,
+1969).
+[79] K. Sakoda, Optical properties of photonic crystals (Springer, Berlin, 2001).
+[80] M. Tinkham, Group theory and quantum mechanics (McGraw-Hill, New York, 1964).
+[81] Y.-C. Chang, Phys. Rev. B 25, 605 (1982).
+[82] T. Koschny, P. Markoš, D. R. Smith, and C. M. Soukoulis, Phys. Rev. E 68, 065602(R) (2003).
+[83] D. Seetharamdoo, R. Sauleau, K. Mahdjoubi, and A.-C. Tarot, J. Appl. Phys. 98, 3505 (2005).
+[84] T. Koschny, P. Markoš, E. N. Economou, D. R. Smith, D. C. Vier, and C. M. Soukoulis, Phys.
+Rev. B 71, 245105 (2005).
+[85] R. Liu, T. J. Cui, D. Huang, B. Zhao, and D. R. Smith, Phys. Rev. E 76, 026606 (2007).
+[86] K. F. Riley, M. P. Hobson, and S. J. Bence, Mathematical Methods for Physics and Engineering
+(Cambridge University Press, Cambridge, 2006).
+[87] J. A. Dobrowolski, D. Poitras, P. Ma, H. Vakil, and M. Acree, Appl. Opt. 41, 3075 (2002).
+[88] E. B. Grann and M. G. Moharam, J. Opt. Soc. Am. A 13, 988 (1996).
+[89] H. A. Macleod, Thin-film optical filters (Institute of Physics, Bristol, 2001).
+[90] S. J. Orfanidis, Electromagnetic waves and antennas, http://www.ece.rutgers.edu/~orfanidi/ewa
+(2008).
+[91] D. H. Raguin and G. M. Morris, Appl. Opt. 32, 1154 (1993).
+[92] D. H. Raguin and G. M. Morris, Appl. Opt. 32, 2582 (1993).
+[93] R. Bräuer and O. Bryngdahl, Appl. Opt. 33, 7875 (1994).
+[94] H. Kikuta, H. Toyota, and W. Yu, Opt. Rev. 10, 63 (2003).
+[95] S. Xiao, M. Qiu, Z. Ruan, and S. He, Appl. Phys. Lett. 85, 4269 (2004).
+[96] L. C. Botten, T. P. White, C. M. de Sterke, and R. C. McPhedran, Phys. Rev. E 74, 026603 (2006).
+BIBLIOGRAPHY 149
+[97] Z. Li, E. Ozbay, H. Chen, J. Chen, F. Yang, and H. Zheng, J. Phys. D 40, 5873 (2007).
+[98] S.-G. Lee, J.-S. Choi, J.-E. Kim, H.-Y. Park, and C.-S. Kee, Opt. Express 16, 4270 (2008).
+[99] J.-M. Park, S.-G. Lee, H. Y. Park, J.-E. Kim, and M.-H. Lee, J. Opt. Soc. Am. B 26, 1967 (2009).
+[100] Y. Jin and S. He, Phys. Lett. A 360, 461 (2007).
+[101] B. Zhang and M. Y. Li, Eur. Phys. J. D 45, 321 (2007).
+[102] T. Baba and D. Ohsaki, Jpn. J. Appl. Phys. 40, 5920 (2001).
+[103] T. Baba, T. Matsumoto, and M. Echizen, Opt. Express 12, 4608 (2004).
+[104] T. Matsumoto, S. Fujita, and T. Baba, Opt. Express 13, 10768 (2005).
+[105] T. Matsumoto, K. Eom, and T. Baba, Opt. Lett. 31, 2786 (2006).
+[106] F. J. Lawrence, L. C. Botten, K. B. Dossou, and C. M. de Sterke, Appl. Phys. Lett. 93, 121114
+(2008).
+[107] F. J. Lawrence, L. C. Botten, K. B. Dossou, C. M. de Sterke, and R. C. McPhedran, Phys. Rev. A
+80, 023826 (2009).
+[108] J. Witzens, M. Hochberg, T. Baehr-Jones, and A. Scherer, Phys. Rev. E 69, 046609 (2004).
+[109] B. Momeni and A. Adibi, Appl. Phys. Lett. 87, 171104 (2005).
+[110] W. H. Press, B. P. Flannery, S. A. Teukolsky, and W. T. Vetterling, Numerical recipes in C (Cam-
+bridge University Press, 1992).
+[111] W. S´migaj, B. Gralak, R. Pierre, and G. Tayeb, in SPP4 Surface Plasmon Photonics Conference
+(2009).
+[112] W. S´migaj, B. Gralak, R. Pierre, and G. Tayeb, Opt. Lett. 34, 3532 (2009).
+[113] D. W. Prather, S. Shi, J. Murakowski, G. J. Schneider, A. Sharkawy, C. Chen, B. L. Miao, and
+R. Martin, J. Phys. D 40, 2635 (2007).
+[114] S. G. Johnson, M. Ibanescu, M. A. Skorobogatiy, O. Weisberg, J. D. Joannopoulos, and Y. Fink,
+Phys. Rev. E 65, 066611 (2002).
+[115] M. Vanwolleghem, X. Checoury, W. S´migaj, B. Gralak, L. Magdenko, K. Postava, B. Dagens,
+P. Beauvillain, and J.-M. Lourtioz, Phys. Rev. B 80, 121102(R) (2009).
+[116] R. E. Collin, Foundations for microwave engineering (Wiley-IEEE, New York, 2001).
+[117] D. M. Pozar, Microwave engineering (Wiley, New York, 1998).
+[118] F. Olyslager, Electromagnetic waveguides and transmission lines (Oxford University Press, Ox-
+ford, 1999).
+[119] D. D. Stancil and A. Prabhakar, Spin waves. Theory and applications (Springer, New York, 2009).
+[120] Y. Shoji and T. Mizumoto, Opt. Express 15, 13446 (2007).
+150 BIBLIOGRAPHY
+[121] M. Vanwolleghem, private communication (2009).
+[122] B. Vertruyen, R. Cloots, J. S. Abell, T. J. Jackson, R. C. da Silva, E. Popova, and N. Keller, Phys.
+Rev. B 78, 094429 (2008).
+[123] H. Takeda and S. John, Phys. Rev. A 78, 023804 (pages 15) (2008).
+[124] J. Lettieri, V. Vaithyanathan, S. K. Eah, J. Stephens, V. Sih, D. D. Awschalom, J. Levy, and D. G.
+Schlom, Appl. Phys. Lett. 83, 975 (2003).
+[125] M. J. Steel, M. Levy, and R. M. Osgood, J. Lightwave Technol. 18, 1297 (2000).
+[126] A. Figotin and I. Vitebsky, Phys. Rev. E 63, 066609 (2001).
+[127] Z. Yu, Z. Wang, and S. Fan, Appl. Phys. Lett. 90, 121133 (2007).
+[128] A. B. Khanikaev and M. J. Steel, Opt. Express 17, 5265 (2009).
+[129] R. Wolfe, V. J. Fratello, and M. M. Powell, J. Appl. Phys. 63, 3099 (1988).
+[130] R. Wolfe, R. A. Lieberman, V. J. Fratello, R. E. Scotti, and N. Kopylov, Appl. Phys. Lett. 56, 426
+(1990).
+[131] H. Dammann, E. Pross, G. Rabe, and W. Tolksdorf, Appl. Phys. Lett. 56, 1302 (1990).
+[132] F. Auracher and H. H. Witte, Opt. Commun. 13, 435 (1975).
+[133] J. Fujita, M. Levy, R. M. Osgood, L. Wilkens, and H. Dötsch, Appl. Phys. Lett. 76, 2158 (2000).
+[134] N. Kono and M. Koshiba, Opt. Express 13, 9155 (2005).
+[135] O. Zhuromskyy, M. Lohmeyer, N. Bahlmann, P. Hertel, H. Dötsch, and A. F. Popkov, Opt. Quan-
+tum Electron. 32, 885 (2000).
+[136] N. Bahlmann, M. Lohmeyer, O. Zhuromskyy, H. Dötsch, and P. Hertel, Opt. Commun. 161, 330
+(1999).
+[137] N. Kono and Y. Tsuji, J. Lightwave Technol. 22, 1741 (2004).
+[138] W. Zaets and K. Ando, IEEE Photon. Technol. Lett. 11 (1999).
+[139] M. Takenaka and Y. Nakano, in Proceedings of the 11th International Conference on Indium
+Phosphide and Related Materials (1999), pp. 289–292.
+[140] M. Vanwolleghem, W. Van Parys, D. Van Thourhout, R. Baets, F. Lelarge, O. Gauthier-Lafaye,
+B. Thedrez, R. Wirix-Speetjens, and L. Lagae, Appl. Phys. Lett. 85, 3980 (2004).
+[141] W. Van Parys, B. Moeyersoon, D. Van Thourhout, R. Baets, M. Vanwolleghem, B. Dagens, J. De-
+cobert, O. Le Gouezigou, D. Make, R. Vanheertum, et al., Appl. Phys. Lett. 88 (2006).
+[142] T. Amemiya, H. Shimizu, M. Yokoyama, P. N. Hai, M. Tanaka, and Y. Nakano, Appl. Opt. 46,
+5784 (2007).
+[143] H. Hemme, H. Dötsch, and P. Hertel, Appl. Opt. 29, 2741 (1990).
+[144] L. Tang, S. M. Drezdzon, and T. Yoshie, Opt. Express 16, 16202 (2008).
+BIBLIOGRAPHY 151
+[145] S. M. Drezdzon and T. Yoshie, Opt. Express 17, 9276 (2009).
+[146] Z. Wang, Y. D. Chong, J. D. Joannopoulos, and M. Soljacˇic´, Phys. Rev. Lett. 100, 013905 (2008).
+[147] Z. Wang, Y. Chong, J. D. Joannopoulos, and M. Soljacˇic´, Nature 461, 772 (2009).
+[148] W. S´migaj, J. Romero-Vivas, B. Gralak, L. Magdenko, B. Dagens, and M. Vanwolleghem, Opt.
+Lett. 35, 568 (2010).
+[149] W. Suh, Z. Wang, and S. Fan, IEEE J. Quantum Electron. 40, 1511 (2004).
+[150] Z. Wang and S. Fan, Photonics Nanostruct. Fundam. Appl. 4, 132 (2006).
+[151] N. Kono and M. Koshiba, in Integrated Photonics Research and Applications/Nanophotonics
+(OSA, 2006), p. IMD3.
+[152] N. Kono, K. Kakihara, K. Saitoh, and M. Koshiba, Opt. Express 15, 7737 (2007).
+[153] K. Gallo, G. Assanto, K. R. Parameswaran, and M. M. Fejer, Applied Physics Letters 79, 314
+(2001).
+[154] Z. Yu and S. Fan, Nat. Photonics 3, 91 (2009).
+[155] Z. Yu, G. Veronis, Z. Wang, and S. Fan, Phys. Rev. Lett. 100, 023902 (2008).
+[156] J. D. Joannopoulos, S. G. Johnson, J. N. Winn, and R. D. Meade, Photonic crystals (Princeton
+University Press, Princeton, 2008).
+[157] J. Scheuer, J. Opt. Soc. Am. B 24, 2178 (2007).
+[158] Abramowitz, M. and Stegun, I. A., ed., Handbook of mathematical functions (Dover, New York,
+1970).
+[159] S. Mazoyer, J. P. Hugonin, and P. Lalanne, Phys. Rev. Lett. 103, 063903 (2009).
+[160] W. S´migaj, J. Opt. Soc. Am. A 24, 3309 (2007).
+[161] Comsol Multiphysics, version 3.5a, RF module user’s guide (2008).
+[162] Y. Tsuji and M. Koshiba, J. Lightwave Technol. 20, 463 (2002).
+[163] L. Magdenko, E. Popova, M. Vanwolleghem, C. Pang, F. Fortuna, T. Maroutian, P. Beauvillain,
+N. Keller, and B. Dagens,Wafer-scale fabrication of magneto-photonic structures in Bismuth Iron
+Garnet thin film, to appear in Microelectron. Eng. (2010).
+[164] M. Hammer and O. V. Ivanova, Opt. Quantum Electron. 41, 267 (2009).
+[165] A. Hessel, in Antenna theory, edited by R. E. Collin and F. J. Zucker (McGraw-Hill, New York,
+1969), vol. 2, chap. 19.
+[166] P. Lalanne, C. Sauvan, and J. P. Hugonin, Laser Photonics Rev. 2, 514 (2008).
+[167] P. Lalanne and J. P. Hugonin, IEEE J. Quantum Electron. 39, 1430 (2003).
+[168] C. Sauvan, G. Lecamp, P. Lalanne, and J. P. Hugonin, Opt. Express 13, 245 (2005).
+152 BIBLIOGRAPHY
+[169] A. Kitagawa and J. Sakai, Phys. Rev. A 80, 033802 (2009).
+[170] K. Srinivasan and O. Painter, Opt. Express 11, 579 (2003).
+[171] K. Srinivasan and O. Painter, Opt. Express 10, 670 (2002).
+[172] D. Englund, I. Fushman, and J. Vucˇkovic´, Opt. Express 13, 5961 (2005).
+[173] Y. Akahane, T. Asano, B. Song, and S. Noda, Nature 425, 944 (2003).
+[174] E. V. Jull, Aperture antennas and diffraction theory (Peter Peregrinus Ltd., New York, 1981).
+[175] C. Balanis, Antenna theory, analysis and design (Wiley, New York, 1997).
+[176] R. Piessens, in Transforms and applications handbook, edited by A. D. Poularikas (CRC, Boca
+Raton, 2000), chap. 9.
+[177] M. Powell, in Large-scale nonlinear optimization, edited by G. Di Pillo and M. Roma (Springer,
+2006), pp. 255–297.
+[178] L. C. Andreani and D. Gerace, Phys. Rev. B 73, 235114 (2006).
+[179] D. Maystre and M. Cadilhac, Journal of Mathematical Physics 26, 2201 (1985).
+[180] D. Maystre, P. Electromagn. Res. 57, 55 (2006).
+[181] I. N. Vekua, New methods for solving elliptic equations (North-Holland, Amsterdam, 1967).
+[182] O. Christensen, An introduction to frames and Riesz bases (Birkhäuser, Boston, 2003).
+[183] J. S. Hesthaven, S. Gottlieb, and D. Gottlieb, Spectral methods for time-dependent problems (Cam-
+bridge University Press, Cambridge, 2007).
+[184] F. Tisseur and K. Meerbergen, SIAM Rev. 43, 235 (2001), ISSN 0036-1445.
+[185] R. C. Ward, SIAM J. Sci. Stat. Comput. 2, 141 (1981).
+[186] E. Anderson, Z. Bai, C. Bischof, S. Blackford, J. Demmel, J. Dongarra, J. Du Croz, A. Greenbaum,
+S. Hammarling, A. McKenney, et al., LAPACK users’ guide (SIAM, Philadelphia, 1999).
+[187] MATLAB 7 function reference, release 2010a, http://www.mathworks.com (2010).
+[188] MIT Photonic Bands (MPB), http://ab-initio.mit.edu/mpb (2003).
+[189] T. Betcke, SIAM J. Matrix Anal. Appl. 30, 1320 (2008).
+[190] M. A. Morgan, S. Chang, and K. K. Mei, IEEE Trans. Antennas Propag. 25, 413 (1977).
+[191] M. A. Morgan and K. K. Mei, IEEE Trans. Antennas Propag. 27, 202 (1979).
+[192] J. Lee, G. M. Wilkins, and R. Mitra, IEEE Transactions on Microwave Theory Techniques 41,
+1981 (1993).
+[193] O. Chinellato, Ph.D. thesis, Swiss Federal Institute of Technology, Zürich (2005).
+[194] O. Chinellato, P. Arbenz, M. Streiff, and A. Witzig, Future Gener. Comput. Syst. 21, 1263 (2005).
+BIBLIOGRAPHY 153
+[195] R. Hiptmair and P. D. Ledger, Int. J. Numer. Meth. Engng 62, 1652 (2005).
+[196] M. Wong, M. Prak, and V. Hanna, in IEEE MTT-S Dig. (1995), pp. 285–288.
+[197] P. Lacoste and Y. Gay, in Mathematical and numerical aspects of wave propagation phenomena
+(SIAM, 1991), pp. 746–749, cited after ref. 196.
+[198] A. D. Greenwood and J. Jin, IEEE Trans. Antennas Propag. 47, 1260 (1999).
+[199] J. P. Boyd, Chebyshev and Fourier spectral methods (Dover, New York, 2000).
+[200] D. Sun, J. Manges, X. Yuan, and Z. Cendes, IEEE Antennas Propag. Mag. 37, 12 (1995).
+[201] I. Munteanu, ICS Newslett. 9, 10 (2002).
+[202] C. Schwab, p- and hp- finite element methods: theory and applications in solid and fluid mechan-
+ics (Oxford University Press, Oxford, 1998).
+[203] Z. Xu and B. Wu, Int. J. Numer. Meth. Engng 75, 945 (2008).
+[204] N. P. van der Aa, H. G. Ter Morsche, and R. R. M. Mattheij, Electron. J. Lin. Algebra 16, 300
+(2007).
+
+
+Conception et modélisation numérique
+de composants optiques en nanophotonique intégrée
+Résumé Cette thèse est consacrée à la conception et l’analyse théorique de différents composants en
+optique intégrée.
+Nous présentons un modèle de milieu effectif pour les cristaux photoniques (CPs) 2D qui rend
+compte des effets de surface, puis un algorithme pour la conception de réseaux antiréfléchissants grand-
+angle pour ces CPs. Ces réseaux permettent d’améliorer significativement la transmission à travers une
+lentille plate d’indice négatif.
+Nous proposons une nouvelle génération de circulateurs magnétooptiques compacts, fonctionnant
+dans un champ magnétique extérieur uniforme et constitués d’une cavité résonnante en anneaux circu-
+laires couplée directement à des guides d’ondes standards.
+Nous généralisons la méthode multipolaire 2D aux matériaux gyrotropiques et la formulons sans
+« lattice sums » pour les structures périodiques. Enfin, nous décrivons en détail la méthode des éléments
+finis pour le calcul des modes propres des cavités 3D en anneaux circulaires et matériaux gyrotropiques.
+Mots clés cristaux photoniques, composants magnétooptiques, théories du milieu effectif, réseaux
+antiréfléchissants, méthodes numériques, optique intégrée.
+Design and numerical modelling of integrated optical components
+Abstract This thesis is devoted to the design and theoretical and numerical analysis of a number of
+photonic crystal (PC) components. In its first part we study the influence of the surface structure of
+two-dimensional (2D) PCs on their optical properties. We formulate an effective-medium model of
+such PCs, able to reproduce the commonly observed strong dependence of their effective parameters
+on the position of their truncation plane. We then develop an algorithm for the design of compact
+wide-angle antireflection gratings for 2D PCs and show them to improve significantly the transmission
+through a PC flat lens.
+In the second part of the manuscript we introduce a new approach to the design of resonant cavities
+to be used in compact magneto-optical circulators. In contrast to structures proposed previously, they
+are devoid of oppositely-polarised magnetic domains, which significantly facilitates their fabrication. We
+show that these cavities need not be embedded in PCs, but can be coupled directly with standard rib
+waveguides.
+Some numerical techniques developed in the course of this thesis are presented in the last part
+of the manuscript. We extend the multiple-scattering method to the case of gyrotropic materials and
+introduce a straightforward and extremely accurate method for the calculation of band structures of
+2D PCs composed of circular cylinders, based on Fourier-Bessel expansions. Finally, we describe the
+implementation of the finite-element method for the calculation of eigenmodes of open, axisymmetric,
+three-dimensional cavities containing gyrotropic materials.
+Keywords photonic crystals, magneto-optical devices, effective-medium theory, antireflection gratings,
+numerical methods, integrated optics.
+Laboratoire d’accueil Équipe CLARTE, Institut Fresnel, Campus de Saint Jérôme,
+avenue Escadrille Normandie-Niemen, 13397 Marseille Cedex 20
+Formation doctorale physique théorique et mathématique
diff --git a/examples/theses/these_archivage_2903871_-_ziyadeh_-_optimise.pdf b/examples/theses/these_archivage_2903871_-_ziyadeh_-_optimise.pdf
new file mode 100644
index 00000000..a5cf3014
Binary files /dev/null and b/examples/theses/these_archivage_2903871_-_ziyadeh_-_optimise.pdf differ
diff --git a/examples/theses/these_archivage_3274485.pdf b/examples/theses/these_archivage_3274485.pdf
new file mode 100644
index 00000000..c929fcf9
Binary files /dev/null and b/examples/theses/these_archivage_3274485.pdf differ
diff --git a/pom.xml b/pom.xml
index 39be6284..3e59f66e 100644
--- a/pom.xml
+++ b/pom.xml
@@ -214,25 +214,11 @@
 			<artifactId>gson</artifactId>
 			<version>2.3.1</version>
 		</dependency>
-<!--
-		<dependency>
-			<groupId>com.google.guava</groupId>
-			<artifactId>guava</artifactId>
-			<version>${guava.version}</version>
-		</dependency>
--->
 		<dependency>
 			<groupId>org.xml-cml</groupId>
 			<artifactId>svg2xml</artifactId>
 			<version>0.1-SNAPSHOT</version>
 		</dependency>
-		<!-- 
-		<dependency>
-			<groupId>org.xml-cml</groupId>
-			<artifactId>svgbuilder</artifactId>
-			<version>0.1-SNAPSHOT</version>
-		</dependency>
-		-->
 		
 		<!--  to avoid Xerces Hell? 
 		http://stackoverflow.com/questions/17777821/maven-dependency-conflict-org-w3c-dom-elementtraversal
diff --git a/src/main/java/org/xmlcml/norma/InputFormat.java b/src/main/java/org/xmlcml/norma/InputFormat.java
index 255ffa49..049f53a8 100644
--- a/src/main/java/org/xmlcml/norma/InputFormat.java
+++ b/src/main/java/org/xmlcml/norma/InputFormat.java
@@ -11,6 +11,7 @@
 public enum InputFormat {
 	DOC,
 	DOCX,
+	HOCR,
 	HTML,
 	LATEX,
 	PDF,
@@ -45,6 +46,9 @@ public static InputFormat getInputFormat(String inputName) {
 		if (is(InputFormat.HTML, inputName) || inputName.endsWith(".htm")) {
 			return InputFormat.HTML;
 		}
+		if (is(InputFormat.HOCR, inputName) || inputName.endsWith(".hocr.html")) {
+			return InputFormat.HOCR;
+		}
 		if (is(InputFormat.SVG, inputName)) {
 			return InputFormat.SVG;
 		}
diff --git a/src/main/java/org/xmlcml/norma/NormaArgProcessor.java b/src/main/java/org/xmlcml/norma/NormaArgProcessor.java
index 1f51f1c0..987328bc 100755
--- a/src/main/java/org/xmlcml/norma/NormaArgProcessor.java
+++ b/src/main/java/org/xmlcml/norma/NormaArgProcessor.java
@@ -190,7 +190,9 @@ public void outputMethod(ArgumentOption option) {
 
 	private void outputSpecifiedFormat() {
 		getOrCreateNormaTransformer();
-		currentCMDir.writeFile(normaTransformer.outputTxt, CMDir.FULLTEXT_PDF_TXT);
+		if (normaTransformer.outputTxt != null) {
+			currentCMDir.writeFile(normaTransformer.outputTxt, CMDir.FULLTEXT_PDF_TXT);
+		}
 		if (normaTransformer.htmlElement != null) {
 			currentCMDir.writeFile(normaTransformer.htmlElement.toXML(), CMDir.FULLTEXT_HTML);
 		}
@@ -225,20 +227,19 @@ File checkAndGetInputFile(CMDir cmDir) {
 	private void createCMDirListFromInputList() {
 		// proceed unless there is a single reserved file for input
 		if (CMDir.isNonEmptyNonReservedInputList(inputList)) {
-//			if (output != null) {
-				LOG.debug("CREATING CMDir FROM INPUT:"+inputList);
-				getOrCreateOutputDirectory();
-				ensureCMDirList();
-				createNewCMDirsAndAddToList();
-//			}
+			LOG.trace("CREATING CMDir FROM INPUT:"+inputList);
+			// this actually creates directory
+			getOrCreateOutputDirectory();
+			ensureCMDirList();
+			createNewCMDirsAndCopyOriginalFilesAndAddToList();
 		}
 	}
 
-	private void createNewCMDirsAndAddToList() {
+	private void createNewCMDirsAndCopyOriginalFilesAndAddToList() {
 		ensureCMDirList();
 		for (String filename : inputList) {
 			try {
-				CMDir cmDir = createCMDir(filename);
+				CMDir cmDir = createCMDirAndCopyFileOrMakeSubDirectory(filename);
 				if (cmDir != null) {
 					cmDirList.add(cmDir);
 				}
@@ -248,7 +249,7 @@ private void createNewCMDirsAndAddToList() {
 		}
 	}
 
-	private CMDir createCMDir(String filename) throws IOException {
+	private CMDir createCMDirAndCopyFileOrMakeSubDirectory(String filename) throws IOException {
 		CMDir cmDir = null;
 		File file = new File(filename);
 		if (file.isDirectory()) {
@@ -260,20 +261,61 @@ private CMDir createCMDir(String filename) throws IOException {
 					LOG.error(name+" is reserved for CMDir: (check that inputs are not already in a CMDir) "+file.getAbsolutePath());
 				}
 				String cmFilename = CMDir.getCMDirReservedFilenameForExtension(name);
-				String dirName = FilenameUtils.removeExtension(name);
-				File cmDirFile = new File(output, dirName);
-				cmDir = new CMDir(cmDirFile);
-				cmDir.createDirectory(cmDirFile, false);
-				File destFile = cmDir.getReservedFile(cmFilename);
-				if (destFile != null) {
-					FileUtils.copyFile(file, destFile);
-					LOG.trace("CMD "+cmFilename+"; "+cmDirFile);
+				if (cmFilename == null) {
+					LOG.error("Cannot create CMDir from this type of file: "+name);
+					return null;
+				}
+				LOG.trace("Reserved filename: "+cmFilename);
+				if (CMDir.isReservedDirectory(cmFilename)) {
+					cmDir = makeCMDir(name);
+					ensureReservedDirectoryAndCopyFile(cmDir, cmFilename, filename);
+				} else {
+					cmDir = makeCMDir(name);
+					File destFile = cmDir.getReservedFile(cmFilename);
+					if (destFile != null) {
+						FileUtils.copyFile(file, destFile);
+					}
 				}
 			}
 		}
 		return cmDir;
 	}
 
+	private CMDir makeCMDir(String name) {
+		CMDir cmDir;
+		String dirName = FilenameUtils.removeExtension(name);
+		cmDir = createCMDir(dirName);
+		return cmDir;
+	}
+
+	private void ensureReservedDirectoryAndCopyFile(CMDir cmDir, String reservedFilename, String filename) {
+		File reservedDir = new File(cmDir.getDirectory(), reservedFilename);
+		LOG.trace("Res "+reservedDir.getAbsolutePath());
+		File orig = new File(filename);
+		LOG.trace("Orig: "+orig.getAbsolutePath());
+		try {
+			FileUtils.forceMkdir(reservedDir);
+		} catch (IOException e) {
+			throw new RuntimeException("Cannot make directory: "+reservedFilename+" "+e);
+		}  
+		String name = FilenameUtils.getName(filename);
+		try {
+			File outFile = new File(reservedDir, name);
+			FileUtils.copyFile(new File(filename), outFile);
+		} catch (IOException e) {
+			throw new RuntimeException("Cannot copy file: "+filename+" to "+reservedDir+" / "+e);
+		}  
+		LOG.debug("created "+name+" in "+reservedDir);
+		
+	}
+
+	private CMDir createCMDir(String dirName) {
+		File cmDirFile = new File(output, dirName);
+		CMDir cmDir = new CMDir(cmDirFile);
+		cmDir.createDirectory(cmDirFile, false);
+		return cmDir;
+	}
+
 	private void getOrCreateOutputDirectory() {
 		if (output != null) {
 			File outputDir = new File(output);
diff --git a/src/main/java/org/xmlcml/norma/input/InputReader.java b/src/main/java/org/xmlcml/norma/input/InputReader.java
index 6d3ce8db..5e5a7f7d 100644
--- a/src/main/java/org/xmlcml/norma/input/InputReader.java
+++ b/src/main/java/org/xmlcml/norma/input/InputReader.java
@@ -8,6 +8,7 @@
 import org.xmlcml.norma.InputFormat;
 import org.xmlcml.norma.RawInput;
 import org.xmlcml.norma.input.html.HtmlReader;
+import org.xmlcml.norma.input.ocr.HOCRReader;
 
 public class InputReader {
 
@@ -19,6 +20,8 @@ public static InputReader createReader(InputFormat type) {
 			LOG.debug("no input type");
 		} else if (type.equals(InputFormat.HTML)) {
 			reader = new HtmlReader();
+		} else if (type.equals(InputFormat.HOCR)) {
+			reader = new HOCRReader();
 		} else {
 			throw new RuntimeException("Unknown/unsupported input type: "+type);
 		}
diff --git a/src/test/java/org/xmlcml/norma/InputTest.java b/src/test/java/org/xmlcml/norma/InputTest.java
index aa0704a8..050931d9 100644
--- a/src/test/java/org/xmlcml/norma/InputTest.java
+++ b/src/test/java/org/xmlcml/norma/InputTest.java
@@ -109,6 +109,11 @@ public void testInputDirectory() {
 	}
 	
 	/** creates single `CMDir` directory
+	 * 
+	 * // SHOWCASE
+	 * Reads isolated XML file, creates a CMDir from the name and copies XML file to
+	 * fulltext.xml
+	 * 
 	 * 
 	 */
 	@Test
@@ -120,6 +125,7 @@ public void testMakeSingleQuickscrape() {
 				new File(Fixtures.TEST_MISC_DIR, "mdpi-04-00932.xml").toString(),
 				"-o", cmDir.toString()
 		};
+		// THIS MAKES THE CMDIR and copies files and renames
 		DefaultArgProcessor argProcessor = new NormaArgProcessor(args);
 		List<String> inputList = argProcessor.getInputList();
 		Assert.assertEquals("inputList", 1, inputList.size());
diff --git a/src/test/java/org/xmlcml/norma/Prototypes.java b/src/test/java/org/xmlcml/norma/Prototypes.java
index 88dec783..062939eb 100644
--- a/src/test/java/org/xmlcml/norma/Prototypes.java
+++ b/src/test/java/org/xmlcml/norma/Prototypes.java
@@ -1,12 +1,22 @@
 package org.xmlcml.norma;
 
+import org.apache.log4j.Level;
+import org.apache.log4j.Logger;
+
 public class Prototypes {
 
+	
+	private static final Logger LOG = Logger.getLogger(Prototypes.class);
+	static {
+		LOG.setLevel(Level.DEBUG);
+	}
+	
 	public static void main(String[] args) {
 //		runHalThesis1();
 //		runHalThesis2();
 //		runHalThesis3();
-		runHalManyThesis();
+//		runHalManyThesis();
+		runImages();
 	}
 
 	private static void runHalThesis1() {
@@ -31,8 +41,26 @@ private static void runHalManyThesis() {
 		createPDFTXT("smigaj");
 		createPDFTXT("TH2013PEST1177");
 	}
+	
+	private static void runImages() {
+		createImageDir("peterijsem/sourceimages/small", "examples/ijsem/small", "png");
+	}
+
+	private static void createImageDir(String imagedir, String cmdir, String ... imageTypes) {
+		String xString = " -e ";
+		for (String imageType : imageTypes) {
+			xString += " "+imageType+" ";
+		}
+		String cmd = "-i "+imagedir+xString+" -o "+cmdir;
+		LOG.debug(cmd);
+		new Norma().run(cmd);
+//			new Norma().run("-q "+imagedir+root+" -i fulltext.pdf -o fulltext.pdf.txt --xsl pdf2txt");
+	}
 
 	private static void createPDFTXT(String name) {
+		/** creates a new CMDIR and copies PDF to "fulltext.pdf"
+		 * 
+		 */
 		new Norma().run("-i examples/theses/"+name+".pdf -o examples/theses/");
 		new Norma().run("-q examples/theses/"+name+" -i fulltext.pdf -o fulltext.pdf.txt --xsl pdf2txt");
 	}
diff --git a/src/test/java/org/xmlcml/norma/json/CatalogEntryTest.java b/src/test/java/org/xmlcml/norma/json/CatalogEntryTest.java
index 5258cc19..b7127afb 100644
--- a/src/test/java/org/xmlcml/norma/json/CatalogEntryTest.java
+++ b/src/test/java/org/xmlcml/norma/json/CatalogEntryTest.java
@@ -136,7 +136,7 @@ public class CatalogEntryTest {
 	    "Scott R. Woodward",
 	    "Antonio Salas",
 	    "Antonio Torroni",
-	    "Hans-J\u00fcrgen Bandelt"],
+	    "Hans-Jürgen Bandelt"], // ISOLATIN character
 	    "title": "The Phylogeny of the Four Pan-American MtDNA Haplogroups: Implications for Evolutionary and Disease Studies",
 	    "firstpage": "e1764",
 	    "id": "b11a6a6453b24ecb9313f9eec27501c4",
@@ -210,6 +210,7 @@ public void testCompleteCatalog() throws IOException {
 	    CatalogEntry catalogEntry = CatalogEntry.createCatalogEntry(jsonObject);
 	    Assert.assertEquals("took", 2, catalogEntry.getTook().intValue());
 	    Assert.assertFalse("timed_out", catalogEntry.getTimed_out());
+	    // has ISO-Latin ignore for the present 
 	    Assert.assertEquals("hit", "[0.75475913 / 54d58c9da5c44dfd9c5313107ade2152 /  / 10.1371/journal.pone.0102272 / 2014-12-01 0620 / PLOS ONE: an inclusive, peer-reviewed, open-access resource from the PUBLIC LIBRARY OF SCIENCE. Reports of well-performed scientific studies from all disciplines freely available to the whole world. / [The PLOS ONE Staff] / e102272 / 54d58c9da5c44dfd9c5313107ade2152 / 9 / /article/fetchObjectAttachment.action?uri=info%3Adoi%2F10.1371%2Fjournal.pone.0102272&representation=XML / 2014-12-01 0616 / 2014/7/2 / 7 / http://dx.plos.org/10.1371/journal.pone.0102272.pdf / contentmine / , 0.7116731 / 0d84b65dd0f044ab9f6a5e430104315d /  / 10.1371/journal.pone.0070048 / 2014-12-29 1902 / PLOS ONE: an inclusive, peer-reviewed, open-access resource from the PUBLIC LIBRARY OF SCIENCE. Reports of well-performed scientific studies from all disciplines freely available to the whole world. / [Angelina R. Sutin, Antonio Terracciano] / e70048 / 0d84b65dd0f044ab9f6a5e430104315d / 8 / null / 2014-12-29 1902 / 2013/7/24 / 7 / http://dx.plos.org/10.1371/journal.pone.0070048.pdf / contentmine / , 0.6614297 / f53f4ee866964ab08417720ed500e72d /  / 10.1371/journal.pbio.1001934 / 2014-12-01 1929 / PLOS Biology is an open-access, peer-reviewed journal that features works of exceptional significance in all areas of biological science, from molecules to ecosystems, including works at the interface with other disciplines. / [Johan J. Bolhuis, Ian Tattersall, Noam Chomsky, Robert C. Berwick] / e1001934 / f53f4ee866964ab08417720ed500e72d / 12 / null / 2014-12-01 1929 / 2014/8/26 / 8 / http://dx.plos.org/10.1371/journal.pbio.1001934.pdf / contentmine / , 0.6614297 / d66cb9ce42ab40c68fbd6d8d548e267c /  / 10.1371/journal.pone.0053095 / 2014-12-07 1523 / PLOS ONE: an inclusive, peer-reviewed, open-access resource from the PUBLIC LIBRARY OF SCIENCE. Reports of well-performed scientific studies from all disciplines freely available to the whole world. / [Mahendra Piraveenan, Mikhail Prokopenko, Liaquat Hossain] / e53095 / d66cb9ce42ab40c68fbd6d8d548e267c / 8 / null / 2014-12-07 1523 / 2013/1/22 / 1 / http://dx.plos.org/10.1371/journal.pone.0053095.pdf / contentmine / , 0.6227139 / 2cd1ac54443e463bb1f385febae2ea94 /  / 10.1371/journal.pone.0105948 / 2014-12-01 1926 / PLOS ONE: an inclusive, peer-reviewed, open-access resource from the PUBLIC LIBRARY OF SCIENCE. Reports of well-performed scientific studies from all disciplines freely available to the whole world. / [Richard D. Norris, James M. Norris, Ralph D. Lorenz, Jib Ray, Brian Jackson] / e105948 / 2cd1ac54443e463bb1f385febae2ea94 / 9 / null / 2014-12-01 1926 / 2014/8/27 / 8 / http://dx.plos.org/10.1371/journal.pone.0105948.pdf / contentmine / , 0.6227139 / e2a99c800e4f4e7caad2cff11c4b5880 /  / 10.1371/journal.pntd.0003131 / 2014-12-04 1819 / PLOS Neglected Tropical Diseases is an open-access journal publishing peer-reviewed research on the world\\'s most neglected tropical diseases, such as elephantiasis, river blindness, leprosy, hookworm, schistosomiasis, and African sleeping sickness / [Samson Leta, Thi Ha Thanh Dao, Frehiwot Mesele, Gezahegn Alemayehu] / e3131 / e2a99c800e4f4e7caad2cff11c4b5880 / 8 / null / 2014-12-01 1925 / 2014/9/4 / 9 / http://dx.plos.org/10.1371/journal.pntd.0003131.pdf / contentmine / , 0.6099375 / 2e865e2652ad4adb95303092d6c8b7a2 /  / 10.1371/journal.pcbi.1003892 / 2014-12-31 0120 / PLOS Computational Biology is an open-access / [Nicholas Generous, Geoffrey Fairchild, Alina Deshpande, Sara Y. Del Valle, Reid Priedhorsky] / e1003892 / 2e865e2652ad4adb95303092d6c8b7a2 / 10 / null / 2014-12-30 2017 / 2014/11/13 / 11 / http://dx.plos.org/10.1371/journal.pcbi.1003892.pdf / contentmine / , 0.5906909 / 9bbeac16ebe040f4bf4ee49b7b763053 /  / 10.1371/journal.pone.0094346 / 2014-12-04 1819 / PLOS ONE: an inclusive, peer-reviewed, open-access resource from the PUBLIC LIBRARY OF SCIENCE. Reports of well-performed scientific studies from all disciplines freely available to the whole world. / [Chuong V. Nguyen, David R. Lovell, Matt Adcock, John La Salle] / e94346 / 9bbeac16ebe040f4bf4ee49b7b763053 / 9 / null / 2014-12-01 1926 / 2014/4/23 / 4 / http://dx.plos.org/10.1371/journal.pone.0094346.pdf / contentmine / , 0.5521466 / b11a6a6453b24ecb9313f9eec27501c4 /  / 10.1371/journal.pone.0001764 / 2014-12-02 0449 / PLOS ONE: an inclusive, peer-reviewed, open-access resource from the PUBLIC LIBRARY OF SCIENCE. Reports of well-performed scientific studies from all disciplines freely available to the whole world. / [Alessandro Achilli, Ugo A. Perego, Claudio M. Bravi, Michael D. Coble, Qing-Peng Kong, Scott R. Woodward, Antonio Salas, Antonio Torroni, Hans-Jürgen Bandelt] / e1764 / b11a6a6453b24ecb9313f9eec27501c4 / 3 / null / 2014-12-02 0449 / 2008/3/12 / 3 / http://dx.plos.org/10.1371/journal.pone.0001764.pdf / contentmine / , 0.45745313 / bb282dc238684b51bc1ee60ed1a4bc6b /  / 10.1371/journal.pone.0000829 / 2014-12-02 0449 / PLOS ONE: an inclusive, peer-reviewed, open-access resource from the PUBLIC LIBRARY OF SCIENCE. Reports of well-performed scientific studies from all disciplines freely available to the whole world. / [Erika Tamm, Toomas Kivisild, Maere Reidla, Mait Metspalu, David Glenn Smith, Connie J. Mulligan, Claudio M. Bravi, Olga Rickards, Cristina Martinez-Labarga, Elsa K. Khusnutdinova, Sardana A. Fedorova, Maria V. Golubenko, Vadim A. Stepanov, Marina A. Gubina, Sergey I. Zhadanov, Ludmila P. Ossipova, Larisa Damba, Mikhail I. Voevoda, Jose E. Dipierri, Richard Villems, Ripan S. Malhi] / e829 / bb282dc238684b51bc1ee60ed1a4bc6b / 2 / null / 2014-12-02 0449 / 2007/9/5 / 9 / http://dx.plos.org/10.1371/journal.pone.0000829.pdf / contentmine / ] / 54 / 0.75475913 /  / null / null /  / 2 / false / ",
 	    		catalogEntry.toString());
 	}