diff --git a/.gitignore b/.gitignore
index 5a7e6ca..4175871 100644
--- a/.gitignore
+++ b/.gitignore
@@ -1,3 +1,4 @@
 *.class
 *.jar
+*.ser
 lib/chromedriver
diff --git a/.idea/libraries/Maven__commons_cli_commons_cli_1_3_1.xml b/.idea/libraries/Maven__commons_cli_commons_cli_1_3_1.xml
new file mode 100644
index 0000000..a1510b9
--- /dev/null
+++ b/.idea/libraries/Maven__commons_cli_commons_cli_1_3_1.xml
@@ -0,0 +1,13 @@
+<component name="libraryTable">
+  <library name="Maven: commons-cli:commons-cli:1.3.1">
+    <CLASSES>
+      <root url="jar://$MAVEN_REPOSITORY$/commons-cli/commons-cli/1.3.1/commons-cli-1.3.1.jar!/" />
+    </CLASSES>
+    <JAVADOC>
+      <root url="jar://$MAVEN_REPOSITORY$/commons-cli/commons-cli/1.3.1/commons-cli-1.3.1-javadoc.jar!/" />
+    </JAVADOC>
+    <SOURCES>
+      <root url="jar://$MAVEN_REPOSITORY$/commons-cli/commons-cli/1.3.1/commons-cli-1.3.1-sources.jar!/" />
+    </SOURCES>
+  </library>
+</component>
\ No newline at end of file
diff --git a/.idea/workspace.xml b/.idea/workspace.xml
index 079e6fb..3c9101d 100644
--- a/.idea/workspace.xml
+++ b/.idea/workspace.xml
@@ -2,6 +2,13 @@
 <project version="4">
   <component name="ChangeListManager">
     <list default="true" id="bbbbc773-7714-4942-be21-383885d0c5dc" name="Default" comment="">
+      <change afterPath="$PROJECT_DIR$/.idea/libraries/Maven__commons_cli_commons_cli_1_3_1.xml" afterDir="false" />
+      <change afterPath="$PROJECT_DIR$/src/main/java/org/forward/entitysearch/experiment/TestReadObject.java" afterDir="false" />
+      <change beforePath="$PROJECT_DIR$/.idea/workspace.xml" beforeDir="false" afterPath="$PROJECT_DIR$/.idea/workspace.xml" afterDir="false" />
+      <change beforePath="$PROJECT_DIR$/EntityAnnotation.iml" beforeDir="false" afterPath="$PROJECT_DIR$/EntityAnnotation.iml" afterDir="false" />
+      <change beforePath="$PROJECT_DIR$/pom.xml" beforeDir="false" afterPath="$PROJECT_DIR$/pom.xml" afterDir="false" />
+      <change beforePath="$PROJECT_DIR$/serialized/kevin.ser" beforeDir="false" afterPath="$PROJECT_DIR$/serialized/kevin.ser" afterDir="false" />
+      <change beforePath="$PROJECT_DIR$/src/main/java/org/forward/entitysearch/experiment/AnnotatorFactory.java" beforeDir="false" afterPath="$PROJECT_DIR$/src/main/java/org/forward/entitysearch/ner/annotation/AnnotatorFactory.java" afterDir="false" />
       <change beforePath="$PROJECT_DIR$/src/main/java/org/forward/entitysearch/ingestion/HTMLDocumentIngestionManager.java" beforeDir="false" afterPath="$PROJECT_DIR$/src/main/java/org/forward/entitysearch/ingestion/HTMLDocumentIngestionManager.java" afterDir="false" />
     </list>
     <ignored path="$PROJECT_DIR$/out/" />
@@ -32,8 +39,8 @@
       <file leaf-file-name="HTMLDocumentIngestionManager.java" pinned="false" current-in-tab="true">
         <entry file="file://$PROJECT_DIR$/src/main/java/org/forward/entitysearch/ingestion/HTMLDocumentIngestionManager.java">
           <provider selected="true" editor-type-id="text-editor">
-            <state relative-caret-position="237">
-              <caret line="248" column="10" selection-start-line="248" selection-start-column="10" selection-end-line="248" selection-end-column="10" />
+            <state relative-caret-position="261">
+              <caret line="285" column="77" selection-start-line="285" selection-start-column="77" selection-end-line="285" selection-end-column="77" />
               <folding>
                 <element signature="imports" expanded="true" />
               </folding>
@@ -41,11 +48,20 @@
           </provider>
         </entry>
       </file>
+      <file leaf-file-name="TextFileFilter.java" pinned="false" current-in-tab="false">
+        <entry file="file://$PROJECT_DIR$/src/main/java/org/forward/entitysearch/ingestion/TextFileFilter.java">
+          <provider selected="true" editor-type-id="text-editor">
+            <state relative-caret-position="120">
+              <caret line="10" column="13" selection-start-line="10" selection-start-column="13" selection-end-line="10" selection-end-column="13" />
+            </state>
+          </provider>
+        </entry>
+      </file>
       <file leaf-file-name="pom.xml" pinned="false" current-in-tab="false">
         <entry file="file://$PROJECT_DIR$/pom.xml">
           <provider selected="true" editor-type-id="text-editor">
-            <state relative-caret-position="200">
-              <caret line="22" column="59" lean-forward="true" selection-start-line="22" selection-start-column="59" selection-end-line="22" selection-end-column="59" />
+            <state relative-caret-position="339">
+              <caret line="73" column="27" selection-start-line="73" selection-start-column="27" selection-end-line="73" selection-end-column="27" />
             </state>
           </provider>
         </entry>
@@ -53,7 +69,7 @@
       <file leaf-file-name="CustomizableCoreAnnotations.java" pinned="false" current-in-tab="false">
         <entry file="file://$PROJECT_DIR$/src/main/java/edu/stanford/nlp/ling/CustomizableCoreAnnotations.java">
           <provider selected="true" editor-type-id="text-editor">
-            <state relative-caret-position="915">
+            <state relative-caret-position="337">
               <caret line="66" column="36" selection-start-line="66" selection-start-column="36" selection-end-line="66" selection-end-column="36" />
             </state>
           </provider>
@@ -74,10 +90,22 @@
         </entry>
       </file>
       <file leaf-file-name="AnnotatorFactory.java" pinned="false" current-in-tab="false">
-        <entry file="file://$PROJECT_DIR$/src/main/java/org/forward/entitysearch/experiment/AnnotatorFactory.java">
+        <entry file="file://$PROJECT_DIR$/src/main/java/org/forward/entitysearch/ner/annotation/AnnotatorFactory.java">
           <provider selected="true" editor-type-id="text-editor">
-            <state relative-caret-position="330">
-              <caret line="26" column="57" selection-start-line="26" selection-start-column="57" selection-end-line="26" selection-end-column="57" />
+            <state relative-caret-position="60">
+              <caret line="8" column="13" selection-start-line="8" selection-start-column="13" selection-end-line="8" selection-end-column="13" />
+            </state>
+          </provider>
+        </entry>
+      </file>
+      <file leaf-file-name="TestReadObject.java" pinned="false" current-in-tab="false">
+        <entry file="file://$PROJECT_DIR$/src/main/java/org/forward/entitysearch/experiment/TestReadObject.java">
+          <provider selected="true" editor-type-id="text-editor">
+            <state relative-caret-position="435">
+              <caret line="29" column="71" selection-start-line="29" selection-start-column="71" selection-end-line="29" selection-end-column="71" />
+              <folding>
+                <element signature="imports" expanded="true" />
+              </folding>
             </state>
           </provider>
         </entry>
@@ -100,28 +128,6 @@
           </provider>
         </entry>
       </file>
-      <file leaf-file-name="WordsToSentencesAnnotator.java" pinned="false" current-in-tab="false">
-        <entry file="jar://$MAVEN_REPOSITORY$/edu/stanford/nlp/stanford-corenlp/3.8.0/stanford-corenlp-3.8.0-sources.jar!/edu/stanford/nlp/pipeline/WordsToSentencesAnnotator.java">
-          <provider selected="true" editor-type-id="text-editor">
-            <state relative-caret-position="3180">
-              <caret line="228" selection-start-line="228" selection-end-line="228" />
-            </state>
-          </provider>
-        </entry>
-      </file>
-      <file leaf-file-name="Annotation.java" pinned="false" current-in-tab="false">
-        <entry file="jar://$MAVEN_REPOSITORY$/edu/stanford/nlp/stanford-corenlp/3.8.0/stanford-corenlp-3.8.0-sources.jar!/edu/stanford/nlp/pipeline/Annotation.java">
-          <provider selected="true" editor-type-id="text-editor">
-            <state relative-caret-position="795">
-              <caret line="92" column="12" selection-start-line="92" selection-start-column="12" selection-end-line="92" selection-end-column="12" />
-              <folding>
-                <element signature="e#2261#2262#0" expanded="true" />
-                <element signature="e#2323#2324#0" expanded="true" />
-              </folding>
-            </state>
-          </provider>
-        </entry>
-      </file>
     </leaf>
   </component>
   <component name="FileTemplateManagerImpl">
@@ -133,7 +139,6 @@
   </component>
   <component name="FindInProjectRecents">
     <findStrings>
-      <find>regexne</find>
       <find>RegexNER</find>
       <find>ner</find>
       <find>Stanford</find>
@@ -163,6 +168,7 @@
       <find>serial</find>
       <find>im</find>
       <find>total</find>
+      <find>Data</find>
     </findStrings>
     <replaceStrings>
       <replace>CustomizedCoreAnnotations.NamedEntityTagAnnotation</replace>
@@ -175,7 +181,6 @@
   <component name="IdeDocumentHistory">
     <option name="CHANGED_PATHS">
       <list>
-        <option value="$PROJECT_DIR$/src/org/forward/entitysearch/ingestion/Ingester.java" />
         <option value="$PROJECT_DIR$/src/org/forward/entitysearch/ingestion/TextFileFilter.java" />
         <option value="$PROJECT_DIR$/src/org/forward/entitysearch/ingestion/WholeDocumentIngestionManager.java" />
         <option value="$PROJECT_DIR$/src/org/forward/entitysearch/ner/annotation/extraction/DBPediaExtractor.java" />
@@ -223,6 +228,8 @@
         <option value="$PROJECT_DIR$/src/main/java/edu/stanford/nlp/pipeline/PipelineHelper.java" />
         <option value="$PROJECT_DIR$/src/main/java/org/forward/entitysearch/experiment/AnnotatorFactory.java" />
         <option value="$PROJECT_DIR$/src/main/java/org/forward/entitysearch/ingestion/ESAnnotatedHTMLDocument.java" />
+        <option value="$PROJECT_DIR$/src/main/java/org/forward/entitysearch/ner/annotation/AnnotatorFactory.java" />
+        <option value="$PROJECT_DIR$/src/main/java/org/forward/entitysearch/experiment/TestReadObject.java" />
         <option value="$PROJECT_DIR$/pom.xml" />
         <option value="$PROJECT_DIR$/src/main/java/org/forward/entitysearch/ingestion/HTMLDocumentIngestionManager.java" />
       </list>
@@ -263,6 +270,64 @@
               <item name="EntityAnnotation" type="b2602c69:ProjectViewProjectNode" />
               <item name="EntityAnnotation" type="462c0819:PsiDirectoryNode" />
             </path>
+            <path>
+              <item name="EntityAnnotation" type="b2602c69:ProjectViewProjectNode" />
+              <item name="EntityAnnotation" type="462c0819:PsiDirectoryNode" />
+              <item name="src" type="462c0819:PsiDirectoryNode" />
+            </path>
+            <path>
+              <item name="EntityAnnotation" type="b2602c69:ProjectViewProjectNode" />
+              <item name="EntityAnnotation" type="462c0819:PsiDirectoryNode" />
+              <item name="src" type="462c0819:PsiDirectoryNode" />
+              <item name="main" type="462c0819:PsiDirectoryNode" />
+            </path>
+            <path>
+              <item name="EntityAnnotation" type="b2602c69:ProjectViewProjectNode" />
+              <item name="EntityAnnotation" type="462c0819:PsiDirectoryNode" />
+              <item name="src" type="462c0819:PsiDirectoryNode" />
+              <item name="main" type="462c0819:PsiDirectoryNode" />
+              <item name="java" type="462c0819:PsiDirectoryNode" />
+            </path>
+            <path>
+              <item name="EntityAnnotation" type="b2602c69:ProjectViewProjectNode" />
+              <item name="EntityAnnotation" type="462c0819:PsiDirectoryNode" />
+              <item name="src" type="462c0819:PsiDirectoryNode" />
+              <item name="main" type="462c0819:PsiDirectoryNode" />
+              <item name="java" type="462c0819:PsiDirectoryNode" />
+              <item name="nlp" type="462c0819:PsiDirectoryNode" />
+            </path>
+            <path>
+              <item name="EntityAnnotation" type="b2602c69:ProjectViewProjectNode" />
+              <item name="EntityAnnotation" type="462c0819:PsiDirectoryNode" />
+              <item name="src" type="462c0819:PsiDirectoryNode" />
+              <item name="main" type="462c0819:PsiDirectoryNode" />
+              <item name="java" type="462c0819:PsiDirectoryNode" />
+              <item name="entitysearch" type="462c0819:PsiDirectoryNode" />
+            </path>
+            <path>
+              <item name="EntityAnnotation" type="b2602c69:ProjectViewProjectNode" />
+              <item name="EntityAnnotation" type="462c0819:PsiDirectoryNode" />
+              <item name="src" type="462c0819:PsiDirectoryNode" />
+              <item name="main" type="462c0819:PsiDirectoryNode" />
+              <item name="java" type="462c0819:PsiDirectoryNode" />
+              <item name="entitysearch" type="462c0819:PsiDirectoryNode" />
+              <item name="experiment" type="462c0819:PsiDirectoryNode" />
+            </path>
+            <path>
+              <item name="EntityAnnotation" type="b2602c69:ProjectViewProjectNode" />
+              <item name="EntityAnnotation" type="462c0819:PsiDirectoryNode" />
+              <item name="src" type="462c0819:PsiDirectoryNode" />
+              <item name="main" type="462c0819:PsiDirectoryNode" />
+              <item name="java" type="462c0819:PsiDirectoryNode" />
+              <item name="entitysearch" type="462c0819:PsiDirectoryNode" />
+              <item name="ingestion" type="462c0819:PsiDirectoryNode" />
+            </path>
+            <path>
+              <item name="EntityAnnotation" type="b2602c69:ProjectViewProjectNode" />
+              <item name="EntityAnnotation" type="462c0819:PsiDirectoryNode" />
+              <item name="src" type="462c0819:PsiDirectoryNode" />
+              <item name="test" type="462c0819:PsiDirectoryNode" />
+            </path>
           </expand>
           <select />
         </subPane>
@@ -309,27 +374,27 @@
       <option name="VM_PARAMETERS" value="-Xmx4096m" />
       <extension name="coverage">
         <pattern>
-          <option name="PATTERN" value="org.forward.entitysearch.experiment.*" />
+          <option name="PATTERN" value="org.forward.entitysearch.ner.annotation.*" />
           <option name="ENABLED" value="true" />
         </pattern>
       </extension>
     </configuration>
-    <configuration name="Manager" type="Application" factoryName="Application" temporary="true" nameIsGenerated="true">
-      <option name="MAIN_CLASS_NAME" value="org.forward.entitysearch.Manager" />
+    <configuration name="PipelineHelper" type="Application" factoryName="Application" temporary="true" nameIsGenerated="true">
+      <option name="MAIN_CLASS_NAME" value="edu.stanford.nlp.pipeline.PipelineHelper" />
       <module name="EntityAnnotation" />
       <extension name="coverage">
         <pattern>
-          <option name="PATTERN" value="org.forward.entitysearch.*" />
+          <option name="PATTERN" value="edu.stanford.nlp.pipeline.*" />
           <option name="ENABLED" value="true" />
         </pattern>
       </extension>
     </configuration>
-    <configuration name="PipelineHelper" type="Application" factoryName="Application" temporary="true" nameIsGenerated="true">
-      <option name="MAIN_CLASS_NAME" value="edu.stanford.nlp.pipeline.PipelineHelper" />
+    <configuration name="TestReadObject" type="Application" factoryName="Application" temporary="true" nameIsGenerated="true">
+      <option name="MAIN_CLASS_NAME" value="org.forward.entitysearch.experiment.TestReadObject" />
       <module name="EntityAnnotation" />
       <extension name="coverage">
         <pattern>
-          <option name="PATTERN" value="edu.stanford.nlp.pipeline.*" />
+          <option name="PATTERN" value="org.forward.entitysearch.experiment.*" />
           <option name="ENABLED" value="true" />
         </pattern>
       </extension>
@@ -339,7 +404,7 @@
       <module name="EntityAnnotation" />
       <extension name="coverage">
         <pattern>
-          <option name="PATTERN" value="org.forward.entitysearch.experiment.*" />
+          <option name="PATTERN" value="org.forward.entitysearch.ner.annotation.*" />
           <option name="ENABLED" value="true" />
         </pattern>
       </extension>
@@ -347,6 +412,7 @@
     <configuration name="TestSelenium" type="Application" factoryName="Application" temporary="true">
       <option name="MAIN_CLASS_NAME" value="org.forward.entitysearch.ingestion.HTMLDocumentIngestionManager" />
       <module name="EntityAnnotation" />
+      <option name="PROGRAM_PARAMETERS" value="-i test_urls.csv -o serialized/ -v false" />
       <option name="VM_PARAMETERS" value="-Xmx4096m" />
       <option name="WORKING_DIRECTORY" value="file://$PROJECT_DIR$" />
       <RunnerSettings RunnerId="Run" />
@@ -359,18 +425,18 @@
     <list>
       <item itemvalue="Application.TestStanfordNLPAnnotator" />
       <item itemvalue="Application.TestSelenium" />
-      <item itemvalue="Application.Manager" />
       <item itemvalue="Application.BasicPipelineExample" />
       <item itemvalue="Application.TestRegex" />
       <item itemvalue="Application.PipelineHelper" />
+      <item itemvalue="Application.TestReadObject" />
     </list>
     <recent_temporary>
       <list>
         <item itemvalue="Application.TestSelenium" />
+        <item itemvalue="Application.TestReadObject" />
         <item itemvalue="Application.BasicPipelineExample" />
         <item itemvalue="Application.PipelineHelper" />
         <item itemvalue="Application.TestRegex" />
-        <item itemvalue="Application.Manager" />
       </list>
     </recent_temporary>
   </component>
@@ -393,12 +459,12 @@
       <workItem from="1526678891338" duration="5160000" />
       <workItem from="1526698295267" duration="21787000" />
       <workItem from="1526919640549" duration="22246000" />
-      <workItem from="1527016798854" duration="3867000" />
+      <workItem from="1527016798854" duration="14479000" />
     </task>
     <servers />
   </component>
   <component name="TimeTrackingManager">
-    <option name="totallyTimeSpent" value="231882000" />
+    <option name="totallyTimeSpent" value="242494000" />
   </component>
   <component name="ToolWindowManager">
     <frame x="6" y="23" width="1421" height="839" extended-state="0" />
@@ -528,21 +594,6 @@
     </expressions>
   </component>
   <component name="editorHistoryManager">
-    <entry file="file://$PROJECT_DIR$/src/main/java/edu/stanford/nlp/pipeline/CustomizedStanfordCoreNLP.java" />
-    <entry file="jar://$MAVEN_REPOSITORY$/edu/stanford/nlp/stanford-corenlp/3.8.0/stanford-corenlp-3.8.0-sources.jar!/edu/stanford/nlp/pipeline/AnnotationOutputter.java">
-      <provider selected="true" editor-type-id="text-editor">
-        <state relative-caret-position="1067">
-          <caret line="76" column="24" selection-start-line="76" selection-start-column="24" selection-end-line="76" selection-end-column="24" />
-        </state>
-      </provider>
-    </entry>
-    <entry file="jar://$MAVEN_REPOSITORY$/edu/stanford/nlp/stanford-corenlp/3.8.0/stanford-corenlp-3.8.0-sources.jar!/edu/stanford/nlp/pipeline/TextOutputter.java">
-      <provider selected="true" editor-type-id="text-editor">
-        <state relative-caret-position="105">
-          <caret line="7" column="21" lean-forward="true" selection-end-line="241" />
-        </state>
-      </provider>
-    </entry>
     <entry file="jar://$MAVEN_REPOSITORY$/edu/stanford/nlp/stanford-corenlp/3.8.0/stanford-corenlp-3.8.0-sources.jar!/edu/stanford/nlp/coref/data/Dictionaries.java">
       <provider selected="true" editor-type-id="text-editor">
         <state relative-caret-position="-2418">
@@ -824,13 +875,6 @@
         </state>
       </provider>
     </entry>
-    <entry file="file://$PROJECT_DIR$/src/main/java/edu/stanford/nlp/ling/CustomizableCoreAnnotations.java">
-      <provider selected="true" editor-type-id="text-editor">
-        <state relative-caret-position="915">
-          <caret line="66" column="36" selection-start-line="66" selection-start-column="36" selection-end-line="66" selection-end-column="36" />
-        </state>
-      </provider>
-    </entry>
     <entry file="file://$PROJECT_DIR$/annotation_config.properties">
       <provider selected="true" editor-type-id="text-editor">
         <state relative-caret-position="255">
@@ -838,13 +882,6 @@
         </state>
       </provider>
     </entry>
-    <entry file="file://$PROJECT_DIR$/src/main/java/org/forward/entitysearch/experiment/AnnotatorFactory.java">
-      <provider selected="true" editor-type-id="text-editor">
-        <state relative-caret-position="330">
-          <caret line="26" column="57" selection-start-line="26" selection-start-column="57" selection-end-line="26" selection-end-column="57" />
-        </state>
-      </provider>
-    </entry>
     <entry file="file://$PROJECT_DIR$/src/main/java/org/forward/entitysearch/ingestion/ESAnnotatedHTMLDocument.java">
       <provider selected="true" editor-type-id="text-editor">
         <state relative-caret-position="1020">
@@ -864,17 +901,55 @@
         </state>
       </provider>
     </entry>
+    <entry file="jar://$MAVEN_REPOSITORY$/edu/stanford/nlp/stanford-corenlp/3.8.0/stanford-corenlp-3.8.0-sources.jar!/edu/stanford/nlp/pipeline/WordsToSentencesAnnotator.java">
+      <provider selected="true" editor-type-id="text-editor">
+        <state relative-caret-position="3180">
+          <caret line="228" selection-start-line="228" selection-end-line="228" />
+        </state>
+      </provider>
+    </entry>
+    <entry file="file://$PROJECT_DIR$/src/main/java/org/forward/entitysearch/ingestion/TextFileFilter.java">
+      <provider selected="true" editor-type-id="text-editor">
+        <state relative-caret-position="120">
+          <caret line="10" column="13" selection-start-line="10" selection-start-column="13" selection-end-line="10" selection-end-column="13" />
+        </state>
+      </provider>
+    </entry>
+    <entry file="file://$PROJECT_DIR$/src/main/java/org/forward/entitysearch/ner/annotation/AnnotatorFactory.java">
+      <provider selected="true" editor-type-id="text-editor">
+        <state relative-caret-position="60">
+          <caret line="8" column="13" selection-start-line="8" selection-start-column="13" selection-end-line="8" selection-end-column="13" />
+        </state>
+      </provider>
+    </entry>
+    <entry file="file://$PROJECT_DIR$/src/main/java/org/forward/entitysearch/experiment/TestReadObject.java">
+      <provider selected="true" editor-type-id="text-editor">
+        <state relative-caret-position="435">
+          <caret line="29" column="71" selection-start-line="29" selection-start-column="71" selection-end-line="29" selection-end-column="71" />
+          <folding>
+            <element signature="imports" expanded="true" />
+          </folding>
+        </state>
+      </provider>
+    </entry>
+    <entry file="file://$PROJECT_DIR$/src/main/java/edu/stanford/nlp/ling/CustomizableCoreAnnotations.java">
+      <provider selected="true" editor-type-id="text-editor">
+        <state relative-caret-position="337">
+          <caret line="66" column="36" selection-start-line="66" selection-start-column="36" selection-end-line="66" selection-end-column="36" />
+        </state>
+      </provider>
+    </entry>
     <entry file="file://$PROJECT_DIR$/pom.xml">
       <provider selected="true" editor-type-id="text-editor">
-        <state relative-caret-position="200">
-          <caret line="22" column="59" lean-forward="true" selection-start-line="22" selection-start-column="59" selection-end-line="22" selection-end-column="59" />
+        <state relative-caret-position="339">
+          <caret line="73" column="27" selection-start-line="73" selection-start-column="27" selection-end-line="73" selection-end-column="27" />
         </state>
       </provider>
     </entry>
     <entry file="file://$PROJECT_DIR$/src/main/java/org/forward/entitysearch/ingestion/HTMLDocumentIngestionManager.java">
       <provider selected="true" editor-type-id="text-editor">
-        <state relative-caret-position="237">
-          <caret line="248" column="10" selection-start-line="248" selection-start-column="10" selection-end-line="248" selection-end-column="10" />
+        <state relative-caret-position="261">
+          <caret line="285" column="77" selection-start-line="285" selection-start-column="77" selection-end-line="285" selection-end-column="77" />
           <folding>
             <element signature="imports" expanded="true" />
           </folding>
diff --git a/EntityAnnotation.iml b/EntityAnnotation.iml
index bd21cd2..eabd5ec 100644
--- a/EntityAnnotation.iml
+++ b/EntityAnnotation.iml
@@ -57,5 +57,6 @@
     <orderEntry type="library" name="Maven: org.codehaus.mojo:animal-sniffer-annotations:1.14" level="project" />
     <orderEntry type="library" name="Maven: com.squareup.okhttp3:okhttp:3.9.1" level="project" />
     <orderEntry type="library" name="Maven: com.squareup.okio:okio:1.13.0" level="project" />
+    <orderEntry type="library" name="Maven: commons-cli:commons-cli:1.3.1" level="project" />
   </component>
 </module>
\ No newline at end of file
diff --git a/pom.xml b/pom.xml
index 4cf1908..2d40515 100644
--- a/pom.xml
+++ b/pom.xml
@@ -67,6 +67,12 @@
             <version>3.12.0</version>
             <scope>compile</scope>
         </dependency>
+        <dependency>
+            <groupId>commons-cli</groupId>
+            <artifactId>commons-cli</artifactId>
+            <version>1.3.1</version>
+            <scope>compile</scope>
+        </dependency>
     </dependencies>
 
 
diff --git a/serialized/kevin.ser b/serialized/kevin.ser
index 5e8587a..efc1bfd 100644
Binary files a/serialized/kevin.ser and b/serialized/kevin.ser differ
diff --git a/src/main/java/org/forward/entitysearch/experiment/TestReadObject.java b/src/main/java/org/forward/entitysearch/experiment/TestReadObject.java
new file mode 100644
index 0000000..a520fbe
--- /dev/null
+++ b/src/main/java/org/forward/entitysearch/experiment/TestReadObject.java
@@ -0,0 +1,33 @@
+package org.forward.entitysearch.experiment;
+
+import edu.stanford.nlp.ling.CoreAnnotations;
+import edu.stanford.nlp.ling.CoreLabel;
+import edu.stanford.nlp.ling.CustomizableCoreAnnotations;
+import org.forward.entitysearch.ingestion.ESAnnotatedHTMLDocument;
+
+import java.io.FileInputStream;
+import java.io.ObjectInputStream;
+
+public class TestReadObject {
+    public static void main (String[] args) {
+        ESAnnotatedHTMLDocument doc = null;
+        FileInputStream fin = null;
+        ObjectInputStream ois = null;
+        try {
+            fin = new FileInputStream("serialized/kevin.ser");
+            ois = new ObjectInputStream(fin);
+            doc = (ESAnnotatedHTMLDocument) ois.readObject();
+        } catch (Exception e) {
+            e.printStackTrace();
+        }
+        if (doc != null) {
+            System.out.println(doc.get(CoreAnnotations.TokensAnnotation.class).size());
+            for (CoreLabel token : doc.get(CoreAnnotations.TokensAnnotation.class)) {
+                System.out.println(token.word() + " " + token.ner() + " " +
+                        token.get(CustomizableCoreAnnotations.LayoutHeightAnnotation.class) + " " +
+                        token.get(CustomizableCoreAnnotations.LayoutWidthAnnotation.class));
+            }
+            System.out.println(doc.getHeight() + " " + doc.getWidth());
+        }
+    }
+}
diff --git a/src/main/java/org/forward/entitysearch/ingestion/HTMLDocumentIngestionManager.java b/src/main/java/org/forward/entitysearch/ingestion/HTMLDocumentIngestionManager.java
index 8dfa786..bbfdc88 100644
--- a/src/main/java/org/forward/entitysearch/ingestion/HTMLDocumentIngestionManager.java
+++ b/src/main/java/org/forward/entitysearch/ingestion/HTMLDocumentIngestionManager.java
@@ -5,9 +5,10 @@
 import edu.stanford.nlp.ling.CustomizableCoreAnnotations;
 import edu.stanford.nlp.pipeline.Annotation;
 import edu.stanford.nlp.pipeline.PipelineHelper;
+import edu.stanford.nlp.util.Pair;
 import edu.stanford.nlp.util.TypesafeMap;
 import org.forward.entitysearch.AnnotationProperties;
-import org.forward.entitysearch.experiment.AnnotatorFactory;
+import org.forward.entitysearch.ner.annotation.AnnotatorFactory;
 import org.openqa.selenium.By;
 import org.openqa.selenium.Dimension;
 import org.openqa.selenium.Rectangle;
@@ -16,11 +17,16 @@
 import org.openqa.selenium.chrome.ChromeOptions;
 import org.openqa.selenium.remote.RemoteWebElement;
 
-import java.io.FileOutputStream;
-import java.io.IOException;
-import java.io.ObjectOutputStream;
+import java.io.*;
+import java.nio.file.Files;
+import java.nio.file.Path;
+import java.nio.file.Paths;
 import java.util.ArrayList;
 import java.util.List;
+import java.util.stream.Collectors;
+import java.util.stream.Stream;
+
+import org.apache.commons.cli.*;
 
 public class HTMLDocumentIngestionManager {
 
@@ -210,43 +216,118 @@ private static List<CoreLabel> tokenizeText(String txt) {
 
     public static void main(String[] args) {
 
+        Options options = new Options();
+
+        Option input = new Option("i", "input", true, "input url");
+        input.setRequired(true);
+        options.addOption(input);
+
+        Option output = new Option("o", "output", true, "output folder for serialized files");
+        output.setRequired(true);
+        options.addOption(output);
+
+        Option verbose = new Option("v", "verbose", true, "print additional message for debugging");
+        verbose.setRequired(false);
+        options.addOption(verbose);
+
+        CommandLineParser parser = new DefaultParser();
+        HelpFormatter formatter = new HelpFormatter();
+        CommandLine cmd;
+
+        try {
+            cmd = parser.parse(options, args);
+        } catch (ParseException e) {
+            System.out.println(e.getMessage());
+            formatter.printHelp("utility-name", options);
+
+            System.exit(1);
+            return;
+        }
+
+        boolean VERBOSE = false;
+        if (cmd.hasOption("verbose"))
+            VERBOSE = Boolean.parseBoolean(cmd.getOptionValue("verbose"));
+        String inputFile = cmd.getOptionValue("input");
+        String outputFolder = cmd.getOptionValue("output");
+
+        List<Pair<String,String>> urls = new ArrayList<>();
+
+        try (BufferedReader br = new BufferedReader(new FileReader(inputFile))) {
+            String line;
+            while ((line = br.readLine()) != null) {
+                String[] tmp = line.split("\t");
+                urls.add(new Pair<>(tmp[0],tmp[1]));
+            }
+
+        } catch (IOException e) {
+            e.printStackTrace();
+        }
+
         long time = System.currentTimeMillis();
         long start = time;
-        String baseUrl = "http://www.forwarddatalab.org/kevinchang";
+
         WebDriver driver = createChromeDriver();
 //        System.out.println(getAllTextWithLayout(driver,baseUrl));
-        System.out.println("After creating driver " + (System.currentTimeMillis()-time));
         time = System.currentTimeMillis();
+        System.out.println("Finish loading web driver " + (time-start)/1000 + " seconds");
+        start = time;
+
         AnnotatorFactory.getInstance().getAnnotationPipeline();
-        System.out.println("After loading the default annotation pipeline " + (System.currentTimeMillis()-time));
-        time = System.currentTimeMillis();
-        ESAnnotatedHTMLDocument document = getHTMLDocumentForAnnotation(baseUrl, driver);
-        System.out.println("After creating document for annotation " + (System.currentTimeMillis()-time));
         time = System.currentTimeMillis();
+        System.out.println("Finish loading the default annotation pipeline " + (time-start)/1000 + " seconds");
+        start = time;
+
         List<Class<? extends TypesafeMap.Key<String>>> fields = PipelineHelper.addPopularRegexRuleAnnotators(AnnotatorFactory.getInstance().getAnnotationPipeline());
-        System.out.println("After loading extra components for annotation pipeline " + (System.currentTimeMillis()-time));
         time = System.currentTimeMillis();
-        AnnotatorFactory.getInstance().getAnnotationPipeline().annotate(document);
-        System.out.println("After annotation " + (System.currentTimeMillis()-time));
-        System.out.println("Total time: " + (System.currentTimeMillis() - start));
-        System.out.println(document.getTitle());
-        System.out.println(document.getURL());
-        System.out.println(document.getHeight() + " " + document.getWidth());
-        try {
-            FileOutputStream fileOut =
-                    new FileOutputStream("serialized/kevin.ser");
-            ObjectOutputStream out = new ObjectOutputStream(fileOut);
-            out.writeObject(document);
-            out.close();
-            fileOut.close();
-            System.out.printf("Serialized data is saved in serialized/kevin.ser");
-        } catch (IOException i) {
-            i.printStackTrace();
+        System.out.println("Finish loading extra annotators " + (time-start)/1000 + " seconds");
+        start = time;
+
+        System.out.println("Ready to download and annotate HTML documents");
+        System.out.println("----------------------------------------------");
+
+        for (int i = 0; i < urls.size(); i++) {
+            String filename = urls.get(i).first;
+            String baseUrl = urls.get(i).second;
+
+            System.out.println(i + "\t" +  baseUrl);
+
+            ESAnnotatedHTMLDocument document = getHTMLDocumentForAnnotation(baseUrl, driver);
+            time = System.currentTimeMillis();
+            System.out.println("Finish creating document for annotation " + (time-start)/1000 + " seconds");
+            start = time;
+
+            AnnotatorFactory.getInstance().getAnnotationPipeline().annotate(document);
+            time = System.currentTimeMillis();
+            System.out.println("Finish annotation " + (time-start)/1000 + " seconds");
+            start = time;
+
+            try {
+                String path = outputFolder + filename + ".ser";
+                FileOutputStream fileOut =
+                        new FileOutputStream(path);
+                ObjectOutputStream out = new ObjectOutputStream(fileOut);
+                out.writeObject(document);
+                out.close();
+                fileOut.close();
+                if (VERBOSE)
+                    System.out.println("Serialized data is saved to " + path);
+            } catch (IOException e) {
+                e.printStackTrace();
+            }
+            time = System.currentTimeMillis();
+            if (VERBOSE) {
+                System.out.println("Finish serialization " + (time-start)/1000 + " seconds");
+                System.out.println("Done with " + document.getTitle() + " with size " + document.getHeight() + " " + document.getWidth());
+            }
+
+            if (VERBOSE) {
+                printAnnotatedDocument(document);
+                PipelineHelper.printAnnotatedDocument(document, fields);
+            }
         }
-        time = System.currentTimeMillis();
-        printAnnotatedDocument(document);
-//        PipelineHelper.printAnnotatedDocument(document, fields);
-        System.out.println("After printing results " + (System.currentTimeMillis()-time));
+
+        driver.close();
+
 //        time = System.currentTimeMillis();
 //        start = time;
 //        document = getHTMLDocumentForAnnotation("https://cs.illinois.edu/directory/profile/kcchang", driver);
@@ -260,7 +341,6 @@ public static void main(String[] args) {
 //        System.out.println("After printing results " + (System.currentTimeMillis()-time));
 
 //        printAnnotatedDocument(document);
-        driver.close();
 
         // List<WebElement> el = driver.findElements(By.cssSelector("*"));
         // It is not working because it will miss text nodes
@@ -313,7 +393,6 @@ public static void main(String[] args) {
     private static ESAnnotatedHTMLDocument getHTMLDocumentForAnnotation(String url, WebDriver driver) {
         driver.get(url);
         String pageTitle = driver.getTitle();
-        System.out.println(url + " " + pageTitle);
         List<CoreLabel> allTokens = new ArrayList<>();
         RemoteWebElement e = (RemoteWebElement) driver.findElement(By.xpath("/html/body"));
         travelDOMTreeWithSelenium(e,null,allTokens, driver);
diff --git a/src/main/java/org/forward/entitysearch/experiment/AnnotatorFactory.java b/src/main/java/org/forward/entitysearch/ner/annotation/AnnotatorFactory.java
similarity index 97%
rename from src/main/java/org/forward/entitysearch/experiment/AnnotatorFactory.java
rename to src/main/java/org/forward/entitysearch/ner/annotation/AnnotatorFactory.java
index c8663c7..e95517b 100644
--- a/src/main/java/org/forward/entitysearch/experiment/AnnotatorFactory.java
+++ b/src/main/java/org/forward/entitysearch/ner/annotation/AnnotatorFactory.java
@@ -1,4 +1,4 @@
-package org.forward.entitysearch.experiment;
+package org.forward.entitysearch.ner.annotation;
 
 import edu.stanford.nlp.ling.CustomizableCoreAnnotations;
 import edu.stanford.nlp.pipeline.*;
diff --git a/test_urls.csv b/test_urls.csv
new file mode 100644
index 0000000..a96ef23
--- /dev/null
+++ b/test_urls.csv
@@ -0,0 +1,2 @@
+0	http://www.forwarddatalab.org/kevinchang
+1	http://www.forwarddatalab.org/research