Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
11 changes: 11 additions & 0 deletions PageSegmentation_Workflow.html
Original file line number Diff line number Diff line change
@@ -0,0 +1,11 @@
<!--[if IE]><meta http-equiv="X-UA-Compatible" content="IE=5,IE=9" ><![endif]-->
<!DOCTYPE html>
<html>
<head>
<title>Untitled Diagram</title>
<meta charset="utf-8"/>
</head>
<body><div class="mxgraph" style="max-width:100%;border:1px solid transparent;" data-mxgraph="{&quot;highlight&quot;:&quot;#0000ff&quot;,&quot;nav&quot;:true,&quot;resize&quot;:true,&quot;toolbar&quot;:&quot;zoom layers lightbox&quot;,&quot;edit&quot;:&quot;_blank&quot;,&quot;xml&quot;:&quot;&lt;mxfile userAgent=\&quot;Mozilla/5.0 (Macintosh; Intel Mac OS X 10_12_6) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/60.0.3112.113 Safari/537.36\&quot; version=\&quot;7.3.9\&quot; editor=\&quot;www.draw.io\&quot; type=\&quot;google\&quot;&gt;&lt;diagram id=\&quot;74e2e168-ea6b-b213-b513-2b3c1d86103e\&quot; name=\&quot;Page-1\&quot;&gt;7V1fc5u4Fv80ntl9SAYhwPixTpO9O9Pt7iS997aPMsg2LUZewE2yn34lQLaRBCa2ZHASPyRGCEno/M7R+Sd5BG9WT7+laL38g4Q4HtlW+DSCH0e2PXE8+pcVPJcFruuUBYs0CssisCt4iP7BVaFVlW6iEGe1ijkhcR6t64UBSRIc5LUylKbksV5tTuJ6r2u0wFLBQ4BiufT/UZgvy1LftXbl/8HRYsl7BlZ1Z4V45aogW6KQPO4VwdsRvEkJyctvq6cbHLO54/NSPnfXcHc7sBQneZcHxmPsBZPxHEy8EPk+vKpa+IniTfWy95vkL/b6eLGijaI8Ikk19vyZT0j2GK1ilNCr6TJfxbQQ0K/BMorDT+iZbNhYshwFP/jVlF6leUVZOkY4TckmCTEbFrvazgu7iNEMx1P69KKodENiktJbCSk6zPKU/MC8cGRDq/hs73AKsRHNozjeqzkvPqycJPkdWkUxA+T/cBqiBFXF1Rj96lLVD4qjRULLAjo/mN6cVnOI0xw/NRIGbMlN2QSTFc7TZ1qlemBcAaTiEKe6fNzBDficHZZ7WBtzEKIK44tt09ve7ilPoGRBifeC7lxFZ7bQF4rp+ycox1NGp2wfefTL3mvuigo8dsSmLWFzhaKuYJQA14lIav6QqfZcn5D9eRurqARfRqXm5ju1rpcuFPmOj60ZhLbjwrl1BSW6jGwvziuOqRHH+3tD+I2rrKDGB1oBwPXT7ib9tmD/r7+vF/Qm5Tfbus4jyqh3vGE6xrLtsqaEgXRJVrMNff3p4zLK8cMaBezOI12O6rB4c2JHzVWNcsj2nJpkAK6MQV+BQa8F4DXsvQRoYGIKafVmysL8KW+C2zsQzw5EAMY1IPaJQ/d0GNoqGH4iKKQ3H6JK7P++Yoook/oeWjG8lH9ZB6U2VlT45dfOYKxh7AAgFcRXQMQEqR27ro2oZA6wz0Vs73RiOypi3+OC2PmSUTiOsjwr/ifscva8/W6Isoe53chq4tRXk3MSVh6qTNlvtw/S1OKQGj/VJUnzJVmQBMW3u9I90Q3qE31IcFON9AMzR4Wyu4i9RLkO7GmtLr3GScifCGKUZVHwZUlV4OJG9Rgor/Ye+o7z/Lm6Rpuc0KLdi3wiZL1VkV+wkpy0YuCnKP/Kx0q/f2Ove12+ICXr1+rti4vdvZI0jB4vxCOlJ9mkAT6gVtC5XuC8oZLXCuwr6xrSTw3cV9w+S3FMzeaf9VG3aP5/kagQLJxpBHHoC8xQvlv10L6tL7bjtLdTvr7UDsUbet6rtmYVMnVPvA6ZzzNca0WHneFL/Pr5z5PY1aqza1c+6Yb9NiRz/O+uvlVt94px2IpxNtjasqwH3sAXVntwJL6lhianAryhH7euifJ+d0gvWzwrbwBHXsxwdpncYYoHYAcWcNUscCLGHWgpIaMbmg5Q99PEMgfq16GsBaYqbfodo5K10QdGXc3qgbobOHFV3TQhVKxuHKG2LEj1+Jg+4QUK2EwFJHxtdh0QsKPyVJ/PYvc1mOxAbbJnRRCQGuhRgooJ2LpmklnG/lHw4iSLcnaPyh+bRf7ubNft0UUjOv38AAeBytyb+S4TAoacOsJSo7T9HQVE2gJax0NkfEHrkKm1xu2w1vgNdm/nxeZ4Esnmnh5BHJCEQZsFtb+QhyRar3GevTonKvTq/OZZCn6bGOI3aaxyiHDfgy3NcR8h3KoFVwiFK1YyRxULbw3pHs0ECh+lHiYoFjBap0rruED4tzsrAJzU9UZPAX8IZDo6RshoSpbNo8KtvFkl0xSjH5coxtrpCC3rMB1VaoMROnJQGdQsy3jQANVII1wquKTHKiY9l05oq4j7mnRC2EEntLs4IEpx1odSCDVY50oGvI6SqLz/GeNwWq6OUbIoTbyig1m6y//4WPRgfbn/7+2wk0G2Nt3hZBBuFw4iGeSA3BAWBVV6pKWQG6JPSw8m5XSQU+PIFyk6OG+2i46DcVS9QSazURcouxE+k+FSfufQ3sXaeeBRb0hSH14alpo9vEBfK2K4HSiYgYaCiYKVztXWRne4aJ3W6/cTe+TS911xOoTm0n7oQ3GyVTmLQ6WR7sAb6EC/Ls7QUmJpj7x5QoKPZN5okjWya6td2Byorz/25qh2EgwVpKaAyH1FrUh0Gpy/2gUJmLkwwDBkDqiJN3au9JKkORHQkEQBZ5QoXVYE/1RTWs26Y0F9GYtJVbpyoTzBgwM9u1WmSA/wkTU9MBmfVt9zXK1CS2YIrh28M0SdIaSZ4lt1e+CHiZCAtV1yTfOD407eGj+4JvjBunx+8CwYTizgIhsHljMZX8EeFwhPcKF5Yvjy6GxwHTt9ZS+vGOiSMNZjyBhYogKv2KerCrW/dBswZ2nRNyF3t/Ur9Lkv2LElMuqJet5RMLD3ZU70EhQj1Sa5WYyCH/z+UNKvQhf7oaNy1fv2DHre0RhtsE355g/BSabKvoK2jBkjCXqOzN96gHGPV+Qn4xS2tpSUZ7vqfnmMcrZNij7GTFhr/dRnmHyQgLBhr4C4JO/UMeqAI6sDjeKy3fA/1QV1PI1MpSLd43m56xWF3xELG6oYd+xu+baWb/vOx3U+hsDuk49fe1ptJz7uEtdyesur5Su/fj7eFEoqKOuMmF/EIvMR2/Cwr7dbrGXWuGW9501oz5toFxZgUt+6CK2xLC1cqDAdjByjIR829galRacdX1Zv0sLUqv/A4tD7omHUlGlF1QB652ZUnctXgXVAGryxHTXtzCwekwJ5m/vMrPIDcEVT7zEpqqVf47ICyzq/7xaUbN/or2hfpc+WQBns4nKpJzQd0ESFVG0XKExK1dYJM8f2mDorrMKjU9YpoVhQ8CEPP+KfKlAWb/2Oxn7ROOmIRh2qjuTqlz2hgz6dwZSyw+e7Xdk5mCLqjC2vRlxu9A4iS1QiPtBwXlybKLI7W1x0Rqw/74tHhiuPXqfpJcojx3J6lEeKnPUhJy6bkkdcaW0/+ashaXN7LBJdXOonf42HLI2gKYuuUM0TwgnFpRAbCxNCcwaV0o6Lkozy1lZbrxmBF3Yuxoucs8o92CrnrI79bTLhL2uzgjGeV5yE1sAkfeRXqnxifflbliiev3teDnteHKBYy1WeFx18LSFGDqa/RbZWmRYNmngfbC3L3kEbgLp3YCgo2Ggm7VNQLR61Z8PBicDQfKN/H9lw8jvL3oM3wOGd8NGg0feycCu2Aetl8eNOTR4kcTtZYvIUNxB35xnybVCN6NTTEEFddXdFM1zbcYiCm/LQBlCxfg+HzzbQxYDS+htOcIpypnriNC1+CGaVLa4HpIByj3izV/0cCqirOhVHGfozoYAC+XSjs0m+i1N7Otmjx0i+rSPhZMmnljCmJZ9n1zamDFLyyecZm5J8H9JFNuyTZS4kbNi+daPp7Pk+flWIy/RLsRE7CMQu22RBFx88aPfBU/ln1wh58m9vmBUbtrzRfcgWnbGfstCGD9vMyQxA0LNMncwg9gNBy9p2GID0cvcTsmX13e/wwtt/AQ==&lt;/diagram&gt;&lt;/mxfile&gt;&quot;}"></div>
<script type="text/javascript" src="https://www.draw.io/js/viewer.min.js"></script>
</body>
</html>
1 change: 1 addition & 0 deletions README.md
Original file line number Diff line number Diff line change
Expand Up @@ -111,3 +111,4 @@ All output files created by the program are created in the data directory:
## Notes ##
* If using IDE, run the command line script first before running the file in
the IDE.
* If one want to skip a binarizing process since the image is already binarized (such as .tiff), edit user.ini file NeedBinarizing=FALSE.
2 changes: 1 addition & 1 deletion RunAll.sh
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,7 @@ echo "AIDA: Poem Identifier"

cd data/
find Output_Snippets/ -type f > snippetPathList.txt
find Output_Snippets/ -not -path '*/\.*' -type f -printf "%f\n" > SnippetNameList.txt
find Output_Snippets/ -not -path '*/\.*' -type f -name '*.jpg' -exec basename {} \; > SnippetNameList.txt;
cd ../
NOME=$1
c=0
Expand Down
5 changes: 3 additions & 2 deletions RunPageSegmentation.sh
Original file line number Diff line number Diff line change
@@ -1,6 +1,6 @@
#!/bin/bash
cd src/
javac execute/RunPageSegmentation.java
javac -cp ../tif_jar/jai_imageio.jar:./ execute/RunPageSegmentation.java
cd ../

beginYear=$1
Expand All @@ -22,7 +22,8 @@ for i in $( ls ); do
totalCount=$((totalCount + 1))
current=$(pwd)
cd $src
java execute/RunPageSegmentation $current/$k
#java execute/RunPageSegmentation $current/$k
java -cp ../tif_jar/jai_imageio.jar:./ execute/RunPageSegmentation $current/$k
cd $current
done
cd ..
Expand Down
Binary file not shown.
Empty file added data/SnippetNameList.txt
Empty file.
1 change: 1 addition & 0 deletions data/snippetPathList.txt
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
Output_Snippets//.keep
Loading