├── dict
    ├── user.dic
    ├── en_US.dic
    ├── vi_VN.aff
    └── en_US.aff
├── tessdata
    ├── configs
    │   ├── quiet
    │   ├── digits
    │   ├── pdf
    │   ├── tsv
    │   ├── unlv
    │   ├── hocr
    │   ├── bazaar
    │   ├── txt
    │   ├── tess_configvars
    │   └── tess_configs
    ├── pdf.ttf
    ├── eng.traineddata
    ├── osd.traineddata
    └── vie.traineddata
├── .tx
    ├── update-l10n.sh
    └── config
├── Hunspellx64.dll
├── Hunspellx86.dll
├── Icons
    └── fatcow
    │   ├── find.png
    │   ├── ocr.png
    │   ├── open.png
    │   ├── save.png
    │   ├── scan.png
    │   ├── tools.png
    │   ├── cancel.png
    │   ├── gear_in.png
    │   ├── zoom_in.png
    │   ├── ocr_small.png
    │   ├── rotate_ccw.png
    │   ├── rotate_cw.png
    │   ├── zoom_fit.png
    │   ├── zoom_out.png
    │   ├── draw_eraser.png
    │   ├── image_paste.png
    │   ├── zoom_actual.png
    │   ├── pilcrow_delete.png
    │   ├── inline_spellcheck.png
    │   ├── document_page_next.png
    │   └── document_page_previous.png
├── Library
    ├── Tesseract.dll
    ├── Tesseract.pdb
    ├── VietKeyInput.dll
    ├── MultiComboBox.dll
    ├── MultiComboBox.pdb
    └── ICSharpCode.SharpZipLib.dll
├── Resources
    └── VietOCR.ico
├── samples
    ├── vietsample.tif
    ├── vietsample1.pdf
    ├── vietsample1.tif
    ├── vietsample2.png
    └── vietsample2.tif
├── x64
    ├── libleptonica1860.dll
    └── libtesseract551.dll
├── x86
    ├── libleptonica1860.dll
    └── libtesseract551.dll
├── packages.config
├── Properties
    ├── Settings.settings
    ├── Settings.Designer.cs
    └── AssemblyInfo.cs
├── .project
├── VietOCR.csproj.user
├── Data
    ├── san.DangAmbigs.txt
    ├── slk.DangAmbigs.txt
    ├── ces.DangAmbigs.txt
    ├── eng.DangAmbigs.txt
    ├── vie.DangAmbigs.txt
    └── ISO639-1.xml
├── App.config
├── .gitignore
├── App.xaml
├── Test
    ├── ConsoleAppTests.cs
    ├── Properties
    │   └── AssemblyInfo.cs
    ├── Utilities
    │   └── PdfUtilitiesTests.cs
    ├── obj
    │   └── Release
    │   │   └── DesignTimeResolveAssemblyReferencesInput.cache
    ├── app.config
    ├── packages.config
    └── .vs
    │   └── VietOCRTests.csproj.dtbcache.json
├── ProcessingOptions.cs
├── Utilities
    ├── VietUtilities.cs
    ├── FixedSizeStack.cs
    ├── ImageConverter.cs
    ├── Utilities.cs
    ├── BreakIterator.cs
    ├── Watcher.cs
    ├── FileExtractor.cs
    └── FormLocalizer.cs
├── StatusForm.xaml
├── HtmlHelpDialog.xaml
├── Postprocessing
    ├── IPostProcessor.cs
    ├── EngPP.cs
    ├── ProcessorFactory.cs
    ├── TextUtilities.cs
    ├── Processor.cs
    └── ViePP.cs
├── Controls
    ├── MoveThumb.cs
    ├── ResizeThumb.cs
    └── RedUnderlineAdorner.cs
├── StatusForm.xaml.cs
├── SplitPdfArgs.cs
├── SliderDialog.xaml
├── ChangeCaseDialog.xaml.cs
├── README.md
├── HtmlHelpDialog.xaml.cs
├── ChangeCaseDialog.xaml
├── DownloadDialog.xaml
├── WIA
    ├── WiaOperationException.cs
    └── WiaScannerAdapter.cs
├── VietOCR.sln
├── App.xaml.cs
├── SliderDialog.xaml.cs
├── DataSource.cs
├── ImageInfoDialog.xaml.cs
├── GuiWithInputMethod.cs
├── OCRHelper.cs
├── GuiWithUILanguage.cs
├── GuiWithOEM.cs
├── ConsoleApp.cs
├── BulkDialog.xaml
├── SplitPdfDialog.xaml
├── ImageInfoDialog.xaml
├── GuiWithRegistry.cs
├── GuiWithBatch.cs
├── GuiWithScan.cs
├── SplitPdfDialog.xaml.cs
├── FindReplaceDialog.xaml.cs
├── GuiWithPSM.cs
├── DownloadDialog.vi.resx
├── GuiWithThumbnail.cs
├── FindReplaceDialog.xaml
└── readme_cs_ja.html


/dict/user.dic:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/tessdata/configs/quiet:
--------------------------------------------------------------------------------
1 | debug_file /dev/null
2 | 


--------------------------------------------------------------------------------
/tessdata/configs/digits:
--------------------------------------------------------------------------------
1 | tessedit_char_whitelist 0123456789-.
2 | 


--------------------------------------------------------------------------------
/.tx/update-l10n.sh:
--------------------------------------------------------------------------------
1 | #!/bin/sh
2 | 
3 | tx pull -a -f --minimum-perc 75
4 | 


--------------------------------------------------------------------------------
/tessdata/configs/pdf:
--------------------------------------------------------------------------------
1 | tessedit_create_pdf 1
2 | tessedit_pageseg_mode 1
3 | 


--------------------------------------------------------------------------------
/tessdata/configs/tsv:
--------------------------------------------------------------------------------
1 | tessedit_create_tsv 1
2 | tessedit_pageseg_mode 1
3 | 


--------------------------------------------------------------------------------
/tessdata/configs/unlv:
--------------------------------------------------------------------------------
1 | tessedit_write_unlv 1
2 | tessedit_pageseg_mode 6
3 | 


--------------------------------------------------------------------------------
/dict/en_US.dic:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/dict/en_US.dic


--------------------------------------------------------------------------------
/Hunspellx64.dll:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Hunspellx64.dll


--------------------------------------------------------------------------------
/Hunspellx86.dll:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Hunspellx86.dll


--------------------------------------------------------------------------------
/tessdata/pdf.ttf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/tessdata/pdf.ttf


--------------------------------------------------------------------------------
/Icons/fatcow/find.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Icons/fatcow/find.png


--------------------------------------------------------------------------------
/Icons/fatcow/ocr.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Icons/fatcow/ocr.png


--------------------------------------------------------------------------------
/Icons/fatcow/open.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Icons/fatcow/open.png


--------------------------------------------------------------------------------
/Icons/fatcow/save.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Icons/fatcow/save.png


--------------------------------------------------------------------------------
/Icons/fatcow/scan.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Icons/fatcow/scan.png


--------------------------------------------------------------------------------
/Icons/fatcow/tools.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Icons/fatcow/tools.png


--------------------------------------------------------------------------------
/Library/Tesseract.dll:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Library/Tesseract.dll


--------------------------------------------------------------------------------
/Library/Tesseract.pdb:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Library/Tesseract.pdb


--------------------------------------------------------------------------------
/Resources/VietOCR.ico:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Resources/VietOCR.ico


--------------------------------------------------------------------------------
/samples/vietsample.tif:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/samples/vietsample.tif


--------------------------------------------------------------------------------
/tessdata/configs/hocr:
--------------------------------------------------------------------------------
1 | tessedit_create_hocr 1
2 | tessedit_pageseg_mode 1
3 | hocr_font_info 0
4 | 


--------------------------------------------------------------------------------
/Icons/fatcow/cancel.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Icons/fatcow/cancel.png


--------------------------------------------------------------------------------
/Icons/fatcow/gear_in.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Icons/fatcow/gear_in.png


--------------------------------------------------------------------------------
/Icons/fatcow/zoom_in.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Icons/fatcow/zoom_in.png


--------------------------------------------------------------------------------
/Library/VietKeyInput.dll:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Library/VietKeyInput.dll


--------------------------------------------------------------------------------
/samples/vietsample1.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/samples/vietsample1.pdf


--------------------------------------------------------------------------------
/samples/vietsample1.tif:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/samples/vietsample1.tif


--------------------------------------------------------------------------------
/samples/vietsample2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/samples/vietsample2.png


--------------------------------------------------------------------------------
/samples/vietsample2.tif:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/samples/vietsample2.tif


--------------------------------------------------------------------------------
/tessdata/eng.traineddata:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/tessdata/eng.traineddata


--------------------------------------------------------------------------------
/tessdata/osd.traineddata:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/tessdata/osd.traineddata


--------------------------------------------------------------------------------
/tessdata/vie.traineddata:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/tessdata/vie.traineddata


--------------------------------------------------------------------------------
/x64/libleptonica1860.dll:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/x64/libleptonica1860.dll


--------------------------------------------------------------------------------
/x64/libtesseract551.dll:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/x64/libtesseract551.dll


--------------------------------------------------------------------------------
/x86/libleptonica1860.dll:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/x86/libleptonica1860.dll


--------------------------------------------------------------------------------
/x86/libtesseract551.dll:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/x86/libtesseract551.dll


--------------------------------------------------------------------------------
/Icons/fatcow/ocr_small.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Icons/fatcow/ocr_small.png


--------------------------------------------------------------------------------
/Icons/fatcow/rotate_ccw.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Icons/fatcow/rotate_ccw.png


--------------------------------------------------------------------------------
/Icons/fatcow/rotate_cw.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Icons/fatcow/rotate_cw.png


--------------------------------------------------------------------------------
/Icons/fatcow/zoom_fit.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Icons/fatcow/zoom_fit.png


--------------------------------------------------------------------------------
/Icons/fatcow/zoom_out.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Icons/fatcow/zoom_out.png


--------------------------------------------------------------------------------
/Library/MultiComboBox.dll:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Library/MultiComboBox.dll


--------------------------------------------------------------------------------
/Library/MultiComboBox.pdb:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Library/MultiComboBox.pdb


--------------------------------------------------------------------------------
/Icons/fatcow/draw_eraser.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Icons/fatcow/draw_eraser.png


--------------------------------------------------------------------------------
/Icons/fatcow/image_paste.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Icons/fatcow/image_paste.png


--------------------------------------------------------------------------------
/Icons/fatcow/zoom_actual.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Icons/fatcow/zoom_actual.png


--------------------------------------------------------------------------------
/Icons/fatcow/pilcrow_delete.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Icons/fatcow/pilcrow_delete.png


--------------------------------------------------------------------------------
/Icons/fatcow/inline_spellcheck.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Icons/fatcow/inline_spellcheck.png


--------------------------------------------------------------------------------
/Icons/fatcow/document_page_next.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Icons/fatcow/document_page_next.png


--------------------------------------------------------------------------------
/Library/ICSharpCode.SharpZipLib.dll:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Library/ICSharpCode.SharpZipLib.dll


--------------------------------------------------------------------------------
/Icons/fatcow/document_page_previous.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nguyenq/VietOCRwpf/HEAD/Icons/fatcow/document_page_previous.png


--------------------------------------------------------------------------------
/tessdata/configs/bazaar:
--------------------------------------------------------------------------------
1 | load_system_dawg     F
2 | load_freq_dawg       F
3 | user_words_suffix    user-words
4 | user_patterns_suffix user-patterns
5 | 


--------------------------------------------------------------------------------
/tessdata/configs/txt:
--------------------------------------------------------------------------------
1 | # This config file should be used with other cofig files which creates renderers.
2 | # usage example: tesseract eurotext.tif eurotext txt hocr pdf
3 | tessedit_create_txt 1
4 | 


--------------------------------------------------------------------------------
/packages.config:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="utf-8"?>
2 | <packages>
3 |   <package id="NHunspell" version="1.2.5554.16953" targetFramework="net461" />
4 |   <package id="Tesseract" version="5.2.0" targetFramework="net48" />
5 | </packages>


--------------------------------------------------------------------------------
/Properties/Settings.settings:
--------------------------------------------------------------------------------
1 | <?xml version='1.0' encoding='utf-8'?>
2 | <SettingsFile xmlns="uri:settings" CurrentProfile="(Default)">
3 |   <Profiles>
4 |     <Profile Name="(Default)" />
5 |   </Profiles>
6 |   <Settings />
7 | </SettingsFile>


--------------------------------------------------------------------------------
/.project:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="UTF-8"?>
 2 | <projectDescription>
 3 | 	<name>VietOCRwpf</name>
 4 | 	<comment></comment>
 5 | 	<projects>
 6 | 	</projects>
 7 | 	<buildSpec>
 8 | 	</buildSpec>
 9 | 	<natures>
10 | 	</natures>
11 | </projectDescription>
12 | 


--------------------------------------------------------------------------------
/VietOCR.csproj.user:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="utf-8"?>
2 | <Project ToolsVersion="14.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
3 |   <PropertyGroup>
4 |     <ProjectView>ProjectFiles</ProjectView>
5 |   </PropertyGroup>
6 | </Project>


--------------------------------------------------------------------------------
/Data/san.DangAmbigs.txt:
--------------------------------------------------------------------------------
1 | # Plain replaces. Character "0" in the first column indicates a plain replace. Delimiter is <TAB> (\t) character.
2 | 0	अा	आ
3 | 0	श्ा	श
4 | 0	ण्ा	ण
5 | 0	हाा	हा
6 | 
7 | # Regular expression replaces. Character "1" in the first column indicates a regex replace. Delimiter is <TAB> (\t) character.


--------------------------------------------------------------------------------
/Data/slk.DangAmbigs.txt:
--------------------------------------------------------------------------------
 1 | # Plain replaces. Character "0" in the first column indicates a plain replace. Delimiter is <TAB> (\t) character.
 2 | 0	iii	m
 3 | 0	l<	k
 4 | 0	lx	h
 5 | 0	xn	m
 6 | 0	 - 	—
 7 | 0	l'	ľ
 8 | 0	d'	ď
 9 | 0	t'	ť
10 | 
11 | # Regular expression replaces. Character "1" in the first column indicates a regex replace. Delimiter is <TAB> (\t) character.


--------------------------------------------------------------------------------
/App.config:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="utf-8"?>
 2 | <configuration>
 3 |   <appSettings>
 4 |     <add key="TessVersion" value="5.5.1"/>
 5 |     <add key="ReleaseDate" value="2025-09-27"/>
 6 |     <add key="Version" value="v6.15.1"/>
 7 |   </appSettings>
 8 |   <startup>
 9 |     <supportedRuntime version="v4.0" sku=".NETFramework,Version=v4.8"/>
10 |   </startup>
11 | </configuration>
12 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
 1 | ################################################################################
 2 | # This .gitignore file was automatically created by Microsoft(R) Visual Studio.
 3 | ################################################################################
 4 | 
 5 | /bin
 6 | /obj
 7 | *.suo
 8 | /Setup/Debug
 9 | /Setup/Release
10 | /.vs
11 | /packages
12 | /TestResults
13 | /Test/bin
14 | /Test/obj
15 | 


--------------------------------------------------------------------------------
/App.xaml:
--------------------------------------------------------------------------------
 1 | <Application x:Class="VietOCR.App"
 2 |              xmlns="http://schemas.microsoft.com/winfx/2006/xaml/presentation"
 3 |              xmlns:x="http://schemas.microsoft.com/winfx/2006/xaml"
 4 |              xmlns:local="clr-namespace:VietOCR"
 5 |              ShutdownMode="OnMainWindowClose">
 6 |     <Application.Resources>
 7 |          
 8 |     </Application.Resources>
 9 | </Application>
10 | 


--------------------------------------------------------------------------------
/tessdata/configs/tess_configvars:
--------------------------------------------------------------------------------
1 | # This text file contains non-init control parameters, specifically non-init variables, to modify Tesseract engine's behaviour.
2 | # https://code.google.com/p/tesseract-ocr/wiki/ControlParams
3 | # http://www.sk-spell.sk.cx/tesseract-ocr-parameters-in-302-version
4 | # Each key/value pair, delimited by spaces, takes one line. Comment lines start with # sign.
5 | # Ex:
6 | #tessedit_char_whitelist 0123456789-.


--------------------------------------------------------------------------------
/Test/ConsoleAppTests.cs:
--------------------------------------------------------------------------------
 1 | using Microsoft.VisualStudio.TestTools.UnitTesting;
 2 | using System.IO;
 3 | using System.Security.AccessControl;
 4 | using VietOCR;
 5 | 
 6 | namespace UnitTest
 7 | {
 8 |     [TestClass]
 9 |     public sealed class ConsoleAppTests
10 |     {
11 |         [TestMethod]
12 |         public void MainTest()
13 |         {
14 |             string[] args = { "samples/vietsample.tif", "out", "-l", "vie", "pdf_textonly" };
15 |             ConsoleApp.Main(args);
16 |             Assert.IsTrue(File.Exists("out.pdf"));
17 |         }
18 |     }
19 | }
20 | 


--------------------------------------------------------------------------------
/Test/Properties/AssemblyInfo.cs:
--------------------------------------------------------------------------------
 1 | using System.Reflection;
 2 | using System.Runtime.CompilerServices;
 3 | using System.Runtime.InteropServices;
 4 | 
 5 | [assembly: AssemblyTitle("UnitTest")]
 6 | [assembly: AssemblyDescription("")]
 7 | [assembly: AssemblyConfiguration("")]
 8 | [assembly: AssemblyCompany("")]
 9 | [assembly: AssemblyProduct("UnitTest")]
10 | [assembly: AssemblyCopyright("Copyright ©  2025")]
11 | [assembly: AssemblyTrademark("")]
12 | [assembly: AssemblyCulture("")]
13 | 
14 | [assembly: ComVisible(false)]
15 | 
16 | [assembly: Guid("61e5e263-898a-4bb0-b099-b7194bc58529")]
17 | 
18 | // [assembly: AssemblyVersion("1.0.*")]
19 | [assembly: AssemblyVersion("1.0.0.0")]
20 | [assembly: AssemblyFileVersion("1.0.0.0")]
21 | 


--------------------------------------------------------------------------------
/ProcessingOptions.cs:
--------------------------------------------------------------------------------
 1 | using System;
 2 | using System.Collections.Generic;
 3 | using System.Linq;
 4 | using System.Text;
 5 | using System.Threading.Tasks;
 6 | 
 7 | namespace VietOCR
 8 | {
 9 |     public class ProcessingOptions
10 |     {
11 |         public bool Deskew { get; set; }
12 |         public bool PostProcessing { get; set; }
13 |         public bool RemoveLines { get; set; }
14 |         public bool RemoveLineBreaks { get; set; }
15 |         public bool CorrectLetterCases { get; set; }
16 |         public bool RemoveHyphens { get; set; }
17 |         public bool ReplaceHyphens { get; set; }
18 |         public bool DangAmbigsEnabled { get; set; }
19 |         public string DangAmbigsPath { get; set; }
20 |     }
21 | }
22 | 


--------------------------------------------------------------------------------
/Utilities/VietUtilities.cs:
--------------------------------------------------------------------------------
 1 | using System;
 2 | 
 3 | using System.Text;
 4 | using System.Text.RegularExpressions;
 5 | 
 6 | namespace Net.SourceForge.Vietpad.Utilities
 7 | {
 8 |     class VietUtilities
 9 |     {
10 |         //private static readonly ILog logger = LogFactory.CreateLogger(System.Reflection.MethodBase.GetCurrentMethod().DeclaringType);
11 | 
12 |         /**
13 |          * Strips accents off words.
14 |          */
15 |         public static string StripDiacritics(string accented)
16 |         {
17 |             Regex regex = new Regex("\\p{IsCombiningDiacriticalMarks}+");
18 | 
19 |             string strFormD = accented.Normalize(NormalizationForm.FormD);
20 |             return regex.Replace(strFormD, string.Empty).Replace('\u0111', 'd').Replace('\u0110', 'D');
21 |         }
22 |     }
23 | }


--------------------------------------------------------------------------------
/StatusForm.xaml:
--------------------------------------------------------------------------------
 1 | <Window x:Class="VietOCR.StatusForm"
 2 |         xmlns="http://schemas.microsoft.com/winfx/2006/xaml/presentation"
 3 |         xmlns:x="http://schemas.microsoft.com/winfx/2006/xaml"
 4 |         xmlns:d="http://schemas.microsoft.com/expression/blend/2008"
 5 |         xmlns:mc="http://schemas.openxmlformats.org/markup-compatibility/2006"
 6 |         xmlns:local="clr-namespace:VietOCR"
 7 |         mc:Ignorable="d"
 8 |         Title="Status Form" Height="300" Width="400">
 9 |     <DockPanel HorizontalAlignment="Stretch" VerticalAlignment="Stretch" LastChildFill="True" >
10 |         <TextBox x:Name="textBox" HorizontalScrollBarVisibility="Auto" VerticalScrollBarVisibility="Auto" HorizontalAlignment="Stretch" TextWrapping="Wrap" VerticalAlignment="Stretch" />
11 |     </DockPanel>
12 | </Window>
13 | 


--------------------------------------------------------------------------------
/Data/ces.DangAmbigs.txt:
--------------------------------------------------------------------------------
 1 | # Plain replaces. Character "0" in the first column indicates a plain replace. Delimiter is <TAB> (\t) character.
 2 | 0	iii	m
 3 | 0	l<	k
 4 | 0	lx	h
 5 | 0	xn	m
 6 | 0	()	o
 7 | 0	a'	á
 8 | 0	e'	é
 9 | 0	y'	ý
10 | 0	d'	ď
11 | 0	t'	ť
12 | 0	7“	?“
13 | 0	7"	?"
14 | 0	f“	.“
15 | 0	f"	."
16 | 0	 & 	 a 
17 | 
18 | # Regular expression replaces. Character "1" in the first column indicates a regex replace. Delimiter is <TAB> (\t) character.
19 | # Correct common errors caused by OCR
20 | # 1 to l
21 | 1	(?<=\p{L}*)1(?=\p{L}+)		l
22 | 1	(?<=\p{L}+)1(?=\p{L}*)		l
23 | # ] to l
24 | 1	(?<=\p{L}*)\](?=\p{L}+)		l
25 | 1	(?<=\p{L}+)\](?=\p{L}*)		l
26 | # | to l
27 | 1	(?<=\p{L}*)\|(?=\p{L}+)		l
28 | 1	(?<=\p{L}+)\|(?=\p{L}*)		l
29 | # 0 to o
30 | 1	(?<=\p{L}*)0(?=\p{L}+)		o
31 | 1	(?<=\p{L}+)0(?=\p{L}*)		o
32 | 


--------------------------------------------------------------------------------
/Data/eng.DangAmbigs.txt:
--------------------------------------------------------------------------------
 1 | # Plain replaces. Character "0" in the first column indicates a plain replace. Delimiter is <TAB> (\t) character.
 2 | 0	iii	m
 3 | 0	l<	k
 4 | 0	lx	h
 5 | 0	xn	m
 6 | 
 7 | # Regular expression replaces. Character "1" in the first column indicates a regex replace. Delimiter is <TAB> (\t) character.
 8 | # Correct common errors caused by OCR
 9 | # 11 to n
10 | 1	\b11(?=\p{L}+\b)	n
11 | # 1 to l
12 | 1	\b1(?=\p{L}+\b)	l
13 | 1	(?<=\p{L}*)1(?=\p{L}+)		l
14 | 1	(?<=\p{L}+)1(?=\p{L}*)		l
15 | # ] to l
16 | 1	(?<=\p{L}*)\](?=\p{L}+)		l
17 | 1	(?<=\p{L}+)\](?=\p{L}*)		l
18 | # | to l
19 | 1	(?<=\p{L}*)\|(?=\p{L}+)		l
20 | 1	(?<=\p{L}+)\|(?=\p{L}*)		l
21 | # I to l
22 | 1	\bI(?![mn]+\b)	l
23 | # 0 to o
24 | 1	(?<=\b\p{L}*)0(?=\p{L}*\b)	o
25 | 1	(?<=\p{L}*)0(?=\p{L}+)		o
26 | 1	(?<=\p{L}+)0(?=\p{L}*)		o
27 | 


--------------------------------------------------------------------------------
/tessdata/configs/tess_configs:
--------------------------------------------------------------------------------
 1 | # This text file contains init-only control parameters to modify Tesseract engine's behaviour.
 2 | # https://code.google.com/p/tesseract-ocr/wiki/ControlParams
 3 | # http://www.sk-spell.sk.cx/tesseract-ocr-parameters-in-302-version
 4 | # Each key/value pair, delimited by spaces, takes one line. Comment lines start with # sign.
 5 | # Ex:
 6 | #debug_file /dev/null
 7 | #debug_file tesseract.log
 8 | # May be beneficial to disable system dictionaries for Vietnamese to improve accuracies
 9 | #load_system_dawg     F
10 | #load_freq_dawg       F
11 | #user_words_suffix    user-words
12 | #user_patterns_suffix user-patterns
13 | #language_model_penalty_non_dict_word 0.15
14 | #language_model_penalty_non_freq_dict_word 0.1
15 | #tessedit_char_whitelist 0123456789-.
16 | #tessedit_create_hocr 1
17 | #tessedit_pageseg_mode 1


--------------------------------------------------------------------------------
/HtmlHelpDialog.xaml:
--------------------------------------------------------------------------------
 1 | <Window x:Class="VietOCR.HtmlHelpDialog"
 2 |         xmlns="http://schemas.microsoft.com/winfx/2006/xaml/presentation"
 3 |         xmlns:x="http://schemas.microsoft.com/winfx/2006/xaml"
 4 |         xmlns:d="http://schemas.microsoft.com/expression/blend/2008"
 5 |         xmlns:mc="http://schemas.openxmlformats.org/markup-compatibility/2006"
 6 |         xmlns:local="clr-namespace:VietOCR"
 7 |         mc:Ignorable="d"
 8 |         Title="VietOCR.NET Help" Height="400" Width="600">
 9 |     <DockPanel>
10 |         <StatusBar DockPanel.Dock="Bottom" >
11 |             <StatusBarItem>
12 |                 <TextBlock Name="lblURL" />
13 |             </StatusBarItem>
14 |         </StatusBar>
15 |         <WebBrowser x:Name="webBrowser" DockPanel.Dock="Top" Navigating="webBrowser_Navigating"/>
16 |     </DockPanel>
17 | </Window>
18 | 


--------------------------------------------------------------------------------
/Postprocessing/IPostProcessor.cs:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * Copyright @ 2008 Quan Nguyen
 3 |  * 
 4 |  * Licensed under the Apache License, Version 2.0 (the "License");
 5 |  * you may not use this file except in compliance with the License.
 6 |  * You may obtain a copy of the License at
 7 |  *
 8 |  *  http://www.apache.org/licenses/LICENSE-2.0
 9 |  *
10 |  * Unless required by applicable law or agreed to in writing, software
11 |  * distributed under the License is distributed on an "AS IS" BASIS,
12 |  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 |  * See the License for the specific language governing permissions and
14 |  * limitations under the License.
15 | */
16 | 
17 | namespace VietOCR.NET.Postprocessing
18 | {
19 |     public interface IPostProcessor
20 |     {
21 |         string PostProcess(string text);
22 |     }
23 | }


--------------------------------------------------------------------------------
/Data/vie.DangAmbigs.txt:
--------------------------------------------------------------------------------
 1 | # Plain replaces. Character "0" in the first column indicates a plain replace. Delimiter is <TAB> (\t) character.
 2 | 0	tmg	úng
 3 | 0	rl	n
 4 | 0	rr	n
 5 | 0	êĩ-	ết
 6 | 0	âỳ	ấy
 7 | 0	oĩ	ơi
 8 | 0	ôỈ	ỡi
 9 | 0	u1I	ưn
10 | 0	q1I	qu
11 | 0	II	u
12 | 0	êf	ết
13 | 0	fâ	rầ
14 | 0	fê	iề
15 | 0	xiê 	về 
16 | 0	ýê	yề
17 | 0	lc	k
18 | 0	vđi	với
19 | 0	cũa	của
20 | 0	phãi	phải
21 | 0	—-	—
22 | 0	-—	—
23 | 0	––	—
24 | 0	Ð	Đ
25 | 0	âÍ	ấ
26 | 
27 | # Regular expression replaces. Character "1" in the first column indicates a regex replace. Delimiter is <TAB> (\t) character.
28 | 1	(?i)(?<=đ)ă\b	ã
29 | 1	(?i)(?<=[ch])ă\b	ả
30 | 1	(?i)ă(?![cmnpt])	à
31 | 1	(?i)ẵ(?=[cpt])	ắ
32 | 1	(?<=\b[Tt])m	rư
33 | 1	(?i)\bl(?=[rh])	t
34 | 1	(u|ll|r)(?=[gh])	n
35 | 1	(iii|ln|rn)	m
36 | 1	(?i)(?<=[qrgsv])ll	u
37 | 1	(?i)(?<=[cnpt])ll	h
38 | 1	(?i)[oe](?=h)	c
39 | 1	\Bđ	ớ


--------------------------------------------------------------------------------
/Controls/MoveThumb.cs:
--------------------------------------------------------------------------------
 1 | using System.Windows.Controls;
 2 | using System.Windows.Controls.Primitives;
 3 | 
 4 | namespace VietOCR.Controls
 5 | {
 6 |     public class MoveThumb : Thumb
 7 |     {
 8 |         public MoveThumb()
 9 |         {
10 |             DragDelta += new DragDeltaEventHandler(this.MoveThumb_DragDelta);
11 |         }
12 | 
13 |         private void MoveThumb_DragDelta(object sender, DragDeltaEventArgs e)
14 |         {
15 |             Control designerItem = this.DataContext as Control;
16 | 
17 |             if (designerItem != null)
18 |             {
19 |                 double left = Canvas.GetLeft(designerItem);
20 |                 double top = Canvas.GetTop(designerItem);
21 | 
22 |                 Canvas.SetLeft(designerItem, left + e.HorizontalChange);
23 |                 Canvas.SetTop(designerItem, top + e.VerticalChange);
24 |             }
25 |         }
26 |     }
27 | }
28 | 


--------------------------------------------------------------------------------
/Test/Utilities/PdfUtilitiesTests.cs:
--------------------------------------------------------------------------------
 1 | using Microsoft.VisualStudio.TestTools.UnitTesting;
 2 | using VietOCR.NET.Utilities;
 3 | using System;
 4 | using System.Collections.Generic;
 5 | using System.Linq;
 6 | using System.Text;
 7 | using System.Threading.Tasks;
 8 | 
 9 | namespace UnitTest
10 | {
11 |     [TestClass()]
12 |     public class PdfUtilitiesTests
13 |     {
14 |         [TestMethod()]
15 |         [Ignore]
16 |         public void ConvertPdf2TiffTest()
17 |         {
18 |            
19 |         }
20 | 
21 |         [TestMethod()]
22 |         [DeploymentItem("samples/vietsample1.pdf", "samples")]
23 |         public void GetPdfPageCountTest()
24 |         {
25 |             string inputPdfFile = "samples/vietsample1.pdf";
26 |             int expResult = 2;
27 |             int result = PdfUtilities.GetPdfPageCount(inputPdfFile);
28 |             Assert.AreEqual(expResult, result);
29 |         }
30 |     }
31 | }


--------------------------------------------------------------------------------
/Test/obj/Release/DesignTimeResolveAssemblyReferencesInput.cache:
--------------------------------------------------------------------------------
1 |    .winmd.dll.exe    4D:\Projects\github\VietOCRwpf\samples\vietsample.tif-D:\Projects\github\VietOCRwpf\packages.config       SC:\Program Files (x86)\Reference Assemblies\Microsoft\Framework\.NETFramework\v4.8\   Full                 {CandidateAssemblyFiles}PC:\Program Files\Common Files\microsoft shared\VSTT\17.0\UITestExtensionPackages{HintPathFromItem}{TargetFrameworkDirectory}B{Registry:Software\Microsoft\.NETFramework,v4.8,AssemblyFoldersEx}{RawFileName}/D:\Projects\github\VietOCRwpf\Test\bin\Release\     B{Registry:Software\Microsoft\.NETFramework,v4.8,AssemblyFoldersEx}XD:\Projects\github\VietOCRwpf\Test\obj\Release\DesignTimeResolveAssemblyReferences.cache   SC:\Program Files (x86)\Reference Assemblies\Microsoft\Framework\.NETFramework\v4.8\[C:\Program Files (x86)\Reference Assemblies\Microsoft\Framework\.NETFramework\v4.8\Facades\.NETFramework,Version=v4.8.NET Framework 4.8v4.8msil
2 | v4.0.30319         


--------------------------------------------------------------------------------
/Postprocessing/EngPP.cs:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * Copyright @ 2008 Quan Nguyen
 3 |  * 
 4 |  * Licensed under the Apache License, Version 2.0 (the "License");
 5 |  * you may not use this file except in compliance with the License.
 6 |  * You may obtain a copy of the License at
 7 |  *
 8 |  *  http://www.apache.org/licenses/LICENSE-2.0
 9 |  *
10 |  * Unless required by applicable law or agreed to in writing, software
11 |  * distributed under the License is distributed on an "AS IS" BASIS,
12 |  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 |  * See the License for the specific language governing permissions and
14 |  * limitations under the License.
15 | */
16 | using System;
17 | using System.Collections.Generic;
18 | using System.Text;
19 | 
20 | namespace VietOCR.NET.Postprocessing
21 | {
22 |     class EngPP : IPostProcessor
23 |     {
24 |         public string PostProcess(string text)
25 |         {
26 |             // no special processing for English
27 |             return text;
28 |         }
29 |     }
30 | }
31 | 


--------------------------------------------------------------------------------
/StatusForm.xaml.cs:
--------------------------------------------------------------------------------
 1 | using System;
 2 | using System.Collections.Generic;
 3 | using System.ComponentModel;
 4 | using System.Linq;
 5 | using System.Text;
 6 | using System.Threading.Tasks;
 7 | using System.Windows;
 8 | using System.Windows.Controls;
 9 | using System.Windows.Data;
10 | using System.Windows.Documents;
11 | using System.Windows.Input;
12 | using System.Windows.Media;
13 | using System.Windows.Media.Imaging;
14 | using System.Windows.Shapes;
15 | 
16 | namespace VietOCR
17 | {
18 |     /// <summary>
19 |     /// Interaction logic for StatusForm.xaml
20 |     /// </summary>
21 |     public partial class StatusForm : Window
22 |     {
23 |         public TextBox TextBox
24 |         {
25 |             get { return textBox; }
26 |         }
27 | 
28 |         public StatusForm()
29 |         {
30 |             InitializeComponent();
31 |         }
32 | 
33 |         protected override void OnClosing(CancelEventArgs e)
34 |         {
35 |             base.OnClosing(e);
36 | 
37 |             e.Cancel = true;
38 |             this.Visibility = Visibility.Hidden;
39 |         }
40 |     }
41 | }
42 | 


--------------------------------------------------------------------------------
/Properties/Settings.Designer.cs:
--------------------------------------------------------------------------------
 1 | //------------------------------------------------------------------------------
 2 | // <auto-generated>
 3 | //     This code was generated by a tool.
 4 | //     Runtime Version:4.0.30319.42000
 5 | //
 6 | //     Changes to this file may cause incorrect behavior and will be lost if
 7 | //     the code is regenerated.
 8 | // </auto-generated>
 9 | //------------------------------------------------------------------------------
10 | 
11 | namespace VietOCR.Properties {
12 |     
13 |     
14 |     [global::System.Runtime.CompilerServices.CompilerGeneratedAttribute()]
15 |     [global::System.CodeDom.Compiler.GeneratedCodeAttribute("Microsoft.VisualStudio.Editors.SettingsDesigner.SettingsSingleFileGenerator", "16.3.0.0")]
16 |     internal sealed partial class Settings : global::System.Configuration.ApplicationSettingsBase {
17 |         
18 |         private static Settings defaultInstance = ((Settings)(global::System.Configuration.ApplicationSettingsBase.Synchronized(new Settings())));
19 |         
20 |         public static Settings Default {
21 |             get {
22 |                 return defaultInstance;
23 |             }
24 |         }
25 |     }
26 | }
27 | 


--------------------------------------------------------------------------------
/Test/app.config:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="utf-8"?>
 2 | <configuration>
 3 |   <runtime>
 4 |     <assemblyBinding xmlns="urn:schemas-microsoft-com:asm.v1">
 5 |       <dependentAssembly>
 6 |         <assemblyIdentity name="System.Runtime.CompilerServices.Unsafe" publicKeyToken="b03f5f7f11d50a3a" culture="neutral" />
 7 |         <bindingRedirect oldVersion="0.0.0.0-6.0.3.0" newVersion="6.0.3.0" />
 8 |       </dependentAssembly>
 9 |       <dependentAssembly>
10 |         <assemblyIdentity name="System.Memory" publicKeyToken="cc7b13ffcd2ddd51" culture="neutral" />
11 |         <bindingRedirect oldVersion="0.0.0.0-4.0.5.0" newVersion="4.0.5.0" />
12 |       </dependentAssembly>
13 |       <dependentAssembly>
14 |         <assemblyIdentity name="System.Collections.Immutable" publicKeyToken="b03f5f7f11d50a3a" culture="neutral" />
15 |         <bindingRedirect oldVersion="0.0.0.0-8.0.0.0" newVersion="8.0.0.0" />
16 |       </dependentAssembly>
17 |       <dependentAssembly>
18 |         <assemblyIdentity name="System.Buffers" publicKeyToken="cc7b13ffcd2ddd51" culture="neutral" />
19 |         <bindingRedirect oldVersion="0.0.0.0-4.0.5.0" newVersion="4.0.5.0" />
20 |       </dependentAssembly>
21 |     </assemblyBinding>
22 |   </runtime>
23 | </configuration>


--------------------------------------------------------------------------------
/SplitPdfArgs.cs:
--------------------------------------------------------------------------------
 1 | using System;
 2 | using System.Collections.Generic;
 3 | using System.Text;
 4 | 
 5 | namespace VietOCR
 6 | {
 7 |     class SplitPdfArgs
 8 |     {
 9 |         string inputFilename;
10 | 
11 |         public string InputFilename
12 |         {
13 |             get { return inputFilename; }
14 |             set { inputFilename = value; }
15 |         }
16 |         string outputFilename;
17 | 
18 |         public string OutputFilename
19 |         {
20 |             get { return outputFilename; }
21 |             set { outputFilename = value; }
22 |         }
23 | 
24 |         string fromPage;
25 | 
26 |         public string FromPage
27 |         {
28 |             get { return fromPage; }
29 |             set { fromPage = value; }
30 |         }
31 |         string toPage;
32 | 
33 |         public string ToPage
34 |         {
35 |             get { return toPage; }
36 |             set { toPage = value; }
37 |         }
38 |         string numOfPages;
39 | 
40 |         public string NumOfPages
41 |         {
42 |             get { return numOfPages; }
43 |             set { numOfPages = value; }
44 |         }
45 | 
46 |         bool pages;
47 |         public bool Pages
48 |         {
49 |             get { return pages; }
50 |             set { pages = value; }
51 |         }
52 |     }
53 | }
54 | 


--------------------------------------------------------------------------------
/Utilities/FixedSizeStack.cs:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * Copyright @ 2013 Quan Nguyen
 3 |  * 
 4 |  * Licensed under the Apache License, Version 2.0 (the "License");
 5 |  * you may not use this file except in compliance with the License.
 6 |  * You may obtain a copy of the License at
 7 |  *
 8 |  *  http://www.apache.org/licenses/LICENSE-2.0
 9 |  *
10 |  * Unless required by applicable law or agreed to in writing, software
11 |  * distributed under the License is distributed on an "AS IS" BASIS,
12 |  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 |  * See the License for the specific language governing permissions and
14 |  * limitations under the License.
15 | */
16 | using System;
17 | using System.Collections.Generic;
18 | using System.Text;
19 | 
20 | namespace VietOCR.NET.Utilities
21 | {
22 |     public class FixedSizeStack<T> : LinkedList<T>
23 |     {
24 |         private int limit;
25 | 
26 |         public FixedSizeStack(int limit)
27 |             : base()
28 |         {
29 |             this.limit = limit;
30 |         }
31 | 
32 |         public T Pop()
33 |         {
34 |             T obj = base.First.Value;
35 |             base.RemoveFirst();
36 |             return obj;
37 |         }
38 | 
39 |         public void Push(T obj)
40 |         {
41 |             base.AddFirst(obj);
42 |             if (this.Count > limit)
43 |             {
44 |                 base.RemoveLast();
45 |             }
46 |         }
47 |     }
48 | }
49 | 


--------------------------------------------------------------------------------
/SliderDialog.xaml:
--------------------------------------------------------------------------------
 1 | <Window x:Class="VietOCR.SliderDialog"
 2 |         xmlns="http://schemas.microsoft.com/winfx/2006/xaml/presentation"
 3 |         xmlns:x="http://schemas.microsoft.com/winfx/2006/xaml"
 4 |         xmlns:d="http://schemas.microsoft.com/expression/blend/2008"
 5 |         xmlns:mc="http://schemas.openxmlformats.org/markup-compatibility/2006"
 6 |         xmlns:local="clr-namespace:VietOCR"
 7 |         xmlns:resx="clr-namespace:VietOCR"
 8 |         mc:Ignorable="d"
 9 |         Title="{x:Static resx:SliderDialog.this_Title}" Height="170" Width="260" ResizeMode="NoResize">
10 |     <Border Padding="20,0,20,20">
11 |         <StackPanel HorizontalAlignment="Stretch">
12 |             <Label x:Name="label1" Content="{x:Static resx:SliderDialog.label1_Text}" HorizontalAlignment="Left" Margin="20,5" />
13 |             <Slider x:Name="slider" HorizontalAlignment="Center" Width="170" TickPlacement="BottomRight" ValueChanged="slider_ValueChanged" TickFrequency="20" LargeChange="10" Maximum="100" Minimum="-100" SmallChange="5"/>
14 |             <StackPanel Orientation="Horizontal" HorizontalAlignment="Center" Margin="0,20,0,0">
15 |                 <Button x:Name="buttonApply" Content="{x:Static resx:SliderDialog.buttonApply_Text}" Width="75" IsDefault="True" Click="buttonApply_Click"/>
16 |                 <Button x:Name="buttonCancel" Content="{x:Static resx:SliderDialog.buttonCancel_Text}" Width="75" IsCancel="True" Margin="10,0,0,0" Click="buttonCancel_Click"/>
17 |             </StackPanel>
18 |         </StackPanel>
19 |     </Border>
20 | </Window>
21 | 


--------------------------------------------------------------------------------
/ChangeCaseDialog.xaml.cs:
--------------------------------------------------------------------------------
 1 | using System.Windows;
 2 | using System.Windows.Controls;
 3 | 
 4 | namespace VietOCR
 5 | {
 6 |     /// <summary>
 7 |     /// Interaction logic for ChangeCaseDialog.xaml
 8 |     /// </summary>
 9 |     public partial class ChangeCaseDialog : Window
10 |     {
11 |         public event RoutedEventHandler CloseDlg;
12 |         public event RoutedEventHandler ChangeCase;
13 | 
14 |         public string SelectedCase { set; get; }
15 | 
16 |         public ChangeCaseDialog()
17 |         {
18 |             InitializeComponent();
19 |         }
20 | 
21 |         private void Window_Loaded(object sender, RoutedEventArgs e)
22 |         {
23 |             foreach (RadioButton rb in this.radioButtonPanel.Children)
24 |             {
25 |                 if (rb.Tag.ToString() == SelectedCase)
26 |                 {
27 |                     // Select Case last saved
28 |                     rb.IsChecked = true;
29 |                     break;
30 |                 }
31 |             }
32 |         }
33 | 
34 |         private void buttonChange_Click(object sender, RoutedEventArgs e)
35 |         {
36 |             foreach (RadioButton rb in this.radioButtonPanel.Children)
37 |             {
38 |                 if (rb.IsChecked.Value)
39 |                 {
40 |                     SelectedCase = rb.Tag.ToString();
41 |                     break;
42 |                 }
43 |             }
44 | 
45 |             ChangeCase?.Invoke(this, e);
46 |         }
47 | 
48 |         private void buttonClose_Click(object sender, RoutedEventArgs e)
49 |         {
50 |             CloseDlg?.Invoke(this, e);
51 | 
52 |             this.Close();
53 |         }
54 |     }
55 | }
56 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | ## VietOCRwpf
 2 | 
 3 | A .NET GUI frontend for Tesseract OCR engine written using WPF. Supports optical character recognition for Vietnamese and other languages supported by Tesseract.
 4 | 
 5 | VietOCRwpf is released and distributed under the [Apache License, v2.0](http://www.apache.org/licenses/LICENSE-2.0).
 6 | 
 7 | ## Features
 8 | 
 9 | * PDF, TIFF, JPEG, GIF, PNG, BMP image formats
10 | * Multi-page TIFF images
11 | * Screenshots
12 | * Selection box
13 | * File drag-and-drop
14 | * Paste image from clipboard
15 | * Postprocessing for Vietnamese to boost accuracy rate
16 | * Vietnamese input methods
17 | * Localized user interface for many languages ([Localization project](https://www.transifex.com/projects/p/vietocr/))
18 | * Integrated scanning support
19 | * Watch folder monitor for support of batch processing
20 | * Custom text replacement in postprocessing
21 | * Spellcheck with Hunspell
22 | * Support for downloading and installing language data packs and appropriate spell dictionaries
23 | 
24 | ## Instructions
25 | 
26 | The program can run as Windows or console application.
27 | 
28 | For CLI option:
29 | ```
30 | vietocr imagefile outputfile [-l lang] [--psm pagesegmode] [text|hocr|pdf|pdf_textonly|unlv|box|alto|page|tsv|lstmbox|wordstrbox] [postprocessing] [correctlettercases] [deskew] [removelines] [removelinebreaks]
31 | ```
32 | 
33 | ## Dependencies
34 | * [Microsoft .NET Framework 4.8 Redistributable](https://dotnet.microsoft.com/download/dotnet-framework/net48)
35 | * [Microsoft Visual C++ 2022 Redistributable Package](https://visualstudio.microsoft.com/downloads/)
36 | * [GPL Ghostscript](http://www.ghostscript.com)


--------------------------------------------------------------------------------
/Postprocessing/ProcessorFactory.cs:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * Copyright @ 2008 Quan Nguyen
 3 |  * 
 4 |  * Licensed under the Apache License, Version 2.0 (the "License");
 5 |  * you may not use this file except in compliance with the License.
 6 |  * You may obtain a copy of the License at
 7 |  *
 8 |  *  http://www.apache.org/licenses/LICENSE-2.0
 9 |  *
10 |  * Unless required by applicable law or agreed to in writing, software
11 |  * distributed under the License is distributed on an "AS IS" BASIS,
12 |  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 |  * See the License for the specific language governing permissions and
14 |  * limitations under the License.
15 | */
16 | namespace VietOCR.NET.Postprocessing
17 | {
18 |     using System;
19 | 
20 |     public enum ISO639
21 |     {
22 |         ben, bul, cat, ces, cop, dan, deu, ell, eng, eus, fin, fra, hun, ind, ita, kan, khm, lav, lit, mal, nld, nor, pol, por, ron, rus, slk, slv, spa, srp, swe, tam, tel, tgl, tur, ukr, vie
23 |     }    
24 |     
25 |     public class ProcessorFactory
26 |     {
27 |         // ISO369-3 codes: http://www.sil.org/iso639-3/codes.asp
28 | 
29 |         public static IPostProcessor createProcessor(ISO639 code)
30 |         {
31 |             IPostProcessor processor;
32 | 
33 |             switch (code)
34 |             {
35 |                 case ISO639.eng:
36 |                     processor = new EngPP();
37 |                     break;
38 |                 case ISO639.vie:
39 |                     processor = new ViePP();
40 |                     break;
41 |                 default:
42 |                     processor = new EngPP();
43 |                     break;
44 |                     //throw new Exception(code.ToString());
45 |             }
46 | 
47 |             return processor;
48 |         }
49 |     }
50 | }
51 | 


--------------------------------------------------------------------------------
/Test/packages.config:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="utf-8"?>
 2 | <packages>
 3 |   <package id="Microsoft.ApplicationInsights" version="2.23.0" targetFramework="net48" />
 4 |   <package id="Microsoft.Testing.Extensions.Telemetry" version="1.8.4" targetFramework="net48" />
 5 |   <package id="Microsoft.Testing.Extensions.TrxReport.Abstractions" version="1.8.4" targetFramework="net48" />
 6 |   <package id="Microsoft.Testing.Extensions.VSTestBridge" version="1.8.4" targetFramework="net48" />
 7 |   <package id="Microsoft.Testing.Platform" version="1.8.4" targetFramework="net48" />
 8 |   <package id="Microsoft.Testing.Platform.MSBuild" version="1.8.4" targetFramework="net48" />
 9 |   <package id="Microsoft.TestPlatform.AdapterUtilities" version="17.14.1" targetFramework="net48" />
10 |   <package id="Microsoft.TestPlatform.ObjectModel" version="17.14.1" targetFramework="net48" />
11 |   <package id="MSTest.Analyzers" version="3.10.4" targetFramework="net48" developmentDependency="true" />
12 |   <package id="MSTest.TestAdapter" version="3.10.4" targetFramework="net48" />
13 |   <package id="MSTest.TestFramework" version="3.10.4" targetFramework="net48" />
14 |   <package id="System.Buffers" version="4.6.1" targetFramework="net48" />
15 |   <package id="System.Collections.Immutable" version="8.0.0" targetFramework="net48" />
16 |   <package id="System.Diagnostics.DiagnosticSource" version="5.0.0" targetFramework="net48" />
17 |   <package id="System.Memory" version="4.6.3" targetFramework="net48" />
18 |   <package id="System.Numerics.Vectors" version="4.6.1" targetFramework="net48" />
19 |   <package id="System.Reflection.Metadata" version="8.0.0" targetFramework="net48" />
20 |   <package id="System.Runtime.CompilerServices.Unsafe" version="6.1.2" targetFramework="net48" />
21 |   <package id="System.Threading.Tasks.Extensions" version="4.6.3" targetFramework="net48" />
22 | </packages>


--------------------------------------------------------------------------------
/HtmlHelpDialog.xaml.cs:
--------------------------------------------------------------------------------
 1 | using System;
 2 | using System.Collections.Generic;
 3 | using System.IO;
 4 | using System.Linq;
 5 | using System.Text;
 6 | using System.Threading.Tasks;
 7 | using System.Windows;
 8 | using System.Windows.Controls;
 9 | using System.Windows.Data;
10 | using System.Windows.Documents;
11 | using System.Windows.Input;
12 | using System.Windows.Media;
13 | using System.Windows.Media.Imaging;
14 | using System.Windows.Shapes;
15 | 
16 | namespace VietOCR
17 | {
18 |     /// <summary>
19 |     /// Interaction logic for HtmlHelpForm.xaml
20 |     /// </summary>
21 |     public partial class HtmlHelpDialog : Window
22 |     {
23 |         const string ABOUT = "about:";
24 | 
25 |         public HtmlHelpDialog(string helpFileName, string title)
26 |         {
27 |             InitializeComponent();
28 | 
29 |             this.Title = title;
30 | 
31 |             // Load HTML document as a stream
32 |             Uri uri = new Uri(@"pack://application:,,,/" + helpFileName, UriKind.Absolute);
33 |             Stream source = Application.GetResourceStream(uri).Stream;
34 | 
35 |             // Navigate to HTML document stream
36 |             this.webBrowser.NavigateToStream(source);
37 |         }
38 | 
39 |         private void webBrowser_Navigating(object sender, System.Windows.Navigation.NavigatingCancelEventArgs e)
40 |         {
41 |             if (e.Uri == null)
42 |             {
43 |                 return;
44 |             }
45 |             string url = e.Uri.ToString();
46 | 
47 |             if (url.StartsWith(ABOUT) && url != "about:blank")
48 |             {
49 |                 this.webBrowser.NavigateToStream(Application.GetResourceStream(e.Uri).Stream);
50 |             }
51 |             else if (url.StartsWith("http"))
52 |             {
53 |                 // Display external links using default webbrowser
54 |                 e.Cancel = true;
55 |                 System.Diagnostics.Process.Start(url);
56 |             }
57 |         }
58 |     }
59 | }
60 | 


--------------------------------------------------------------------------------
/Utilities/ImageConverter.cs:
--------------------------------------------------------------------------------
 1 | /*
 2 |  * Created by Rajan Tawate.
 3 |  * User: Owner
 4 |  * Date: 9/3/2006
 5 |  * Time: 8:00 PM
 6 |  */
 7 | 
 8 | using System;
 9 | using System.Drawing;
10 | using System.IO;
11 | using System.Collections;
12 | using System.Windows.Media.Imaging;
13 | 
14 | /// <summary>
15 | /// Description of ImageConverter.
16 | /// </summary>
17 | public static class ImageConverter
18 | {
19 | 
20 |     public static byte[] imageToByteArray(System.Drawing.Image imageIn)
21 |     {
22 |         MemoryStream ms = new MemoryStream();
23 |         imageIn.Save(ms, System.Drawing.Imaging.ImageFormat.Bmp);
24 |         return ms.ToArray();
25 |     }
26 | 
27 |     public static Image byteArrayToImage(byte[] byteArrayIn)
28 |     {
29 |         MemoryStream ms = new MemoryStream(byteArrayIn);
30 |         Image returnImage = Image.FromStream(ms);
31 |         return returnImage;
32 |     }
33 | 
34 |     public static BitmapImage BitmapToImageSource(System.Drawing.Image bitmap)
35 |     {
36 |         using (MemoryStream ms = new MemoryStream())
37 |         {
38 |             bitmap.Save(ms, System.Drawing.Imaging.ImageFormat.Png);
39 |             ms.Position = 0;
40 |             BitmapImage bitmapImage = new BitmapImage();
41 |             bitmapImage.BeginInit();
42 |             bitmapImage.StreamSource = ms;
43 |             bitmapImage.CacheOption = BitmapCacheOption.OnLoad;
44 |             bitmapImage.EndInit();
45 | 
46 |             return bitmapImage;
47 |         }
48 |     }
49 | 
50 |     public static Bitmap ImageSourceToBitmap(BitmapSource bitmapSource)
51 |     {
52 |         using (MemoryStream ms = new MemoryStream())
53 |         {
54 |             BitmapEncoder enc = new PngBitmapEncoder();
55 |             enc.Frames.Add(BitmapFrame.Create(bitmapSource));
56 |             enc.Save(ms);
57 | 
58 |             using (Bitmap tempBitmap = new Bitmap(ms))
59 |             {
60 |                  return new Bitmap(tempBitmap);
61 |             }
62 |         }
63 |     }
64 | }
65 | 
66 | 


--------------------------------------------------------------------------------
/Data/ISO639-1.xml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="UTF-8"?>
 2 | <properties>
 3 |   <comment>ISO 639-1 Standard</comment>
 4 |   <entry key="ban">bn_BD</entry>
 5 |   <entry key="ben">bn_IN</entry>
 6 |   <entry key="bih">bh_IN</entry>
 7 |   <entry key="bul">bg_BG</entry>
 8 |   <entry key="cat">ca_ES</entry>
 9 |   <entry key="ces">cs_CZ</entry>
10 |   <entry key="chi-sim">zh_CN</entry>
11 |   <entry key="chi-tra">zh_TW</entry>
12 |   <entry key="cop">cop_EG</entry>
13 |   <entry key="dan">da_DK</entry>
14 |   <entry key="deu">de_DE</entry>
15 |   <entry key="deu-f">de_DE_f</entry>
16 |   <entry key="ell">el_GR</entry>
17 |   <entry key="eng">en_US</entry>
18 |   <entry key="eus">eu_ES</entry>
19 |   <entry key="fin">fi_FI</entry>
20 |   <entry key="fra">fr_FR</entry>
21 |   <entry key="guj">gu_IN</entry>
22 |   <entry key="heb">iw_IL</entry>    
23 |   <entry key="hin">hi_IN</entry>
24 |   <entry key="hun">hu_HU</entry>
25 |   <entry key="ind">id_ID</entry>
26 |   <entry key="ita">it_IT</entry>
27 |   <entry key="jpn">ja_JP</entry>
28 |   <entry key="kan">kn_IN</entry>
29 |   <entry key="khm">km_KH</entry>
30 |   <entry key="kor">ko_KR</entry>
31 |   <entry key="lav">lv_LV</entry>
32 |   <entry key="lit">lt_LT</entry>
33 |   <entry key="mal">ml_IN</entry>
34 |   <entry key="mar">mr_IN</entry>
35 |   <entry key="nld">nl_NL</entry>
36 |   <entry key="nor">no_NO</entry>
37 |   <entry key="ori">or_IN</entry>
38 |   <entry key="pan">pa_IN</entry>
39 |   <entry key="pol">pl_PL</entry>
40 |   <entry key="por">pt_BR</entry>
41 |   <entry key="ron">ro_RO</entry>
42 |   <entry key="rus">ru_RU</entry>
43 |   <entry key="san">sa_IN</entry>
44 |   <entry key="slk">sk_SK</entry>
45 |   <entry key="slv">sl_SI</entry>
46 |   <entry key="spa">es_ES</entry>
47 |   <entry key="srp">sr_YU</entry>
48 |   <entry key="swe">sv_SE</entry>
49 |   <entry key="tam">ta_IN</entry>
50 |   <entry key="tel">te_IN</entry>
51 |   <entry key="tgl">tl_PH</entry>
52 |   <entry key="tha">th_TH</entry>
53 |   <entry key="tur">tr_TR</entry>
54 |   <entry key="ukr">uk_UA</entry>
55 |   <entry key="vie">vi_VN</entry>
56 | </properties>


--------------------------------------------------------------------------------
/ChangeCaseDialog.xaml:
--------------------------------------------------------------------------------
 1 | <Window x:Class="VietOCR.ChangeCaseDialog"
 2 |         xmlns="http://schemas.microsoft.com/winfx/2006/xaml/presentation"
 3 |         xmlns:x="http://schemas.microsoft.com/winfx/2006/xaml"
 4 |         xmlns:d="http://schemas.microsoft.com/expression/blend/2008"
 5 |         xmlns:mc="http://schemas.openxmlformats.org/markup-compatibility/2006"
 6 |         xmlns:local="clr-namespace:VietOCR"
 7 |         xmlns:resx="clr-namespace:VietOCR"
 8 |         mc:Ignorable="d"
 9 |         Title="{x:Static resx:ChangeCaseDialog.this_Title}" Height="200" Width="240" Loaded="Window_Loaded" ResizeMode="NoResize"
10 |         WindowStartupLocation="CenterOwner">
11 |     <Grid>
12 |         <StackPanel x:Name="radioButtonPanel" Margin="20,10,20,0">
13 |             <StackPanel.Resources>
14 |                 <Style TargetType="{x:Type RadioButton}">
15 |                     <Setter Property="Margin" Value="0,0,0,12"/>
16 |                 </Style>
17 |             </StackPanel.Resources>
18 |             <RadioButton x:Name="radioButton1" Content="{x:Static resx:ChangeCaseDialog.radioButton1_Text}" Tag="Sentence_case" />
19 |             <RadioButton x:Name="radioButton2" Content="{x:Static resx:ChangeCaseDialog.radioButton2_Text}" Tag="lowercase" />
20 |             <RadioButton x:Name="radioButton3" Content="{x:Static resx:ChangeCaseDialog.radioButton3_Text}" Tag="UPPERCASE" />
21 |             <RadioButton x:Name="radioButton4" Content="{x:Static resx:ChangeCaseDialog.radioButton4_Text}" Tag="Title_Case" Margin="0" />
22 |         </StackPanel>
23 |         <StackPanel Orientation="Horizontal" HorizontalAlignment="Center" VerticalAlignment="Bottom" Margin="0 20">
24 |             <Button x:Name="buttonChange" Content="{x:Static resx:ChangeCaseDialog.buttonChange_Text}" VerticalAlignment="Bottom" Width="75" Click="buttonChange_Click"/>
25 |             <Button x:Name="buttonClose" Content="{x:Static resx:ChangeCaseDialog.buttonClose_Text}" Margin="10,0,0,0" VerticalAlignment="Bottom" Width="75" Click="buttonClose_Click"/>
26 |         </StackPanel>
27 |     </Grid>
28 | </Window>
29 | 


--------------------------------------------------------------------------------
/DownloadDialog.xaml:
--------------------------------------------------------------------------------
 1 | <Window x:Class="VietOCR.DownloadDialog"
 2 |         xmlns="http://schemas.microsoft.com/winfx/2006/xaml/presentation"
 3 |         xmlns:x="http://schemas.microsoft.com/winfx/2006/xaml"
 4 |         xmlns:d="http://schemas.microsoft.com/expression/blend/2008"
 5 |         xmlns:mc="http://schemas.openxmlformats.org/markup-compatibility/2006"
 6 |         xmlns:local="clr-namespace:VietOCR"
 7 |         xmlns:resx="clr-namespace:VietOCR"
 8 |         mc:Ignorable="d"
 9 |         Title="{x:Static resx:DownloadDialog.this_Title}" Height="248" Width="330" Loaded="Window_Loaded" ResizeMode="NoResize" WindowStartupLocation="CenterOwner">
10 |     <DockPanel>
11 |         <StatusBar DockPanel.Dock="Bottom" Height="24">
12 |             <StatusBarItem>
13 |                 <Label x:Name="toolStripStatusLabel1" Padding="0"/>
14 |             </StatusBarItem>
15 |             <StatusBarItem>
16 |                 <ProgressBar x:Name="toolStripProgressBar1" Height="14" Width="150" Visibility="Hidden"/>
17 |             </StatusBarItem>
18 |         </StatusBar>
19 |         <GroupBox x:Name="groupBox1" Header="{x:Static resx:DownloadDialog.groupBox1_Text}" DockPanel.Dock="Left" VerticalAlignment="Top" HorizontalAlignment="Left" Margin="10,5,0,0" Padding="2" Width="190" Height="172">
20 |             <ListBox x:Name="listBox" VerticalAlignment="Stretch" HorizontalAlignment="Stretch"  SelectionChanged="listBox_SelectionChanged" SelectionMode="Multiple"/>
21 |         </GroupBox>
22 |         <Border Padding="16,20,16,15">
23 |             <StackPanel DockPanel.Dock="Right" >
24 |                 <Button x:Name="buttonDownload" Content="{x:Static resx:DownloadDialog.buttonDownload_Text}"  Click="buttonDownload_Click"/>
25 |                 <Button x:Name="buttonCancel" Content="{x:Static resx:DownloadDialog.buttonCancel_Text}" Click="buttonCancel_Click" Margin="0, 5, 0, 20"/>
26 |                 <Button x:Name="buttonClose" Content="{x:Static resx:DownloadDialog.buttonClose_Text}"  Click="buttonClose_Click"/>
27 |             </StackPanel>
28 |         </Border>
29 |     </DockPanel>
30 | </Window>
31 | 


--------------------------------------------------------------------------------
/WIA/WiaOperationException.cs:
--------------------------------------------------------------------------------
 1 | //http://geekswithblogs.net/tonyt/archive/2006/07/29/86608.aspx
 2 | 
 3 | using System;
 4 | using System.Collections.Generic;
 5 | using System.Text;
 6 | using System.Runtime.InteropServices;
 7 | 
 8 | namespace VietOCR.NET.WIA
 9 | {
10 |     [Serializable]
11 |     public class WiaOperationException : Exception
12 |     {
13 |         private WiaScannerError _errorCode;
14 | 
15 |         public WiaOperationException(WiaScannerError errorCode)
16 |             : base()
17 |         {
18 |             ErrorCode = errorCode;
19 |         }
20 | 
21 |         public WiaOperationException(string message, WiaScannerError errorCode)
22 |             : base(message)
23 |         {
24 |             ErrorCode = errorCode;
25 |         }
26 | 
27 |         public WiaOperationException(string message, Exception innerException)
28 |             : base(message, innerException)
29 |         {
30 |             COMException comException = innerException as COMException;
31 | 
32 |             if (comException != null)
33 |                 ErrorCode = (WiaScannerError)comException.ErrorCode;
34 |         }
35 | 
36 |         public WiaOperationException(string message, Exception innerException, WiaScannerError errorCode)
37 |             : base(message, innerException)
38 |         {
39 |             ErrorCode = errorCode;
40 |         }
41 | 
42 |         public WiaOperationException(System.Runtime.Serialization.SerializationInfo info,
43 |              System.Runtime.Serialization.StreamingContext context)
44 |             : base(info, context)
45 |         {
46 |             info.AddValue("ErrorCode", (uint)_errorCode);
47 |         }
48 | 
49 |         public WiaScannerError ErrorCode
50 |         {
51 |             get { return _errorCode; }
52 |             protected set { _errorCode = value; }
53 |         }
54 | 
55 |         public override void GetObjectData(System.Runtime.Serialization.SerializationInfo info,
56 |              System.Runtime.Serialization.StreamingContext context)
57 |         {
58 |             base.GetObjectData(info, context);
59 |             ErrorCode = (WiaScannerError)info.GetUInt32("ErrorCode");
60 |         }
61 |     }
62 | }
63 | 


--------------------------------------------------------------------------------
/Test/.vs/VietOCRTests.csproj.dtbcache.json:
--------------------------------------------------------------------------------
1 | {"RootPath":"D:\\Projects\\github\\VietOCRTests","ProjectFileName":"VietOCRTests.csproj","Configuration":"Release|AnyCPU","FrameworkPath":"","Sources":[{"SourceFile":"ConsoleAppTests.cs"},{"SourceFile":"Properties\\AssemblyInfo.cs"},{"SourceFile":"Utilities\\PdfUtilitiesTests.cs"},{"SourceFile":"obj\\Release\\.NETFramework,Version=v4.8.AssemblyAttributes.cs"}],"References":[{"Reference":"D:\\Projects\\github\\VietOCRwpf\\packages\\MSTest.TestFramework.2.2.10\\lib\\net45\\Microsoft.VisualStudio.TestPlatform.TestFramework.dll","ResolvedFrom":"","OriginalItemSpec":"","Name":"","EmbedInteropTypes":false,"CopyLocal":false,"IsProjectReference":false,"ProjectPath":""},{"Reference":"D:\\Projects\\github\\VietOCRwpf\\packages\\MSTest.TestFramework.2.2.10\\lib\\net45\\Microsoft.VisualStudio.TestPlatform.TestFramework.Extensions.dll","ResolvedFrom":"","OriginalItemSpec":"","Name":"","EmbedInteropTypes":false,"CopyLocal":false,"IsProjectReference":false,"ProjectPath":""},{"Reference":"C:\\Program Files (x86)\\Reference Assemblies\\Microsoft\\Framework\\.NETFramework\\v4.8\\mscorlib.dll","ResolvedFrom":"","OriginalItemSpec":"","Name":"","EmbedInteropTypes":false,"CopyLocal":false,"IsProjectReference":false,"ProjectPath":""},{"Reference":"C:\\Program Files (x86)\\Reference Assemblies\\Microsoft\\Framework\\.NETFramework\\v4.8\\System.Core.dll","ResolvedFrom":"","OriginalItemSpec":"","Name":"","EmbedInteropTypes":false,"CopyLocal":false,"IsProjectReference":false,"ProjectPath":""},{"Reference":"C:\\Program Files (x86)\\Reference Assemblies\\Microsoft\\Framework\\.NETFramework\\v4.8\\System.dll","ResolvedFrom":"","OriginalItemSpec":"","Name":"","EmbedInteropTypes":false,"CopyLocal":false,"IsProjectReference":false,"ProjectPath":""},{"Reference":"D:\\Projects\\github\\VietOCRwpf\\bin\\Release\\VietOCR.exe","ResolvedFrom":"","OriginalItemSpec":"","Name":"","EmbedInteropTypes":false,"CopyLocal":false,"IsProjectReference":true,"ProjectPath":""}],"Analyzers":[],"Outputs":[{"OutputItemFullPath":"D:\\Projects\\github\\VietOCRTests\\bin\\Release\\VietOCRTests.dll","OutputItemRelativePath":"VietOCRTests.dll"},{"OutputItemFullPath":"D:\\Projects\\github\\VietOCRTests\\bin\\Release\\VietOCRTests.pdb","OutputItemRelativePath":"VietOCRTests.pdb"}],"CopyToOutputEntries":[]}


--------------------------------------------------------------------------------
/VietOCR.sln:
--------------------------------------------------------------------------------
 1 | 
 2 | Microsoft Visual Studio Solution File, Format Version 12.00
 3 | # Visual Studio Version 17
 4 | VisualStudioVersion = 17.0.31912.275
 5 | MinimumVisualStudioVersion = 10.0.40219.1
 6 | Project("{FAE04EC0-301F-11D3-BF4B-00C04F79EFBC}") = "VietOCR", "VietOCR.csproj", "{1DDD5F42-D710-4AB7-BAA9-5A8C2A83EFCF}"
 7 | EndProject
 8 | Project("{54435603-DBB4-11D2-8724-00A0C9A8B90C}") = "Setup", "Setup\Setup.vdproj", "{76C0F1BE-1BA1-4096-8A4E-8E35A5E361C9}"
 9 | EndProject
10 | Project("{2150E333-8FDC-42A3-9474-1A3956D46DE8}") = "Tests", "Tests", "{02EA681E-C7D8-13C7-8484-4AC65E1B71E8}"
11 | EndProject
12 | Project("{FAE04EC0-301F-11D3-BF4B-00C04F79EFBC}") = "UnitTest", "Test\UnitTest.csproj", "{61E5E263-898A-4BB0-B099-B7194BC58529}"
13 | EndProject
14 | Global
15 | 	GlobalSection(SolutionConfigurationPlatforms) = preSolution
16 | 		Debug|Any CPU = Debug|Any CPU
17 | 		Release|Any CPU = Release|Any CPU
18 | 	EndGlobalSection
19 | 	GlobalSection(ProjectConfigurationPlatforms) = postSolution
20 | 		{1DDD5F42-D710-4AB7-BAA9-5A8C2A83EFCF}.Debug|Any CPU.ActiveCfg = Debug|Any CPU
21 | 		{1DDD5F42-D710-4AB7-BAA9-5A8C2A83EFCF}.Debug|Any CPU.Build.0 = Debug|Any CPU
22 | 		{1DDD5F42-D710-4AB7-BAA9-5A8C2A83EFCF}.Release|Any CPU.ActiveCfg = Release|Any CPU
23 | 		{1DDD5F42-D710-4AB7-BAA9-5A8C2A83EFCF}.Release|Any CPU.Build.0 = Release|Any CPU
24 | 		{76C0F1BE-1BA1-4096-8A4E-8E35A5E361C9}.Debug|Any CPU.ActiveCfg = Debug
25 | 		{76C0F1BE-1BA1-4096-8A4E-8E35A5E361C9}.Release|Any CPU.ActiveCfg = Release
26 | 		{61E5E263-898A-4BB0-B099-B7194BC58529}.Debug|Any CPU.ActiveCfg = Debug|Any CPU
27 | 		{61E5E263-898A-4BB0-B099-B7194BC58529}.Debug|Any CPU.Build.0 = Debug|Any CPU
28 | 		{61E5E263-898A-4BB0-B099-B7194BC58529}.Release|Any CPU.ActiveCfg = Release|Any CPU
29 | 		{61E5E263-898A-4BB0-B099-B7194BC58529}.Release|Any CPU.Build.0 = Release|Any CPU
30 | 	EndGlobalSection
31 | 	GlobalSection(SolutionProperties) = preSolution
32 | 		HideSolutionNode = FALSE
33 | 	EndGlobalSection
34 | 	GlobalSection(NestedProjects) = preSolution
35 | 		{61E5E263-898A-4BB0-B099-B7194BC58529} = {02EA681E-C7D8-13C7-8484-4AC65E1B71E8}
36 | 	EndGlobalSection
37 | 	GlobalSection(ExtensibilityGlobals) = postSolution
38 | 		SolutionGuid = {631CDFDA-3AEA-40F5-8FD9-F9827F80034C}
39 | 		RESX_SortFileContentOnSave = True
40 | 		RESX_ResXSortingComparison = CurrentCulture
41 | 	EndGlobalSection
42 | EndGlobal
43 | 


--------------------------------------------------------------------------------
/Controls/ResizeThumb.cs:
--------------------------------------------------------------------------------
 1 | using System;
 2 | using System.Windows;
 3 | using System.Windows.Controls;
 4 | using System.Windows.Controls.Primitives;
 5 | 
 6 | namespace VietOCR.Controls
 7 | {
 8 |     public class ResizeThumb : Thumb
 9 |     {
10 |         public ResizeThumb()
11 |         {
12 |             DragDelta += new DragDeltaEventHandler(this.ResizeThumb_DragDelta);
13 |         }
14 | 
15 |         private void ResizeThumb_DragDelta(object sender, DragDeltaEventArgs e)
16 |         {
17 |             Control designerItem = this.DataContext as Control;
18 | 
19 |             if (designerItem != null)
20 |             {
21 |                 double deltaVertical, deltaHorizontal;
22 | 
23 |                 switch (VerticalAlignment)
24 |                 {
25 |                     case VerticalAlignment.Bottom:
26 |                         deltaVertical = Math.Min(-e.VerticalChange, designerItem.ActualHeight - designerItem.MinHeight);
27 |                         designerItem.Height -= deltaVertical;
28 |                         break;
29 |                     case VerticalAlignment.Top:
30 |                         deltaVertical = Math.Min(e.VerticalChange, designerItem.ActualHeight - designerItem.MinHeight);
31 |                         Canvas.SetTop(designerItem, Canvas.GetTop(designerItem) + deltaVertical);
32 |                         designerItem.Height -= deltaVertical;
33 |                         break;
34 |                     default:
35 |                         break;
36 |                 }
37 | 
38 |                 switch (HorizontalAlignment)
39 |                 {
40 |                     case HorizontalAlignment.Left:
41 |                         deltaHorizontal = Math.Min(e.HorizontalChange, designerItem.ActualWidth - designerItem.MinWidth);
42 |                         Canvas.SetLeft(designerItem, Canvas.GetLeft(designerItem) + deltaHorizontal);
43 |                         designerItem.Width -= deltaHorizontal;
44 |                         break;
45 |                     case HorizontalAlignment.Right:
46 |                         deltaHorizontal = Math.Min(-e.HorizontalChange, designerItem.ActualWidth - designerItem.MinWidth);
47 |                         designerItem.Width -= deltaHorizontal;
48 |                         break;
49 |                     default:
50 |                         break;
51 |                 }
52 |             }
53 | 
54 |             e.Handled = true;
55 |         }
56 |     }
57 | }
58 | 


--------------------------------------------------------------------------------
/Utilities/Utilities.cs:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * Copyright @ 2008 Quan Nguyen
 3 |  * 
 4 |  * Licensed under the Apache License, Version 2.0 (the "License");
 5 |  * you may not use this file except in compliance with the License.
 6 |  * You may obtain a copy of the License at
 7 |  *
 8 |  *  http://www.apache.org/licenses/LICENSE-2.0
 9 |  *
10 |  * Unless required by applicable law or agreed to in writing, software
11 |  * distributed under the License is distributed on an "AS IS" BASIS,
12 |  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 |  * See the License for the specific language governing permissions and
14 |  * limitations under the License.
15 | */
16 | using System;
17 | using System.Collections.Generic;
18 | using System.Text;
19 | using System.Windows;
20 | using System.Windows.Controls;
21 | using System.Windows.Controls.Primitives;
22 | using System.Xml;
23 | 
24 | namespace VietOCR.NET.Utilities
25 | {
26 |     static class Utilities
27 |     {
28 |         /// <summary>
29 |         /// Populates a dictionary with entries from an XML document.
30 |         /// </summary>
31 |         /// <param name="table"></param>
32 |         /// <param name="xmlFilePath"></param>
33 |         public static void LoadFromXML(Dictionary<string, string> table, string xmlFilePath)
34 |         {
35 |             XmlDocument doc = new XmlDocument();
36 |             doc.Load(xmlFilePath);
37 | 
38 |             XmlNodeList list = doc.GetElementsByTagName("entry");
39 |             foreach (XmlNode node in list)
40 |             {
41 |                 if (!table.ContainsKey(node.Attributes[0].Value))
42 |                 {
43 |                     table.Add(node.Attributes[0].Value, node.InnerText);
44 |                 }
45 |             }
46 |         }
47 | 
48 |         /// <summary>
49 |         /// Simulates button click.
50 |         /// </summary>
51 |         /// <param name="btn"></param>
52 |         public static void PerformClick(this Button btn)
53 |         {
54 |             btn.RaiseEvent(new RoutedEventArgs(Button.ClickEvent));
55 |         }
56 | 
57 |         /// <summary>
58 |         /// Simulates togglebutton click.
59 |         /// </summary>
60 |         /// <param name="btn"></param>
61 |         public static void PerformClick(this ToggleButton btn)
62 |         {
63 |             btn.IsChecked ^= true;
64 |             btn.RaiseEvent(new RoutedEventArgs(ToggleButton.ClickEvent));
65 |         }
66 |     }
67 | }
68 | 


--------------------------------------------------------------------------------
/.tx/config:
--------------------------------------------------------------------------------
 1 | [main]
 2 | host = https://www.transifex.com
 3 | 
 4 | [o:vietocr:p:vietocr:r:BulkDialog_resx]
 5 | file_filter            = BulkDialog.<lang>.resx
 6 | source_file            = BulkDialog.resx
 7 | source_lang            = en
 8 | type                   = RESX
 9 | 
10 | [o:vietocr:p:vietocr:r:ChangeCaseDialog_resx]
11 | file_filter            = ChangeCaseDialog.<lang>.resx
12 | source_file            = ChangeCaseDialog.resx
13 | source_lang            = en
14 | type                   = RESX
15 | 
16 | [o:vietocr:p:vietocr:r:DownloadDialog_resx]
17 | file_filter            = DownloadDialog.<lang>.resx
18 | source_file            = DownloadDialog.resx
19 | source_lang            = en
20 | type                   = RESX
21 | 
22 | [o:vietocr:p:vietocr:r:FindReplaceDialog_resx]
23 | file_filter            = FindReplaceDialog.<lang>.resx
24 | source_file            = FindReplaceDialog.resx
25 | source_lang            = en
26 | type                   = RESX
27 | 
28 | [o:vietocr:p:vietocr:r:Gui_resx]
29 | file_filter            = Gui.<lang>.resx
30 | source_file            = Gui.resx
31 | source_lang            = en
32 | type                   = RESX
33 | 
34 | [o:vietocr:p:vietocr:r:ImageInfoDialog_resx]
35 | file_filter            = ImageInfoDialog.<lang>.resx
36 | source_file            = ImageInfoDialog.resx
37 | source_lang            = en
38 | type                   = RESX
39 | 
40 | [o:vietocr:p:vietocr:r:OptionsDialog_resx]
41 | file_filter            = OptionsDialog.<lang>.resx
42 | source_file            = OptionsDialog.resx
43 | source_lang            = en
44 | type                   = RESX
45 | 
46 | [o:vietocr:p:vietocr:r:Resources_resx]
47 | file_filter            = Properties/Resources.<lang>.resx
48 | source_file            = Properties/Resources.resx
49 | source_lang            = en
50 | type                   = RESX
51 | 
52 | [o:vietocr:p:vietocr:r:SliderDialog_resx]
53 | file_filter            = SliderDialog.<lang>.resx
54 | source_file            = SliderDialog.resx
55 | source_lang            = en
56 | type                   = RESX
57 | 
58 | [o:vietocr:p:vietocr:r:SplitPdfDialog_resx]
59 | file_filter            = SplitPdfDialog.<lang>.resx
60 | source_file            = SplitPdfDialog.resx
61 | source_lang            = en
62 | type                   = RESX
63 | 
64 | [o:vietocr:p:vietocr:r:readme_cs_html]
65 | file_filter            = readme_cs_<lang>.html
66 | source_file            = readme_cs.html
67 | source_lang            = en
68 | type                   = HTML
69 | 


--------------------------------------------------------------------------------
/Properties/AssemblyInfo.cs:
--------------------------------------------------------------------------------
 1 | using System.Reflection;
 2 | using System.Resources;
 3 | using System.Runtime.CompilerServices;
 4 | using System.Runtime.InteropServices;
 5 | using System.Windows;
 6 | 
 7 | // General Information about an assembly is controlled through the following 
 8 | // set of attributes. Change these attribute values to modify the information
 9 | // associated with an assembly.
10 | [assembly: AssemblyTitle("VietOCR.NET")]
11 | [assembly: AssemblyDescription(".NET WPF GUI Frontend for Tesseract OCR engine")]
12 | [assembly: AssemblyConfiguration("")]
13 | [assembly: AssemblyCompany("VietUnicode")]
14 | [assembly: AssemblyProduct("VietOCR.NET")]
15 | [assembly: AssemblyCopyright("Copyright © VietUnicode 2019")]
16 | [assembly: AssemblyTrademark("")]
17 | [assembly: AssemblyCulture("")]
18 | 
19 | // Setting ComVisible to false makes the types in this assembly not visible 
20 | // to COM components.  If you need to access a type in this assembly from 
21 | // COM, set the ComVisible attribute to true on that type.
22 | [assembly: ComVisible(false)]
23 | 
24 | //In order to begin building localizable applications, set 
25 | //<UICulture>CultureYouAreCodingWith</UICulture> in your .csproj file
26 | //inside a <PropertyGroup>.  For example, if you are using US english
27 | //in your source files, set the <UICulture> to en-US.  Then uncomment
28 | //the NeutralResourceLanguage attribute below.  Update the "en-US" in
29 | //the line below to match the UICulture setting in the project file.
30 | 
31 | //[assembly: NeutralResourcesLanguage("en-US", UltimateResourceFallbackLocation.Satellite)]
32 | 
33 | 
34 | [assembly: ThemeInfo(
35 |     ResourceDictionaryLocation.None, //where theme specific resource dictionaries are located
36 |                                      //(used if a resource is not found in the page, 
37 |                                      // or application resource dictionaries)
38 |     ResourceDictionaryLocation.SourceAssembly //where the generic resource dictionary is located
39 |                                               //(used if a resource is not found in the page, 
40 |                                               // app, or any theme specific resource dictionaries)
41 | )]
42 | 
43 | 
44 | // Version information for an assembly consists of the following four values:
45 | //
46 | //      Major Version
47 | //      Minor Version 
48 | //      Build Number
49 | //      Revision
50 | //
51 | // You can specify all the values or you can default the Build and Revision Numbers 
52 | // by using the '*' as shown below:
53 | // [assembly: AssemblyVersion("1.0.*")]
54 | [assembly: AssemblyVersion("1.0.0.0")]
55 | [assembly: AssemblyFileVersion("6.15.1.0")]
56 | 


--------------------------------------------------------------------------------
/dict/vi_VN.aff:
--------------------------------------------------------------------------------
  1 | SET UTF-8
  2 | TRY aAàÀảẢãÃáÁạẠăĂằẰẳẲẵẴắẮặẶâÂầẦẩẨẫẪấẤậẬbBcCdDđĐeEèÈẻẺẽẼéÉẹẸêÊềỀểỂễỄếẾệỆfFgGhHiIìÌỉỈĩĨíÍịỊjJkKlLmMnNoOòÒỏỎõÕóÓọỌôÔồỒổỔỗỖốỐộỘơƠờỜởỞỡỠớỚợỢpPqQrRsStTuUùÙủỦũŨúÚụỤưƯừỪửỬữỮứỨựỰvVwWxXyYỳỲỷỶỹỸýÝỵỴzZ
  3 | 
  4 | REP 206
  5 | REP f ph
  6 | REP uo ườ
  7 | REP uo ướ
  8 | REP uo ưở
  9 | REP uo ưỡ
 10 | REP uo ươ
 11 | REP uo ượ
 12 | REP ươ ườ
 13 | REP ươ ướ
 14 | REP ươ ưở
 15 | REP ươ ưỡ
 16 | REP ươ ượ
 17 | REP a à
 18 | REP A À 
 19 | REP a ả
 20 | REP A Ả 
 21 | REP a ã
 22 | REP A Ã
 23 | REP a á
 24 | REP A Á
 25 | REP a ạ
 26 | REP A Ạ
 27 | REP a ă
 28 | REP A Ă
 29 | REP a ằ
 30 | REP A Ằ
 31 | REP a ẳ
 32 | REP A Ẳ
 33 | REP a ẵ
 34 | REP A Ẵ
 35 | REP a ắ
 36 | REP A Ắ
 37 | REP a ặ
 38 | REP A Ặ
 39 | REP ă ằ
 40 | REP Ă Ằ
 41 | REP ă ẳ
 42 | REP Ă Ẳ
 43 | REP ă ẵ
 44 | REP Ă Ẵ
 45 | REP ă ắ
 46 | REP Ă Ắ
 47 | REP ă ặ
 48 | REP Ă Ặ
 49 | REP a â
 50 | REP A Â
 51 | REP a ầ
 52 | REP A Ầ
 53 | REP a ẩ
 54 | REP A Ẩ
 55 | REP a ẫ
 56 | REP A Ẫ
 57 | REP a ấ
 58 | REP A Ấ
 59 | REP a ậ
 60 | REP A Ậ
 61 | REP â ầ
 62 | REP Â Ầ
 63 | REP â ẩ
 64 | REP Â Ẩ
 65 | REP â ẫ
 66 | REP Â Ẫ
 67 | REP â ấ
 68 | REP Â Ấ
 69 | REP â ậ
 70 | REP Â Ậ
 71 | REP d đ
 72 | REP D Đ
 73 | REP e è
 74 | REP E È
 75 | REP e ẻ
 76 | REP E Ẻ
 77 | REP e ẽ
 78 | REP E Ẽ
 79 | REP e é
 80 | REP E É
 81 | REP e ẹ
 82 | REP E Ẹ
 83 | REP e ê
 84 | REP E Ê
 85 | REP e ề
 86 | REP E Ề
 87 | REP e ể
 88 | REP E Ể
 89 | REP e ễ
 90 | REP E Ễ
 91 | REP e ế
 92 | REP E Ế
 93 | REP e ệ
 94 | REP E Ệ
 95 | REP ê ề
 96 | REP Ê Ề
 97 | REP ê ể
 98 | REP Ê Ể
 99 | REP ê ễ
100 | REP Ê Ễ
101 | REP ê ế
102 | REP Ê Ế
103 | REP ê ệ
104 | REP Ê Ệ
105 | REP i ì
106 | REP I Ì
107 | REP i ỉ
108 | REP I Ỉ
109 | REP i ĩ
110 | REP I Ĩ
111 | REP i í
112 | REP I Í
113 | REP i ị
114 | REP I Ị
115 | REP o ò
116 | REP O Ò
117 | REP o ỏ
118 | REP O Ỏ
119 | REP o õ
120 | REP O Õ
121 | REP o ó
122 | REP O Ó
123 | REP o ọ
124 | REP O Ọ
125 | REP o ô
126 | REP O Ô
127 | REP o ồ
128 | REP O Ồ
129 | REP o ổ
130 | REP O Ổ
131 | REP o ỗ
132 | REP O Ỗ
133 | REP o ố
134 | REP O Ố
135 | REP o ộ
136 | REP O Ộ
137 | REP ô ồ
138 | REP Ô Ồ
139 | REP ô ổ
140 | REP Ô Ổ
141 | REP ô ỗ
142 | REP Ô Ỗ
143 | REP ô ố
144 | REP Ô Ố
145 | REP ô ộ
146 | REP Ô Ộ
147 | REP o ơ
148 | REP O Ơ
149 | REP o ờ
150 | REP O Ờ
151 | REP o ở
152 | REP O Ở
153 | REP o ỡ
154 | REP O Ỡ
155 | REP o ớ
156 | REP O Ớ
157 | REP o ợ
158 | REP O Ợ
159 | REP ơ ờ
160 | REP Ơ Ờ
161 | REP ơ ở
162 | REP Ơ Ở
163 | REP ơ ỡ
164 | REP Ơ Ỡ
165 | REP ơ ớ
166 | REP Ơ Ớ
167 | REP ơ ợ
168 | REP Ơ Ợ
169 | REP u ù
170 | REP U Ù
171 | REP u ủ
172 | REP U Ủ
173 | REP u ũ
174 | REP U Ũ
175 | REP u ú
176 | REP U Ú
177 | REP u ụ
178 | REP U Ụ
179 | REP u ư
180 | REP U Ư
181 | REP u ừ
182 | REP U Ừ
183 | REP u ử
184 | REP U Ử
185 | REP u ữ
186 | REP U Ữ
187 | REP u ứ
188 | REP U Ứ
189 | REP u ự
190 | REP U Ự
191 | REP ư ừ
192 | REP Ư Ừ
193 | REP ư ử
194 | REP Ư Ử
195 | REP ư ữ
196 | REP Ư Ữ
197 | REP ư ứ
198 | REP Ư Ứ
199 | REP ư ự
200 | REP Ư Ự
201 | REP y ỳ
202 | REP Y Ỳ
203 | REP y ỷ
204 | REP Y Ỷ
205 | REP y ỹ
206 | REP Y Ỹ
207 | REP y ý
208 | REP Y Ý
209 | REP Y Ỵ
210 | REP y ỵ


--------------------------------------------------------------------------------
/App.xaml.cs:
--------------------------------------------------------------------------------
 1 | using Microsoft.Win32;
 2 | using System;
 3 | using System.Collections.Generic;
 4 | using System.Configuration;
 5 | using System.Data;
 6 | using System.Globalization;
 7 | using System.Linq;
 8 | using System.Runtime.InteropServices;
 9 | using System.Threading;
10 | using System.Threading.Tasks;
11 | using System.Windows;
12 | using System.Windows.Markup;
13 | 
14 | namespace VietOCR
15 | {
16 |     /// <summary>
17 |     /// Interaction logic for App.xaml
18 |     /// </summary>
19 |     public partial class App : Application
20 |     {
21 |         [DllImport("kernel32.dll")]
22 |         private static extern bool AllocConsole();
23 | 
24 |         [DllImport("kernel32.dll")]
25 |         private static extern bool AttachConsole(int pid);
26 |      
27 |         private string strRegKey = "Software\\VietUnicode\\";
28 |         const string strUILang = "UILanguage";
29 |         public const string strProgName = "VietOCR.NET";
30 | 
31 |         protected override void OnStartup(StartupEventArgs e)
32 |         {
33 |             if (e.Args.Length == 0)
34 |             {
35 |                 base.OnStartup(e);
36 | 
37 |                 // Access registry to determine which UI Language to be loaded.
38 |                 // The desired locale must be known before initializing visual components
39 |                 // with language text. Waiting until OnLoad would be too late.
40 |                 strRegKey += strProgName;
41 | 
42 |                 RegistryKey regkey = Registry.CurrentUser.OpenSubKey(strRegKey);
43 | 
44 |                 if (regkey == null)
45 |                     regkey = Registry.CurrentUser.CreateSubKey(strRegKey);
46 | 
47 |                 string selectedUILanguage = (string)regkey.GetValue(strUILang, "en-US");
48 |                 regkey.Close();
49 | 
50 |                 //XmlLanguage lang = XmlLanguage.GetLanguage(CultureInfo.CurrentCulture.IetfLanguageTag);
51 |                 //FrameworkElement.LanguageProperty.OverrideMetadata(typeof(FrameworkElement), new FrameworkPropertyMetadata(lang));
52 |                 //FrameworkContentElement.LanguageProperty.OverrideMetadata(typeof(System.Windows.Documents.TextElement), new FrameworkPropertyMetadata(lang));
53 | 
54 |                 // Sets the UI culture to the selected language.
55 |                 ChangeCulture(new CultureInfo(selectedUILanguage));
56 |             }
57 |             else
58 |             {
59 |                 // Command line given, display console
60 |                 if (!AttachConsole(-1)) // Attach to a parent process console
61 |                 {
62 |                     AllocConsole(); // Alloc a new console
63 |                 }
64 | 
65 |                 ConsoleApp.Main(e.Args);
66 |                 Environment.Exit(0);
67 |             }
68 |         }
69 | 
70 |         public static void ChangeCulture(CultureInfo newCulture)
71 |         {
72 |             Thread.CurrentThread.CurrentUICulture = newCulture;
73 | 
74 |             var oldWindow = Application.Current.MainWindow;
75 | 
76 |             Application.Current.MainWindow = new GuiWithTools();
77 |             Application.Current.MainWindow.Show();
78 | 
79 |             if (oldWindow != null)
80 |             {
81 |                 oldWindow.Close();
82 |             }
83 |         }
84 |     }
85 | }
86 | 


--------------------------------------------------------------------------------
/SliderDialog.xaml.cs:
--------------------------------------------------------------------------------
  1 | using System;
  2 | using System.Collections.Generic;
  3 | using System.Linq;
  4 | using System.Text;
  5 | using System.Threading.Tasks;
  6 | using System.Windows;
  7 | using System.Windows.Controls;
  8 | using System.Windows.Data;
  9 | using System.Windows.Documents;
 10 | using System.Windows.Input;
 11 | using System.Windows.Media;
 12 | using System.Windows.Media.Imaging;
 13 | using System.Windows.Shapes;
 14 | 
 15 | namespace VietOCR
 16 | {
 17 |     /// <summary>
 18 |     /// Interaction logic for TrackbarDialog.xaml
 19 |     /// </summary>
 20 |     public partial class SliderDialog : Window
 21 |     {
 22 |         public string LabelText
 23 |         {
 24 |             set
 25 |             {
 26 |                 this.label1.Content = value;
 27 |             }
 28 |         }
 29 | 
 30 |         private double prevValue;
 31 | 
 32 |         public delegate void HandleValueChange(object sender, ValueChangedEventArgs e);
 33 |         public event HandleValueChange ValueUpdated;
 34 | 
 35 |         public SliderDialog()
 36 |         {
 37 |             InitializeComponent();
 38 |         }
 39 | 
 40 |         private void slider_ValueChanged(object sender, RoutedPropertyChangedEventArgs<double> e)
 41 |         {
 42 |             if (this.ValueUpdated != null)
 43 |             {
 44 |                 Slider bar = (Slider)sender;
 45 | 
 46 |                 //reduce # of unnecessary value changed events
 47 |                 if (Math.Abs(bar.Value - prevValue) >= bar.SmallChange)
 48 |                 {
 49 |                     prevValue = bar.Value;
 50 |                     //Console.WriteLine(prevValue);
 51 |                     ValueChangedEventArgs args = new ValueChangedEventArgs(bar.Value);
 52 |                     this.ValueUpdated(this, args);
 53 |                 }
 54 |             }
 55 |         }
 56 | 
 57 |         public class ValueChangedEventArgs : EventArgs
 58 |         {
 59 |             public double NewValue
 60 |             {
 61 |                 get;
 62 |                 set;
 63 |             }
 64 | 
 65 |             public ValueChangedEventArgs(double value)
 66 |                 : base()
 67 |             {
 68 |                 this.NewValue = value;
 69 |             }
 70 |         }
 71 | 
 72 |         public void SetForContrast()
 73 |         {
 74 |             this.slider.Minimum = 5;
 75 |             this.slider.Value = 25;
 76 |             this.slider.TickFrequency = 10;
 77 |         }
 78 | 
 79 |         public void SetForGamma()
 80 |         {
 81 |             this.slider.Minimum = 0;
 82 |             this.slider.Value = 50;
 83 |             this.slider.TickFrequency = 10;
 84 |         }
 85 | 
 86 |         public void SetForThreshold()
 87 |         {
 88 |             this.slider.Minimum = 0;
 89 |             this.slider.Value = 50;
 90 |             this.slider.TickFrequency = 10;
 91 |         }
 92 | 
 93 |         private void buttonApply_Click(object sender, RoutedEventArgs e)
 94 |         {
 95 |             this.DialogResult = true;
 96 |             this.Visibility = Visibility.Hidden;
 97 |             this.Close();
 98 |         }
 99 | 
100 |         private void buttonCancel_Click(object sender, RoutedEventArgs e)
101 |         {
102 |             this.Visibility = Visibility.Hidden;
103 |             this.Close();
104 |         }
105 |     }
106 | }
107 | 


--------------------------------------------------------------------------------
/WIA/WiaScannerAdapter.cs:
--------------------------------------------------------------------------------
  1 | //http://geekswithblogs.net/tonyt/archive/2006/07/29/86608.aspx
  2 | 
  3 | using System;
  4 | using System.Collections.Generic;
  5 | using System.Text;
  6 | using System.Drawing;
  7 | using System.Drawing.Imaging;
  8 | using System.IO;
  9 | using System.Runtime.InteropServices;
 10 | using System.Security.Permissions;
 11 | using WIA;
 12 | 
 13 | namespace VietOCR.NET.WIA
 14 | {
 15 |     public enum WiaScannerError : uint
 16 |     {
 17 |         LibraryNotInstalled = 0x80040154,
 18 |         OutputFileExists = 0x80070050,
 19 |         ScannerNotAvailable = 0x80210015,
 20 |         OperationCancelled = 0x80210064
 21 |     }
 22 | 
 23 |     public sealed class WiaScannerAdapter : IDisposable
 24 |     {
 25 |          private ICommonDialog _wiaManager;
 26 |          private bool _disposed; // indicates if Dispose has been called
 27 | 
 28 |          public WiaScannerAdapter()
 29 |          {
 30 |          }
 31 | 
 32 |          ~WiaScannerAdapter()
 33 |          {
 34 |               Dispose(false);
 35 |          }
 36 | 
 37 |          private ICommonDialog WiaManager
 38 |          {
 39 |               get { return _wiaManager; }
 40 |               set { _wiaManager = value; }
 41 |          }
 42 | 
 43 |          [System.Diagnostics.DebuggerNonUserCodeAttribute()]
 44 |          [SecurityPermission(SecurityAction.Demand, UnmanagedCode = true)]
 45 |          public Image ScanImage(ImageFormat outputFormat, string fileName)
 46 |          {
 47 |               if (outputFormat == null)
 48 |                    throw new ArgumentNullException("outputFormat");
 49 | 
 50 |               FileIOPermission filePerm = new FileIOPermission(FileIOPermissionAccess.AllAccess, fileName);
 51 |               filePerm.Demand();
 52 | 
 53 |               ImageFile imageObject = null;
 54 | 
 55 |               try
 56 |               {
 57 |                    if (WiaManager == null)
 58 |                         WiaManager = new CommonDialog();
 59 | 
 60 |                    imageObject =
 61 |                         WiaManager.ShowAcquireImage(WiaDeviceType.ScannerDeviceType,
 62 |                              WiaImageIntent.GrayscaleIntent, WiaImageBias.MaximizeQuality, 
 63 |                              outputFormat.Guid.ToString("B"), false, true, true);
 64 | 
 65 |                    imageObject.SaveFile(fileName);
 66 |                    return Image.FromFile(fileName);
 67 |               }
 68 |               catch (COMException ex)
 69 |               {
 70 |                    string message = "Error scanning image";
 71 |                    throw new WiaOperationException(message, ex);
 72 |               }
 73 |               finally
 74 |               {
 75 |                    if (imageObject != null)
 76 |                         Marshal.ReleaseComObject(imageObject);
 77 |               }
 78 |          }
 79 | 
 80 |          public void Dispose()
 81 |          {
 82 |               Dispose(true);
 83 |               GC.SuppressFinalize(this);
 84 |          }
 85 | 
 86 |          private void Dispose(bool disposing)
 87 |          {
 88 |               if (!_disposed)
 89 |               {
 90 |                    if (disposing)
 91 |                    {
 92 |                         // no managed resources to cleanup
 93 |                    }
 94 | 
 95 |                   // cleanup unmanaged resources
 96 |                   if (_wiaManager != null)
 97 |                        Marshal.ReleaseComObject(_wiaManager);
 98 | 
 99 |                   _disposed = true;
100 |               }
101 |          }
102 |     }
103 | }
104 | 


--------------------------------------------------------------------------------
/DataSource.cs:
--------------------------------------------------------------------------------
  1 | /// https://www.codeproject.com/Articles/45782/A-WPF-Combo-Box-with-Multiple-Selection
  2 | 
  3 | using System;
  4 | using System.Collections.Generic;
  5 | using System.Linq;
  6 | using System.Text;
  7 | using System.Collections.ObjectModel;
  8 | using System.ComponentModel;
  9 | using System.Windows.Data;
 10 | using System.Windows;
 11 | 
 12 | namespace VietOCR
 13 | {
 14 |     public class DataSource : INotifyPropertyChanged
 15 |     {
 16 |         
 17 |         #region INotifyPropertyChanged Members
 18 | 
 19 |         public event PropertyChangedEventHandler PropertyChanged;
 20 |         private void OnPropertyChanged(string propertyName)
 21 |         {
 22 |             if (PropertyChanged != null)
 23 |                 PropertyChanged(this, new PropertyChangedEventArgs(propertyName));
 24 |         }
 25 |         
 26 |         #endregion
 27 |        
 28 |         public ObservableCollection<string> InstalledLanguages
 29 |         {
 30 |             get;
 31 |             set;
 32 |         }
 33 |         
 34 |         private string _selectedLanguage = "English";
 35 |         public string SelectedLanguage
 36 |         {
 37 |             get { return _selectedLanguage; }
 38 |             set 
 39 |             { 
 40 |                 _selectedLanguage = value;
 41 |                 OnPropertyChanged("SelectedLanguage");
 42 |             }
 43 |         }
 44 | 
 45 |         private ObservableCollection<string> _selectedLanguages;
 46 |         public ObservableCollection<string> SelectedLanguages
 47 |         {
 48 |             get
 49 |             {
 50 |                 if (_selectedLanguages == null)
 51 |                 {
 52 |                     _selectedLanguages = new ObservableCollection<string> { "English" };
 53 |                     SelectedLanguagesText = WriteSelectedLanguagesString(_selectedLanguages);
 54 |                     _selectedLanguages.CollectionChanged +=
 55 |                         (s, e) =>
 56 |                         {
 57 |                             SelectedLanguagesText = WriteSelectedLanguagesString(_selectedLanguages);
 58 |                             OnPropertyChanged("SelectedLanguages");
 59 |                         };
 60 |                 }
 61 |                 return _selectedLanguages;
 62 |             }
 63 |             set
 64 |             {
 65 |                 _selectedLanguages.Clear();
 66 |                 foreach (string lang in value)
 67 |                 {
 68 |                     if (InstalledLanguages.Contains(lang))
 69 |                     {
 70 |                         _selectedLanguages.Add(lang);
 71 |                     }
 72 |                 }
 73 |             }
 74 |         }
 75 | 
 76 |         string _selectedLanguagesText;
 77 |         public string SelectedLanguagesText
 78 |         {
 79 |             get { return _selectedLanguagesText; }
 80 |             set 
 81 |             { 
 82 |                 _selectedLanguagesText = value;
 83 |                 OnPropertyChanged("SelectedLanguagesText");
 84 |             }
 85 |         } 
 86 | 
 87 |         private static string WriteSelectedLanguagesString(IList<string> list)
 88 |         {
 89 |             if (list.Count == 0)
 90 |                 return string.Empty;
 91 | 
 92 |             StringBuilder builder = new StringBuilder(list[0]);
 93 | 
 94 |             for (int i = 1; i < list.Count; i++)
 95 |             {
 96 |                 builder.Append(", ");
 97 |                 builder.Append(list[i]);
 98 |             }
 99 | 
100 |             return builder.ToString();
101 |         }
102 |     }
103 | }
104 | 


--------------------------------------------------------------------------------
/ImageInfoDialog.xaml.cs:
--------------------------------------------------------------------------------
 1 | using System;
 2 | using System.Collections.Generic;
 3 | using System.Drawing;
 4 | using System.Linq;
 5 | using System.Text;
 6 | using System.Threading.Tasks;
 7 | using System.Windows;
 8 | using System.Windows.Controls;
 9 | using System.Windows.Data;
10 | using System.Windows.Documents;
11 | using System.Windows.Input;
12 | using System.Windows.Media;
13 | using System.Windows.Media.Imaging;
14 | using System.Windows.Shapes;
15 | 
16 | namespace VietOCR
17 | {
18 |     /// <summary>
19 |     /// Interaction logic for ImageInfoDialog.xaml
20 |     /// </summary>
21 |     public partial class ImageInfoDialog : Window
22 |     {
23 |         System.Drawing.Image image;
24 |         bool isProgrammatic;
25 | 
26 |         public System.Drawing.Image Image
27 |         {
28 |             get { return image; }
29 |             set { image = value; }
30 |         }
31 | 
32 |         public ImageInfoDialog()
33 |         {
34 |             InitializeComponent();
35 |         }
36 | 
37 |         private void buttonOK_Click(object sender, RoutedEventArgs e)
38 |         {
39 |             this.Close();
40 |         }
41 | 
42 |         private void ConvertUnits(int unit)
43 |         {
44 |             switch (unit)
45 |             {
46 |                 case 1: // "inches"
47 |                     this.textBoxWidth.Text = Math.Round(this.image.Width / this.image.HorizontalResolution, 1).ToString();
48 |                     this.textBoxHeight.Text = Math.Round(this.image.Height / this.image.VerticalResolution, 1).ToString();
49 |                     break;
50 | 
51 |                 case 2: //"cm"
52 |                     this.textBoxWidth.Text = Math.Round(this.image.Width / this.image.HorizontalResolution * 2.54, 2).ToString();
53 |                     this.textBoxHeight.Text = Math.Round(this.image.Height / this.image.VerticalResolution * 2.54, 2).ToString();
54 |                     break;
55 | 
56 |                 default: // "pixel"
57 |                     this.textBoxWidth.Text = this.image.Width.ToString();
58 |                     this.textBoxHeight.Text = this.image.Height.ToString();
59 |                     break;
60 |             }
61 |         }
62 | 
63 |         private void Window_Loaded(object sender, RoutedEventArgs e)
64 |         {
65 |             this.textBoxXRes.Text = Math.Round(this.image.HorizontalResolution).ToString();
66 |             this.textBoxYRes.Text = Math.Round(this.image.VerticalResolution).ToString();
67 |             this.textBoxWidth.Text = this.image.Width.ToString();
68 |             this.textBoxHeight.Text = this.image.Height.ToString();
69 |             this.textBoxBitDepth.Text = Bitmap.GetPixelFormatSize(this.image.PixelFormat).ToString();
70 |             this.comboBoxUnitW.SelectedIndex = 0;
71 |             this.comboBoxUnitH.SelectedIndex = 0;
72 |         }
73 | 
74 |         private void comboBoxUnitW_SelectionChanged(object sender, SelectionChangedEventArgs e)
75 |         {
76 |             if (!isProgrammatic)
77 |             {
78 |                 isProgrammatic = true;
79 |                 this.comboBoxUnitH.SelectedIndex = this.comboBoxUnitW.SelectedIndex;
80 |                 ConvertUnits(this.comboBoxUnitW.SelectedIndex);
81 |                 isProgrammatic = false;
82 |             }
83 |         }
84 | 
85 |         private void comboBoxUnitH_SelectionChanged(object sender, SelectionChangedEventArgs e)
86 |         {
87 |             if (!isProgrammatic)
88 |             {
89 |                 isProgrammatic = true;
90 |                 this.comboBoxUnitW.SelectedIndex = this.comboBoxUnitH.SelectedIndex;
91 |                 ConvertUnits(this.comboBoxUnitH.SelectedIndex);
92 |                 isProgrammatic = false;
93 |             }
94 |         }
95 |     }
96 | }
97 | 


--------------------------------------------------------------------------------
/Utilities/BreakIterator.cs:
--------------------------------------------------------------------------------
  1 | /*
  2 | * BreakIterator
  3 | *
  4 | * Attempt to mimic Java's BreakIterator class
  5 | * to analyze word boundaries.
  6 | *
  7 | * @author: Quan Nguyen
  8 | * @version: 1.4, 10 January 2011
  9 | */
 10 | 
 11 | using System.Text.RegularExpressions;
 12 | 
 13 | namespace Net.SourceForge.Vietpad.Utilities
 14 | {
 15 |     public class BreakIterator
 16 |     {
 17 |         private static BreakIterator instance;
 18 | 
 19 |         private string text;
 20 |         static int index;
 21 |         static MatchCollection mc;
 22 |         public static readonly int DONE = -1;
 23 | 
 24 |         static readonly Regex regex = new Regex(@"\b.", RegexOptions.Compiled | RegexOptions.Singleline);
 25 | 
 26 |         private BreakIterator() { }
 27 | 
 28 |         public static BreakIterator GetWordInstance()
 29 |         {
 30 |             if (instance == null)
 31 |             {
 32 |                 instance = new BreakIterator();
 33 |             }
 34 | 
 35 |             return instance;
 36 |         }
 37 | 
 38 |         public string Text
 39 |         {
 40 |             set
 41 |             {
 42 |                 text = value;
 43 |                 mc = regex.Matches(text); // collection of all word boundaries
 44 |                 //		for (int i = 0; i < mc.Count; i++)
 45 |                 //		{    
 46 |                 //			System.Console.WriteLine("Found '{0}' at position {1}", mc[i].Value, mc[i].Index);
 47 |                 //		}        
 48 |             }
 49 |         }
 50 |         public int First()
 51 |         {
 52 |             index = 0;
 53 |             if (mc.Count > 0)
 54 |             {
 55 |                 return mc[0].Index;
 56 |             }
 57 |             else
 58 |             {
 59 |                 return index;
 60 |             }
 61 |         }
 62 |         public int Last()
 63 |         {
 64 |             index = mc.Count;
 65 |             return text.Length;
 66 |         }
 67 | 
 68 |         public int Next()
 69 |         {
 70 |             while (index < mc.Count)
 71 |             {
 72 |                 index++;
 73 |                 if (index >= mc.Count)
 74 |                 {
 75 |                     return text.Length;
 76 |                 }
 77 |                 else
 78 |                 {
 79 |                     return mc[index].Index;
 80 |                 }
 81 |             }
 82 | 
 83 |             index = mc.Count;
 84 |             return DONE;
 85 |         }
 86 |         public int Previous()
 87 |         {
 88 |             while (index > 0)
 89 |             {
 90 |                 index--;
 91 |                 if (index < 0)
 92 |                 {
 93 |                     return 0;
 94 |                 }
 95 |                 else
 96 |                 {
 97 |                     return mc[index].Index;
 98 |                 }
 99 |             }
100 | 
101 |             index = 0;
102 |             return DONE;
103 |         }
104 | 
105 |         public int Following(int offset)
106 |         {
107 |             int start = First();
108 |             for (int end = Next(); end != BreakIterator.DONE; start = end, end = Next())
109 |             {
110 |                 if (end > offset)
111 |                 {
112 |                     return end;
113 |                 }
114 |             }
115 |             return DONE;
116 |         }
117 | 
118 |         public int Preceding(int offset)
119 |         {
120 |             int start = First();
121 |             for (int end = Next(); end != BreakIterator.DONE; start = end, end = Next())
122 |             {
123 |                 if (end > offset)
124 |                 {
125 |                     return Previous();
126 |                 }
127 |             }
128 |             return DONE;
129 |         }
130 |     }
131 | }


--------------------------------------------------------------------------------
/GuiWithInputMethod.cs:
--------------------------------------------------------------------------------
  1 | /**
  2 |  * Copyright @ 2008 Quan Nguyen
  3 |  * 
  4 |  * Licensed under the Apache License, Version 2.0 (the "License");
  5 |  * you may not use this file except in compliance with the License.
  6 |  * You may obtain a copy of the License at
  7 |  *
  8 |  *  http://www.apache.org/licenses/LICENSE-2.0
  9 |  *
 10 |  * Unless required by applicable law or agreed to in writing, software
 11 |  * distributed under the License is distributed on an "AS IS" BASIS,
 12 |  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 13 |  * See the License for the specific language governing permissions and
 14 |  * limitations under the License.
 15 | */
 16 | using System;
 17 | using System.Collections.Generic;
 18 | using Microsoft.Win32;
 19 | using System.Windows.Controls;
 20 | using System.Windows;
 21 | 
 22 | using Net.SourceForge.Vietpad.InputMethod;
 23 | 
 24 | namespace VietOCR
 25 | {
 26 |     public partial class GuiWithInputMethod : GuiWithFormat
 27 |     {
 28 |         MenuItem miimChecked;
 29 | 
 30 |         private string selectedInputMethod;
 31 |         const string strInputMethod = "InputMethod";
 32 | 
 33 |         public GuiWithInputMethod()
 34 |         {
 35 |             //
 36 |             // Settings InputMethod submenu
 37 |             //
 38 |             RoutedEventHandler eh = new RoutedEventHandler(MenuKeyboardInputMethodOnClick);
 39 | 
 40 |             List<MenuItem> ar = new List<MenuItem>();
 41 | 
 42 |             foreach (string inputMethod in Enum.GetNames(typeof(InputMethods)))
 43 |             {
 44 |                 MenuItem miim = new MenuItem();
 45 |                 miim.Header = inputMethod;
 46 |                 miim.IsCheckable = true;
 47 |                 miim.Click += eh;
 48 |                 ar.Add(miim);
 49 |             }
 50 | 
 51 |             this.vietInputMethodToolStripMenuItem.ItemsSource = ar;
 52 | 
 53 |             new VietKeyHandler(textBox1);
 54 |         }
 55 | 
 56 |         protected override void Window_Loaded(object sender, RoutedEventArgs e)
 57 |         {
 58 |             base.Window_Loaded(sender, e);
 59 | 
 60 |             for (int i = 0; i < this.vietInputMethodToolStripMenuItem.Items.Count; i++)
 61 |             {
 62 |                 if (((MenuItem)this.vietInputMethodToolStripMenuItem.Items[i]).Header.ToString() == selectedInputMethod)
 63 |                 {
 64 |                     // Select InputMethod last saved
 65 |                     miimChecked = (MenuItem)vietInputMethodToolStripMenuItem.Items[i];
 66 |                     miimChecked.IsChecked = true;
 67 |                     break;
 68 |                 }
 69 |             }
 70 | 
 71 |             VietKeyHandler.InputMethod = (InputMethods)Enum.Parse(typeof(InputMethods), selectedInputMethod);
 72 |             VietKeyHandler.SmartMark = true;
 73 |             VietKeyHandler.ConsumeRepeatKey = true;
 74 |         }
 75 | 
 76 |         void MenuKeyboardInputMethodOnClick(object obj, EventArgs ea)
 77 |         {
 78 |             miimChecked.IsChecked = false;
 79 |             miimChecked = (MenuItem)obj;
 80 |             miimChecked.IsChecked = true;
 81 |             selectedInputMethod = miimChecked.Header.ToString();
 82 |             VietKeyHandler.InputMethod = (InputMethods)Enum.Parse(typeof(InputMethods), selectedInputMethod);
 83 |         }
 84 | 
 85 |         protected override void LoadRegistryInfo(RegistryKey regkey)
 86 |         {
 87 |             base.LoadRegistryInfo(regkey);
 88 |             selectedInputMethod = (string)regkey.GetValue(strInputMethod, Enum.GetName(typeof(InputMethods), InputMethods.Telex));
 89 |         }
 90 | 
 91 |         protected override void SaveRegistryInfo(RegistryKey regkey)
 92 |         {
 93 |             base.SaveRegistryInfo(regkey);
 94 |             regkey.SetValue(strInputMethod, selectedInputMethod);
 95 |         }
 96 |         
 97 |     }
 98 | }
 99 | 
100 | 


--------------------------------------------------------------------------------
/Postprocessing/TextUtilities.cs:
--------------------------------------------------------------------------------
  1 | using System;
  2 | using System.Collections.Generic;
  3 | using System.Text;
  4 | using System.Text.RegularExpressions;
  5 | using System.IO;
  6 | 
  7 | namespace VietOCR.NET.Postprocessing
  8 | {
  9 |     class TextUtilities
 10 |     {
 11 |         private static List<Dictionary<string, string>> maps;
 12 |         private static DateTime mapLastModified = DateTime.MinValue;
 13 | 
 14 |         /// <summary>
 15 |         /// Corrects letter cases.
 16 |         /// </summary>
 17 |         /// <param name="input"></param>
 18 |         /// <returns></returns>
 19 |         public static string CorrectLetterCases(string input)
 20 |         {
 21 |             // lower uppercase letters ended by lowercase letters except the first letter
 22 |             Regex regex = new Regex("(?<=\\p{L}+)(\\p{Lu}+)(?=\\p{Ll}+)");
 23 |             input = regex.Replace(input, new MatchEvaluator(LowerCaseText));
 24 | 
 25 |             //// lower uppercase letters begun by lowercase letters
 26 |             regex = new Regex("(?<=\\p{Ll}+)(\\p{Lu}+)");
 27 |             input = regex.Replace(input, new MatchEvaluator(LowerCaseText));
 28 | 
 29 |             return input;
 30 |         }
 31 | 
 32 |         static string LowerCaseText(Match m)
 33 |         {
 34 |             // Lowercase the matched string.
 35 |             return m.Value.ToLower();
 36 |         }
 37 | 
 38 |         public static List<Dictionary<string, string>> LoadMap(string dangAmbigsFile)
 39 |         {
 40 |             try
 41 |             {
 42 |                 FileInfo dataFile = new FileInfo(dangAmbigsFile);
 43 | 
 44 |                 DateTime fileLastModified = dataFile.LastWriteTime;
 45 |                 if (maps == null)
 46 |                 {
 47 |                     maps = new List<Dictionary<string, string>>();
 48 |                 }
 49 |                 else
 50 |                 {
 51 |                     if (fileLastModified <= mapLastModified)
 52 |                     {
 53 |                         return maps; // no need to reload map
 54 |                     }
 55 |                     maps.Clear();
 56 |                 }
 57 |                 mapLastModified = fileLastModified;
 58 | 
 59 |                 for (int i = Processor.PLAIN; i <= Processor.REGEX; i++)
 60 |                 {
 61 |                     maps.Add(new Dictionary<string, string>());
 62 |                 }
 63 | 
 64 |                 StreamReader sr = new StreamReader(dangAmbigsFile, Encoding.UTF8);
 65 |                 string str;
 66 | 
 67 |                 while ((str = sr.ReadLine()) != null)
 68 |                 {
 69 |                     // skip empty line or line starts with # or without tab delimiters
 70 |                     if (str.Trim().Length == 0 || str.Trim().StartsWith("#") || !str.Contains("\t"))
 71 |                     {
 72 |                         continue;
 73 |                     }
 74 | 
 75 |                     str = Regex.Replace(str, "\t+", "\t");
 76 |                     string[] parts = str.Split('\t');
 77 |                     if (parts.Length < 3)
 78 |                     {
 79 |                         continue;
 80 |                     }
 81 | 
 82 |                     int type = int.Parse(parts[0]);
 83 |                     string key = parts[1];
 84 |                     string value = parts[2];
 85 | 
 86 |                     if (type < Processor.PLAIN || type > Processor.REGEX)
 87 |                     {
 88 |                         continue;
 89 |                     }
 90 | 
 91 |                     Dictionary<string, string> dict = maps[type];
 92 |                     dict[key] = value;
 93 |                 }
 94 |                 sr.Close();   
 95 |             }
 96 |             catch (Exception e)
 97 |             {
 98 |                 Console.WriteLine(e.StackTrace);
 99 |             }
100 | 
101 |             return maps;
102 |         }
103 |     }
104 | }
105 | 


--------------------------------------------------------------------------------
/OCRHelper.cs:
--------------------------------------------------------------------------------
 1 | using System.IO;
 2 | using System.Drawing;
 3 | using VietOCR.NET.Utilities;
 4 | using VietOCR.NET.Postprocessing;
 5 | using System.Linq;
 6 | using System;
 7 | 
 8 | namespace VietOCR
 9 | {
10 |     class OCRHelper
11 |     {
12 |         /// <summary>
13 |         /// Performs OCR for bulk/batch and console operations.
14 |         /// </summary>
15 |         /// <param name="imageFile">Image file</param>
16 |         /// <param name="outputFile">Output file without extension</param>
17 |         /// <param name="langCode">language code</param>
18 |         /// <param name="pageSegMode">page segmentation mode</param>
19 |         /// <param name="outputFormat">format of output file. Possible values: <code>text</code>, <code>text+</code> (with post-corrections), <code>hocr</code></param>
20 |         /// <param name="deskew">deskew</param>
21 |         public static void PerformOCR(string imageFile, string outputFile, string langCode, string pageSegMode, string outputFormat, ProcessingOptions options)
22 |         {
23 |             DirectoryInfo dir = Directory.GetParent(outputFile);
24 |             if (dir != null && !dir.Exists)
25 |             {
26 |                 dir.Create();
27 |             }
28 | 
29 |             OCR<Image> ocrEngine = new OCRImages();
30 |             ocrEngine.PageSegMode = pageSegMode;
31 |             ocrEngine.Language = langCode;
32 |             ocrEngine.OutputFormat = outputFormat;
33 |             ocrEngine.OutputFile = outputFile;
34 |             ocrEngine.ProcessingOptions = options;
35 | 
36 |             string workingTiffFile = null;
37 | 
38 |             try
39 |             {
40 |                 // convert PDF to TIFF
41 |                 if (imageFile.ToLower().EndsWith(".pdf"))
42 |                 {
43 |                     workingTiffFile = PdfUtilities.ConvertPdf2TiffGS(imageFile);
44 |                     imageFile = workingTiffFile;
45 |                 }
46 | 
47 |                 ocrEngine.ProcessFile(imageFile);
48 | 
49 |                 if (outputFormat.Split(',').Contains(Tesseract.RenderedFormat.TEXT.ToString()))
50 |                 {
51 |                     // post-corrections for text output
52 |                     if (options.PostProcessing || options.CorrectLetterCases || options.RemoveLineBreaks)
53 |                     {
54 |                         string outputFilename = outputFile + ".txt";
55 |                         string result = File.ReadAllText(outputFilename);
56 | 
57 |                         // postprocess to correct common OCR errors
58 |                         if (options.PostProcessing)
59 |                         {
60 |                             result = Processor.PostProcess(result, langCode, options.DangAmbigsPath, options.DangAmbigsEnabled, options.ReplaceHyphens);
61 |                         }
62 | 
63 |                         // correct letter cases
64 |                         if (options.CorrectLetterCases)
65 |                         {
66 |                             result = TextUtilities.CorrectLetterCases(result);
67 |                         }
68 | 
69 |                         // remove line breaks
70 |                         if (options.RemoveLineBreaks)
71 |                         {
72 |                             result = Net.SourceForge.Vietpad.Utilities.TextUtilities.RemoveLineBreaks(result, options.RemoveHyphens);
73 |                         }
74 | 
75 |                         using (StreamWriter sw = new StreamWriter(outputFilename, false, new System.Text.UTF8Encoding()))
76 |                         {
77 |                             sw.Write(result);
78 |                         }
79 |                     }
80 |                 }
81 |             }
82 |             finally
83 |             {
84 |                 if (workingTiffFile != null && File.Exists(workingTiffFile))
85 |                 {
86 |                     File.Delete(workingTiffFile);
87 |                 }
88 |             }
89 |         }
90 |     }
91 | }
92 | 


--------------------------------------------------------------------------------
/GuiWithUILanguage.cs:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * Copyright @ 2008 Quan Nguyen
 3 |  * 
 4 |  * Licensed under the Apache License, Version 2.0 (the "License");
 5 |  * you may not use this file except in compliance with the License.
 6 |  * You may obtain a copy of the License at
 7 |  *
 8 |  *  http://www.apache.org/licenses/LICENSE-2.0
 9 |  *
10 |  * Unless required by applicable law or agreed to in writing, software
11 |  * distributed under the License is distributed on an "AS IS" BASIS,
12 |  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 |  * See the License for the specific language governing permissions and
14 |  * limitations under the License.
15 | */
16 | using System;
17 | using System.Collections.Generic;
18 | using System.ComponentModel;
19 | using System.Data;
20 | using System.Drawing;
21 | using System.Text;
22 | using System.Globalization;
23 | //using Vietpad.NET.Controls;
24 | using System.Windows;
25 | using System.Windows.Controls;
26 | 
27 | namespace VietOCR
28 | {
29 |     public class GuiWithUILanguage : GuiWithInputMethod
30 |     {
31 |         MenuItem miuilChecked;
32 | 
33 |         public GuiWithUILanguage()
34 |         {
35 | 
36 |             //
37 |             // Settings UI Language submenu
38 |             //
39 |             RoutedEventHandler eh = new RoutedEventHandler(MenuKeyboardUILangOnClick);
40 | 
41 |             List<MenuItem> ar = new List<MenuItem>();
42 | 
43 |             string[] uiLangs = { "ar-SA", "bn-IN", "ca-ES", "cs-CZ", "de-DE", "en-US", "es-ES", "et-EE", "fa-IR", "fi-FI", "fr-FR", "hi-IN", "hu-HU", "it-IT", "ja-JP", "kn-In", "ku-Arab-IQ", "lt-LT", "ne-NP", "nl-NL", "pl-PL", "pt-PT", "ru-RU", "sd-Deva", "sk-SK", "sl-SI", "tr-TR", "vi-VN", "zh-Hans" };
44 |             foreach (string uiLang in uiLangs)
45 |             {
46 |                 MenuItem miuil = new MenuItem();
47 |                 CultureInfo ci = new CultureInfo(uiLang);
48 |                 miuil.Tag = ci.Name;
49 |                 miuil.Header = ci.Parent.DisplayName + " (" + ci.Parent.NativeName + ")";
50 |                 if (ci.Parent.DisplayName.StartsWith("Invariant Language"))
51 |                 {
52 |                     miuil.Header = ci.EnglishName.Substring(0, ci.EnglishName.IndexOf("(") - 1) + " (" + ci.NativeName.Substring(0, ci.NativeName.IndexOf("(") - 1) + ")";
53 |                 }
54 |                 miuil.Click += eh;
55 |                 ar.Add(miuil);
56 |                 this.uiLanguageToolStripMenuItem.Items.Add(miuil);
57 |             }
58 |         }
59 | 
60 |         protected override void Window_Loaded(object sender, RoutedEventArgs e)
61 |         {
62 |             base.Window_Loaded(sender, e);
63 | 
64 |             for (int i = 0; i < this.uiLanguageToolStripMenuItem.Items.Count; i++)
65 |             {
66 |                 if (((MenuItem)this.uiLanguageToolStripMenuItem.Items[i]).Tag.ToString() == selectedUILanguage)
67 |                 {
68 |                     // Select UI Language last saved
69 |                     miuilChecked = (MenuItem)uiLanguageToolStripMenuItem.Items[i];
70 |                     miuilChecked.IsChecked = true;
71 |                     break;
72 |                 }
73 |             }
74 |         }
75 | 
76 |         void MenuKeyboardUILangOnClick(object obj, EventArgs ea)
77 |         {
78 |             if (miuilChecked != null)
79 |             {
80 |                 miuilChecked.IsChecked = false;
81 |             }
82 |             
83 |             miuilChecked = (MenuItem)obj;
84 |             miuilChecked.IsChecked = true;
85 |             if (selectedUILanguage != miuilChecked.Tag.ToString())
86 |             {
87 |                 selectedUILanguage = miuilChecked.Tag.ToString();
88 |                 //ChangeUILanguage(selectedUILanguage);
89 |                 App.ChangeCulture(new CultureInfo(selectedUILanguage));
90 |             }
91 |         }
92 |     }
93 | }
94 | 


--------------------------------------------------------------------------------
/dict/en_US.aff:
--------------------------------------------------------------------------------
  1 | SET ISO8859-1
  2 | TRY esianrtolcdugmphbyfvkwzESIANRTOLCDUGMPHBYFVKWZ'
  3 | NOSUGGEST !
  4 | 
  5 | # ordinal numbers
  6 | COMPOUNDMIN 1
  7 | # only in compounds: 1th, 2th, 3th
  8 | ONLYINCOMPOUND c
  9 | # compound rules:
 10 | # 1. [0-9]*1[0-9]th (10th, 11th, 12th, 56714th, etc.)
 11 | # 2. [0-9]*[02-9](1st|2nd|3rd|[4-9]th) (21st, 22nd, 123rd, 1234th, etc.)
 12 | COMPOUNDRULE 2
 13 | COMPOUNDRULE n*1t
 14 | COMPOUNDRULE n*mp
 15 | WORDCHARS 0123456789
 16 | 
 17 | PFX A Y 1
 18 | PFX A   0     re         .
 19 | 
 20 | PFX I Y 1
 21 | PFX I   0     in         .
 22 | 
 23 | PFX U Y 1
 24 | PFX U   0     un         .
 25 | 
 26 | PFX C Y 1
 27 | PFX C   0     de          .
 28 | 
 29 | PFX E Y 1
 30 | PFX E   0     dis         .
 31 | 
 32 | PFX F Y 1
 33 | PFX F   0     con         .
 34 | 
 35 | PFX K Y 1
 36 | PFX K   0     pro         .
 37 | 
 38 | SFX V N 2
 39 | SFX V   e     ive        e
 40 | SFX V   0     ive        [^e]
 41 | 
 42 | SFX N Y 3
 43 | SFX N   e     ion        e
 44 | SFX N   y     ication    y 
 45 | SFX N   0     en         [^ey] 
 46 | 
 47 | SFX X Y 3
 48 | SFX X   e     ions       e
 49 | SFX X   y     ications   y
 50 | SFX X   0     ens        [^ey]
 51 | 
 52 | SFX H N 2
 53 | SFX H   y     ieth       y
 54 | SFX H   0     th         [^y] 
 55 | 
 56 | SFX Y Y 1
 57 | SFX Y   0     ly         .
 58 | 
 59 | SFX G Y 2
 60 | SFX G   e     ing        e
 61 | SFX G   0     ing        [^e] 
 62 | 
 63 | SFX J Y 2
 64 | SFX J   e     ings       e
 65 | SFX J   0     ings       [^e]
 66 | 
 67 | SFX D Y 4
 68 | SFX D   0     d          e
 69 | SFX D   y     ied        [^aeiou]y
 70 | SFX D   0     ed         [^ey]
 71 | SFX D   0     ed         [aeiou]y
 72 | 
 73 | SFX T N 4
 74 | SFX T   0     st         e
 75 | SFX T   y     iest       [^aeiou]y
 76 | SFX T   0     est        [aeiou]y
 77 | SFX T   0     est        [^ey]
 78 | 
 79 | SFX R Y 4
 80 | SFX R   0     r          e
 81 | SFX R   y     ier        [^aeiou]y
 82 | SFX R   0     er         [aeiou]y
 83 | SFX R   0     er         [^ey]
 84 | 
 85 | SFX Z Y 4
 86 | SFX Z   0     rs         e
 87 | SFX Z   y     iers       [^aeiou]y
 88 | SFX Z   0     ers        [aeiou]y
 89 | SFX Z   0     ers        [^ey]
 90 | 
 91 | SFX S Y 4
 92 | SFX S   y     ies        [^aeiou]y
 93 | SFX S   0     s          [aeiou]y
 94 | SFX S   0     es         [sxzh]
 95 | SFX S   0     s          [^sxzhy]
 96 | 
 97 | SFX P Y 3
 98 | SFX P   y     iness      [^aeiou]y
 99 | SFX P   0     ness       [aeiou]y
100 | SFX P   0     ness       [^y]
101 | 
102 | SFX M Y 1
103 | SFX M   0     's         .
104 | 
105 | SFX B Y 3
106 | SFX B   0     able       [^aeiou]
107 | SFX B   0     able       ee
108 | SFX B   e     able       [^aeiou]e
109 | 
110 | SFX L Y 1
111 | SFX L   0     ment       .
112 | 
113 | REP 88
114 | REP a ei
115 | REP ei a
116 | REP a ey
117 | REP ey a
118 | REP ai ie
119 | REP ie ai
120 | REP are air
121 | REP are ear
122 | REP are eir
123 | REP air are
124 | REP air ere
125 | REP ere air
126 | REP ere ear
127 | REP ere eir
128 | REP ear are
129 | REP ear air
130 | REP ear ere
131 | REP eir are
132 | REP eir ere
133 | REP ch te
134 | REP te ch
135 | REP ch ti
136 | REP ti ch
137 | REP ch tu
138 | REP tu ch
139 | REP ch s
140 | REP s ch
141 | REP ch k
142 | REP k ch
143 | REP f ph
144 | REP ph f
145 | REP gh f
146 | REP f gh
147 | REP i igh
148 | REP igh i
149 | REP i uy
150 | REP uy i
151 | REP i ee
152 | REP ee i
153 | REP j di
154 | REP di j
155 | REP j gg
156 | REP gg j
157 | REP j ge
158 | REP ge j
159 | REP s ti
160 | REP ti s
161 | REP s ci
162 | REP ci s
163 | REP k cc
164 | REP cc k
165 | REP k qu
166 | REP qu k
167 | REP kw qu
168 | REP o eau
169 | REP eau o
170 | REP o ew
171 | REP ew o
172 | REP oo ew
173 | REP ew oo
174 | REP ew ui
175 | REP ui ew
176 | REP oo ui
177 | REP ui oo
178 | REP ew u
179 | REP u ew
180 | REP oo u
181 | REP u oo
182 | REP u oe
183 | REP oe u
184 | REP u ieu
185 | REP ieu u
186 | REP ue ew
187 | REP ew ue
188 | REP uff ough
189 | REP oo ieu
190 | REP ieu oo
191 | REP ier ear
192 | REP ear ier
193 | REP ear air
194 | REP air ear
195 | REP w qu
196 | REP qu w
197 | REP z ss
198 | REP ss z
199 | REP shun tion
200 | REP shun sion
201 | REP shun cion
202 | 


--------------------------------------------------------------------------------
/Postprocessing/Processor.cs:
--------------------------------------------------------------------------------
  1 | /**
  2 |  * Copyright @ 2008 Quan Nguyen
  3 |  * 
  4 |  * Licensed under the Apache License, Version 2.0 (the "License");
  5 |  * you may not use this file except in compliance with the License.
  6 |  * You may obtain a copy of the License at
  7 |  *
  8 |  *  http://www.apache.org/licenses/LICENSE-2.0
  9 |  *
 10 |  * Unless required by applicable law or agreed to in writing, software
 11 |  * distributed under the License is distributed on an "AS IS" BASIS,
 12 |  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 13 |  * See the License for the specific language governing permissions and
 14 |  * limitations under the License.
 15 | */
 16 | namespace VietOCR.NET.Postprocessing
 17 | {
 18 |     using System;
 19 |     using System.Text;
 20 |     using System.IO;
 21 |     using System.Collections.Generic;
 22 |     using System.Text.RegularExpressions;
 23 | 
 24 |     public class Processor
 25 |     {
 26 |         public const int PLAIN = 0;  // plain replaces
 27 |         public const int REGEX = 1;  // regex replaces
 28 | 
 29 |         public static string PostProcess(string text, string langCode)
 30 |         {
 31 |             try
 32 |             {
 33 |                 IPostProcessor processor = ProcessorFactory.createProcessor((ISO639)Enum.Parse(typeof(ISO639), langCode.Substring(0, 3)));
 34 |                 return processor.PostProcess(text);
 35 |             }
 36 |             catch
 37 |             {
 38 |                 return text;
 39 |             }
 40 |         }
 41 | 
 42 |         public static string PostProcess(string text, string langCode, string dangAmbigsPath, bool dangAmbigsEnabled, bool replaceHyphens)
 43 |         {
 44 |             if (text.Trim().Length == 0)
 45 |             {
 46 |                 return text;
 47 |             }
 48 | 
 49 |             if (replaceHyphens)
 50 |             {
 51 |                 text = Net.SourceForge.Vietpad.Utilities.TextUtilities.ReplaceHyphensWithSoftHyphens(text);
 52 |             }
 53 | 
 54 |             // correct using external x.DangAmbigs.txt file first, if enabled
 55 |             if (dangAmbigsEnabled)
 56 |             {
 57 |                 StringBuilder strB = new StringBuilder(text);
 58 | 
 59 |                 // replace text based on entries read from an x.DangAmbigs.txt file
 60 |                 List<Dictionary<string, string>> replaceRules = TextUtilities.LoadMap(Path.Combine(dangAmbigsPath, langCode + ".DangAmbigs.txt"));
 61 |                 if (replaceRules.Count == 0 && langCode.Length > 3)
 62 |                 {
 63 |                     replaceRules = TextUtilities.LoadMap(Path.Combine(dangAmbigsPath, langCode.Substring(0, 3) + ".DangAmbigs.txt")); // fall back on base
 64 |                 }
 65 | 
 66 |                 if (replaceRules.Count == 0)
 67 |                 {
 68 |                     throw new NotSupportedException(langCode);
 69 |                 }
 70 | 
 71 |                 Dictionary<string, string> replaceRulesPlain = replaceRules[PLAIN];
 72 |                 Dictionary<string, string>.KeyCollection.Enumerator enumer = replaceRulesPlain.Keys.GetEnumerator();
 73 | 
 74 |                 while (enumer.MoveNext())
 75 |                 {
 76 |                     string key = enumer.Current;
 77 |                     string value = replaceRulesPlain[key];
 78 |                     strB = strB.Replace(key, value);
 79 |                 }
 80 |                 text = strB.ToString();
 81 | 
 82 |                 Dictionary<string, string> replaceRulesRegex = replaceRules[REGEX];
 83 |                 enumer = replaceRulesRegex.Keys.GetEnumerator();
 84 | 
 85 |                 while (enumer.MoveNext())
 86 |                 {
 87 |                     string key = enumer.Current;
 88 |                     string value = replaceRulesRegex[key];
 89 |                     text = Regex.Replace(text, key, value);
 90 |                 }
 91 |             }
 92 | 
 93 |             // postprocessor
 94 |             text = PostProcess(text, langCode);
 95 | 
 96 |             // correct letter cases
 97 |             return TextUtilities.CorrectLetterCases(text);
 98 |         }
 99 |     }
100 | }


--------------------------------------------------------------------------------
/GuiWithOEM.cs:
--------------------------------------------------------------------------------
  1 | /**
  2 |  * Copyright @ 2017 Quan Nguyen
  3 |  * 
  4 |  * Licensed under the Apache License, Version 2.0 (the "License");
  5 |  * you may not use this file except in compliance with the License.
  6 |  * You may obtain a copy of the License at
  7 |  *
  8 |  *  http://www.apache.org/licenses/LICENSE-2.0
  9 |  *
 10 |  * Unless required by applicable law or agreed to in writing, software
 11 |  * distributed under the License is distributed on an "AS IS" BASIS,
 12 |  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 13 |  * See the License for the specific language governing permissions and
 14 |  * limitations under the License.
 15 | */
 16 | 
 17 | using System;
 18 | using System.Collections.Generic;
 19 | using System.ComponentModel;
 20 | //using Vietpad.NET.Controls;
 21 | using Microsoft.Win32;
 22 | using Tesseract;
 23 | using System.Windows.Controls;
 24 | using System.Windows;
 25 | 
 26 | namespace VietOCR
 27 | {
 28 |     public class GuiWithOEM : GuiWithPSM
 29 |     {
 30 |         const string strOEM = "OcrEngineMode";
 31 |         MenuItem oemItemChecked;
 32 | 
 33 |         public GuiWithOEM()
 34 |         {
 35 |             Dictionary<string, string> oemDict = new Dictionary<string, string>();
 36 |             oemDict.Add("TesseractOnly", "0 - Legacy Engine Only");
 37 |             oemDict.Add("LstmOnly", "1 - LSTM Engine Only");
 38 |             oemDict.Add("TesseractAndLstm", "2 - Legacy & LSTM Engines");
 39 |             oemDict.Add("Default", "3 - Default");
 40 | 
 41 |             //
 42 |             // Settings EngineMode submenu
 43 |             //
 44 |             RoutedEventHandler eh = new RoutedEventHandler(MenuOEMOnClick);
 45 | 
 46 |             foreach (string mode in Enum.GetNames(typeof(EngineMode)))
 47 |             {
 48 |                 MenuItem oemItem = new MenuItem();
 49 |                 oemItem.Header = oemDict[mode];
 50 |                 oemItem.Tag = mode;
 51 |                 oemItem.Click += eh;
 52 |                 this.oemToolStripMenuItem.Items.Add(oemItem);
 53 |             }
 54 |         }
 55 | 
 56 |         protected override void Window_Loaded(object sender, RoutedEventArgs e)
 57 |         {
 58 |             base.Window_Loaded(sender, e);
 59 | 
 60 |             for (int i = 0; i < this.oemToolStripMenuItem.Items.Count; i++)
 61 |             {
 62 |                 if (((MenuItem)this.oemToolStripMenuItem.Items[i]).Tag.ToString() == selectedOEM)
 63 |                 {
 64 |                     // Select PSM last saved
 65 |                     oemItemChecked = (MenuItem)oemToolStripMenuItem.Items[i];
 66 |                     oemItemChecked.IsChecked = true;
 67 |                     break;
 68 |                 }
 69 |             }
 70 | 
 71 |             this.statusLabelOEMvalue.Content = selectedOEM;
 72 |         }
 73 | 
 74 |         void MenuOEMOnClick(object obj, EventArgs ea)
 75 |         {
 76 |             if (oemItemChecked != null)
 77 |             {
 78 |                 oemItemChecked.IsChecked = false;
 79 |             }
 80 |             oemItemChecked = (MenuItem)obj;
 81 |             oemItemChecked.IsChecked = true;
 82 |             selectedOEM = oemItemChecked.Tag.ToString();
 83 |             this.statusLabelOEMvalue.Content = selectedOEM;
 84 |         }
 85 | 
 86 |         protected override void LoadRegistryInfo(RegistryKey regkey)
 87 |         {
 88 |             base.LoadRegistryInfo(regkey);
 89 |             selectedOEM = (string)regkey.GetValue(strOEM, Enum.GetName(typeof(EngineMode), Tesseract.EngineMode.Default));
 90 |             try
 91 |             {
 92 |                 // validate OEM value
 93 |                 Tesseract.EngineMode oem = (EngineMode)Enum.Parse(typeof(EngineMode), selectedOEM);
 94 |             }
 95 |             catch
 96 |             {
 97 |                 selectedOEM = Enum.GetName(typeof(EngineMode), Tesseract.EngineMode.Default);
 98 |             }
 99 |         }
100 | 
101 |         protected override void SaveRegistryInfo(RegistryKey regkey)
102 |         {
103 |             base.SaveRegistryInfo(regkey);
104 |             regkey.SetValue(strOEM, selectedOEM);
105 |         }
106 |     }
107 | }
108 | 


--------------------------------------------------------------------------------
/ConsoleApp.cs:
--------------------------------------------------------------------------------
  1 | using System;
  2 | using System.Collections.Generic;
  3 | using System.IO;
  4 | using System.Linq;
  5 | 
  6 | namespace VietOCR
  7 | {
  8 |     public class ConsoleApp
  9 |     {
 10 |         public static void Main(string[] args)
 11 |         {
 12 |             new ConsoleApp().PerformOCR(args);
 13 |         }
 14 | 
 15 |         void PerformOCR(string[] args)
 16 |         {
 17 |             if (args[0] == "-?" || args[0] == "-help" || args.Length == 1)
 18 |             {
 19 |                 Console.WriteLine("Usage: vietocr imagefile outputfile [-l lang] [--psm pagesegmode] [text|hocr|pdf|pdf_textonly|unlv|box|alto|page|tsv|lstmbox|wordstrbox] [postprocessing] [correctlettercases] [deskew] [removelines] [removelinebreaks]");
 20 |                 return;
 21 |             }
 22 | 
 23 |             FileInfo imageFile = new FileInfo(args[0]);
 24 |             FileInfo outputFile = new FileInfo(args[1]);
 25 | 
 26 |             if (!imageFile.Exists)
 27 |             {
 28 |                 Console.WriteLine("Input file does not exist.");
 29 |                 return;
 30 |             }
 31 | 
 32 |             ProcessingOptions options = new ProcessingOptions();
 33 | 
 34 |             HashSet<string> outputFormatSet = new HashSet<string>();
 35 |             string[] renderers = Enum.GetNames(typeof(Tesseract.RenderedFormat));
 36 |             string curLangCode = "eng"; //default language
 37 |             string psm = "3"; // or alternatively, "Auto"; // 3 - Fully automatic page segmentation, but no OSD (default)
 38 |             
 39 |             for (int i = 0; i < args.Length; i++)
 40 |             {
 41 |                 string arg = args[i];
 42 | 
 43 |                 // command-line options
 44 |                 if ("-l" == arg)
 45 |                 {
 46 |                     if ((i+1) < args.Length)
 47 |                     {
 48 |                         curLangCode = args[i + 1];
 49 |                     }
 50 |                 }
 51 | 
 52 |                 if ("--psm" == arg)
 53 |                 {
 54 |                     if ((i+1) < args.Length)
 55 |                     {
 56 |                         psm = args[i + 1];
 57 |                         try
 58 |                         {
 59 |                             short psmval = Int16.Parse(psm);
 60 |                             if (psmval > 13) throw new ArgumentException();
 61 |                         }
 62 |                         catch
 63 |                         {
 64 |                             Console.WriteLine("Invalid input value for PSM.");
 65 |                             return;
 66 |                         }
 67 |                     }
 68 |                 }
 69 | 
 70 |                 // parse output formats
 71 |                 if (renderers.Contains(arg.ToUpper()))
 72 |                 {
 73 |                     outputFormatSet.Add(arg.ToUpper());
 74 |                 }
 75 | 
 76 |                 // enable pre-processing
 77 |                 if ("deskew" == arg)
 78 |                 {
 79 |                     options.Deskew = true;
 80 |                 }
 81 |                 if ("removelines" == arg)
 82 |                 {
 83 |                     options.RemoveLines = true;
 84 |                 }
 85 | 
 86 |                 // enable post-processing
 87 |                 if ("postprocessing" == arg)
 88 |                 {
 89 |                     options.PostProcessing = true;
 90 |                 }
 91 |                 if ("correctlettercases" == arg)
 92 |                 {
 93 |                     options.CorrectLetterCases = true;
 94 |                 }
 95 |                 if ("removelinebreaks" == arg)
 96 |                 {
 97 |                     options.RemoveLineBreaks = true;
 98 |                 }
 99 |             }
100 | 
101 |             if (outputFormatSet.Count == 0)
102 |             {
103 |                 outputFormatSet.Add(Tesseract.RenderedFormat.TEXT.ToString());
104 |             }
105 | 
106 |             string outputFormat = string.Join(",", outputFormatSet);
107 | 
108 |             try
109 |             {
110 |                 OCRHelper.PerformOCR(imageFile.FullName, outputFile.FullName, curLangCode, psm, outputFormat, options);
111 |             }
112 |             catch (Exception e)
113 |             {
114 |                 Console.WriteLine("Error: " + e.Message);
115 |             }
116 |         }
117 |     }
118 | }
119 | 


--------------------------------------------------------------------------------
/Utilities/Watcher.cs:
--------------------------------------------------------------------------------
  1 | using System;
  2 | using System.Collections.Generic;
  3 | using System.Text;
  4 | using System.IO;
  5 | using System.Text.RegularExpressions;
  6 | using System.Threading;
  7 | 
  8 | namespace VietOCR.NET.Utilities
  9 | {
 10 |     /// <summary>
 11 |     /// Monitors a folder for new image files.
 12 |     /// </summary>
 13 |     public class Watcher
 14 |     {
 15 |         private Queue<string> queue;
 16 |         private Regex filters = new Regex(@".*\.(tif|tiff|jpg|jpeg|gif|png|bmp|pdf)$", RegexOptions.IgnoreCase);
 17 | 
 18 |         private FileSystemWatcher watcher;
 19 | 
 20 |         public string Path
 21 |         {
 22 |             get { return watcher.Path; }
 23 |             set { watcher.Path = value; }
 24 |         }
 25 | 
 26 |         public bool Enabled
 27 |         {
 28 |             get { return watcher.EnableRaisingEvents; }
 29 |             set { watcher.EnableRaisingEvents = value; }
 30 |         }
 31 | 
 32 |         //[PermissionSet(SecurityAction.Demand, Name = "FullTrust")]
 33 |         public Watcher(Queue<string> q, string watchFolder)
 34 |         {
 35 |             queue = q;
 36 | 
 37 |             // Create a new FileSystemWatcher and set its properties.
 38 |             watcher = new FileSystemWatcher();
 39 |             watcher.Path = watchFolder;
 40 |             /* Watch for changes in LastWrite times, and 
 41 |                the renaming of files or directories. */
 42 |             watcher.NotifyFilter = NotifyFilters.LastWrite | NotifyFilters.FileName | NotifyFilters.DirectoryName;
 43 | 
 44 |             // Only watch tif files.
 45 |             //watcher.Filter = "*.tif"; // commented out since multiple filters not possible with Filter property
 46 | 
 47 |             // Add event handlers.
 48 |             //watcher.Changed += new FileSystemEventHandler(OnChanged);
 49 |             watcher.Created += new FileSystemEventHandler(OnChanged);
 50 |             //watcher.Deleted += new FileSystemEventHandler(OnChanged);
 51 |             //watcher.Renamed += new RenamedEventHandler(OnRenamed);
 52 | 
 53 |             // Begin watching.
 54 |             watcher.EnableRaisingEvents = true;
 55 |         }
 56 | 
 57 |         // Define the event handlers.
 58 |         private void OnChanged(object source, FileSystemEventArgs e)
 59 |         {
 60 |             // Specify what is done when a file is changed, created, or deleted.
 61 |             if (e.ChangeType == WatcherChangeTypes.Created)
 62 |             {
 63 |                 if (filters.IsMatch(e.Name))
 64 |                 {
 65 |                     // Wait if file is still being written
 66 |                     FileInfo fileInfo = new FileInfo(e.FullPath);
 67 |                     while (IsFileLocked(fileInfo))
 68 |                     {
 69 |                         Thread.Sleep(1000);
 70 |                     }
 71 |                     Console.WriteLine("New file: " + e.FullPath);
 72 |                     queue.Enqueue(e.FullPath);
 73 |                 }
 74 |             }
 75 |         }
 76 | 
 77 |         private void OnRenamed(object source, RenamedEventArgs e)
 78 |         {
 79 |             // Specify what is done when a file is renamed.
 80 |             Console.WriteLine("File: {0} renamed to {1}", e.OldFullPath, e.FullPath);
 81 |         }
 82 | 
 83 |         /// <summary>
 84 |         /// Check if file is locked as in being used or written by another process.
 85 |         /// https://stackoverflow.com/questions/876473/is-there-a-way-to-check-if-a-file-is-in-use/
 86 |         /// </summary>
 87 |         /// <param name="file"></param>
 88 |         /// <returns></returns>
 89 |         protected virtual bool IsFileLocked(FileInfo file)
 90 |         {
 91 |             try
 92 |             {
 93 |                 using (FileStream stream = file.Open(FileMode.Open, FileAccess.Read, FileShare.None))
 94 |                 {
 95 |                     //stream.Close();
 96 |                 }
 97 |             }
 98 |             catch (IOException)
 99 |             {
100 |                 //the file is unavailable because it is:
101 |                 //still being written to
102 |                 //or being processed by another thread
103 |                 //or does not exist (has already been processed)
104 |                 return true;
105 |             }
106 | 
107 |             //file is not locked
108 |             return false;
109 |         }
110 |     }
111 | }


--------------------------------------------------------------------------------
/BulkDialog.xaml:
--------------------------------------------------------------------------------
 1 | <Window x:Class="VietOCR.BulkDialog"
 2 |         xmlns="http://schemas.microsoft.com/winfx/2006/xaml/presentation"
 3 |         xmlns:x="http://schemas.microsoft.com/winfx/2006/xaml"
 4 |         xmlns:d="http://schemas.microsoft.com/expression/blend/2008"
 5 |         xmlns:mc="http://schemas.openxmlformats.org/markup-compatibility/2006"
 6 |         xmlns:local="clr-namespace:VietOCR"
 7 |         xmlns:resx="clr-namespace:VietOCR"
 8 |         mc:Ignorable="d"
 9 |         Title="{x:Static resx:BulkDialog.this_Title}" Height="200" Width="380" Loaded="Window_Loaded" ResizeMode="NoResize" WindowStartupLocation="CenterOwner">
10 |     <Grid Margin="10,10,10,10">
11 |         <Grid.RowDefinitions>
12 |             <RowDefinition Height="5*"/>
13 |             <RowDefinition Height="5*"/>
14 |             <RowDefinition Height="5*"/>
15 |             <RowDefinition Height="7*"/>
16 |         </Grid.RowDefinitions>
17 |         <Grid.ColumnDefinitions>
18 |             <ColumnDefinition Width="120*"/>
19 |             <ColumnDefinition Width="210*"/>
20 |             <ColumnDefinition Width="40*"/>
21 |         </Grid.ColumnDefinitions>
22 |         <Label x:Name="labelInput" Content="{x:Static resx:BulkDialog.labelInput_Text}" Target="{Binding ElementName=textBoxInput}" HorizontalAlignment="Left"  VerticalAlignment="Center" Grid.ColumnSpan="2"/>
23 |         <Label x:Name="labelOutput" Content="{x:Static resx:BulkDialog.labelOutput_Text}" Target="{Binding ElementName=textBoxOutput}" HorizontalAlignment="Left"  VerticalAlignment="Center" Grid.Row="1"/>
24 |         <TextBox x:Name="textBoxInput" HorizontalAlignment="Stretch"   VerticalAlignment="Center" VerticalContentAlignment="Center" Height="23" IsReadOnly="True" Grid.Column="1"/>
25 |         <TextBox x:Name="textBoxOutput" HorizontalAlignment="Stretch"  VerticalAlignment="Center" VerticalContentAlignment="Center" Height="23" IsReadOnly="True" Grid.Column="1" Grid.Row="1"/>
26 |         <Button x:Name="btnInput" Content="..." HorizontalAlignment="Center" VerticalAlignment="Center" Width="25" Click="btnInput_Click" ToolTip="{x:Static resx:BulkDialog.btnInput_ToolTip}" Grid.Column="2"/>
27 |         <Button x:Name="btnOutput" Content="..." HorizontalAlignment="Center" VerticalAlignment="Center" Width="25" Click="btnOutput_Click" ToolTip="{x:Static resx:BulkDialog.btnOutput_ToolTip}" Grid.Column="2" Grid.Row="1"/>
28 |         <Button Style="{StaticResource {x:Static ToolBar.ButtonStyleKey}}" HorizontalAlignment="Left" VerticalAlignment="Top" Name="buttonOutputFormat" ContextMenuService.IsEnabled="False" Grid.Column="1" Grid.Row="2" Click="buttonOutputFormat_Click"  >
29 |             <Button.Content>
30 |                 <DockPanel FlowDirection="LeftToRight" >
31 |                     <Label x:Name="labelOutputFormat" Content="{x:Static resx:BulkDialog.labelOutputFormat_Text}" />
32 |                     <Path x:Name="BtnArrowDown" Margin="4" VerticalAlignment="Center" Width="10" Fill="Black" Stretch="Uniform" HorizontalAlignment="Right" Data="F1 M 301.14,-189.041L 311.57,-189.041L 306.355,-182.942L 301.14,-189.041 Z "/>
33 |                     <Path x:Name="BtnArrowUp" Visibility="Collapsed" Margin="4" VerticalAlignment="Center" Width="10" Fill="Black" Stretch="Uniform" HorizontalAlignment="Right" Data="F1 M 301.14,189.041L 311.57,189.041L 306.355,182.942L 301.14,189.041 Z "/>
34 |                 </DockPanel>
35 |             </Button.Content>
36 |             <Button.ContextMenu>
37 |                 <ContextMenu x:Name="menuOutputFormat" Opened="ContextMenu_Opened" Closed="ContextMenu_Closed" />
38 |             </Button.ContextMenu>
39 |         </Button>
40 | 
41 |         <StackPanel Orientation="Horizontal" HorizontalAlignment="Right" Grid.Column="1" Grid.ColumnSpan="2" Grid.Row="3" >
42 |             <StackPanel.Resources>
43 |                 <Style TargetType="{x:Type Button}">
44 |                     <Setter Property="Margin" Value="5,0,10,0"/>
45 |                 </Style>
46 |             </StackPanel.Resources>
47 |             <Button x:Name="buttonRun" Content="{x:Static resx:BulkDialog.buttonRun_Text}" VerticalAlignment="Center" Width="70"  Click="buttonRun_Click" IsDefault="True" />
48 |             <Button x:Name="buttonCancel" Content="{x:Static resx:BulkDialog.buttonCancel_Text}" VerticalAlignment="Center" Width="70" IsCancel="True" />
49 |         </StackPanel>
50 |         <Button x:Name="buttonOptions" BorderThickness="0" BorderBrush="Transparent" Background="Transparent" HorizontalAlignment="Left" Margin="6,10,0,0" Grid.Row="3" VerticalAlignment="Top" Height="auto" Width="auto" Click="buttonOptions_Click">
51 |             <Image Source="Icons/fatcow/tools.png" Height="16" Width="16"></Image>
52 |         </Button>
53 |     </Grid>
54 | </Window>
55 | 


--------------------------------------------------------------------------------
/SplitPdfDialog.xaml:
--------------------------------------------------------------------------------
 1 | <Window x:Class="VietOCR.SplitPdfDialog"
 2 |         xmlns="http://schemas.microsoft.com/winfx/2006/xaml/presentation"
 3 |         xmlns:x="http://schemas.microsoft.com/winfx/2006/xaml"
 4 |         xmlns:d="http://schemas.microsoft.com/expression/blend/2008"
 5 |         xmlns:mc="http://schemas.openxmlformats.org/markup-compatibility/2006"
 6 |         xmlns:local="clr-namespace:VietOCR"
 7 |         xmlns:resx="clr-namespace:VietOCR"
 8 |         mc:Ignorable="d"
 9 |         Title="{x:Static resx:SplitPdfDialog.this_Title}" Height="220" Width="360" ResizeMode="NoResize" WindowStartupLocation="CenterOwner">
10 |     <Grid Margin="10,10,0,20">
11 |         <Grid.ColumnDefinitions>
12 |             <ColumnDefinition Width="25*"/>
13 |             <ColumnDefinition Width="56*"/>
14 |             <ColumnDefinition Width="12*"/>
15 |         </Grid.ColumnDefinitions>
16 |         <Grid.RowDefinitions>
17 |             <RowDefinition Height="*"/>
18 |             <RowDefinition Height="*"/>
19 |             <RowDefinition Height="*"/>
20 |             <RowDefinition Height="*"/>
21 |             <RowDefinition Height="*"/>
22 |         </Grid.RowDefinitions>
23 |         <Label x:Name="labelInput" Content="{x:Static resx:SplitPdfDialog.labelInput_Text}" Target="{Binding ElementName=textBoxInput}" VerticalAlignment="Center"/>
24 |         <Label x:Name="labelOutput" Content="{x:Static resx:SplitPdfDialog.labelOutput_Text}" Target="{Binding ElementName=textBoxOutput}" VerticalAlignment="Center" Grid.Row="1"/>
25 |         <TextBox x:Name="textBoxInput" Height="24" HorizontalAlignment="Stretch"  IsReadOnly="True" VerticalAlignment="Center"  VerticalContentAlignment="Center" Grid.Column="1"/>
26 |         <TextBox x:Name="textBoxOutput" Height="24" HorizontalAlignment="Stretch"  IsReadOnly="True" VerticalAlignment="Center" VerticalContentAlignment="Center" Grid.Row="1" Grid.Column="1"/>
27 |         <Button x:Name="buttonBrowseInput" Content="..." HorizontalAlignment="Center" VerticalAlignment="Center" Width="25" Click="buttonBrowseInput_Click" ToolTip="{x:Static resx:SplitPdfDialog.buttonBrowseInput_ToolTip}" Grid.Column="2"/>
28 |         <Button x:Name="buttonBrowseOutput" Content="..." HorizontalAlignment="Center" VerticalAlignment="Center" Width="25" Click="buttonBrowseOutput_Click" ToolTip="{x:Static resx:SplitPdfDialog.buttonBrowseOutput_ToolTip}" Grid.Row="1" Grid.Column="2"/>
29 |         <StackPanel Orientation="Horizontal" Grid.Row="2" Grid.Column="0" Grid.ColumnSpan="3" >
30 |             <RadioButton GroupName="Group1" x:Name="radioButtonPages" Content="{x:Static resx:SplitPdfDialog.radioButtonPages_Text}" Margin="8,0,16,0" VerticalAlignment="Center" Checked="radioButtonPages_Checked" />
31 |             <Label x:Name="labelFrom" Content="{x:Static resx:SplitPdfDialog.labelFrom_Text}" Target="{Binding ElementName=textBoxFrom}" HorizontalAlignment="Left" VerticalAlignment="Center"/>
32 |             <TextBox x:Name="textBoxFrom" Height="24" HorizontalAlignment="Left" VerticalAlignment="Center" Width="30" VerticalContentAlignment="Center" />
33 |             <Separator Opacity="0" Width="20" />
34 |             <Label x:Name="labelTo" Content="{x:Static resx:SplitPdfDialog.labelTo_Text}" Target="{Binding ElementName=textBoxTo}" HorizontalAlignment="Left" VerticalAlignment="Center" />
35 |             <TextBox x:Name="textBoxTo" Height="24" HorizontalAlignment="Left" VerticalAlignment="Center" Width="30" VerticalContentAlignment="Center" />
36 |         </StackPanel>
37 |         <StackPanel Orientation="Horizontal" Grid.Row="3" Grid.Column="0"  Grid.ColumnSpan="3" >
38 |             <RadioButton GroupName="Group1" x:Name="radioButtonFiles" Content="{x:Static resx:SplitPdfDialog.radioButtonFiles_Text}" Margin="8,0,16,0" VerticalAlignment="Center" Checked="radioButtonFiles_Checked" />
39 |             <Label x:Name="labelNumOfPages" Content="{x:Static resx:SplitPdfDialog.labelNumOfPages_Text}" Target="{Binding ElementName=textBoxNumOfPages}" HorizontalAlignment="Left" VerticalAlignment="Center" />
40 |             <TextBox x:Name="textBoxNumOfPages" Height="24" HorizontalAlignment="Left"  VerticalAlignment="Center" Width="30" VerticalContentAlignment="Center" />
41 |         </StackPanel>
42 |         <StackPanel Orientation="Horizontal" Grid.Row="4" Grid.Column="1" Grid.ColumnSpan="2" HorizontalAlignment="Right">
43 |             <Button x:Name="buttonSplit" Content="{x:Static resx:SplitPdfDialog.buttonSplit_Text}" HorizontalAlignment="Left" VerticalAlignment="Bottom" Width="75" IsDefault="True" Click="buttonSplit_Click" />
44 |             <Button x:Name="buttonCancel" Content="{x:Static resx:SplitPdfDialog.buttonCancel_Text}" HorizontalAlignment="Left" VerticalAlignment="Bottom" Width="75" Margin="10, 0, 20, 0" IsCancel="True" />
45 |         </StackPanel>
46 |     </Grid>
47 | </Window>
48 | 


--------------------------------------------------------------------------------
/ImageInfoDialog.xaml:
--------------------------------------------------------------------------------
 1 | <Window x:Class="VietOCR.ImageInfoDialog"
 2 |         xmlns="http://schemas.microsoft.com/winfx/2006/xaml/presentation"
 3 |         xmlns:x="http://schemas.microsoft.com/winfx/2006/xaml"
 4 |         xmlns:d="http://schemas.microsoft.com/expression/blend/2008"
 5 |         xmlns:mc="http://schemas.openxmlformats.org/markup-compatibility/2006"
 6 |         xmlns:local="clr-namespace:VietOCR"
 7 |         xmlns:resx="clr-namespace:VietOCR"
 8 |         mc:Ignorable="d"
 9 |         Title="{x:Static resx:ImageInfoDialog.this_Title}" Height="246" Width="286" Loaded="Window_Loaded" ResizeMode="NoResize">
10 |     <Grid>
11 |         <Grid HorizontalAlignment="Center" VerticalAlignment="Top" Width="Auto" Margin="0 20">
12 |             <Grid.RowDefinitions>
13 |                 <RowDefinition Height="*"/>
14 |                 <RowDefinition Height="*"/>
15 |                 <RowDefinition Height="*"/>
16 |                 <RowDefinition Height="*"/>
17 |                 <RowDefinition Height="*"/>
18 |             </Grid.RowDefinitions>
19 |             <Grid.ColumnDefinitions>
20 |                 <ColumnDefinition Width="5*"/>
21 |                 <ColumnDefinition Width="3*"/>
22 |                 <ColumnDefinition Width="3*"/>
23 |             </Grid.ColumnDefinitions>
24 | 
25 |             <Label x:Name="labelWidth" Content="{x:Static resx:ImageInfoDialog.labelWidth_Text}" HorizontalAlignment="Left" VerticalAlignment="Center" />
26 |             <TextBox x:Name="textBoxWidth" Grid.Column="1" VerticalContentAlignment="Center" HorizontalAlignment="Left" VerticalAlignment="Center" Width="56" IsReadOnly="True" Height="23"/>
27 |             <Label x:Name="labelHeight" Content="{x:Static resx:ImageInfoDialog.labelHeight_Text}" HorizontalAlignment="Left" VerticalAlignment="Center" Grid.Row="1" />
28 |             <Label x:Name="labelXRes" Content="{x:Static resx:ImageInfoDialog.labelXRes_Text}" HorizontalAlignment="Left" VerticalAlignment="Center" Grid.Row="2" />
29 |             <Label x:Name="labelYRes" Content="{x:Static resx:ImageInfoDialog.labelYRes_Text}" HorizontalAlignment="Left" VerticalAlignment="Center" Grid.Row="3" />
30 |             <TextBox x:Name="textBoxHeight" Grid.Column="1" VerticalContentAlignment="Center" HorizontalAlignment="Left" VerticalAlignment="Center" Width="56" Grid.Row="1" IsReadOnly="True" Height="23"/>
31 |             <TextBox x:Name="textBoxXRes" Grid.Column="1" VerticalContentAlignment="Center" HorizontalAlignment="Left" VerticalAlignment="Center" Width="56" Grid.Row="2" IsReadOnly="True" Height="23" />
32 |             <TextBox x:Name="textBoxYRes" Grid.Column="1" VerticalContentAlignment="Center" HorizontalAlignment="Left" VerticalAlignment="Center" Width="56" Grid.Row="3" IsReadOnly="True" Height="23" />
33 |             <Label x:Name="labelBitDepth" Content="{x:Static resx:ImageInfoDialog.labelBitDepth_Text}" HorizontalAlignment="Left" VerticalAlignment="Center" Grid.Row="4" />
34 |             <TextBox x:Name="textBoxBitDepth" Grid.Column="1" VerticalContentAlignment="Center" HorizontalAlignment="Left" VerticalAlignment="Center" Width="56" Grid.Row="4" IsReadOnly="True" Height="23" />
35 |             <ComboBox x:Name="comboBoxUnitW" Grid.Column="2" Margin="5,0,0,0" Width="60" VerticalAlignment="Center" ToolTip="{x:Static resx:ImageInfoDialog.comboBoxUnitW_ToolTip}" SelectionChanged="comboBoxUnitW_SelectionChanged" >
36 |                 <ComboBoxItem Content="{x:Static resx:ImageInfoDialog.comboBox3_Items}"/>
37 |                 <ComboBoxItem Content="{x:Static resx:ImageInfoDialog.comboBox3_Items1}"/>
38 |                 <ComboBoxItem Content="{x:Static resx:ImageInfoDialog.comboBox3_Items2}"/>
39 |             </ComboBox>
40 |             <ComboBox x:Name="comboBoxUnitH" Grid.Column="2" Margin="5,0,0,0" Width="60" HorizontalAlignment="Stretch" VerticalAlignment="Center" Grid.Row="1" ToolTip="{x:Static resx:ImageInfoDialog.comboBoxUnitH_ToolTip}" SelectionChanged="comboBoxUnitH_SelectionChanged" >
41 |                 <ComboBoxItem Content="{x:Static resx:ImageInfoDialog.comboBox4_Items}"/>
42 |                 <ComboBoxItem Content="{x:Static resx:ImageInfoDialog.comboBox4_Items1}"/>
43 |                 <ComboBoxItem Content="{x:Static resx:ImageInfoDialog.comboBox4_Items2}"/>
44 |             </ComboBox>
45 |             <Label x:Name="label5" Content="{x:Static resx:ImageInfoDialog.label5_Text}" HorizontalAlignment="Left" VerticalAlignment="Center" Grid.Row="2" Grid.Column="2" />
46 |             <Label x:Name="label6" Content="{x:Static resx:ImageInfoDialog.label6_Text}" HorizontalAlignment="Left" VerticalAlignment="Center" Grid.Row="3" Grid.Column="2" />
47 |         </Grid>
48 |         <Button x:Name="buttonOK" Content="{x:Static resx:ImageInfoDialog.buttonOK_Text}" HorizontalAlignment="Center" VerticalAlignment="Bottom" Width="60" Click="buttonOK_Click" Margin="0 20"/>
49 |     </Grid>
50 | </Window>
51 | 


--------------------------------------------------------------------------------
/GuiWithRegistry.cs:
--------------------------------------------------------------------------------
  1 | /**
  2 |  * Copyright @ 2008 Quan Nguyen
  3 |  * 
  4 |  * Licensed under the Apache License, Version 2.0 (the "License");
  5 |  * you may not use this file except in compliance with the License.
  6 |  * You may obtain a copy of the License at
  7 |  *
  8 |  *  http://www.apache.org/licenses/LICENSE-2.0
  9 |  *
 10 |  * Unless required by applicable law or agreed to in writing, software
 11 |  * distributed under the License is distributed on an "AS IS" BASIS,
 12 |  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 13 |  * See the License for the specific language governing permissions and
 14 |  * limitations under the License.
 15 | */
 16 | using System;
 17 | using System.Drawing;
 18 | using Microsoft.Win32;
 19 | using System.Windows;
 20 | 
 21 | namespace VietOCR
 22 | {
 23 |     public class GuiWithRegistry : Gui
 24 |     {
 25 |         const string strWinState = "WindowState";
 26 |         const string strLocationX = "LocationX";
 27 |         const string strLocationY = "LocationY";
 28 |         const string strWidth = "Width";
 29 |         const string strHeight = "Height";
 30 | 
 31 |         protected string strRegKey = "Software\\VietUnicode\\";
 32 | 
 33 |         Rect restoreBounds;
 34 | 
 35 |         public GuiWithRegistry()
 36 |         {
 37 |             strRegKey += strProgName;
 38 |             InitializeComponent();
 39 |             restoreBounds = this.RestoreBounds;
 40 |         }
 41 | 
 42 |         protected override void Window_Loaded(object sender, RoutedEventArgs e)
 43 |         {
 44 |             base.Window_Loaded(sender, e);
 45 | 
 46 |             // Load registry information.
 47 |             RegistryKey regkey = Registry.CurrentUser.OpenSubKey(strRegKey);
 48 | 
 49 |             if (regkey == null)
 50 |                 regkey = Registry.CurrentUser.CreateSubKey(strRegKey);
 51 | 
 52 |             LoadRegistryInfo(regkey);
 53 |             regkey.Close();
 54 |         }
 55 | 
 56 |         protected override void Window_Closed(object sender, EventArgs e)
 57 |         {
 58 |             // Save registry information.
 59 |             RegistryKey regkey = Registry.CurrentUser.OpenSubKey(strRegKey, true);
 60 | 
 61 |             if (regkey == null)
 62 |                 regkey = Registry.CurrentUser.CreateSubKey(strRegKey);
 63 | 
 64 |             SaveRegistryInfo(regkey);
 65 |             regkey.Close();
 66 | 
 67 |             base.Window_Closed(sender, e);
 68 |         }
 69 | 
 70 |         protected override void Window_SizeChanged(object sender, SizeChangedEventArgs e)
 71 |         {
 72 |             if (WindowState == WindowState.Normal)
 73 |                 restoreBounds = this.RestoreBounds;
 74 |         }
 75 | 
 76 |         protected override void Window_LocationChanged(object sender, EventArgs e)
 77 |         {
 78 |             if (WindowState == WindowState.Normal)
 79 |                 restoreBounds = this.RestoreBounds;
 80 |         }
 81 | 
 82 |         protected override void SaveRegistryInfo(RegistryKey regkey)
 83 |         {
 84 |             base.SaveRegistryInfo(regkey);
 85 | 
 86 |             regkey.SetValue(strWinState, (int) WindowState);
 87 |             regkey.SetValue(strLocationX, restoreBounds.X);
 88 |             regkey.SetValue(strLocationY, restoreBounds.Y);
 89 |             regkey.SetValue(strWidth, restoreBounds.Width);
 90 |             regkey.SetValue(strHeight, restoreBounds.Height);
 91 |         }
 92 | 
 93 |         protected override void LoadRegistryInfo(RegistryKey regkey)
 94 |         {
 95 |             base.LoadRegistryInfo(regkey);
 96 | 
 97 |             double x = Convert.ToDouble(regkey.GetValue(strLocationX, 100));
 98 |             double y = Convert.ToDouble(regkey.GetValue(strLocationY, 100));
 99 |             double cx = Convert.ToDouble(regkey.GetValue(strWidth, 324));
100 |             double cy = Convert.ToDouble(regkey.GetValue(strHeight, 300));
101 | 
102 |             restoreBounds = new Rect(x, y, cx, cy);
103 | 
104 |             // Adjust rectangle for any change in desktop size.
105 | 
106 |             Rect rectDesk = SystemParameters.WorkArea;
107 | 
108 |             restoreBounds.Width = Math.Min(restoreBounds.Width, rectDesk.Width);
109 |             restoreBounds.Height = Math.Min(restoreBounds.Height, rectDesk.Height);
110 |             restoreBounds.X -= Math.Max(restoreBounds.Right - rectDesk.Right, 0);
111 |             restoreBounds.Y -= Math.Max(restoreBounds.Bottom - rectDesk.Bottom, 0);
112 | 
113 |             // Set form properties.
114 |             this.Left = restoreBounds.Left;
115 |             this.Top = restoreBounds.Top;
116 |             this.Width = restoreBounds.Width;
117 |             this.Height = restoreBounds.Height;
118 | 
119 |             WindowState = (WindowState)regkey.GetValue(strWinState, 0);
120 |         }
121 |     }
122 | }
123 | 
124 | 


--------------------------------------------------------------------------------
/GuiWithBatch.cs:
--------------------------------------------------------------------------------
  1 | /**
  2 |  * Copyright @ 2012 Quan Nguyen
  3 |  * 
  4 |  * Licensed under the Apache License, Version 2.0 (the "License");
  5 |  * you may not use this file except in compliance with the License.
  6 |  * You may obtain a copy of the License at
  7 |  *
  8 |  *  http://www.apache.org/licenses/LICENSE-2.0
  9 |  *
 10 |  * Unless required by applicable law or agreed to in writing, software
 11 |  * distributed under the License is distributed on an "AS IS" BASIS,
 12 |  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 13 |  * See the License for the specific language governing permissions and
 14 |  * limitations under the License.
 15 | */
 16 | using System;
 17 | using System.Collections.Generic;
 18 | using System.ComponentModel;
 19 | using System.Data;
 20 | using System.Drawing;
 21 | using System.Text;
 22 | using VietOCR.NET.Utilities;
 23 | using System.Threading;
 24 | using System.IO;
 25 | using VietOCR.NET.Postprocessing;
 26 | using System.Globalization;
 27 | using System.Windows;
 28 | using System.Windows.Threading;
 29 | using VietOCR.NET;
 30 | 
 31 | namespace VietOCR
 32 | {
 33 |     public class GuiWithBatch : GuiWithSettings
 34 |     {
 35 |         private Queue<string> queue;
 36 |         private Watcher watcher;
 37 |         private DispatcherTimer aTimer;
 38 |         private StatusForm statusForm;
 39 | 
 40 |         delegate void UpdateStatusEvent(string message);
 41 | 
 42 |         public GuiWithBatch()
 43 |         {
 44 |             statusForm = new StatusForm();
 45 |             statusForm.Title = Properties.Resources.BatchProcessStatus;
 46 |         }
 47 | 
 48 |         protected override void Window_Loaded(object sender, RoutedEventArgs e)
 49 |         {
 50 |             base.Window_Loaded(sender, e);
 51 | 
 52 |             queue = new Queue<string>();
 53 |             watcher = new Watcher(queue, watchFolder);
 54 |             watcher.Enabled = watchEnabled;
 55 | 
 56 |             aTimer = new DispatcherTimer();
 57 |             aTimer.Interval = new TimeSpan(10000);
 58 |             aTimer.Tick += new EventHandler(OnTimedEvent);
 59 |             if (watchEnabled)
 60 |             {
 61 |                 aTimer.Start();
 62 |             }
 63 |         }
 64 | 
 65 |         private void OnTimedEvent(Object sender, EventArgs e)
 66 |         {
 67 |             if (queue.Count > 0)
 68 |             {
 69 |                 if (!this.statusForm.IsVisible)
 70 |                 {
 71 |                     this.statusForm.Show();
 72 |                 }
 73 |                 else if (this.statusForm.WindowState == WindowState.Minimized)
 74 |                 {
 75 |                     this.statusForm.WindowState = WindowState.Normal;
 76 |                 }
 77 | 
 78 |                 Thread t = new Thread(new ThreadStart(AutoOCR));
 79 |                 t.Start();
 80 |             }
 81 |         }
 82 | 
 83 |         private void AutoOCR()
 84 |         {
 85 |             FileInfo imageFile;
 86 |             try
 87 |             {
 88 |                 imageFile = new FileInfo(queue.Dequeue());
 89 |                 if (imageFile == null || !imageFile.Exists)
 90 |                 {
 91 |                     return;
 92 |                 }
 93 |             }
 94 |             catch
 95 |             {
 96 |                 return;
 97 |             }
 98 | 
 99 |             Dispatcher.BeginInvoke(new Action<string>(WorkerUpdate), DispatcherPriority.Normal, imageFile.FullName);
100 | 
101 |             if (curLangCode == null)
102 |             {
103 |                 Dispatcher.BeginInvoke(new Action<string>(WorkerUpdate), DispatcherPriority.Normal, "\t** " + Properties.Resources.selectLanguage + " **");
104 |                 //queue.Clear();
105 |                 return;
106 |             }
107 | 
108 |             try
109 |             {
110 |                 OCRHelper.PerformOCR(imageFile.FullName, Path.Combine(outputFolder, imageFile.Name), curLangCode, selectedPSM, outputFormat, options);
111 |             }
112 |             catch
113 |             {
114 |                 // Sets the UI culture to the selected language.
115 |                 Thread.CurrentThread.CurrentUICulture = new CultureInfo(selectedUILanguage);
116 |                 Dispatcher.BeginInvoke(new Action<string>(WorkerUpdate), DispatcherPriority.Normal, "\t** " + Properties.Resources.Cannotprocess + imageFile.Name + " **");
117 |             }
118 |         }
119 | 
120 |         void WorkerUpdate(string message)
121 |         {
122 |             this.statusForm.TextBox.AppendText(message + Environment.NewLine);
123 |         }
124 | 
125 |         protected override void updateWatch()
126 |         {
127 |             watcher.Path = watchFolder;
128 |             watcher.Enabled = watchEnabled;
129 |             if (watchEnabled)
130 |             {
131 |                 aTimer.Start();
132 |             }
133 |             else
134 |             {
135 |                 aTimer.Stop();
136 |             }
137 |         }
138 |     }
139 | }
140 | 


--------------------------------------------------------------------------------
/Postprocessing/ViePP.cs:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * Copyright @ 2008 Quan Nguyen
 3 |  * 
 4 |  * Licensed under the Apache License, Version 2.0 (the "License");
 5 |  * you may not use this file except in compliance with the License.
 6 |  * You may obtain a copy of the License at
 7 |  *
 8 |  *  http://www.apache.org/licenses/LICENSE-2.0
 9 |  *
10 |  * Unless required by applicable law or agreed to in writing, software
11 |  * distributed under the License is distributed on an "AS IS" BASIS,
12 |  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 |  * See the License for the specific language governing permissions and
14 |  * limitations under the License.
15 | */
16 | namespace VietOCR.NET.Postprocessing
17 | {
18 |     using System;
19 |     using System.Text;
20 |     using System.Text.RegularExpressions;
21 | 
22 |     public class ViePP : IPostProcessor
23 |     {
24 |         const string TONE = "[\u0300\u0309\u0303\u0301\u0323]?"; // `?~'.
25 |         const string DOT_BELOW = "\u0323?"; // .
26 |         const string MARK = "[\u0306\u0302\u031B]?"; // (^+
27 |         const string VOWEL = "[aeiouy]";
28 | 
29 |         public string PostProcess(string text)
30 |         {
31 |             // Move all of these string replace to external vie.DangAmbigs.txt.
32 |             // The file location also gives users more control over the choice of word corrections.
33 |             //// substitute Vietnamese letters frequently misrecognized by Tesseract 2.03
34 |             //StringBuilder strB = new StringBuilder(text);
35 |             //strB.Replace("êĩ-", "ết")
36 |             //    .Replace("tmg", "úng")
37 |             //    ;
38 | 
39 |             //text =  Regex.Replace(
40 |             //        Regex.Replace(
41 |             //        Regex.Replace(
42 |             //        Regex.Replace(
43 |             //        Regex.Replace(
44 |             //        Regex.Replace(
45 |             //        Regex.Replace(
46 |             //        Regex.Replace(
47 |             //        Regex.Replace(
48 |             //        Regex.Replace(
49 |             //        Regex.Replace(
50 |             //        Regex.Replace(text,
51 |             //            "(?i)(?<=đ)ă\\b", "ã"),
52 |             //            "(?i)(?<=[ch])ă\\b", "ả"),
53 |             //            "(?i)ă(?![cmnpt])", "à"),
54 |             //            "(?i)ẵ(?=[cpt])", "ắ"),
55 |             //            "(?<=\\b[Tt])m", "rư"),
56 |             //            "(?i)\\bl(?=[rh])", "t"),
57 |             //            "(u|ll|r)(?=[gh])", "n"),
58 |             //            "(iii|ln|rn)", "m"),
59 |             //            "(?i)(?<=[mqrgsv])ll", "u"),
60 |             //            "(?i)(?<=[cknpt])ll", "h"),
61 |             //            "(?i)[oe](?=h)", "c"),
62 |             //            "\\Bđ", "ớ")
63 |             //        ;
64 | 
65 |             string nfdText = text.Normalize(NormalizationForm.FormD);
66 |             nfdText = Regex.Replace(
67 |                     Regex.Replace(
68 |                     Regex.Replace(
69 |                     Regex.Replace(
70 |                     Regex.Replace(
71 |                     Regex.Replace(
72 |                     Regex.Replace(
73 |                     Regex.Replace(
74 |                     Regex.Replace(
75 |                     Regex.Replace(
76 |                     Regex.Replace(
77 |                     Regex.Replace(nfdText,
78 |                         "(?i)(?<![q])(u)(?=o\u031B" + TONE + "\\p{L})", "$1\u031B"), // uo+n to u+o+n 
79 |                         "(?i)(?<=u\u031B)(o)(?=" + TONE + "\\p{L})", "$1\u031B"), // u+on to u+o+n
80 |                         "(?i)(i)" + TONE + "(?=[eioy])", "$1"), // remove mark on i followed by certain vowels
81 |                         "(?i)(?<=gi)" + TONE + "(?=[aeiouy])", ""), // remove mark on i preceeded by g and followed by any vowel
82 |                         // It seems to be a bug with .NET: it should be \\b, not \\B,
83 |                         // unless combining diacritical characters are not considered as words by .NET.
84 |                         "(?i)(?<=[^q]" + VOWEL + "\\p{IsCombiningDiacriticalMarks}{0,2})(i)" + TONE + "\\B", "$1"), // remove mark on i preceeded by vowels w/ or w/o diacritics
85 |                         "(?i)(?<=[aeo]\u0302)['\u2018\u2019]", "\u0301"), // ^right-single-quote to ^acute
86 |                         "(?i)\u2018([aeo]\u0302)(?!\\p{IsCombiningDiacriticalMarks})", "$1\u0300"), // left-single-quote+a^ to a^grave
87 |                         "(?i)(?<=[aeo]\u0302)h", "\u0301n"), // a^+h to a^acute+n
88 |                         "(?i)(?<=[uo]" + TONE + ")['\u2018]", "\u031B"), // u'+left-single-quote) to u+' 
89 |                         "(?i)(?<=" + VOWEL + "\\p{IsCombiningDiacriticalMarks}{0,2})l\\b", "t"), // vowel+diacritics+l to vowel+diacritics+t
90 |                         "(?i)(?<=" + VOWEL + "\\p{IsCombiningDiacriticalMarks}{0,2})ll\\b", "u"), // vowel+diacritics+ll to vowel+diacritics+u
91 |                         "\\B\\$(?="+ VOWEL + ")", "S") // replace leading $ followed by vowel with S
92 |                     ;
93 | 
94 |             return nfdText.Normalize();
95 |         }
96 |     }
97 | }


--------------------------------------------------------------------------------
/Controls/RedUnderlineAdorner.cs:
--------------------------------------------------------------------------------
  1 | /// Adapted from https://github.com/lsd1991/SpellTextBox/blob/master/SpellTextBox/RedUnderlineAdorner.cs
  2 | 
  3 | using System;
  4 | using System.Windows;
  5 | using System.Windows.Controls;
  6 | using System.Windows.Documents;
  7 | using System.Windows.Media;
  8 | using System.Windows.Threading;
  9 | using System.Collections.ObjectModel;
 10 | 
 11 | namespace VietOCR.Controls
 12 | {
 13 |     public class RedUnderlineAdorner : Adorner
 14 |     {
 15 |         ScrollChangedEventHandler scrollChangedEventHandler;
 16 |         TextChangedEventHandler textChangedEventHandler;
 17 | 
 18 |         TextBox textbox;
 19 |         SpellCheckHelper mySpeller;
 20 |         Pen pen = CreateErrorPen();
 21 | 
 22 |         public RedUnderlineAdorner(TextBox textbox, SpellCheckHelper mySpeller) : base(textbox)
 23 |         {
 24 |             this.textbox = textbox;
 25 |             this.mySpeller = mySpeller;
 26 | 
 27 |             scrollChangedEventHandler = new ScrollChangedEventHandler(
 28 |                 delegate
 29 |                 {
 30 |                     SignalInvalidate();
 31 |                 });
 32 | 
 33 |             textChangedEventHandler = new TextChangedEventHandler(
 34 |                 delegate
 35 |                 {
 36 |                     mySpeller.SpellCheck();
 37 |                     SignalInvalidate();
 38 |                 });
 39 | 
 40 |             textbox.AddHandler(ScrollViewer.ScrollChangedEvent, scrollChangedEventHandler);
 41 |             textbox.TextChanged += textChangedEventHandler;
 42 |         }
 43 | 
 44 |         public void Dispose()
 45 |         {
 46 |             if (textbox != null)
 47 |             {
 48 |                 textbox.RemoveHandler(ScrollViewer.ScrollChangedEvent, scrollChangedEventHandler);
 49 |                 textbox.TextChanged -= textChangedEventHandler;
 50 |             }
 51 |         }
 52 | 
 53 |         void SignalInvalidate()
 54 |         {
 55 |             textbox.Dispatcher.BeginInvoke(DispatcherPriority.Background, (Action)InvalidateVisual);
 56 |         }
 57 | 
 58 |         protected override void OnRender(DrawingContext drawingContext)
 59 |         {
 60 |             if (textbox != null)
 61 |             {
 62 |                 ObservableCollection<System.Drawing.CharacterRange> errorRanges = mySpeller.GetSpellingErrorRanges;
 63 | 
 64 |                 foreach (System.Drawing.CharacterRange mWord in errorRanges)
 65 |                 {
 66 |                     Rect rectangleBounds = new Rect(this.AdornedElement.DesiredSize); 
 67 | 
 68 |                     Rect startRect = textbox.GetRectFromCharacterIndex(mWord.First);
 69 |                     Rect endRect = textbox.GetRectFromCharacterIndex(mWord.First + mWord.Length);
 70 | 
 71 |                     Rect startRectM = startRect; // textbox.GetRectFromCharacterIndex(Math.Min(mWord.First, textbox.Text.Length));
 72 |                     Rect endRectM = endRect; // textbox.GetRectFromCharacterIndex(Math.Min(mWord.First + mWord.Length, textbox.Text.Length));
 73 | 
 74 |                     startRectM.X += rectangleBounds.X;
 75 |                     startRectM.Y += rectangleBounds.Y;
 76 |                     endRectM.X += rectangleBounds.X;
 77 |                     endRectM.Y += rectangleBounds.Y;
 78 | 
 79 |                     if (rectangleBounds.Contains(startRectM) && rectangleBounds.Contains(endRectM))
 80 |                     {
 81 |                         // don't draw for word that spans multiple lines
 82 |                         if (Math.Abs(startRect.BottomLeft.Y - endRect.BottomRight.Y) < 8)
 83 |                         {
 84 |                             drawingContext.DrawLine(pen, startRect.BottomLeft, endRect.BottomRight);
 85 |                         }
 86 |                     }
 87 |                 }
 88 |             }
 89 |         }
 90 | 
 91 |         private static Pen CreateErrorPen()
 92 |         {
 93 |             double size = 4.0;
 94 | 
 95 |             var geometry = new StreamGeometry();
 96 |             using (var context = geometry.Open())
 97 |             {
 98 |                 context.BeginFigure(new Point(0.0, 0.0), false, false);
 99 |                 context.PolyLineTo(new[] {
100 |                     new Point(size * 0.25, size * 0.25),
101 |                     new Point(size * 0.5, 0.0),
102 |                     new Point(size * 0.75, size * 0.25),
103 |                     new Point(size, 0.0)
104 |                 }, true, true);
105 |             }
106 | 
107 |             var brushPattern = new GeometryDrawing
108 |             {
109 |                 Pen = new Pen(Brushes.Red, 0.2),
110 |                 Geometry = geometry
111 |             };
112 | 
113 |             var brush = new DrawingBrush(brushPattern)
114 |             {
115 |                 TileMode = TileMode.Tile,
116 |                 Viewport = new Rect(0.0, size * 0.33, size * 3.0, size),
117 |                 ViewportUnits = BrushMappingMode.Absolute
118 |             };
119 | 
120 |             var pen = new Pen(brush, size);
121 |             pen.Freeze();
122 | 
123 |             return pen;
124 |         }
125 |     }
126 | }
127 | 


--------------------------------------------------------------------------------
/GuiWithScan.cs:
--------------------------------------------------------------------------------
  1 | using System;
  2 | using System.Collections.Generic;
  3 | using System.ComponentModel;
  4 | using System.Data;
  5 | using System.Drawing;
  6 | using System.Text;
  7 | using System.IO;
  8 | using System.Drawing.Imaging;
  9 | using VietOCR.NET.WIA;
 10 | using System.Windows;
 11 | using System.Windows.Input;
 12 | 
 13 | namespace VietOCR
 14 | {
 15 |     public class GuiWithScan : GuiWithThumbnail
 16 |     {
 17 |         private System.ComponentModel.BackgroundWorker backgroundWorkerScan;
 18 | 
 19 |         public GuiWithScan()
 20 |         {
 21 |             this.backgroundWorkerScan = new System.ComponentModel.BackgroundWorker();
 22 |             // 
 23 |             // backgroundWorkerScan
 24 |             // 
 25 |             this.backgroundWorkerScan.WorkerReportsProgress = true;
 26 |             this.backgroundWorkerScan.WorkerSupportsCancellation = true;
 27 |             this.backgroundWorkerScan.DoWork += new System.ComponentModel.DoWorkEventHandler(this.backgroundWorkerScan_DoWork);
 28 |             this.backgroundWorkerScan.RunWorkerCompleted += new System.ComponentModel.RunWorkerCompletedEventHandler(this.backgroundWorkerScan_RunWorkerCompleted);
 29 | 
 30 |         }
 31 | 
 32 |         protected override void scanToolStripMenuItem_Click(object sender, RoutedEventArgs e)
 33 |         {
 34 |             scaleX = scaleY = 1f;
 35 |             performScan();
 36 |         }
 37 | 
 38 |         /// <summary>
 39 |         /// Access scanner and scan documents via WIA.
 40 |         /// </summary>
 41 |         void performScan()
 42 |         {
 43 |             try
 44 |             {
 45 |                 this.statusLabel.Content = Properties.Resources.Scanning;
 46 |                 this.Cursor = Cursors.Wait;
 47 |                 
 48 |                 this.textBox1.Cursor = Cursors.Wait;
 49 |                 this.buttonScan.IsEnabled = false;
 50 |                 this.scanToolStripMenuItem.IsEnabled = false;
 51 |                 this.toolStripProgressBar1.IsEnabled = true;
 52 |                 this.toolStripProgressBar1.Visibility = Visibility.Visible;
 53 |                 //this.toolStripProgressBar1.Style = ProgressBarStyle.Marquee;
 54 | 
 55 |                 // Start the asynchronous operation.
 56 |                 backgroundWorkerScan.RunWorkerAsync();
 57 |             }
 58 |             catch (Exception ex)
 59 |             {
 60 |                 Console.WriteLine(ex.Message);
 61 |             }
 62 |         }
 63 | 
 64 |         [System.Diagnostics.DebuggerNonUserCodeAttribute()]
 65 |         private void backgroundWorkerScan_DoWork(object sender, DoWorkEventArgs e)
 66 |         {
 67 |             using (WiaScannerAdapter adapter = new WiaScannerAdapter())
 68 |             {
 69 |                 try
 70 |                 {
 71 |                     string tempFileName = Path.GetTempFileName();
 72 |                     File.Delete(tempFileName);
 73 |                     tempFileName = Path.ChangeExtension(tempFileName, ".png");
 74 |                     tempFileCollection.AddFile(tempFileName, false);
 75 |                     FileInfo imageFile = new FileInfo(tempFileName);
 76 |                     if (imageFile.Exists)
 77 |                     {
 78 |                         imageFile.Delete();
 79 |                     }
 80 |                     adapter.ScanImage(ImageFormat.Png, imageFile.FullName);
 81 |                     e.Result = tempFileName;
 82 |                 }
 83 |                 catch (WiaOperationException ex)
 84 |                 {
 85 |                     throw new Exception(System.Text.RegularExpressions.Regex.Replace(ex.ErrorCode.ToString(), "(?=\\p{Lu}+)", " ").Trim() + ".");
 86 |                 }
 87 |             }
 88 |         }
 89 | 
 90 |         private void backgroundWorkerScan_RunWorkerCompleted(object sender, RunWorkerCompletedEventArgs e)
 91 |         {
 92 |             this.toolStripProgressBar1.IsEnabled = false;
 93 |             this.toolStripProgressBar1.Visibility = Visibility.Hidden;
 94 | 
 95 |             // First, handle the case where an exception was thrown.
 96 |             if (e.Error != null)
 97 |             {
 98 |                 this.statusLabel.Content = string.Empty;
 99 |                 MessageBox.Show(e.Error.Message, Properties.Resources.ScanningOperation, MessageBoxButton.OK, MessageBoxImage.Error);
100 |             }
101 |             else if (e.Cancelled)
102 |             {
103 |                 // Next, handle the case where the user canceled the operation.
104 |                 // Note that due to a race condition in the DoWork event handler, the Cancelled
105 |                 // flag may not have been set, even though CancelAsync was called.
106 |                 this.statusLabel.Content = "Scanning " + Properties.Resources.canceled;
107 |             }
108 |             else
109 |             {
110 |                 // Finally, handle the case where the operation succeeded.
111 |                 openFile(e.Result.ToString());
112 |                 this.statusLabel.Content = Properties.Resources.Scancompleted;
113 |             }
114 | 
115 |             this.Cursor = null;
116 |             this.textBox1.Cursor = null;
117 |             this.buttonScan.IsEnabled = true;
118 |             this.scanToolStripMenuItem.IsEnabled = true;
119 |         }
120 |     }
121 | }
122 | 


--------------------------------------------------------------------------------
/SplitPdfDialog.xaml.cs:
--------------------------------------------------------------------------------
  1 | using Microsoft.Win32;
  2 | using System;
  3 | using System.Collections.Generic;
  4 | using System.Linq;
  5 | using System.Text;
  6 | using System.Text.RegularExpressions;
  7 | using System.Threading.Tasks;
  8 | using System.Windows;
  9 | using System.Windows.Controls;
 10 | using System.Windows.Data;
 11 | using System.Windows.Documents;
 12 | using System.Windows.Input;
 13 | using System.Windows.Media;
 14 | using System.Windows.Media.Imaging;
 15 | using System.Windows.Shapes;
 16 | 
 17 | namespace VietOCR
 18 | {
 19 |     /// <summary>
 20 |     /// Interaction logic for SplitPdfDialog.xaml
 21 |     /// </summary>
 22 |     public partial class SplitPdfDialog : Window
 23 |     {
 24 |         SplitPdfArgs args;
 25 |         string pdfFolder = null;
 26 | 
 27 |         internal SplitPdfArgs Args
 28 |         {
 29 |             get { return args; }
 30 |         }
 31 | 
 32 |         public SplitPdfDialog()
 33 |         {
 34 |             InitializeComponent();
 35 | 
 36 |             disableBoxes(!this.radioButtonPages.IsChecked.Value);
 37 |             this.textBoxNumOfPages.IsEnabled = false;
 38 |             this.textBoxNumOfPages.Text = "20";
 39 |             //this.toolTip1.SetToolTip(this.buttonBrowseInput, Properties.Resources.Browse);
 40 |             //this.toolTip1.SetToolTip(this.buttonBrowseOutput, Properties.Resources.Browse);
 41 |         }
 42 | 
 43 |         private void buttonBrowseInput_Click(object sender, RoutedEventArgs e)
 44 |         {
 45 |             OpenFileDialog dialog = new OpenFileDialog();
 46 |             dialog.Title = Properties.Resources.Open;
 47 |             dialog.InitialDirectory = pdfFolder;
 48 |             dialog.Filter = "PDF (*.pdf)|*.pdf";
 49 |             dialog.RestoreDirectory = true;
 50 | 
 51 |             Nullable<bool> result = dialog.ShowDialog();
 52 | 
 53 |             if (result.HasValue && result.Value)
 54 |             {
 55 |                 this.textBoxInput.Text = dialog.FileName;
 56 |                 pdfFolder = System.IO.Path.GetDirectoryName(dialog.FileName);
 57 |             }
 58 |         }
 59 | 
 60 |         private void buttonBrowseOutput_Click(object sender, RoutedEventArgs e)
 61 |         {
 62 |             SaveFileDialog dialog = new SaveFileDialog();
 63 |             dialog.Title = Properties.Resources.Save;
 64 |             dialog.InitialDirectory = pdfFolder;
 65 |             dialog.Filter = "PDF (*.pdf)|*.pdf";
 66 |             dialog.RestoreDirectory = true;
 67 | 
 68 |             Nullable<bool> result = dialog.ShowDialog();
 69 | 
 70 |             if (result.HasValue && result.Value)
 71 |             {
 72 |                 this.textBoxOutput.Text = dialog.FileName;
 73 | 
 74 |                 if (!this.textBoxOutput.Text.EndsWith(".pdf"))
 75 |                 {
 76 |                     this.textBoxOutput.Text += ".pdf"; // seems not needed
 77 |                 }
 78 |             }
 79 |         }
 80 | 
 81 |         private void buttonSplit_Click(object sender, RoutedEventArgs e)
 82 |         {
 83 |             SplitPdfArgs args = new SplitPdfArgs();
 84 |             args.InputFilename = this.textBoxInput.Text;
 85 |             args.OutputFilename = this.textBoxOutput.Text;
 86 |             args.FromPage = this.textBoxFrom.Text;
 87 |             args.ToPage = this.textBoxTo.Text;
 88 |             args.NumOfPages = this.textBoxNumOfPages.Text;
 89 |             args.Pages = this.radioButtonPages.IsChecked.Value;
 90 | 
 91 |             if (args.InputFilename.Length > 0 && args.OutputFilename.Length > 0 &&
 92 |                 ((this.radioButtonPages.IsChecked.Value && args.FromPage.Length > 0) ||
 93 |                 (this.radioButtonFiles.IsChecked.Value && args.NumOfPages.Length > 0)))
 94 |             {
 95 |                 Regex regexNums = new Regex(@"^\d+$");
 96 | 
 97 |                 if ((this.radioButtonPages.IsChecked.Value && regexNums.IsMatch(args.FromPage) &&
 98 |                     (args.ToPage.Length > 0 ? regexNums.IsMatch(args.ToPage) : true)) ||
 99 |                     (this.radioButtonFiles.IsChecked.Value && regexNums.IsMatch(args.NumOfPages)))
100 |                 {
101 |                     this.args = args;
102 |                     this.DialogResult = true;
103 |                 }
104 |                 else
105 |                 {
106 |                     MessageBox.Show(this, "Input invalid.", "Error", MessageBoxButton.OK, MessageBoxImage.Error);
107 |                 }
108 |             }
109 |             else
110 |             {
111 |                 MessageBox.Show(this, "Input incomplete.", "Error", MessageBoxButton.OK, MessageBoxImage.Error);
112 |             }
113 |         }
114 | 
115 |         void disableBoxes(bool enabled)
116 |         {
117 |             this.textBoxNumOfPages.IsEnabled = enabled;
118 |             this.textBoxFrom.IsEnabled = !enabled;
119 |             this.textBoxTo.IsEnabled = !enabled;
120 |         }
121 | 
122 |         private void radioButtonPages_Checked(object sender, RoutedEventArgs e)
123 |         {
124 |             disableBoxes(false);
125 |         }
126 | 
127 |         private void radioButtonFiles_Checked(object sender, RoutedEventArgs e)
128 |         {
129 |             disableBoxes(true);
130 |         }
131 |     }
132 | }
133 | 


--------------------------------------------------------------------------------
/FindReplaceDialog.xaml.cs:
--------------------------------------------------------------------------------
  1 | // Modified by Quan Nguyen for VietOCR.NET
  2 | // Version: 2.0, 28 September 2018
  3 | // See: http://vietocr.sourceforge.net
  4 | // Change: - Fixed a bug on Search direction, 18 Feb 2003
  5 | // 
  6 | 
  7 | //------------------------------------------------
  8 | // FindReplaceDialog.cs © 2001 by Charles Petzold
  9 | //------------------------------------------------
 10 | 
 11 | using Net.SourceForge.Vietpad.InputMethod;
 12 | using System;
 13 | using System.Windows;
 14 | using System.Windows.Controls;
 15 | 
 16 | namespace VietOCR
 17 | {
 18 |     /// <summary>
 19 |     /// Interaction logic for FindReplaceDialog.xaml
 20 |     /// </summary>
 21 |     public partial class FindReplaceDialog : Window
 22 |     {
 23 |         // Public events
 24 |         public event RoutedEventHandler FindNext;
 25 |         public event RoutedEventHandler Replace;
 26 |         public event RoutedEventHandler ReplaceAll;
 27 |         public event RoutedEventHandler CloseDlg;
 28 | 
 29 |         // Properties
 30 |         public string FindText
 31 |         {
 32 |             set { cbFind.Text = value; }
 33 |             get { return cbFind.Text; }
 34 |         }
 35 |         public string ReplaceText
 36 |         {
 37 |             set { cbReplace.Text = value; }
 38 |             get { return cbReplace.Text; }
 39 |         }
 40 |         public bool MatchCase
 41 |         {
 42 |             set { chkboxMatchCase.IsChecked = value; }
 43 |             get { return chkboxMatchCase.IsChecked.Value; }
 44 |         }
 45 |         public bool? MatchWholeWord
 46 |         {
 47 |             set { chkboxMatchWholeWord.IsChecked = value; }
 48 |             get { return chkboxMatchWholeWord.IsEnabled ? chkboxMatchWholeWord.IsChecked : null; }
 49 |         }
 50 |         public bool MatchDiacritics
 51 |         {
 52 |             set { chkboxMatchDiacritics.IsChecked = value; }
 53 |             get { return chkboxMatchDiacritics.IsChecked.Value; }
 54 |         }
 55 |         public bool MatchRegex
 56 |         {
 57 |             set { this.chkboxMatchRegex.IsChecked = value; }
 58 |             get { return this.chkboxMatchRegex.IsChecked.Value; }
 59 |         }
 60 |         public bool SearchDown
 61 |         {
 62 |             set
 63 |             {
 64 |                 if (value)
 65 |                     radiobtnSearchDown.IsChecked = true;
 66 |                 else
 67 |                     radiobtnSearchUp.IsChecked = true;
 68 |             }
 69 |             get { return radiobtnSearchDown.IsChecked.Value; }
 70 |         }
 71 | 
 72 |         public FindReplaceDialog()
 73 |         {
 74 |             InitializeComponent();
 75 |         }
 76 | 
 77 |         private void btnFindNext_Click(object sender, RoutedEventArgs e)
 78 |         {
 79 |             PopulateComboBox("Find");
 80 |             FindNext?.Invoke(this, e);
 81 |         }
 82 | 
 83 |         private void btnReplace_Click(object sender, RoutedEventArgs e)
 84 |         {
 85 |             PopulateComboBox("Find");
 86 |             PopulateComboBox("Replace");
 87 |             Replace?.Invoke(this, e);
 88 |         }
 89 | 
 90 |         private void btnReplaceAll_Click(object sender, RoutedEventArgs e)
 91 |         {
 92 |             PopulateComboBox("Find");
 93 |             PopulateComboBox("Replace");
 94 |             ReplaceAll?.Invoke(this, e);
 95 |         }
 96 | 
 97 |         private void btnClose_Click(object sender, RoutedEventArgs e)
 98 |         {
 99 |             this.Hide();
100 |             CloseDlg?.Invoke(this, e);
101 |         }
102 | 
103 |         /**
104 |          * Populates the combobox with entries from the corresponding text field
105 |          */
106 |         void PopulateComboBox(string button)
107 |         {
108 |             string text;
109 |             ComboBox comboBox;
110 | 
111 |             if (button == "Find")
112 |             {
113 |                 text = this.FindText;
114 |                 comboBox = this.cbFind;
115 |             }
116 |             else
117 |             {
118 |                 text = this.ReplaceText;
119 |                 comboBox = this.cbReplace;
120 |             }
121 |             if (text == string.Empty) return;
122 | 
123 |             if (!comboBox.Items.Contains(text))
124 |             {
125 |                 comboBox.Items.Insert(0, text);
126 |             }
127 |         }
128 | 
129 |         private void Window_Loaded(object sender, RoutedEventArgs e)
130 |         {
131 |             // integrate Viet Input Method
132 |             new VietKeyHandler(this.cbFind);
133 |             new VietKeyHandler(this.cbReplace);
134 | 
135 |             cbFind.Focus();
136 |         }
137 | 
138 |         private void cbFind_TextChanged(object sender, TextChangedEventArgs e)
139 |         {
140 |             btnFindNext.IsEnabled = btnReplace.IsEnabled = cbFind.Text.Length > 0;
141 |             btnReplaceAll.IsEnabled = cbFind.Text.Length > 0 && !(MatchRegex && !MatchDiacritics);
142 |         }
143 | 
144 |         private void option_Changed(object sender, RoutedEventArgs e)
145 |         {
146 |             if (sender == this.chkboxMatchDiacritics || sender == this.chkboxMatchRegex)
147 |             {
148 |                 btnReplaceAll.IsEnabled = cbFind.Text.Length > 0 && (!MatchRegex || MatchDiacritics);
149 |             }
150 |             if (sender == this.chkboxMatchRegex)
151 |             {
152 |                 this.chkboxMatchWholeWord.IsEnabled = !MatchRegex;
153 |             }
154 |             this.btnFindNext.Focus();
155 |         }
156 |     }
157 | }
158 | 


--------------------------------------------------------------------------------
/GuiWithPSM.cs:
--------------------------------------------------------------------------------
  1 | /**
  2 |  * Copyright @ 2008 Quan Nguyen
  3 |  * 
  4 |  * Licensed under the Apache License, Version 2.0 (the "License");
  5 |  * you may not use this file except in compliance with the License.
  6 |  * You may obtain a copy of the License at
  7 |  *
  8 |  *  http://www.apache.org/licenses/LICENSE-2.0
  9 |  *
 10 |  * Unless required by applicable law or agreed to in writing, software
 11 |  * distributed under the License is distributed on an "AS IS" BASIS,
 12 |  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 13 |  * See the License for the specific language governing permissions and
 14 |  * limitations under the License.
 15 | */
 16 | 
 17 | using System;
 18 | using System.Collections.Generic;
 19 | using System.ComponentModel;
 20 | //using Vietpad.NET.Controls;
 21 | using Microsoft.Win32;
 22 | using Tesseract;
 23 | using System.Windows.Controls;
 24 | using System.Windows;
 25 | 
 26 | namespace VietOCR
 27 | {
 28 |     public class GuiWithPSM : GuiWithBatch
 29 |     {
 30 |         const string strPSM = "PageSegMode";
 31 |         MenuItem psmItemChecked;
 32 | 
 33 |         public GuiWithPSM()
 34 |         {
 35 |             Dictionary<string, string> psmDict = new Dictionary<string, string>();
 36 |             psmDict.Add("OsdOnly", "0 - Orientation and script detection (OSD) only");
 37 |             psmDict.Add("AutoOsd", "1 - Automatic page segmentation with OSD");
 38 |             psmDict.Add("AutoOnly", "2 - Automatic page segmentation, but no OSD, or OCR");
 39 |             psmDict.Add("Auto", "3 - Fully automatic page segmentation, but no OSD (default)");
 40 |             psmDict.Add("SingleColumn", "4 - Assume a single column of text of variable sizes");
 41 |             psmDict.Add("SingleBlockVertText", "5 - Assume a single uniform block of vertically aligned text");
 42 |             psmDict.Add("SingleBlock", "6 - Assume a single uniform block of text");
 43 |             psmDict.Add("SingleLine", "7 - Treat the image as a single text line");
 44 |             psmDict.Add("SingleWord", "8 - Treat the image as a single word");
 45 |             psmDict.Add("CircleWord", "9 - Treat the image as a single word in a circle");
 46 |             psmDict.Add("SingleChar", "10 - Treat the image as a single character");
 47 |             psmDict.Add("SparseText", "11 - Find as much text as possible in no particular order");
 48 |             psmDict.Add("SparseTextOsd", "12 - Sparse text with orientation and script detection");
 49 |             psmDict.Add("RawLine", "13 - Treat the image as a single text line, bypassing hacks that are Tesseract-specific");
 50 |             psmDict.Add("Count", "14 - Number of enum entries");
 51 | 
 52 |             //
 53 |             // Settings PageSegMode submenu
 54 |             //
 55 |             RoutedEventHandler eh = new RoutedEventHandler(MenuPSMOnClick);
 56 | 
 57 |             foreach (string mode in Enum.GetNames(typeof(PageSegMode)))
 58 |             {
 59 |                 if ((PageSegMode)Enum.Parse(typeof(PageSegMode), mode) == PageSegMode.Count)
 60 |                 {
 61 |                     continue;
 62 |                 }
 63 |                 MenuItem psmItem = new MenuItem();
 64 |                 psmItem.Header = psmDict[mode];
 65 |                 psmItem.Tag = mode;
 66 |                 //psmItem.CheckOnClick = true;
 67 |                 psmItem.Click += eh;
 68 |                 this.psmToolStripMenuItem.Items.Add(psmItem);
 69 |             }
 70 |         }
 71 | 
 72 |         protected override void Window_Loaded(object sender, RoutedEventArgs e)
 73 |         {
 74 |             base.Window_Loaded(sender, e);
 75 | 
 76 |             for (int i = 0; i < this.psmToolStripMenuItem.Items.Count; i++)
 77 |             {
 78 |                 if (((MenuItem)this.psmToolStripMenuItem.Items[i]).Tag.ToString() == selectedPSM)
 79 |                 {
 80 |                     // Select PSM last saved
 81 |                     psmItemChecked = (MenuItem)psmToolStripMenuItem.Items[i];
 82 |                     psmItemChecked.IsChecked = true;
 83 |                     break;
 84 |                 }
 85 |             }
 86 | 
 87 |             this.statusLabelPSMvalue.Content = selectedPSM;
 88 |         }
 89 | 
 90 |         void MenuPSMOnClick(object obj, EventArgs ea)
 91 |         {
 92 |             if (psmItemChecked != null)
 93 |             {
 94 |                 psmItemChecked.IsChecked = false;
 95 |             }
 96 |             psmItemChecked = (MenuItem)obj;
 97 |             psmItemChecked.IsChecked = true;
 98 |             selectedPSM = psmItemChecked.Tag.ToString();
 99 |             this.statusLabelPSMvalue.Content = selectedPSM;
100 |         }
101 | 
102 |         protected override void LoadRegistryInfo(RegistryKey regkey)
103 |         {
104 |             base.LoadRegistryInfo(regkey);
105 |             selectedPSM = (string)regkey.GetValue(strPSM, Enum.GetName(typeof(PageSegMode), Tesseract.PageSegMode.Auto));
106 |             try
107 |             {
108 |                 // validate PSM value
109 |                 Tesseract.PageSegMode psm = (PageSegMode)Enum.Parse(typeof(PageSegMode), selectedPSM);
110 |             }
111 |             catch
112 |             {
113 |                 selectedPSM = Enum.GetName(typeof(PageSegMode), Tesseract.PageSegMode.Auto);
114 |             }
115 |         }
116 | 
117 |         protected override void SaveRegistryInfo(RegistryKey regkey)
118 |         {
119 |             base.SaveRegistryInfo(regkey);
120 |             regkey.SetValue(strPSM, selectedPSM);
121 |         }
122 |     }
123 | }
124 | 


--------------------------------------------------------------------------------
/Utilities/FileExtractor.cs:
--------------------------------------------------------------------------------
  1 | ///
  2 | /// http://wiki.sharpdevelop.net/GZip-and-Tar-Samples.ashx
  3 | /// http://wiki.sharpdevelop.net/SharpZipLib-Zip-Samples.ashx#Unpack_a_Zip_with_full_control_over_the_operation_3
  4 | ///
  5 | 
  6 | using System;
  7 | using System.Collections.Generic;
  8 | using System.Text;
  9 | using System.IO;
 10 | using ICSharpCode.SharpZipLib.Tar;
 11 | using ICSharpCode.SharpZipLib.GZip;
 12 | using ICSharpCode.SharpZipLib.Core;
 13 | using ICSharpCode.SharpZipLib.Zip;
 14 | 
 15 | namespace VietOCR.NET.Utilities
 16 | {
 17 |     class FileExtractor
 18 |     {
 19 |         public static void ExtractCompressedFile(string compressedArchiveName, string destFolder) 
 20 |         {
 21 |             if (compressedArchiveName.ToLower().EndsWith(".zip"))
 22 |             {
 23 |                 ExtractZipFile(compressedArchiveName, null, destFolder);
 24 |             }
 25 |             else if (compressedArchiveName.ToLower().EndsWith(".tar.gz"))
 26 |             {
 27 |                 ExtractTGZ(compressedArchiveName, destFolder);
 28 |             }
 29 |             else if (compressedArchiveName.ToLower().EndsWith(".gz"))
 30 |             {
 31 |                 ExtractGZip(compressedArchiveName, destFolder);
 32 |             }
 33 |             else
 34 |             {
 35 |                 string destFile = Path.Combine(destFolder, Path.GetFileName(compressedArchiveName));
 36 |                 // Ensure that the target does not exist
 37 |                 if (File.Exists(destFile))
 38 |                 {
 39 |                     File.Delete(destFile);
 40 |                 }
 41 |                     
 42 |                 File.Move(compressedArchiveName, destFile);
 43 |             }
 44 |         }
 45 |         
 46 |         public static void ExtractTGZ(string gzArchiveName, string destFolder)
 47 |         {
 48 |             Stream inStream = File.OpenRead(gzArchiveName);
 49 |             Stream gzipStream = new GZipInputStream(inStream);
 50 | 
 51 |             TarArchive tarArchive = TarArchive.CreateInputTarArchive(gzipStream);
 52 |             tarArchive.ExtractContents(destFolder);
 53 |             tarArchive.Close();
 54 | 
 55 |             gzipStream.Close();
 56 |             inStream.Close();
 57 |         }
 58 | 
 59 |         public static void ExtractGZip(string gzipFileName, string targetDir)
 60 |         {
 61 |             byte[] dataBuffer = new byte[4096];
 62 | 
 63 |             using (Stream fs = new FileStream(gzipFileName, FileMode.Open, FileAccess.Read))
 64 |             {
 65 |                 using (GZipInputStream gzipStream = new GZipInputStream(fs))
 66 |                 {
 67 |                     string fnOut = Path.Combine(targetDir, Path.GetFileNameWithoutExtension(gzipFileName));
 68 | 
 69 |                     using (FileStream fsOut = File.Create(fnOut))
 70 |                     {
 71 |                         StreamUtils.Copy(gzipStream, fsOut, dataBuffer);
 72 |                     }
 73 |                 }
 74 |             }
 75 |         }
 76 | 
 77 |         public static void ExtractZipFile(string archiveFilenameIn, string password, string outFolder)
 78 |         {
 79 |             ZipFile zf = null;
 80 |             try
 81 |             {
 82 |                 FileStream fs = File.OpenRead(archiveFilenameIn);
 83 |                 zf = new ZipFile(fs);
 84 |                 if (!string.IsNullOrEmpty(password))
 85 |                 {
 86 |                     zf.Password = password;		// AES encrypted entries are handled automatically
 87 |                 }
 88 |                 foreach (ZipEntry zipEntry in zf)
 89 |                 {
 90 |                     if (!zipEntry.IsFile)
 91 |                     {
 92 |                         continue;			// Ignore directories
 93 |                     }
 94 |                     string entryFileName = zipEntry.Name;
 95 |                     // to remove the folder from the entry:- entryFileName = Path.GetFileName(entryFileName);
 96 |                     // Optionally match entrynames against a selection list here to skip as desired.
 97 |                     // The unpacked length is available in the zipEntry.Size property.
 98 | 
 99 |                     byte[] buffer = new byte[4096];		// 4K is optimum
100 |                     Stream zipStream = zf.GetInputStream(zipEntry);
101 | 
102 |                     // Manipulate the output filename here as desired.
103 |                     string fullZipToPath = Path.Combine(outFolder, entryFileName);
104 |                     string directoryName = Path.GetDirectoryName(fullZipToPath);
105 |                     if (directoryName.Length > 0)
106 |                         Directory.CreateDirectory(directoryName);
107 | 
108 |                     // Unzip file in buffered chunks. This is just as fast as unpacking to a buffer the full size
109 |                     // of the file, but does not waste memory.
110 |                     // The "using" will close the stream even if an exception occurs.
111 |                     using (FileStream streamWriter = File.Create(fullZipToPath))
112 |                     {
113 |                         StreamUtils.Copy(zipStream, streamWriter, buffer);
114 |                     }
115 |                 }
116 |             }
117 |             finally
118 |             {
119 |                 if (zf != null)
120 |                 {
121 |                     zf.IsStreamOwner = true; // Makes close also shut the underlying stream
122 |                     zf.Close(); // Ensure we release resources
123 |                 }
124 |             }
125 |         }
126 |     }
127 | }
128 | 


--------------------------------------------------------------------------------
/DownloadDialog.vi.resx:
--------------------------------------------------------------------------------
  1 | <?xml version='1.0' encoding='UTF-8'?>
  2 | <root>
  3 |   <xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema" xmlns:msdata="urn:schemas-microsoft-com:xml-msdata" id="root">
  4 |     <xsd:import namespace="http://www.w3.org/XML/1998/namespace"/>
  5 |     <xsd:element name="root" msdata:IsDataSet="true">
  6 |       <xsd:complexType>
  7 |         <xsd:choice maxOccurs="unbounded">
  8 |           <xsd:element name="metadata">
  9 |             <xsd:complexType>
 10 |               <xsd:sequence>
 11 |                 <xsd:element name="value" type="xsd:string" minOccurs="0"/>
 12 |               </xsd:sequence>
 13 |               <xsd:attribute name="name" use="required" type="xsd:string"/>
 14 |               <xsd:attribute name="type" type="xsd:string"/>
 15 |               <xsd:attribute name="mimetype" type="xsd:string"/>
 16 |               <xsd:attribute ref="xml:space"/>
 17 |             </xsd:complexType>
 18 |           </xsd:element>
 19 |           <xsd:element name="assembly">
 20 |             <xsd:complexType>
 21 |               <xsd:attribute name="alias" type="xsd:string"/>
 22 |               <xsd:attribute name="name" type="xsd:string"/>
 23 |             </xsd:complexType>
 24 |           </xsd:element>
 25 |           <xsd:element name="data">
 26 |             <xsd:complexType>
 27 |               <xsd:sequence>
 28 |                 <xsd:element name="value" type="xsd:string" minOccurs="0" msdata:Ordinal="1"/>
 29 |                 <xsd:element name="comment" type="xsd:string" minOccurs="0" msdata:Ordinal="2"/>
 30 |               </xsd:sequence>
 31 |               <xsd:attribute name="name" type="xsd:string" use="required" msdata:Ordinal="1"/>
 32 |               <xsd:attribute name="type" type="xsd:string" msdata:Ordinal="3"/>
 33 |               <xsd:attribute name="mimetype" type="xsd:string" msdata:Ordinal="4"/>
 34 |               <xsd:attribute ref="xml:space"/>
 35 |             </xsd:complexType>
 36 |           </xsd:element>
 37 |           <xsd:element name="resheader">
 38 |             <xsd:complexType>
 39 |               <xsd:sequence>
 40 |                 <xsd:element name="value" type="xsd:string" minOccurs="0" msdata:Ordinal="1"/>
 41 |               </xsd:sequence>
 42 |               <xsd:attribute name="name" type="xsd:string" use="required"/>
 43 |             </xsd:complexType>
 44 |           </xsd:element>
 45 |         </xsd:choice>
 46 |       </xsd:complexType>
 47 |     </xsd:element>
 48 |   </xsd:schema>
 49 |   <resheader name="resmimetype">
 50 |     <value>text/microsoft-resx</value>
 51 |   </resheader>
 52 |   <resheader name="version">
 53 |     <value>2.0</value>
 54 |   </resheader>
 55 |   <resheader name="reader">
 56 |     <value>System.Resources.ResXResourceReader, System.Windows.Forms, Version=2.0.0.0, Culture=neutral, PublicKeyToken=b77a5c561934e089</value>
 57 |   </resheader>
 58 |   <resheader name="writer">
 59 |     <value>System.Resources.ResXResourceWriter, System.Windows.Forms, Version=2.0.0.0, Culture=neutral, PublicKeyToken=b77a5c561934e089</value>
 60 |   </resheader>
 61 |   <data name="$this.ClientSize" type="System.Drawing.Size, System.Drawing">
 62 |     <value>263, 180</value>
 63 |   </data>
 64 |   <data name="this.Title" xml:space="preserve">
 65 |     <value>Tải dữ liệu ngôn ngữ</value>
 66 |   </data>
 67 |   <data name="buttonCancel.Location" type="System.Drawing.Point, System.Drawing">
 68 |     <value>176, 54</value>
 69 |   </data>
 70 |   <data name="buttonCancel.Size" type="System.Drawing.Size, System.Drawing">
 71 |     <value>75, 23</value>
 72 |   </data>
 73 |   <data name="buttonCancel.Text" xml:space="preserve">
 74 |     <value>Bãi</value>
 75 |   </data>
 76 |   <data name="buttonClose.Location" type="System.Drawing.Point, System.Drawing">
 77 |     <value>176, 109</value>
 78 |   </data>
 79 |   <data name="buttonClose.Size" type="System.Drawing.Size, System.Drawing">
 80 |     <value>75, 23</value>
 81 |   </data>
 82 |   <data name="buttonClose.Text" xml:space="preserve">
 83 |     <value>Đóng</value>
 84 |   </data>
 85 |   <data name="buttonDownload.Location" type="System.Drawing.Point, System.Drawing">
 86 |     <value>176, 25</value>
 87 |   </data>
 88 |   <data name="buttonDownload.Size" type="System.Drawing.Size, System.Drawing">
 89 |     <value>75, 23</value>
 90 |   </data>
 91 |   <data name="buttonDownload.Text" xml:space="preserve">
 92 |     <value>Tải xuống</value>
 93 |   </data>
 94 |   <data name="groupBox1.Location" type="System.Drawing.Point, System.Drawing">
 95 |     <value>6, 6</value>
 96 |   </data>
 97 |   <data name="groupBox1.Size" type="System.Drawing.Size, System.Drawing">
 98 |     <value>158, 142</value>
 99 |   </data>
100 |   <data name="groupBox1.Text" xml:space="preserve">
101 |     <value>Các gói ngôn ngữ hiện có</value>
102 |   </data>
103 |   <data name="listBox1.Location" type="System.Drawing.Point, System.Drawing">
104 |     <value>3, 18</value>
105 |   </data>
106 |   <data name="listBox1.Size" type="System.Drawing.Size, System.Drawing">
107 |     <value>152, 121</value>
108 |   </data>
109 |   <data name="statusStrip1.Location" type="System.Drawing.Point, System.Drawing">
110 |     <value>0, 158</value>
111 |   </data>
112 |   <data name="statusStrip1.Size" type="System.Drawing.Size, System.Drawing">
113 |     <value>263, 22</value>
114 |   </data>
115 |   <data name="statusStrip1.Text" xml:space="preserve">
116 |     <value>statusStrip1</value>
117 |   </data>
118 |   <data name="toolStripProgressBar1.Size" type="System.Drawing.Size, System.Drawing">
119 |     <value>100, 16</value>
120 |   </data>
121 |   <data name="toolStripStatusLabel1.Size" type="System.Drawing.Size, System.Drawing">
122 |     <value>0, 17</value>
123 |   </data>
124 | </root>
125 | 


--------------------------------------------------------------------------------
/GuiWithThumbnail.cs:
--------------------------------------------------------------------------------
  1 | using System;
  2 | using System.ComponentModel;
  3 | using System.Linq;
  4 | using System.Windows;
  5 | using System.Windows.Controls;
  6 | using System.Windows.Controls.Primitives;
  7 | using System.Windows.Media;
  8 | using System.Windows.Media.Imaging;
  9 | using System.Windows.Shapes;
 10 | 
 11 | namespace VietOCR
 12 | {
 13 |     public class GuiWithThumbnail : GuiWithFile
 14 |     {
 15 |         private BackgroundWorker backgroundWorkerLoadThumbnail;
 16 |         private Style toggleButtonStyle;
 17 | 
 18 |         public GuiWithThumbnail()
 19 |         {
 20 |             toggleButtonStyle = new Style(typeof(RadioButton), (Style)FindResource(typeof(ToggleButton)));
 21 |             this.backgroundWorkerLoadThumbnail = new BackgroundWorker();
 22 |             this.backgroundWorkerLoadThumbnail.WorkerReportsProgress = true;
 23 |             this.backgroundWorkerLoadThumbnail.DoWork += new DoWorkEventHandler(this.backgroundWorkerLoadThumbnail_DoWork);
 24 |             this.backgroundWorkerLoadThumbnail.ProgressChanged += new ProgressChangedEventHandler(this.backgroundWorkerLoadThumbnail_ProgressChanged);
 25 |             this.backgroundWorkerLoadThumbnail.RunWorkerCompleted += BackgroundWorkerLoadThumbnail_RunWorkerCompleted;
 26 |         }
 27 | 
 28 |         protected override void loadThumbnails()
 29 |         {
 30 |             this.panelThumbnail.Children.Clear();
 31 |             this.backgroundWorkerLoadThumbnail.RunWorkerAsync();
 32 |         }
 33 | 
 34 |         protected override void selectThumbnail(int index)
 35 |         {
 36 |             this.panelThumbnail.Children.OfType<RadioButton>().Where(x => (int) x.Tag == index).First().IsChecked = true;
 37 |         }
 38 | 
 39 |         private void backgroundWorkerLoadThumbnail_DoWork(object sender, DoWorkEventArgs e)
 40 |         {
 41 |             // Create thumbnails
 42 |             for (int i = 0; i < imageList.Count; i++)
 43 |             {
 44 |                 System.Drawing.Image thumbnail = imageList[i].GetThumbnailImage(85, 110, null, IntPtr.Zero);
 45 |                 this.backgroundWorkerLoadThumbnail.ReportProgress(i, thumbnail);
 46 |             }
 47 |         }
 48 | 
 49 |         private void backgroundWorkerLoadThumbnail_ProgressChanged(object sender, ProgressChangedEventArgs e)
 50 |         {
 51 |             // Load thumbnails & associated labels into panel
 52 |             System.Drawing.Image thumbnail = (System.Drawing.Image)e.UserState;
 53 |             RadioButton rb = new RadioButton();
 54 |             rb.Width = thumbnail.Width;
 55 |             rb.Height = thumbnail.Height;
 56 |             rb.Style = toggleButtonStyle;
 57 |             BitmapImage bmimage = ImageConverter.BitmapToImageSource(thumbnail);
 58 |             System.Windows.Controls.Image image = new System.Windows.Controls.Image();
 59 |             image.Source = bmimage;
 60 |             rb.Content = image;
 61 |             rb.HorizontalAlignment = HorizontalAlignment.Center;
 62 |             rb.Tag = e.ProgressPercentage;
 63 |             rb.Click += new RoutedEventHandler(this.radioButton_Click);
 64 |             this.panelThumbnail.Children.Add(rb);
 65 |             Rectangle rect = new Rectangle();
 66 |             rect.HorizontalAlignment = HorizontalAlignment.Right;
 67 |             rect.Width = 10;
 68 |             rect.Height = 10;
 69 |             SolidColorBrush mySolidColorBrush = new SolidColorBrush();
 70 |             mySolidColorBrush.Color = System.Windows.Media.Color.FromArgb(255, 0, 128, 128);
 71 |             //rect.Stroke = mySolidColorBrush;
 72 |             rect.Fill = mySolidColorBrush;
 73 |             rect.Margin= new Thickness(0, -10, 0, 0);
 74 | 
 75 |             System.Windows.Data.Binding binding = new System.Windows.Data.Binding("IsChecked");
 76 |             binding.Converter = new System.Windows.Controls.BooleanToVisibilityConverter();
 77 |             binding.Source = rb;
 78 |             rect.SetBinding(UIElement.VisibilityProperty, binding);
 79 |             this.panelThumbnail.Children.Add(rect);
 80 |             Label label = new Label();
 81 |             label.Content = e.ProgressPercentage + 1;
 82 |             label.HorizontalAlignment = HorizontalAlignment.Center;
 83 |             label.Margin = new Thickness(0, -5, 0, 0);
 84 |             this.panelThumbnail.Children.Add(label);
 85 |         }
 86 | 
 87 |         private void BackgroundWorkerLoadThumbnail_RunWorkerCompleted(object sender, RunWorkerCompletedEventArgs e)
 88 |         {
 89 |             if (e.Error != null)
 90 |             {
 91 |                 MessageBox.Show(e.Error.Message);
 92 |             }
 93 |             else if (e.Cancelled)
 94 |             {
 95 |                 //cancelled
 96 |             }
 97 |             else
 98 |             {
 99 |                 selectThumbnail(imageIndex);
100 |             }
101 |         }
102 | 
103 |         private void radioButton_Click(object sender, RoutedEventArgs e)
104 |         {
105 |             int index = (int)((RadioButton)sender).Tag;
106 |             if (imageIndex == index)
107 |             {
108 |                 return;
109 |             }
110 |             imageIndex = index;
111 |             this.comboBoxPageNum.SelectedItem = (imageIndex + 1);
112 |         }
113 | 
114 |         //protected override void splitContainerImage_SplitterMoved(object sender, SplitterEventArgs e)
115 |         //{
116 |         //    foreach (Control con in this.panelThumbnail.Children)
117 |         //    {
118 |         //        int horizontalMargin = (int)(this.panelThumbnail.Width - con.Width) / 2;
119 |         //        con.Margin = new Thickness(horizontalMargin, 0, horizontalMargin, 2);
120 |         //    }
121 |         //}
122 |     }
123 | }
124 | 


--------------------------------------------------------------------------------
/FindReplaceDialog.xaml:
--------------------------------------------------------------------------------
 1 | <Window x:Class="VietOCR.FindReplaceDialog"
 2 |         xmlns="http://schemas.microsoft.com/winfx/2006/xaml/presentation"
 3 |         xmlns:x="http://schemas.microsoft.com/winfx/2006/xaml"
 4 |         xmlns:d="http://schemas.microsoft.com/expression/blend/2008"
 5 |         xmlns:mc="http://schemas.openxmlformats.org/markup-compatibility/2006"
 6 |         xmlns:local="clr-namespace:VietOCR"
 7 |         xmlns:resx="clr-namespace:VietOCR"
 8 |         mc:Ignorable="d"
 9 |         Title="{x:Static resx:FindReplaceDialog.this_Title}" Height="200" Width="410"
10 |         WindowStartupLocation="CenterOwner" ResizeMode="NoResize" Loaded="Window_Loaded">
11 |     <Grid HorizontalAlignment="Stretch" VerticalAlignment="Stretch">
12 |         <Grid.RowDefinitions>
13 |             <RowDefinition Height="Auto" />
14 |             <RowDefinition Height="Auto" />
15 |         </Grid.RowDefinitions>
16 |         <Grid.ColumnDefinitions>
17 |             <ColumnDefinition Width="11*" />
18 |             <ColumnDefinition Width="4*" />
19 |         </Grid.ColumnDefinitions>
20 | 
21 |         <Grid Margin="2,10,1,0"  Grid.Column="0" Grid.Row="0">
22 |             <Grid.Resources>
23 |                 <Style TargetType="{x:Type ComboBox}">
24 |                     <Setter Property="Margin" Value="0,2,0,2" />
25 |                 </Style>
26 |             </Grid.Resources>
27 |             <Grid.RowDefinitions>
28 |                 <RowDefinition Height="Auto" />
29 |                 <RowDefinition Height="Auto" />
30 |             </Grid.RowDefinitions>
31 |             <Grid.ColumnDefinitions>
32 |                 <ColumnDefinition Width="Auto" />
33 |                 <ColumnDefinition Width="*" />
34 |             </Grid.ColumnDefinitions>
35 |             <Label x:Name="labelFind" Content="{x:Static resx:FindReplaceDialog.labelFind_Text}" Target="{Binding ElementName=cbFind}" HorizontalAlignment="Left" VerticalAlignment="Top" Grid.Column="0" Grid.Row="0"/>
36 |             <ComboBox x:Name="cbFind" HorizontalAlignment="Right" Width="190" Grid.Column="1" Grid.Row="0" IsEditable="True" TextBoxBase.TextChanged="cbFind_TextChanged"/>
37 |             <Label x:Name="labelReplace" Content="{x:Static resx:FindReplaceDialog.labelReplace_Text}" Target="{Binding ElementName=cbReplace}" HorizontalAlignment="Left" VerticalAlignment="Top" Grid.Column="0" Grid.Row="1"/>
38 |             <ComboBox x:Name="cbReplace" HorizontalAlignment="Right" Width="190" Grid.Column="1" Grid.Row="1" IsEditable="True" />
39 |         </Grid>
40 | 
41 |         <GroupBox Margin="2,0,0,0" Header="Options" Grid.Column="0" Grid.Row="1" Padding="3">
42 |             <Grid Margin="2,0,0,0">
43 |                 <Grid.Resources>
44 |                     <Style TargetType="{x:Type CheckBox}">
45 |                         <Setter Property="Margin" Value="0,4,0,4" />
46 |                     </Style>
47 |                     <Style TargetType="{x:Type RadioButton}">
48 |                         <Setter Property="Margin" Value="0,4,0,4" />
49 |                     </Style>
50 |                 </Grid.Resources>
51 |                 <Grid.RowDefinitions>
52 |                     <RowDefinition Height="Auto" />
53 |                     <RowDefinition Height="Auto" />
54 |                     <RowDefinition Height="Auto" />
55 |                 </Grid.RowDefinitions>
56 |                 <Grid.ColumnDefinitions>
57 |                     <ColumnDefinition Width="*" />
58 |                     <ColumnDefinition Width="Auto" />
59 |                 </Grid.ColumnDefinitions>
60 |                 <CheckBox x:Name="chkboxMatchCase" Content="{x:Static resx:FindReplaceDialog.chkboxMatchCase_Text}" Grid.Column="0" Grid.Row="0" Checked="option_Changed" Unchecked="option_Changed"/>
61 |                 <CheckBox x:Name="chkboxMatchWholeWord" Content="{x:Static resx:FindReplaceDialog.chkboxMatchWholeWord_Text}"  Grid.Column="0" Grid.Row="1" Checked="option_Changed" Unchecked="option_Changed"/>
62 |                 <CheckBox x:Name="chkboxMatchDiacritics" Content="{x:Static resx:FindReplaceDialog.chkboxMatchDiacritics_Text}"  Grid.Column="0" Grid.Row="2" Checked="option_Changed" Unchecked="option_Changed"/>
63 |                 <RadioButton x:Name="radiobtnSearchUp" Content="{x:Static resx:FindReplaceDialog.radiobtnUp_Text}"  Grid.Column="1" Grid.Row="0" Checked="option_Changed" Unchecked="option_Changed"/>
64 |                 <RadioButton x:Name="radiobtnSearchDown"  Content="{x:Static resx:FindReplaceDialog.radiobtnDown_Text}" Grid.Column="1" Grid.Row="1" Checked="option_Changed" Unchecked="option_Changed"/>
65 |                 <CheckBox x:Name="chkboxMatchRegex" Content="{x:Static resx:FindReplaceDialog.chkboxMatchRegex_Text}" Grid.Column="1" Grid.Row="2" Checked="option_Changed" Unchecked="option_Changed"/>
66 |             </Grid>
67 |         </GroupBox>
68 |         
69 |         <StackPanel VerticalAlignment="Top" Grid.Column="1" Grid.Row="0" Grid.RowSpan="2" Margin="5" >
70 |             <StackPanel.Resources>
71 |                 <Style TargetType="{x:Type Button}">
72 |                     <Setter Property="Margin" Value="5,5,5,0"/>
73 |                 </Style>
74 |             </StackPanel.Resources>
75 |             <Button x:Name="btnFindNext" IsDefault="True" Content="{x:Static resx:FindReplaceDialog.btnFindNext_Text}" Click="btnFindNext_Click" IsEnabled="False"/>
76 |             <Button x:Name="btnReplace" Content="{x:Static resx:FindReplaceDialog.btnReplace_Text}" Click="btnReplace_Click" IsEnabled="False"/>
77 |             <Button x:Name="btnReplaceAll" Content="{x:Static resx:FindReplaceDialog.btnReplaceAll_Text}" Click="btnReplaceAll_Click" IsEnabled="False"/>
78 |             <Button x:Name="btnClose" Content="{x:Static resx:FindReplaceDialog.btnClose_Text}" Click="btnClose_Click"/>
79 |         </StackPanel>
80 | 
81 |     </Grid>
82 | </Window>
83 | 


--------------------------------------------------------------------------------
/Utilities/FormLocalizer.cs:
--------------------------------------------------------------------------------
  1 | /**
  2 |  * Copyright @ 2008 Quan Nguyen
  3 |  * 
  4 |  * Licensed under the Apache License, Version 2.0 (the "License");
  5 |  * you may not use this file except in compliance with the License.
  6 |  * You may obtain a copy of the License at
  7 |  *
  8 |  *  http://www.apache.org/licenses/LICENSE-2.0
  9 |  *
 10 |  * Unless required by applicable law or agreed to in writing, software
 11 |  * distributed under the License is distributed on an "AS IS" BASIS,
 12 |  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 13 |  * See the License for the specific language governing permissions and
 14 |  * limitations under the License.
 15 | */
 16 | using System;
 17 | using System.Collections.Generic;
 18 | using System.Text;
 19 | using System.Threading;
 20 | using System.ComponentModel;
 21 | using System.Reflection;
 22 | using System.Globalization;
 23 | using System.Windows;
 24 | using System.Windows.Controls;
 25 | 
 26 | namespace VietOCR.NET.Utilities
 27 | {
 28 |     class FormLocalizer
 29 |     {
 30 |         private Window form;
 31 |         private Type formType;
 32 | 
 33 |         /// <summary>
 34 |         /// Constructor.
 35 |         /// </summary>
 36 |         /// <param name="form"></param>
 37 |         public FormLocalizer(Window form, Type formType)
 38 |         {
 39 |             this.form = form;
 40 |             this.formType = formType;
 41 |         }
 42 | 
 43 |         /// <summary>
 44 |         /// Update UI elements.
 45 |         /// Original code from http://secure.codeproject.com/KB/locale/ChangeUICulture.aspx
 46 |         /// </summary>
 47 |         /// <param name="culture"></param>
 48 |         public void ApplyCulture(CultureInfo culture)
 49 |         {
 50 |             // Applies culture to current Thread.
 51 |             Thread.CurrentThread.CurrentUICulture = culture;
 52 | 
 53 |             // Create a resource manager for this Form
 54 |             // and determine its fields via reflection.
 55 | 
 56 |             ComponentResourceManager resources = new ComponentResourceManager(formType);
 57 |             FieldInfo[] fieldInfos = formType.GetFields(BindingFlags.Instance |
 58 |                 BindingFlags.DeclaredOnly | BindingFlags.NonPublic);
 59 | 
 60 |             // Call SuspendLayout for Form and all fields derived from Control, so assignment of 
 61 |             // localized text doesn't change layout immediately.
 62 | 
 63 |             //form.SuspendLayout();
 64 |             // If available, assign localized text to Form and fields with Text property.
 65 | 
 66 |             string text = resources.GetString("this.Title");
 67 |             if (text != null)
 68 |                 form.Title = text;
 69 | 
 70 |             foreach (FieldInfo fieldInfo in fieldInfos)
 71 |             {
 72 |                 Type fieldType = fieldInfo.FieldType;
 73 |                 if (fieldType.IsSubclassOf(typeof(Control)) || fieldType.IsSubclassOf(typeof(MenuItem)))
 74 |                 {
 75 |                     //if (fieldType.IsSubclassOf(typeof(Control)))
 76 |                     //{
 77 |                     //    fieldType.InvokeMember("SuspendLayout",
 78 |                     //        BindingFlags.InvokeMethod, null,
 79 |                     //        fieldInfo.GetValue(form), null);
 80 |                     //}
 81 | 
 82 |                     if (fieldType.GetProperty("Header", typeof(object)) != null)
 83 |                     {
 84 |                         text = resources.GetString(fieldInfo.Name + ".Text");
 85 |                         if (text != null)
 86 |                         {
 87 |                             fieldType.InvokeMember("Header",
 88 |                                 BindingFlags.SetProperty, null,
 89 |                                 fieldInfo.GetValue(form), new object[] { text });
 90 |                         }
 91 |                     }
 92 |                     else if (fieldType.GetProperty("Content", typeof(object)) != null)
 93 |                     {
 94 |                         text = resources.GetString(fieldInfo.Name + ".Text");
 95 |                         if (text != null)
 96 |                         {
 97 |                             fieldType.InvokeMember("Content",
 98 |                                 BindingFlags.SetProperty, null,
 99 |                                 fieldInfo.GetValue(form), new object[] { text });
100 |                         }
101 |                     }
102 |                     else if (fieldType.GetProperty("Text", typeof(string)) != null)
103 |                     {
104 |                         text = resources.GetString(fieldInfo.Name + ".Text");
105 |                         if (text != null)
106 |                         {
107 |                             fieldType.InvokeMember("Text",
108 |                                 BindingFlags.SetProperty, null,
109 |                                 fieldInfo.GetValue(form), new object[] { text });
110 |                         }
111 |                     }
112 |                     else if (fieldType.GetProperty("ToolTipText", typeof(string)) != null)
113 |                     {
114 |                         text = resources.GetString(fieldInfo.Name + ".ToolTipText");
115 |                         if (text != null)
116 |                         {
117 |                             fieldType.InvokeMember("ToolTipText",
118 |                                 BindingFlags.SetProperty, null,
119 |                                 fieldInfo.GetValue(form), new object[] { text });
120 |                         }
121 |                     }
122 | 
123 |                     // Call ResumeLayout for Form and all fields
124 |                     // derived from Control to resume layout logic.
125 |                     // Call PerformLayout, so layout changes due
126 |                     // to assignment of localized text are performed.
127 |                     //if (fieldType.IsSubclassOf(typeof(Control)))
128 |                     //{
129 |                     //    fieldType.InvokeMember("ResumeLayout",
130 |                     //            BindingFlags.InvokeMethod, null,
131 |                     //            fieldInfo.GetValue(form), new object[] { false });
132 |                     //}
133 |                 }
134 |             }
135 | 
136 |             //form.ResumeLayout(false);
137 |             //form.PerformLayout();
138 |         }
139 |     }
140 | }
141 | 


--------------------------------------------------------------------------------
/readme_cs_ja.html:
--------------------------------------------------------------------------------
 1 | <html>
 2 | <head>
 3 | <meta http-equiv="Content-Type" content="text/html; charset=utf-8">
 4 | <title>VietOCR.NET - Tesseract OCRの.NET WPF 製GUIフロントエンド</title>
 5 | </head>
 6 | <body>
 7 |     <div>
 8 |         <h2 align="center">VietOCR.NET</h2>
 9 |         <h3>概要</h3>
10 |         <p><a href="http://vietocr.sourceforge.net/">VietOCR.NET</a>は.NET WPF で書かれた<a href="https://github.com/tesseract-ocr">Tesseract OCRエンジン</a>のGUIフロントエンドです。一般的な画像形式やマルチページTIFF形式の文字認識をサポートします。このプログラムはOCR処理につきまとう誤認識を修正する後処理をし、認識結果の正解率を向上させます。コマンドラインから実行すればコンソールアプリケーションとしても機能します。</p>
11 |         <p>バッチ処理がサポートされるようになりました。プログラムは監視フォルダ内の新しい画像ファイルを監視し、OCRエンジンを通して自動処理し出力フォルダに認識結果を出力します。</p>
12 |         <h3>システム要件</h3>
13 |         <p><a href="https://dotnet.microsoft.com/download/dotnet-framework/net48">Microsoft .NET Framework 4.8 再配布可能パッケージ</a>。</p>
14 |         <p>
15 |             If you encounter &quot;<i>Exception has been thrown by the target of an invocation</i>&quot; errors, please install
16 |             <a href="https://visualstudio.microsoft.com/downloads/">Microsoft Visual C++ 2022 Redistributable Package</a>.
17 |         </p>
18 |         <h3>インストール</h3>
19 |         <p>
20 |             If you do not have authority to install under <code>C:\Program Files</code> folder,
21 |             you can specify another folder in Install Installation Folder dialog.
22 |         </p>
23 |         <p>Scanning support is provided via the Windows Image Acquisition Library v2.0.</p>
24 |         <p>
25 |             PDF support is possible via <a href="http://www.ghostscript.com/">GPL Ghostscript</a>. After installation of the library, please ensure the dynamic
26 |             load library <code>gsdll64.dll</code> is in the search path by setting the <code>Path</code>
27 |             environment variable, which is accessible through Windows&#39; Control Panel &gt;
28 |             System &gt; Advanced tab &gt; Environment Variables. For instance, append the following
29 |             to <code>Path</code> variable value for GS version 10.06.0:
30 |         </p>
31 |         <blockquote>
32 |             <p><code>;C:\Program Files\gs\gs10.06.0\bin</code></p>
33 |         </blockquote>
34 |         <p>
35 |             Spellcheck functionality is available through Hunspell, whose <a href="http://wiki.services.openoffice.org/wiki/Dictionaries">
36 |                 dictionary
37 |             </a> files (<code>.aff</code>, <code>.dic</code>) should be placed in <code>dict</code>
38 |             folder of VietOCR.
39 |         </p>
40 |         <h3>説明</h3>
41 |         <p>
42 |             <a href="https://github.com/tesseract-ocr/tessdata">Language data packs</a>
43 |             for Tesseract should be decompressed into <code>tesseract</code> installation folder;
44 |             the data files, whose names start with ISO639-3 codes, will be placed in the <code>tessdata</code>
45 |             subdirectory. VietOCR also provides support for downloading and installing selected
46 |             language packs via <em>Download Language Data</em> menu item. Depending on the location
47 |             of the <code>tessdata</code> folder, you may be required to run the program as admin
48 |             to be able to install the downloaded data into the folder if it is inside a system
49 |             folder, such as in <code>C:\Program Files</code>.
50 |         </p>
51 |         <p>ベトナム語の言語データはTimes New Roman、Arial、Verdana、Courier Newのフォントで生成されています。そのためよく似たフォントグリフを持つ画像ではより良い認識成功率を示すでしょう。サポートしているフォントと違った見かけのフォントグリフを持つ画像をOCRするには、一般的に、特別にそれらの書体をTesseractに<a href="https://github.com/tesseract-ocr/tesseract/wiki/TrainingTesseract">学習</a>させた別の言語データパックを生成してください。一部のVNI、TCVN3(ABC)フォントの言語データも最新バージョンにバンドルされています。</p>
52 |         <p>
53 |             Images to be OCRed should be scanned at resolution from at least 200 DPI (dot per
54 |             inch) to 400 DPI in monochrome (black&amp;white) or grayscale. Scanning at higher
55 |             resolutions will not necessarily result in better recognition accuracy, which currently
56 |             can be higher than 97% for Vietnamese, and the next release of Tesseract may improve
57 |             it even further. Even so, the actual rates still depend greatly on the quality of
58 |             the scanned image. The typical settings for scanning are 300 DPI and 1 bpp (bit
59 |             per pixel) black&amp;white or 8 bpp grayscale uncompressed TIFF or PNG format.
60 |         </p>
61 |         <p><em>スクリーンショット モード</em>は低解像度の画像に対して、スクリーン プリントのように300dpiで再スケーリングし認識率を向上させます。</p>
62 |         <p>
63 |             In addition to the built-in text postprocessing algorithm, you can add your own
64 |             custom text replacement scheme via a UTF-8-encoded tab-delimited text file named <code>x.DangAmbigs.txt</code>,
65 |             where x is the ISO639-3 language code. Both plain and Regex text replacements are supported.
66 |         </p>
67 |         <p>
68 |             You can put init-only and non-init control parameters in <code>tessdata/configs/tess_configs</code>
69 |             and <code>tess_configvars</code> files, respectively, to modify Tesseract&#39;s
70 |             behaviour.
71 |         </p>
72 |         <p>組込みのツールにはOCR操作が便利になるように複数の画像やPDFファイルを単一のものに結合したり、メモリ不足例外が発生しそうな大きなPDFファイルを小さく分割したりする機能があります。</p>
73 |         <h3>後処理</h3>
74 |         <p>誤認識は一般的に3つのカテゴリに分類できます。誤認識の多くは文字の大文字/小文字に関係し（例 HOA、nhắC）、一般的なUnicode用テキストエディタで簡単に修正できます。他の多くの誤認識は、ダイアクリティカルマークの欠落、似ている形状の間違った文字など（huu – hưu、mang – marg、h0a – hoa、la – 1a、uhìu - nhìn）のOCR処理結果です。またこれらはスペルチェッカプログラムによって簡単に修正できます。組込みの後処理機能は前述の誤りの多くを修正するのに役立ちます。</p>
75 |         <p>誤認識の最後のカテゴリはセマンティックエラーであり、検出するのが最も困難です。これはその単語が辞書内では有効なエントリですが、文脈としては間違っていることを意味します。（例 tinh – tình、vân – vấn）これらのエラーはエディタを通して読み、元画像に応じてそれらを手作業で修正する必要があります。</p>
76 |         <p>組込み機能を使用してOCR誤認識の最初の2つのカテゴリを修正する方法は次のとおりです。</p>
77 |         <ol style="margin-top: 0in" start="1" type="1">
78 |             <li>行をグループ化します。各行が別々の1行段落としてOCRされるように、行が属する段落にグループ化してください。<i>書式</i>メニュー下の<i>改行を削除</i>機能を使用します。詩ではこの操作が必要ない場合があるので注意してください。</li>
79 |             <li>文字ケースエラーの大部分を修正するために、同じく<i>書式</i>メニュー下の<i>文字ケースを変更</i>を選択し<i>［センテンスケース］</i>を選択します。残った文字ケースエラーの部分を見つけて修正します。</li>
80 |             <li>統合<i>スペルチェック</i>を使用してスペルミスエラーを修正します。</li>
81 |         </ol>
82 |         <p>以上の処理により一般的な誤認識の大部分を除去できます。残るセマンティックエラーは少ないですが、人間がエディタを通して読み、スキャン元の文書のようにその文書を編集する必要があります。</p>
83 |         <p>質問がある場合は <a href="http://sourceforge.net/projects/vietocr/forums">VietOCRフォーラム</a>に投稿してください。</p>
84 |         <hr>
85 |     </div>
86 | </body>
87 | </html>
88 | 


--------------------------------------------------------------------------------