This repository has been archived by the owner on May 7, 2024. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathrun_dcr_prod.bat
162 lines (137 loc) · 5.27 KB
/
run_dcr_prod.bat
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
@echo off
rem ----------------------------------------------------------------------------
rem
rem run_dcr_prod.bat: Document Content Recognition - Production Environment.
rem
rem ----------------------------------------------------------------------------
setlocal EnableDelayedExpansion
set DCR_CHOICE_ACTION_DEFAULT=db_u
set DCR_ENVIRONMENT_TYPE=prod
set PYTHONPATH=src
if ["%1"] EQU [""] (
echo =========================================================
echo all - Run the complete core processing of all new documents.
echo ---------------------------------------------------------
echo p_i - 1. Process the inbox directory.
echo p_2_i - 2. Convert pdf documents to image files: pdf2image / Poppler.
echo ocr - 3. Convert image files to pdf documents: Tesseract OCR / Tex Live.
echo n_2_p - 2. Convert non-pdf documents to pdf documents: Pandoc
echo ---------------------------------------------------------
echo tet - 4. Extract text and metadata from pdf documents: PDFlib TET.
echo s_p_j - 5. Store the parser result in a JSON file.
echo tkn - 6. Create qualified document tokens. SpaCy.
echo ---------------------------------------------------------
echo db_c - Create the database.
echo db_u - Upgrade the database.
echo ---------------------------------------------------------
echo e_lt - Export the line type rules.
echo ---------------------------------------------------------
echo m_p - Run the installation of the necessary 3rd party packages for production and compile all packages and modules.
echo ---------------------------------------------------------
set /P DCR_CHOICE_ACTION="Enter the desired action [default: %DCR_CHOICE_ACTION_DEFAULT%] "
if ["!DCR_CHOICE_ACTION!"] EQU [""] (
set DCR_CHOICE_ACTION=%DCR_CHOICE_ACTION_DEFAULT%
)
) else (
set DCR_CHOICE_ACTION=%1
)
echo.
echo Script %0 is now running
if exist logging_dcr.log (
del /f /q logging_dcr.log
)
echo =======================================================================
echo Start %0
echo -----------------------------------------------------------------------
echo DCR - Document Content Recognition.
echo -----------------------------------------------------------------------
echo CHOICE_ACTION : %DCR_CHOICE_ACTION%
echo ENVIRONMENT_TYPE : %DCR_ENVIRONMENT_TYPE%
echo PYTHONPATH : %PYTHONPATH%
echo -----------------------------------------------------------------------
echo:| TIME
echo =======================================================================
set _CHOICE=
if ["%DCR_CHOICE_ACTION%"] EQU ["m_p"] (
make pipenv-prod
if ERRORLEVEL 1 (
echo Processing of the script: %0 - step: 'make prod' was aborted
exit -1073741510
)
make compileall
if ERRORLEVEL 1 (
echo Processing of the script: %0 - step: 'make prod' was aborted
exit -1073741510
)
goto normal_exit
)
if ["%DCR_CHOICE_ACTION%"] EQU ["all"] (
set _CHOICE=%DCR_CHOICE_ACTION%
)
if ["%DCR_CHOICE_ACTION%"] EQU ["db_c"] (
set _CHOICE=%DCR_CHOICE_ACTION%
)
if ["%DCR_CHOICE_ACTION%"] EQU ["db_u"] (
set _CHOICE=%DCR_CHOICE_ACTION%
)
if ["%DCR_CHOICE_ACTION%"] EQU ["e_lt"] (
set _CHOICE=%DCR_CHOICE_ACTION%
)
if ["%DCR_CHOICE_ACTION%"] EQU ["n_2_p"] (
set _CHOICE=%DCR_CHOICE_ACTION%
)
if ["%DCR_CHOICE_ACTION%"] EQU ["ocr"] (
set _CHOICE=%DCR_CHOICE_ACTION%
)
if ["%DCR_CHOICE_ACTION%"] EQU ["p_i"] (
set _CHOICE=%DCR_CHOICE_ACTION%
)
if ["%DCR_CHOICE_ACTION%"] EQU ["p_2_i"] (
set _CHOICE=%DCR_CHOICE_ACTION%
)
if ["%DCR_CHOICE_ACTION%"] EQU ["s_p_j"] (
set _CHOICE=%DCR_CHOICE_ACTION%
)
if ["%DCR_CHOICE_ACTION%"] EQU ["tet"] (
set _CHOICE=%DCR_CHOICE_ACTION%
)
if ["%DCR_CHOICE_ACTION%"] EQU ["tkn"] (
set _CHOICE=%DCR_CHOICE_ACTION%
)
if ["!_CHOICE!"] EQU ["%DCR_CHOICE_ACTION%"] (
if ["%DCR_CHOICE_ACTION%"] EQU ["e_lt"] (
set DCR_CHOICE_ACTION=e_lt
)
if ["%DCR_CHOICE_ACTION%"] EQU ["p_2_i"] (
set DCR_CHOICE_ACTION=p_i %DCR_CHOICE_ACTION%
)
if ["%DCR_CHOICE_ACTION%"] EQU ["ocr"] (
set DCR_CHOICE_ACTION=p_i p_2_i %DCR_CHOICE_ACTION%
)
if ["%DCR_CHOICE_ACTION%"] EQU ["n_2_p"] (
set DCR_CHOICE_ACTION=p_i p_2_i ocr %DCR_CHOICE_ACTION%
)
if ["%DCR_CHOICE_ACTION%"] EQU ["tet"] (
set DCR_CHOICE_ACTION=p_i p_2_i ocr n_2_p %DCR_CHOICE_ACTION%
)
if ["%DCR_CHOICE_ACTION%"] EQU ["s_p_j"] (
set DCR_CHOICE_ACTION=p_i p_2_i ocr n_2_p tet %DCR_CHOICE_ACTION%
)
if ["%DCR_CHOICE_ACTION%"] EQU ["tkn"] (
set DCR_CHOICE_ACTION=p_i p_2_i ocr n_2_p tet s_p_j tkn %DCR_CHOICE_ACTION%
)
pipenv run python src\dcr\launcher.py !DCR_CHOICE_ACTION!
if ERRORLEVEL 1 (
echo Processing of the script: %0 - step: 'python src\dcr\launcher.py %DCR_CHOICE_ACTION%' was aborted
exit -1073741510
)
goto normal_exit
)
echo Usage: "run_dcr_prod[.bat] all | db_c | db_u | e_lt | m_p | n_2_p | ocr | p_i | p_2_i | s_p_j | tet | tkn"
exit -1073741510
:normal_exit
echo -----------------------------------------------------------------------
echo:| TIME
echo -----------------------------------------------------------------------
echo End %0
echo =======================================================================