-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathunshred_main.cpp
More file actions
130 lines (113 loc) · 3.48 KB
/
unshred_main.cpp
File metadata and controls
130 lines (113 loc) · 3.48 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
//////////////////////////////////////////////////////////////////////////////////////////
//
// Naming conventions used in source files and header files.
//
// Let's assume the following text content to be unshredded by this programme.
//
// a1|a2|a3
// b1|b2|b3
// c1|c2|c3
// d1|d2|d3
//
// In above example, a1, a2 or b1, etc. is a string with same width, "|" is the delimiter
// used by programme.
//
// In the programme, above data will be stored into following 2 dimensional vector:
// {
// {a1,b1,c1,d1},
// {a2,b2,c2,d2},
// {a3,b3,c3,d3}
// }
//
// A text strip refers to {a1,b1,c1,d1}, or {a2,b2,c2,d2}, etc.
// A "column" is often used to refer a text strip in data members or variables in the programme.
//
//////////////////////////////////////////////////////////////////////////////////////////
#include <boost/algorithm/string/classification.hpp>
#include <boost/algorithm/string/trim.hpp>
#include <thread>
#include <iostream>
#include "singleton_diction.h"
#include "thread_controller.h"
#include "common_classes.h"
#include "text_unshredder.h"
using namespace std;
#ifndef UTFLAG
// Main function
int main()
#else
int UTmain(const string str_infile, const string str_outfile, bool b_thread_abnormal_flag)
#endif
{
try
{
// Singleton class
SingletonDiction & singleton_dict = SingletonDiction::GetInstance();
singleton_dict.Init();
singleton_dict.BuildWordPiece();
const int max_thread_number = 10;
thread unshred_thread[max_thread_number];
TextUnshredder text_unshredder;
// Populate Populate vec_text_columns_ from input file
#ifndef UTFLAG
text_unshredder.GetInput("shredded_text.ascii");
#else
text_unshredder.GetInput(str_infile);
#endif
for (int i = 0; i < max_thread_number; ++i)
{
unshred_thread[i] = thread(ThreadController::DoTextUnshredderInThread,text_unshredder);
}
for (int i = 0; i < max_thread_number; ++i)
unshred_thread[i].join();
#ifndef UTFLAG
if (ThreadController::n_thread_abnormals_ > 0)
#else
if (b_thread_abnormal_flag == true)
#endif
{
string s_abormals_count = to_string(ThreadController::n_thread_abnormals_);
string s_threads_count = to_string(max_thread_number);
string s_error_message = s_abormals_count + " out of " + s_threads_count + " threads threw abormal errors!";
throw runtime_error(s_error_message);
}
if (ThreadController::vec_final_merged_text_.empty())
{
throw runtime_error("Abnormal error occured!");
}
else
{
for ( int i = 0; i < ThreadController::vec_final_merged_text_.size(); ++i)
{
boost::trim_right_if (ThreadController::vec_final_merged_text_[i], boost::is_any_of(" "));
}
#ifndef UTFLAG
TextFileOperation::WriteText("restored_text.ascii", ThreadController::vec_final_merged_text_);
#else
TextFileOperation::WriteText(str_outfile, ThreadController::vec_final_merged_text_);
#endif
}
if (ThreadController::b_premature_flag_ == true)
{
#ifndef UTFLAG
cout <<"Partially restored! Number of "<< ThreadController::n_premature_column_count_ << " text strips cannot be restored successfully and just append to the right side!" << endl;
#endif
return 1;
}
else
{
#ifndef UTFLAG
cout <<"Successfully restored!" << endl;
#endif
return 0;
}
}
catch(exception & ref_exception)
{
#ifndef UTFLAG
cout << ref_exception.what() << endl;
cout << "Error occured. Abort!" << endl;
#endif
return 2;
}
}