1 năm trước cách đây · df4c0d4310
--- a/.gitignore
+++ b/.gitignore
@@ -27,6 +27,14 @@ __pycache__/
 
				 /output/
			
 
				 /inference_model/
			
 
				 /output_inference/
			
 
				+/Dewarp/convert_result/
			
 
				+/Dewarp/datasets/
			
 
				+/Dewarp/outputs/
			
 
				+/Dewarp/test_data/
			
 
				+/Dewarp/test_imgs/
			
 
				+/Dewarp/imgs_result/
			
 
				+/Dewarp/video/
			
 
				+/Dewarp/video_frame/
			
 
				 /parts/
			
 
				 /sdist/
			
 
				 /var/
			
--- a/Dewarp/LICENSE
+++ b/Dewarp/LICENSE
@@ -0,0 +1,201 @@
 
				+                                 Apache License
			
 
				+                           Version 2.0, January 2004
			
 
				+                        http://www.apache.org/licenses/
			
 
				+
			
 
				+   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
			
 
				+
			
 
				+   1. Definitions.
			
 
				+
			
 
				+      "License" shall mean the terms and conditions for use, reproduction,
			
 
				+      and distribution as defined by Sections 1 through 9 of this document.
			
 
				+
			
 
				+      "Licensor" shall mean the copyright owner or entity authorized by
			
 
				+      the copyright owner that is granting the License.
			
 
				+
			
 
				+      "Legal Entity" shall mean the union of the acting entity and all
			
 
				+      other entities that control, are controlled by, or are under common
			
 
				+      control with that entity. For the purposes of this definition,
			
 
				+      "control" means (i) the power, direct or indirect, to cause the
			
 
				+      direction or management of such entity, whether by contract or
			
 
				+      otherwise, or (ii) ownership of fifty percent (50%) or more of the
			
 
				+      outstanding shares, or (iii) beneficial ownership of such entity.
			
 
				+
			
 
				+      "You" (or "Your") shall mean an individual or Legal Entity
			
 
				+      exercising permissions granted by this License.
			
 
				+
			
 
				+      "Source" form shall mean the preferred form for making modifications,
			
 
				+      including but not limited to software source code, documentation
			
 
				+      source, and configuration files.
			
 
				+
			
 
				+      "Object" form shall mean any form resulting from mechanical
			
 
				+      transformation or translation of a Source form, including but
			
 
				+      not limited to compiled object code, generated documentation,
			
 
				+      and conversions to other media types.
			
 
				+
			
 
				+      "Work" shall mean the work of authorship, whether in Source or
			
 
				+      Object form, made available under the License, as indicated by a
			
 
				+      copyright notice that is included in or attached to the work
			
 
				+      (an example is provided in the Appendix below).
			
 
				+
			
 
				+      "Derivative Works" shall mean any work, whether in Source or Object
			
 
				+      form, that is based on (or derived from) the Work and for which the
			
 
				+      editorial revisions, annotations, elaborations, or other modifications
			
 
				+      represent, as a whole, an original work of authorship. For the purposes
			
 
				+      of this License, Derivative Works shall not include works that remain
			
 
				+      separable from, or merely link (or bind by name) to the interfaces of,
			
 
				+      the Work and Derivative Works thereof.
			
 
				+
			
 
				+      "Contribution" shall mean any work of authorship, including
			
 
				+      the original version of the Work and any modifications or additions
			
 
				+      to that Work or Derivative Works thereof, that is intentionally
			
 
				+      submitted to Licensor for inclusion in the Work by the copyright owner
			
 
				+      or by an individual or Legal Entity authorized to submit on behalf of
			
 
				+      the copyright owner. For the purposes of this definition, "submitted"
			
 
				+      means any form of electronic, verbal, or written communication sent
			
 
				+      to the Licensor or its representatives, including but not limited to
			
 
				+      communication on electronic mailing lists, source code control systems,
			
 
				+      and issue tracking systems that are managed by, or on behalf of, the
			
 
				+      Licensor for the purpose of discussing and improving the Work, but
			
 
				+      excluding communication that is conspicuously marked or otherwise
			
 
				+      designated in writing by the copyright owner as "Not a Contribution."
			
 
				+
			
 
				+      "Contributor" shall mean Licensor and any individual or Legal Entity
			
 
				+      on behalf of whom a Contribution has been received by Licensor and
			
 
				+      subsequently incorporated within the Work.
			
 
				+
			
 
				+   2. Grant of Copyright License. Subject to the terms and conditions of
			
 
				+      this License, each Contributor hereby grants to You a perpetual,
			
 
				+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
			
 
				+      copyright license to reproduce, prepare Derivative Works of,
			
 
				+      publicly display, publicly perform, sublicense, and distribute the
			
 
				+      Work and such Derivative Works in Source or Object form.
			
 
				+
			
 
				+   3. Grant of Patent License. Subject to the terms and conditions of
			
 
				+      this License, each Contributor hereby grants to You a perpetual,
			
 
				+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
			
 
				+      (except as stated in this section) patent license to make, have made,
			
 
				+      use, offer to sell, sell, import, and otherwise transfer the Work,
			
 
				+      where such license applies only to those patent claims licensable
			
 
				+      by such Contributor that are necessarily infringed by their
			
 
				+      Contribution(s) alone or by combination of their Contribution(s)
			
 
				+      with the Work to which such Contribution(s) was submitted. If You
			
 
				+      institute patent litigation against any entity (including a
			
 
				+      cross-claim or counterclaim in a lawsuit) alleging that the Work
			
 
				+      or a Contribution incorporated within the Work constitutes direct
			
 
				+      or contributory patent infringement, then any patent licenses
			
 
				+      granted to You under this License for that Work shall terminate
			
 
				+      as of the date such litigation is filed.
			
 
				+
			
 
				+   4. Redistribution. You may reproduce and distribute copies of the
			
 
				+      Work or Derivative Works thereof in any medium, with or without
			
 
				+      modifications, and in Source or Object form, provided that You
			
 
				+      meet the following conditions:
			
 
				+
			
 
				+      (a) You must give any other recipients of the Work or
			
 
				+          Derivative Works a copy of this License; and
			
 
				+
			
 
				+      (b) You must cause any modified files to carry prominent notices
			
 
				+          stating that You changed the files; and
			
 
				+
			
 
				+      (c) You must retain, in the Source form of any Derivative Works
			
 
				+          that You distribute, all copyright, patent, trademark, and
			
 
				+          attribution notices from the Source form of the Work,
			
 
				+          excluding those notices that do not pertain to any part of
			
 
				+          the Derivative Works; and
			
 
				+
			
 
				+      (d) If the Work includes a "NOTICE" text file as part of its
			
 
				+          distribution, then any Derivative Works that You distribute must
			
 
				+          include a readable copy of the attribution notices contained
			
 
				+          within such NOTICE file, excluding those notices that do not
			
 
				+          pertain to any part of the Derivative Works, in at least one
			
 
				+          of the following places: within a NOTICE text file distributed
			
 
				+          as part of the Derivative Works; within the Source form or
			
 
				+          documentation, if provided along with the Derivative Works; or,
			
 
				+          within a display generated by the Derivative Works, if and
			
 
				+          wherever such third-party notices normally appear. The contents
			
 
				+          of the NOTICE file are for informational purposes only and
			
 
				+          do not modify the License. You may add Your own attribution
			
 
				+          notices within Derivative Works that You distribute, alongside
			
 
				+          or as an addendum to the NOTICE text from the Work, provided
			
 
				+          that such additional attribution notices cannot be construed
			
 
				+          as modifying the License.
			
 
				+
			
 
				+      You may add Your own copyright statement to Your modifications and
			
 
				+      may provide additional or different license terms and conditions
			
 
				+      for use, reproduction, or distribution of Your modifications, or
			
 
				+      for any such Derivative Works as a whole, provided Your use,
			
 
				+      reproduction, and distribution of the Work otherwise complies with
			
 
				+      the conditions stated in this License.
			
 
				+
			
 
				+   5. Submission of Contributions. Unless You explicitly state otherwise,
			
 
				+      any Contribution intentionally submitted for inclusion in the Work
			
 
				+      by You to the Licensor shall be under the terms and conditions of
			
 
				+      this License, without any additional terms or conditions.
			
 
				+      Notwithstanding the above, nothing herein shall supersede or modify
			
 
				+      the terms of any separate license agreement you may have executed
			
 
				+      with Licensor regarding such Contributions.
			
 
				+
			
 
				+   6. Trademarks. This License does not grant permission to use the trade
			
 
				+      names, trademarks, service marks, or product names of the Licensor,
			
 
				+      except as required for reasonable and customary use in describing the
			
 
				+      origin of the Work and reproducing the content of the NOTICE file.
			
 
				+
			
 
				+   7. Disclaimer of Warranty. Unless required by applicable law or
			
 
				+      agreed to in writing, Licensor provides the Work (and each
			
 
				+      Contributor provides its Contributions) on an "AS IS" BASIS,
			
 
				+      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
			
 
				+      implied, including, without limitation, any warranties or conditions
			
 
				+      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
			
 
				+      PARTICULAR PURPOSE. You are solely responsible for determining the
			
 
				+      appropriateness of using or redistributing the Work and assume any
			
 
				+      risks associated with Your exercise of permissions under this License.
			
 
				+
			
 
				+   8. Limitation of Liability. In no event and under no legal theory,
			
 
				+      whether in tort (including negligence), contract, or otherwise,
			
 
				+      unless required by applicable law (such as deliberate and grossly
			
 
				+      negligent acts) or agreed to in writing, shall any Contributor be
			
 
				+      liable to You for damages, including any direct, indirect, special,
			
 
				+      incidental, or consequential damages of any character arising as a
			
 
				+      result of this License or out of the use or inability to use the
			
 
				+      Work (including but not limited to damages for loss of goodwill,
			
 
				+      work stoppage, computer failure or malfunction, or any and all
			
 
				+      other commercial damages or losses), even if such Contributor
			
 
				+      has been advised of the possibility of such damages.
			
 
				+
			
 
				+   9. Accepting Warranty or Additional Liability. While redistributing
			
 
				+      the Work or Derivative Works thereof, You may choose to offer,
			
 
				+      and charge a fee for, acceptance of support, warranty, indemnity,
			
 
				+      or other liability obligations and/or rights consistent with this
			
 
				+      License. However, in accepting such obligations, You may act only
			
 
				+      on Your own behalf and on Your sole responsibility, not on behalf
			
 
				+      of any other Contributor, and only if You agree to indemnify,
			
 
				+      defend, and hold each Contributor harmless for any liability
			
 
				+      incurred by, or claims asserted against, such Contributor by reason
			
 
				+      of your accepting any such warranty or additional liability.
			
 
				+
			
 
				+   END OF TERMS AND CONDITIONS
			
 
				+
			
 
				+   APPENDIX: How to apply the Apache License to your work.
			
 
				+
			
 
				+      To apply the Apache License to your work, attach the following
			
 
				+      boilerplate notice, with the fields enclosed by brackets "{}"
			
 
				+      replaced with your own identifying information. (Don't include
			
 
				+      the brackets!)  The text should be enclosed in the appropriate
			
 
				+      comment syntax for the file format. We also recommend that a
			
 
				+      file or class name and description of purpose be included on the
			
 
				+      same "printed page" as the copyright notice for easier
			
 
				+      identification within third-party archives.
			
 
				+
			
 
				+   Copyright {yyyy} {name of copyright owner}
			
 
				+
			
 
				+   Licensed under the Apache License, Version 2.0 (the "License");
			
 
				+   you may not use this file except in compliance with the License.
			
 
				+   You may obtain a copy of the License at
			
 
				+
			
 
				+       http://www.apache.org/licenses/LICENSE-2.0
			
 
				+
			
 
				+   Unless required by applicable law or agreed to in writing, software
			
 
				+   distributed under the License is distributed on an "AS IS" BASIS,
			
 
				+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				+   See the License for the specific language governing permissions and
			
 
				+   limitations under the License.
			
--- a/Dewarp/README.md
+++ b/Dewarp/README.md
--- a/Dewarp/corner_data_generator.py
+++ b/Dewarp/corner_data_generator.py
@@ -0,0 +1,68 @@
 
				+''' Document Localization using Recursive CNN
			
 
				+ Maintainer : Khurram Javed
			
 
				+ Email : kjaved@ualberta.ca '''
			
 
				+
			
 
				+import os
			
 
				+import cv2
			
 
				+import numpy as np
			
 
				+
			
 
				+import dataprocessor
			
 
				+from utils import utils
			
 
				+
			
 
				+
			
 
				+def args_processor():
			
 
				+    import argparse
			
 
				+    parser = argparse.ArgumentParser()
			
 
				+    parser.add_argument("-i", "--input-dir", help="Path to data files (Extract images using video_to_image.py first")
			
 
				+    parser.add_argument("-o", "--output-dir", help="Directory to store results")
			
 
				+    parser.add_argument("--dataset", default="smartdoc", help="'smartdoc' or 'selfcollected' dataset")
			
 
				+    return parser.parse_args()
			
 
				+
			
 
				+
			
 
				+if __name__ == '__main__':
			
 
				+    args = args_processor()
			
 
				+    input_directory = args.input_dir
			
 
				+    if not os.path.isdir(args.output_dir):
			
 
				+        os.mkdir(args.output_dir)
			
 
				+    import csv
			
 
				+
			
 
				+    # Dataset iterator
			
 
				+    if args.dataset=="smartdoc":
			
 
				+        dataset_test = dataprocessor.dataset.SmartDocDirectories(input_directory)
			
 
				+    elif args.dataset=="selfcollected":
			
 
				+        dataset_test = dataprocessor.dataset.SelfCollectedDataset(input_directory)
			
 
				+    else:
			
 
				+        print ("Incorrect dataset type; please choose between smartdoc or selfcollected")
			
 
				+        assert(False)
			
 
				+    with open(os.path.join(args.output_dir, 'gt.csv'), 'a', newline='') as csvfile:
			
 
				+        spamwriter = csv.writer(csvfile, delimiter=',',
			
 
				+                                quotechar='|')
			
 
				+        # Counter for file naming
			
 
				+        counter = 0
			
 
				+        for data_elem in dataset_test.myData:
			
 
				+
			
 
				+            img_path = data_elem[0]
			
 
				+            target = data_elem[1].reshape((4, 2))
			
 
				+            img = cv2.imread(img_path)
			
 
				+            if args.dataset=="selfcollected":
			
 
				+                target = target / (img.shape[1], img.shape[0])
			
 
				+                target = target * (1920, 1920)
			
 
				+                img = cv2.resize(img, (1920, 1920))
			
 
				+            corner_cords = target
			
 
				+
			
 
				+            for angle in range(0, 90, 1):
			
 
				+                print(angle)
			
 
				+                img_rotate, gt_rotate = utils.rotate(img, corner_cords, angle)
			
 
				+                for random_crop in range(0, 1):
			
 
				+                    img_list, gt_list = utils.get_corners(img_rotate, gt_rotate)
			
 
				+                    for a in range(0, 4):
			
 
				+                        counter += 1
			
 
				+                        f_name = str(counter).zfill(8)
			
 
				+                        print(gt_list[a])
			
 
				+                        gt_store = list(np.array(gt_list[a]) / (300, 300))
			
 
				+                        img_store = cv2.resize(img_list[a], (64, 64))
			
 
				+                        # cv2.circle(img_store, tuple(list((np.array(gt_store)*64).astype(int))), 2, (255, 0, 0), 2)
			
 
				+
			
 
				+                        cv2.imwrite(os.path.join(args.output_dir, f_name + ".jpg"),
			
 
				+                                    img_store, [int(cv2.IMWRITE_JPEG_QUALITY), 80])
			
 
				+                        spamwriter.writerow((f_name + ".jpg", tuple(gt_store)))
			
--- a/Dewarp/csv_convert.py
+++ b/Dewarp/csv_convert.py
@@ -0,0 +1,40 @@
 
				+import argparse
			
 
				+import csv
			
 
				+import os
			
 
				+from tqdm import tqdm
			
 
				+
			
 
				+
			
 
				+def run(csv_path, save_folder):
			
 
				+    if not os.path.exists(csv_path):
			
 
				+        print(csv_path, 'not exist')
			
 
				+        return
			
 
				+    if not os.path.exists(save_folder):
			
 
				+        os.makedirs(save_folder)
			
 
				+    csv_file = csv.reader(open(csv_path, 'r'))
			
 
				+    cnt = 1
			
 
				+    for line in tqdm(csv_file):
			
 
				+        # 文件名
			
 
				+        name = line[0].split('/')[-1]
			
 
				+        print(name)
			
 
				+        if cnt != 1:
			
 
				+            with open(save_folder + '/' + name + '.csv', 'a', encoding='utf-8') as fp:
			
 
				+            # 打印四个点信息
			
 
				+                ll = line[7:]
			
 
				+                height = int(ll[4].split(':')[-1])
			
 
				+                width = int(ll[5][16:-1])
			
 
				+                # print(height*width)
			
 
				+                for i in range(0, 24, 6):
			
 
				+                    x = float(ll[i].split(':')[-1])
			
 
				+                    y = float(ll[i+1].split(':')[-1])
			
 
				+                    text = str(width*x/100) + ' ' + str(height*y/100) + '\n'
			
 
				+                    fp.write(text)
			
 
				+            fp.close()
			
 
				+        cnt += 1
			
 
				+
			
 
				+
			
 
				+if __name__ == '__main__':
			
 
				+    parser = argparse.ArgumentParser()
			
 
				+    parser.add_argument('--csv_path', type=str, default='my_data_1.0.1.csv')
			
 
				+    parser.add_argument('--save_folder', type=str, default='./convert_result')
			
 
				+    args = parser.parse_args()
			
 
				+    run(args.csv_path, args.save_folder)
			
--- a/Dewarp/data.csv
+++ b/Dewarp/data.csv
@@ -0,0 +1,4 @@
 
				+470.909090909091 511.27272727272725
			
 
				+1905.0 568.0909090909091
			
 
				+373.18181818181824 2618.090909090909
			
 
				+2066.3636363636365 2638.5454545454545
			
--- a/Dewarp/data_augmentor/augmentData.py
+++ b/Dewarp/data_augmentor/augmentData.py
@@ -0,0 +1,67 @@
 
				+import os
			
 
				+
			
 
				+import cv2
			
 
				+import numpy as np
			
 
				+
			
 
				+import utils
			
 
				+
			
 
				+
			
 
				+def argsProcessor():
			
 
				+    import argparse
			
 
				+    parser = argparse.ArgumentParser()
			
 
				+    parser.add_argument("-i", "--dataPath", help="DataPath")
			
 
				+    parser.add_argument("-o", "--outputFiles", help="outputFiles", default="bar")
			
 
				+    return parser.parse_args()
			
 
				+
			
 
				+args = argsProcessor()
			
 
				+
			
 
				+output_dir = args.outputFiles
			
 
				+if (not os.path.isdir(output_dir)):
			
 
				+    os.mkdir(output_dir)
			
 
				+
			
 
				+dir = args.dataPath
			
 
				+import csv
			
 
				+
			
 
				+with open(output_dir+"/gt.csv", 'a') as csvfile:
			
 
				+    spamwriter_1 = csv.writer(csvfile, delimiter=',',
			
 
				+                                quotechar='|', quoting=csv.QUOTE_MINIMAL)
			
 
				+    for image in os.listdir(dir):
			
 
				+        if image.endswith("jpg") or image.endswith("JPG"):
			
 
				+            if os.path.isfile(dir+"/"+image+".csv"):
			
 
				+                with open(dir+"/"+image+ ".csv", 'r') as csvfile:
			
 
				+                    spamwriter = csv.reader(csvfile, delimiter=' ',
			
 
				+                                            quotechar='|', quoting=csv.QUOTE_MINIMAL)
			
 
				+                    img = cv2.imread(dir +"/"+ image)
			
 
				+                    print (image)
			
 
				+                    gt= []
			
 
				+                    for row in spamwriter:
			
 
				+                        gt.append(row)
			
 
				+                        # img = cv2.circle(img, (int(float(row[0])), int(float(row[1]))), 2,(255,0,0),90)
			
 
				+                    gt =np.array(gt).astype(np.float32)
			
 
				+                    gt = gt / (img.shape[1], img.shape[0])
			
 
				+                    gt = gt * (1080, 1080)
			
 
				+                    img = cv2.resize(img, (1080, 1080))
			
 
				+
			
 
				+
			
 
				+                    print (gt)
			
 
				+
			
 
				+                    for angle in range(0,271,90):
			
 
				+                        img_rotate, gt_rotate = utils.rotate(img, gt, angle)
			
 
				+                        for random_crop in range(0,16):
			
 
				+                            img_crop, gt_crop = utils.random_crop(img_rotate, gt_rotate)
			
 
				+                            mah_size = img_crop.shape
			
 
				+                            img_crop = cv2.resize(img_crop, (64, 64))
			
 
				+                            gt_crop = np.array(gt_crop)
			
 
				+
			
 
				+                            # gt_crop = gt_crop*(1.0 / mah_size[1],1.0 / mah_size[0])
			
 
				+
			
 
				+                            # for a in range(0,4):
			
 
				+                            # no=0
			
 
				+                            # for a in range(0,4):
			
 
				+                            #     no+=1
			
 
				+                            #     cv2.circle(img_crop, tuple(((gt_crop[a]*64).astype(int))), 2,(255-no*60,no*60,0),9)
			
 
				+                            # # # cv2.imwrite("asda.jpg", img)
			
 
				+
			
 
				+                            cv2.imwrite(output_dir + "/" +str(angle)+str(random_crop)+ image, img_crop)
			
 
				+                            spamwriter_1.writerow((str(angle)+str(random_crop)+ image, tuple(list(gt_crop))))
			
 
				+
			
--- a/Dewarp/data_augmentor/cornerData.py
+++ b/Dewarp/data_augmentor/cornerData.py
@@ -0,0 +1,63 @@
 
				+import os
			
 
				+
			
 
				+import cv2
			
 
				+import numpy as np
			
 
				+
			
 
				+import utils
			
 
				+
			
 
				+def argsProcessor():
			
 
				+    import argparse
			
 
				+    parser = argparse.ArgumentParser()
			
 
				+    parser.add_argument("-i", "--dataPath", help="DataPath")
			
 
				+    parser.add_argument("-o", "--outputFiles", help="outputFiles", default="bar")
			
 
				+    return parser.parse_args()
			
 
				+
			
 
				+args = argsProcessor()
			
 
				+
			
 
				+output_dir = args.outputFiles
			
 
				+if (not os.path.isdir(output_dir)):
			
 
				+    os.mkdir(output_dir)
			
 
				+
			
 
				+dir = args.dataPath
			
 
				+import csv
			
 
				+
			
 
				+with open(output_dir+"/gt.csv", 'a') as csvfile:
			
 
				+    spamwriter_1 = csv.writer(csvfile, delimiter=',',
			
 
				+                                quotechar='|', quoting=csv.QUOTE_MINIMAL)
			
 
				+    for image in os.listdir(dir):
			
 
				+        if image.endswith("jpg"):
			
 
				+            if os.path.isfile(dir+"/"+image+".csv"):
			
 
				+                with open(dir+"/"+image+ ".csv", 'r') as csvfile:
			
 
				+                    spamwriter = csv.reader(csvfile, delimiter=' ',
			
 
				+                                            quotechar='|', quoting=csv.QUOTE_MINIMAL)
			
 
				+                    img = cv2.imread(dir +"/"+ image)
			
 
				+                    print (image)
			
 
				+                    gt= []
			
 
				+                    for row in spamwriter:
			
 
				+                        gt.append(row)
			
 
				+                        # img = cv2.circle(img, (int(float(row[0])), int(float(row[1]))), 2,(255,0,0),90)
			
 
				+                    gt =np.array(gt).astype(np.float32)
			
 
				+
			
 
				+
			
 
				+                    # print gt
			
 
				+                    gt = gt / (img.shape[1], img.shape[0])
			
 
				+
			
 
				+                    gt = gt * (1080, 1080)
			
 
				+
			
 
				+                    img = cv2.resize(img, ( 1080,1080))
			
 
				+                    # for a in range(0,4):
			
 
				+                    #     img = cv2.circle(img, tuple((gt[a].astype(int))), 2, (255, 0, 0), 9)
			
 
				+                    # cv2.imwrite("asda.jpg", img)
			
 
				+                    # 0/0
			
 
				+                    for angle in range(0,271,90):
			
 
				+                        img_rotate, gt_rotate = utils.rotate(img, gt, angle)
			
 
				+                        for random_crop in range(0,16):
			
 
				+                            img_list, gt_list = utils.getCorners(img_rotate, gt_rotate)
			
 
				+                            for a in range(0,4):
			
 
				+                                print (gt_list[a])
			
 
				+                                gt_store = list(np.array(gt_list[a])/(300,300))
			
 
				+                                img_store = cv2.resize(img_list[a], (64,64))
			
 
				+                                print (tuple(list(np.array(gt_store)*64)))
			
 
				+                                # cv2.circle(img_store, tuple(list((np.array(gt_store)*64).astype(int))), 2, (255, 0, 0), 2)
			
 
				+                                cv2.imwrite( output_dir+"/"+image + str(angle) +str(random_crop) + str(a) +".jpg", img_store)
			
 
				+                                spamwriter_1.writerow(( image + str(angle) +str(random_crop) + str(a) +".jpg", tuple(gt_store)))
			
--- a/Dewarp/data_augmentor/label.py
+++ b/Dewarp/data_augmentor/label.py
@@ -0,0 +1,32 @@
 
				+import os
			
 
				+
			
 
				+import matplotlib.image as mpimg
			
 
				+import matplotlib.pyplot as plt
			
 
				+
			
 
				+current_file = None
			
 
				+
			
 
				+
			
 
				+def onclick(event):
			
 
				+    if event.dblclick:
			
 
				+        print('button=%d, x=%d, y=%d, xdata=%f, ydata=%f' %
			
 
				+              (event.button, event.x, event.y, event.xdata, event.ydata))
			
 
				+        import csv
			
 
				+        with open(current_file + ".csv", 'a') as csvfile:
			
 
				+            spamwriter = csv.writer(csvfile, delimiter=' ',
			
 
				+                                    quotechar='|', quoting=csv.QUOTE_MINIMAL)
			
 
				+            spamwriter.writerow([str(event.xdata), str(event.ydata)])
			
 
				+
			
 
				+
			
 
				+dir = "../data1/"
			
 
				+for image in os.listdir(dir):
			
 
				+    if image.endswith("jpg") or image.endswith("JPG"):
			
 
				+        if os.path.isfile(dir + image + ".csv"):
			
 
				+            pass
			
 
				+        else:
			
 
				+            fig = plt.figure()
			
 
				+            cid = fig.canvas.mpl_connect('button_press_event', onclick)
			
 
				+            print(dir + image)
			
 
				+            current_file = dir + image
			
 
				+            img = mpimg.imread(dir + image)
			
 
				+            plt.imshow(img)
			
 
				+            plt.show()
			
--- a/Dewarp/data_augmentor/testData.py
+++ b/Dewarp/data_augmentor/testData.py
@@ -0,0 +1,21 @@
 
				+import os
			
 
				+import numpy as np
			
 
				+import cv2
			
 
				+import csv
			
 
				+
			
 
				+dir = "../data1/"
			
 
				+for image in os.listdir(dir):
			
 
				+    if image.endswith("jpg") or image.endswith("JPG"):
			
 
				+        if os.path.isfile(dir+image+".csv"):
			
 
				+            with open(dir+image+ ".csv", 'r') as csvfile:
			
 
				+                spamwriter = csv.reader(csvfile, delimiter=' ',
			
 
				+                                        quotechar='|', quoting=csv.QUOTE_MINIMAL)
			
 
				+                img = cv2.imread(dir + image)
			
 
				+                no = 0
			
 
				+                for row in spamwriter:
			
 
				+                    no+=1
			
 
				+                    print (row)
			
 
				+                    img = cv2.circle(img, (int(float(row[0])), int(float(row[1]))), 2,(255-no*60,no*60,0),90)
			
 
				+                img = cv2.resize(img, (300,300))
			
 
				+                cv2.imshow("a",img)
			
 
				+                cv2.waitKey(0)
			
--- a/Dewarp/dataprocessor/__init__.py
+++ b/Dewarp/dataprocessor/__init__.py
@@ -0,0 +1,4 @@
 
				+from dataprocessor.datasetfactory import *
			
 
				+from dataprocessor.dataloaders import *
			
 
				+from dataprocessor.loaderfactory import *
			
 
				+from dataprocessor.dataset import *
			
--- a/Dewarp/dataprocessor/dataloaders.py
+++ b/Dewarp/dataprocessor/dataloaders.py
@@ -0,0 +1,117 @@
 
				+''' Document Localization using Recursive CNN
			
 
				+ Maintainer : Khurram Javed
			
 
				+ Email : kjaved@ualberta.ca '''
			
 
				+
			
 
				+import logging
			
 
				+
			
 
				+import PIL
			
 
				+import torch.utils.data as td
			
 
				+import tqdm
			
 
				+from PIL import Image
			
 
				+
			
 
				+logger = logging.getLogger('iCARL')
			
 
				+
			
 
				+
			
 
				+class HddLoader(td.Dataset):
			
 
				+    def __init__(self, data, transform=None, cuda=False):
			
 
				+        self.data = data
			
 
				+
			
 
				+        self.transform = transform
			
 
				+        self.cuda = cuda
			
 
				+        self.len = len(data[0])
			
 
				+
			
 
				+    def __len__(self):
			
 
				+        return self.len
			
 
				+
			
 
				+    def __getitem__(self, index):
			
 
				+        '''
			
 
				+        Replacing this with a more efficient implemnetation selection; removing c
			
 
				+        :param index: 
			
 
				+        :return: 
			
 
				+        '''
			
 
				+        assert (index < len(self.data[0]))
			
 
				+        assert (index < self.len)
			
 
				+        img = Image.open(self.data[0][index])
			
 
				+        target = self.data[1][index]
			
 
				+        if self.transform is not None:
			
 
				+            img = self.transform(img)
			
 
				+
			
 
				+        return img, target
			
 
				+
			
 
				+class RamLoader(td.Dataset):
			
 
				+    def __init__(self, data, transform=None, cuda=False):
			
 
				+        self.data = data
			
 
				+
			
 
				+        self.transform = transform
			
 
				+        self.cuda = cuda
			
 
				+        self.len = len(data[0])
			
 
				+        self.loadInRam()
			
 
				+
			
 
				+    def loadInRam(self):
			
 
				+        self.loaded_data = []
			
 
				+        logger.info("Loading data in RAM")
			
 
				+        for i in tqdm.tqdm(self.data[0]):
			
 
				+            img = Image.open(i)
			
 
				+            if self.transform is not None:
			
 
				+                img = self.transform(img)
			
 
				+            self.loaded_data.append(img)
			
 
				+
			
 
				+    def __len__(self):
			
 
				+        return self.len
			
 
				+
			
 
				+    def __getitem__(self, index):
			
 
				+        '''
			
 
				+        Replacing this with a more efficient implemnetation selection; removing c
			
 
				+        :param index: 
			
 
				+        :return: 
			
 
				+        '''
			
 
				+        assert (index < len(self.data[0]))
			
 
				+        assert (index < self.len)
			
 
				+        target = self.data[1][index]
			
 
				+        img = self.loaded_data[index]
			
 
				+        return img, target
			
 
				+
			
 
				+
			
 
				+
			
 
				+class SingleFolderLoaderResized(td.Dataset):
			
 
				+    '''
			
 
				+    This loader class decodes all the images into tensors; this removes the decoding time.
			
 
				+    '''
			
 
				+
			
 
				+    def __init__(self, data, transform=None, cuda=False):
			
 
				+
			
 
				+        self.data = data
			
 
				+
			
 
				+        self.transform = transform
			
 
				+        self.cuda = cuda
			
 
				+        self.len = len(data)
			
 
				+        self.decodeImages()
			
 
				+
			
 
				+    def decodeImages(self):
			
 
				+        self.loaded_data = []
			
 
				+        logger.info("Resizing Images")
			
 
				+        for i in tqdm.tqdm(self.data):
			
 
				+            i = i[0]
			
 
				+            img = Image.open(i)
			
 
				+            img = img.resize((32, 32), PIL.Image.ANTIALIAS)
			
 
				+            img.save(i)
			
 
				+
			
 
				+    def __len__(self):
			
 
				+        return self.len
			
 
				+
			
 
				+    def __getitem__(self, index):
			
 
				+        '''
			
 
				+        Replacing this with a more efficient implemnetation selection; removing c
			
 
				+        :param index: 
			
 
				+        :return: 
			
 
				+        '''
			
 
				+        assert (index < len(self.data))
			
 
				+        assert (index < self.len)
			
 
				+
			
 
				+        img = Image.open(self.data[index][0])
			
 
				+        target = self.data[index][1]
			
 
				+        if self.transform is not None:
			
 
				+            img = self.transform(img)
			
 
				+
			
 
				+        return img, target
			
 
				+
			
--- a/Dewarp/dataprocessor/dataset.py
+++ b/Dewarp/dataprocessor/dataset.py
@@ -0,0 +1,207 @@
 
				+''' Document Localization using Recursive CNN
			
 
				+ Maintainer : Khurram Javed
			
 
				+ Email : kjaved@ualberta.ca '''
			
 
				+
			
 
				+import csv
			
 
				+import logging
			
 
				+import os
			
 
				+import xml.etree.ElementTree as ET
			
 
				+
			
 
				+import numpy as np
			
 
				+from torchvision import transforms
			
 
				+
			
 
				+import utils.utils as utils
			
 
				+
			
 
				+# To incdude a new Dataset, inherit from Dataset and add all the Dataset specific parameters here.
			
 
				+# Goal : Remove any data specific parameters from the rest of the code
			
 
				+
			
 
				+logger = logging.getLogger('iCARL')
			
 
				+
			
 
				+
			
 
				+class Dataset():
			
 
				+    '''
			
 
				+    Base class to reprenent a Dataset
			
 
				+    '''
			
 
				+
			
 
				+    def __init__(self, name):
			
 
				+        self.name = name
			
 
				+        self.data = []
			
 
				+        self.labels = []
			
 
				+
			
 
				+
			
 
				+class SmartDoc(Dataset):
			
 
				+    '''
			
 
				+    Class to include MNIST specific details
			
 
				+    '''
			
 
				+
			
 
				+    def __init__(self, directory="data"):
			
 
				+        super().__init__("smartdoc")
			
 
				+        self.data = []
			
 
				+        self.labels = []
			
 
				+        for d in directory:
			
 
				+            self.directory = d
			
 
				+            self.train_transform = transforms.Compose([transforms.Resize([32, 32]),
			
 
				+                                                       transforms.ColorJitter(1.5, 1.5, 0.9, 0.5),
			
 
				+                                                       transforms.ToTensor()])
			
 
				+
			
 
				+            self.test_transform = transforms.Compose([transforms.Resize([32, 32]),
			
 
				+                                                      transforms.ToTensor()])
			
 
				+
			
 
				+            logger.info("Pass train/test data paths here")
			
 
				+
			
 
				+            self.classes_list = {}
			
 
				+
			
 
				+            file_names = []
			
 
				+            print (self.directory, "gt.csv")
			
 
				+            with open(os.path.join(self.directory, "gt.csv"), 'r') as csvfile:
			
 
				+                spamreader = csv.reader(csvfile, delimiter=',', quotechar='|', quoting=csv.QUOTE_MINIMAL)
			
 
				+                import ast
			
 
				+                for row in spamreader:
			
 
				+                    file_names.append(row[0])
			
 
				+                    self.data.append(os.path.join(self.directory, row[0]))
			
 
				+                    test = row[1].replace("array", "")
			
 
				+                    self.labels.append((ast.literal_eval(test)))
			
 
				+        self.labels = np.array(self.labels)
			
 
				+
			
 
				+        self.labels = np.reshape(self.labels, (-1, 8))
			
 
				+        logger.debug("Ground Truth Shape: %s", str(self.labels.shape))
			
 
				+        logger.debug("Data shape %s", str(len(self.data)))
			
 
				+
			
 
				+        self.myData = [self.data, self.labels]
			
 
				+
			
 
				+
			
 
				+class SmartDocDirectories(Dataset):
			
 
				+    '''
			
 
				+    Class to include MNIST specific details
			
 
				+    '''
			
 
				+
			
 
				+    def __init__(self, directory="data"):
			
 
				+        super().__init__("smartdoc")
			
 
				+        self.data = []
			
 
				+        self.labels = []
			
 
				+
			
 
				+        for folder in os.listdir(directory):
			
 
				+            if (os.path.isdir(directory + "/" + folder)):
			
 
				+                for file in os.listdir(directory + "/" + folder):
			
 
				+                    images_dir = directory + "/" + folder + "/" + file
			
 
				+                    if (os.path.isdir(images_dir)):
			
 
				+
			
 
				+                        list_gt = []
			
 
				+                        tree = ET.parse(images_dir + "/" + file + ".gt")
			
 
				+                        root = tree.getroot()
			
 
				+                        for a in root.iter("frame"):
			
 
				+                            list_gt.append(a)
			
 
				+
			
 
				+                        im_no = 0
			
 
				+                        for image in os.listdir(images_dir):
			
 
				+                            if image.endswith(".jpg"):
			
 
				+                                # print(im_no)
			
 
				+                                im_no += 1
			
 
				+
			
 
				+                                # Now we have opened the file and GT. Write code to create multiple files and scale gt
			
 
				+                                list_of_points = {}
			
 
				+
			
 
				+                                # img = cv2.imread(images_dir + "/" + image)
			
 
				+                                self.data.append(os.path.join(images_dir, image))
			
 
				+
			
 
				+                                for point in list_gt[int(float(image[0:-4])) - 1].iter("point"):
			
 
				+                                    myDict = point.attrib
			
 
				+
			
 
				+                                    list_of_points[myDict["name"]] = (
			
 
				+                                        int(float(myDict['x'])), int(float(myDict['y'])))
			
 
				+
			
 
				+                                ground_truth = np.asarray(
			
 
				+                                    (list_of_points["tl"], list_of_points["tr"], list_of_points["br"],
			
 
				+                                     list_of_points["bl"]))
			
 
				+                                ground_truth = utils.sort_gt(ground_truth)
			
 
				+                                self.labels.append(ground_truth)
			
 
				+
			
 
				+        self.labels = np.array(self.labels)
			
 
				+
			
 
				+        self.labels = np.reshape(self.labels, (-1, 8))
			
 
				+        logger.debug("Ground Truth Shape: %s", str(self.labels.shape))
			
 
				+        logger.debug("Data shape %s", str(len(self.data)))
			
 
				+
			
 
				+        self.myData = []
			
 
				+        for a in range(len(self.data)):
			
 
				+            self.myData.append([self.data[a], self.labels[a]])
			
 
				+
			
 
				+class SelfCollectedDataset(Dataset):
			
 
				+    '''
			
 
				+    Class to include MNIST specific details
			
 
				+    '''
			
 
				+
			
 
				+    def __init__(self, directory="data"):
			
 
				+        super().__init__("smartdoc")
			
 
				+        self.data = []
			
 
				+        self.labels = []
			
 
				+
			
 
				+        for image in os.listdir(directory):
			
 
				+            # print (image)
			
 
				+            if image.endswith("jpg") or image.endswith("JPG"):
			
 
				+                if os.path.isfile(os.path.join(directory, image + ".csv")):
			
 
				+                    with open(os.path.join(directory, image + ".csv"), 'r') as csvfile:
			
 
				+                        spamwriter = csv.reader(csvfile, delimiter=' ',
			
 
				+                                                quotechar='|', quoting=csv.QUOTE_MINIMAL)
			
 
				+
			
 
				+                        img_path = os.path.join(directory, image)
			
 
				+
			
 
				+                        gt = []
			
 
				+                        for row in spamwriter:
			
 
				+                            gt.append(row)
			
 
				+                        gt = np.array(gt).astype(np.float32)
			
 
				+                        ground_truth = utils.sort_gt(gt)
			
 
				+                        self.labels.append(ground_truth)
			
 
				+                        self.data.append(img_path)
			
 
				+
			
 
				+        self.labels = np.array(self.labels)
			
 
				+
			
 
				+        self.labels = np.reshape(self.labels, (-1, 8))
			
 
				+        logger.debug("Ground Truth Shape: %s", str(self.labels.shape))
			
 
				+        logger.debug("Data shape %s", str(len(self.data)))
			
 
				+
			
 
				+        self.myData = []
			
 
				+        for a in range(len(self.data)):
			
 
				+            self.myData.append([self.data[a], self.labels[a]])
			
 
				+
			
 
				+
			
 
				+
			
 
				+
			
 
				+class SmartDocCorner(Dataset):
			
 
				+    '''
			
 
				+    Class to include MNIST specific details
			
 
				+    '''
			
 
				+
			
 
				+    def __init__(self, directory="data"):
			
 
				+        super().__init__("smartdoc")
			
 
				+        self.data = []
			
 
				+        self.labels = []
			
 
				+        for d in directory:
			
 
				+            self.directory = d
			
 
				+            self.train_transform = transforms.Compose([transforms.Resize([32, 32]),
			
 
				+                                                       transforms.ColorJitter(0.5, 0.5, 0.5, 0.5),
			
 
				+                                                       transforms.ToTensor()])
			
 
				+
			
 
				+            self.test_transform = transforms.Compose([transforms.Resize([32, 32]),
			
 
				+                                                      transforms.ToTensor()])
			
 
				+
			
 
				+            logger.info("Pass train/test data paths here")
			
 
				+
			
 
				+            self.classes_list = {}
			
 
				+
			
 
				+            file_names = []
			
 
				+            with open(os.path.join(self.directory, "gt.csv"), 'r') as csvfile:
			
 
				+                spamreader = csv.reader(csvfile, delimiter=',', quotechar='|', quoting=csv.QUOTE_MINIMAL)
			
 
				+                import ast
			
 
				+                for row in spamreader:
			
 
				+                    file_names.append(row[0])
			
 
				+                    self.data.append(os.path.join(self.directory, row[0]))
			
 
				+                    test = row[1].replace("array", "")
			
 
				+                    self.labels.append((ast.literal_eval(test)))
			
 
				+        self.labels = np.array(self.labels)
			
 
				+
			
 
				+        self.labels = np.reshape(self.labels, (-1, 2))
			
 
				+        logger.debug("Ground Truth Shape: %s", str(self.labels.shape))
			
 
				+        logger.debug("Data shape %s", str(len(self.data)))
			
 
				+
			
 
				+        self.myData = [self.data, self.labels]
			
--- a/Dewarp/dataprocessor/datasetfactory.py
+++ b/Dewarp/dataprocessor/datasetfactory.py
@@ -0,0 +1,19 @@
 
				+''' Document Localization using Recursive CNN
			
 
				+ Maintainer : Khurram Javed
			
 
				+ Email : kjaved@ualberta.ca '''
			
 
				+
			
 
				+import dataprocessor.dataset as data
			
 
				+import torchvision
			
 
				+
			
 
				+class DatasetFactory:
			
 
				+    def __init__(self):
			
 
				+        pass
			
 
				+
			
 
				+    @staticmethod
			
 
				+    def get_dataset(directory, type="document"):
			
 
				+        if type=="document":
			
 
				+            return data.SmartDoc(directory)
			
 
				+        elif type =="corner":
			
 
				+            return data.SmartDocCorner(directory)
			
 
				+        elif type=="CIFAR":
			
 
				+            return torchvision.datasets.CIFAR100(root='./data', train=True, download=True, transform=torchvision.transforms.ToTensor())
			
--- a/Dewarp/dataprocessor/loaderfactory.py
+++ b/Dewarp/dataprocessor/loaderfactory.py
@@ -0,0 +1,21 @@
 
				+''' Document Localization using Recursive CNN
			
 
				+ Maintainer : Khurram Javed
			
 
				+ Email : kjaved@ualberta.ca '''
			
 
				+
			
 
				+
			
 
				+
			
 
				+import dataprocessor.dataloaders as loader
			
 
				+
			
 
				+
			
 
				+class LoaderFactory:
			
 
				+    def __init__(self):
			
 
				+        pass
			
 
				+
			
 
				+    @staticmethod
			
 
				+    def get_loader(type, data, transform=None, cuda=False):
			
 
				+        if type=="hdd":
			
 
				+            return loader.HddLoader(data, transform=transform,
			
 
				+                                    cuda=cuda)
			
 
				+        elif type =="ram":
			
 
				+            return loader.RamLoader(data, transform=transform,
			
 
				+                                    cuda=cuda)
			
--- a/Dewarp/dataset_intro.md
+++ b/Dewarp/dataset_intro.md
@@ -0,0 +1,24 @@
 
				+### 图像切边增强数据集
			
 
				+
			
 
				+| **数据对象**                                   |            **倾斜角度**            |    **场景**     |             **备注**             | **举例**                                               |
			
 
				+|:-------------------------------------------|:------------------------------:|:-------------:|:------------------------------:|------------------------------------------------------| 
			
 
				+| <font color="#006600">浅色、四角点完整</font>      |               无                | 办公桌、地毯、沙发、椅子等 |          办公桌上的简历、票据等           | <img src="test_data/001.jpg" width=64px;height:64px> |
			
 
				+| <font color="#006600">**深色、四角点完整**</font>  |               无                |               |             书本的封面              |                                                      |                                       |
			
 
				+| <font color="#dd0000">浅色、四角点不完整</font>     |               无                |               | （上两角点、下两角点、左两角点、右两角点）之一未出现在图像中 | <img src="test_data/002.jpg" width=64px;height:64px> |
			
 
				+| <font color="#dd0000">浅色、四角点不完整</font>     |               无                |               |          三个角点未出现在图像中           | <img src="test_data/003.jpg" width=64px;height:64px> |
			
 
				+| <font color="#dd0000">浅色、四角点不完整</font>     |               无                |               |           四角点未出现在图像中           | <img src="test_data/004.jpg" width=64px;height:64px> |
			
 
				+| <font color="#dd0000">**深色、四角点不完整**</font> |               无                |               | （上两角点、下两角点、左两角点、右两角点）之一未出现在图像中 |                                                      |
			
 
				+| <font color="#dd0000">**深色、四角点不完整**</font> |               无                |               |          三个角点未出现在图像中           |                                                      |
			
 
				+| <font color="#dd0000">**深色、四角点不完整**</font> |               无                |               |           四角点未出现在图像中           |                                                      |
			
 
				+| <font color="#006600">浅色、四角点完整</font>      | <font color="#150CFF">有</font> |               |                                |                                                      |
			
 
				+| <font color="#006600">**深色、四角点完整**</font>  | <font color="#150CFF">有</font> |               |                                |                                                      |
			
 
				+| <font color="#dd0000">浅色、四角点不完整</font>     | <font color="#150CFF">有</font> |               |            一个角点不在图中            | <img src="test_data/005.jpg" width=64px;height:64px> |
			
 
				+| <font color="#dd0000">浅色、四角点不完整</font>     | <font color="#150CFF">有</font> |               |            两个角点不在图中            | <img src="test_data/006.jpg" width=64px;height:64px> |
			
 
				+| <font color="#dd0000">浅色、四角点不完整</font>     | <font color="#150CFF">有</font> |               |            三个角点不在图中            | <img src="test_data/007.jpg" width=64px;height:64px> |
			
 
				+| <font color="#dd0000">浅色、四角点不完整</font>     | <font color="#150CFF">有</font> |               |            四个角点不在图中            | <img src="test_data/008.jpg" width=64px;height:64px> |
			
 
				+| <font color="#dd0000">**深色、四角点不完整**</font> | <font color="#150CFF">有</font> |               |            一个角点不在图中            |                                                      |
			
 
				+| <font color="#dd0000">**深色、四角点不完整**</font> | <font color="#150CFF">有</font> |               |            两个角点不在图中            |                                                      |
			
 
				+| <font color="#dd0000">**深色、四角点不完整**</font> | <font color="#150CFF">有</font> |               |            三个角点不在图中            |                                                      |
			
 
				+| <font color="#dd0000">**深色、四角点不完整**</font> | <font color="#150CFF">有</font> |               |            四个角点不在图中            |                                                      |
			
 
				+
			
 
				+
			
--- a/Dewarp/demo.py
+++ b/Dewarp/demo.py
@@ -0,0 +1,72 @@
 
				+''' Document Localization using Recursive CNN
			
 
				+ Maintainer : Khurram Javed
			
 
				+ Email : kjaved@ualberta.ca '''
			
 
				+import math
			
 
				+
			
 
				+import cv2
			
 
				+import numpy as np
			
 
				+
			
 
				+import evaluation
			
 
				+
			
 
				+
			
 
				+def args_processor():
			
 
				+    import argparse
			
 
				+    parser = argparse.ArgumentParser()
			
 
				+    parser.add_argument("-i", "--imagePath", default="../058.jpg", help="Path to the document image")
			
 
				+    parser.add_argument("-o", "--outputPath", default="../output.jpg", help="Path to store the result")
			
 
				+    parser.add_argument("-rf", "--retainFactor", help="Floating point in range (0,1) specifying retain factor",
			
 
				+                        default="0.85")
			
 
				+    parser.add_argument("-cm", "--cornerModel", help="Model for corner point refinement",
			
 
				+                        default="../cornerModelWell")
			
 
				+    parser.add_argument("-dm", "--documentModel", help="Model for document corners detection",
			
 
				+                        default="../documentModelWell")
			
 
				+    return parser.parse_args()
			
 
				+
			
 
				+
			
 
				+if __name__ == "__main__":
			
 
				+    args = args_processor()
			
 
				+
			
 
				+    corners_extractor = evaluation.corner_extractor.GetCorners(args.documentModel)
			
 
				+    corner_refiner = evaluation.corner_refiner.corner_finder(args.cornerModel)
			
 
				+
			
 
				+    img = cv2.imread(args.imagePath)
			
 
				+
			
 
				+    oImg = img
			
 
				+
			
 
				+    extracted_corners = corners_extractor.get(oImg)
			
 
				+    corner_address = []
			
 
				+    # Refine the detected corners using corner refiner
			
 
				+    image_name = 0
			
 
				+    for corner in extracted_corners:
			
 
				+        image_name += 1
			
 
				+        corner_img = corner[0]
			
 
				+        refined_corner = np.array(corner_refiner.get_location(corner_img, 0.85))
			
 
				+
			
 
				+        # Converting from local co-ordinate to global co-ordinates of the image
			
 
				+        refined_corner[0] += corner[1]
			
 
				+        refined_corner[1] += corner[2]
			
 
				+
			
 
				+        # Final results
			
 
				+        corner_address.append(refined_corner)
			
 
				+    print(corner_address)
			
 
				+    width = int(math.sqrt(math.pow(corner_address[1][0]-corner_address[0][0], 2) + math.pow(corner_address[1][1]-corner_address[0][1], 2)))
			
 
				+    height = int(math.sqrt(math.pow(corner_address[2][0]-corner_address[1][0], 2) + math.pow(corner_address[2][1]-corner_address[1][1], 2)))
			
 
				+    print(width, height)
			
 
				+    # if width > height:
			
 
				+    #     t = width
			
 
				+    #     width = height
			
 
				+    #     height = t
			
 
				+    # print(width, height)
			
 
				+    pts1 = np.float32([[corner_address[0][0], corner_address[0][1]], [corner_address[1][0], corner_address[1][1]], [corner_address[3][0], corner_address[3][1]], [corner_address[2][0], corner_address[2][1]]])
			
 
				+    pts2 = np.float32([[0, 0], [width, 0], [0, height], [width, height]])
			
 
				+    M = cv2.getPerspectiveTransform(pts1, pts2)
			
 
				+    warped = cv2.warpPerspective(img, M, (width, height))
			
 
				+    # cv2.imshow('ww', warped)
			
 
				+    # cv2.waitKey()
			
 
				+    # cv2.destroyAllWindows()
			
 
				+    cv2.imwrite(str(args.outputPath).split('.')[0] + '_warped.png', warped)
			
 
				+
			
 
				+    for a in range(0, len(extracted_corners)):
			
 
				+        cv2.line(oImg, tuple(corner_address[a % 4]), tuple(corner_address[(a + 1) % 4]), (255, 0, 0), 4)
			
 
				+
			
 
				+    cv2.imwrite(args.outputPath, oImg)
			
--- a/Dewarp/document_data_generator.py
+++ b/Dewarp/document_data_generator.py
@@ -0,0 +1,72 @@
 
				+import os
			
 
				+from tqdm import tqdm
			
 
				+
			
 
				+import cv2
			
 
				+import numpy as np
			
 
				+import utils
			
 
				+import dataprocessor
			
 
				+
			
 
				+def args_processor():
			
 
				+    import argparse
			
 
				+    parser = argparse.ArgumentParser()
			
 
				+    parser.add_argument("-i", "--input-dir", help="Path to data files (Extract images using video_to_image.py first")
			
 
				+    parser.add_argument("-o", "--output-dir", help="Directory to store results")
			
 
				+    parser.add_argument("--dataset", default="smartdoc", help="'smartdoc' or 'selfcollected' dataset")
			
 
				+    return parser.parse_args()
			
 
				+
			
 
				+
			
 
				+if __name__ == '__main__':
			
 
				+    if __name__ == '__main__':
			
 
				+        args = args_processor()
			
 
				+        input_directory = args.input_dir
			
 
				+        if not os.path.isdir(args.output_dir):
			
 
				+            os.mkdir(args.output_dir)
			
 
				+        import csv
			
 
				+
			
 
				+
			
 
				+        # Dataset iterator
			
 
				+        if args.dataset == "smartdoc":
			
 
				+            dataset_test = dataprocessor.dataset.SmartDocDirectories(input_directory)
			
 
				+        elif args.dataset == "selfcollected":
			
 
				+            dataset_test = dataprocessor.dataset.SelfCollectedDataset(input_directory)
			
 
				+        else:
			
 
				+            print("Incorrect dataset type; please choose between smartdoc or selfcollected")
			
 
				+            assert (False)
			
 
				+        with open(os.path.join(args.output_dir, 'gt.csv'), 'a', newline='') as csvfile:
			
 
				+            spamwriter = csv.writer(csvfile, delimiter=',',
			
 
				+                                    quotechar='|')
			
 
				+            # Counter for file naming
			
 
				+            counter = 0
			
 
				+            for data_elem in tqdm(dataset_test.myData):
			
 
				+
			
 
				+                img_path = data_elem[0]
			
 
				+                target = data_elem[1].reshape((4, 2))
			
 
				+                img = cv2.imread(img_path)
			
 
				+
			
 
				+                if args.dataset == "selfcollected":
			
 
				+                    target = target / (img.shape[1], img.shape[0])
			
 
				+                    target = target * (1920, 1920)
			
 
				+                    img = cv2.resize(img, (1920, 1920))
			
 
				+
			
 
				+                corner_cords = target
			
 
				+
			
 
				+                for angle in range(0, 271, 90):
			
 
				+                    img_rotate, gt_rotate = utils.utils.rotate(img, corner_cords, angle)
			
 
				+                    for random_crop in range(0, 16):
			
 
				+                        counter += 1
			
 
				+                        f_name = str(counter).zfill(8)
			
 
				+
			
 
				+                        img_crop, gt_crop = utils.utils.random_crop(img_rotate, gt_rotate)
			
 
				+                        mah_size = img_crop.shape
			
 
				+                        img_crop = cv2.resize(img_crop, (64, 64))
			
 
				+                        gt_crop = np.array(gt_crop)
			
 
				+
			
 
				+                        # no=0
			
 
				+                        # for a in range(0,4):
			
 
				+                        #     no+=1
			
 
				+                        #     cv2.circle(img_crop, tuple(((gt_crop[a]*64).astype(int))), 2,(255-no*60,no*60,0),9)
			
 
				+                        # # cv2.imwrite("asda.jpg", img)
			
 
				+
			
 
				+                        cv2.imwrite(os.path.join(args.output_dir, f_name+".jpg"), img_crop)
			
 
				+                        spamwriter.writerow((f_name+".jpg", tuple(list(gt_crop))))
			
 
				+                        print(tuple(list(gt_crop)))
			
--- a/Dewarp/evaluate.py
+++ b/Dewarp/evaluate.py
@@ -0,0 +1,69 @@
 
				+''' Document Localization using Recursive CNN
			
 
				+ Maintainer : Khurram Javed
			
 
				+ Email : kjaved@ualberta.ca '''
			
 
				+
			
 
				+import argparse
			
 
				+import time
			
 
				+
			
 
				+import numpy as np
			
 
				+import torch
			
 
				+from PIL import Image
			
 
				+
			
 
				+import dataprocessor
			
 
				+import evaluation
			
 
				+
			
 
				+from utils import utils
			
 
				+
			
 
				+parser = argparse.ArgumentParser(description='iCarl2.0')
			
 
				+
			
 
				+parser.add_argument("-i", "--data-dir", default="/Users/khurramjaved96/bg5",
			
 
				+                    help="input Directory of test data")
			
 
				+
			
 
				+args = parser.parse_args()
			
 
				+args.cuda = torch.cuda.is_available()
			
 
				+if __name__ == '__main__':
			
 
				+    corners_extractor = evaluation.corner_extractor.GetCorners("../documentModelWell")
			
 
				+    corner_refiner = evaluation.corner_refiner.corner_finder("../cornerModelWell")
			
 
				+    test_set_dir = args.data_dir
			
 
				+    iou_results = []
			
 
				+    my_results = []
			
 
				+    dataset_test = dataprocessor.dataset.SmartDocDirectories(test_set_dir)
			
 
				+    for data_elem in dataset_test.myData:
			
 
				+
			
 
				+        img_path = data_elem[0]
			
 
				+        # print(img_path)
			
 
				+        target = data_elem[1].reshape((4, 2))
			
 
				+        img_array = np.array(Image.open(img_path))
			
 
				+        computation_start_time = time.clock()
			
 
				+        extracted_corners = corners_extractor.get(img_array)
			
 
				+        temp_time = time.clock()
			
 
				+        corner_address = []
			
 
				+        # Refine the detected corners using corner refiner
			
 
				+        counter=0
			
 
				+        for corner in extracted_corners:
			
 
				+            counter+=1
			
 
				+            corner_img = corner[0]
			
 
				+            refined_corner = np.array(corner_refiner.get_location(corner_img, 0.85))
			
 
				+
			
 
				+            # Converting from local co-ordinate to global co-ordinate of the image
			
 
				+            refined_corner[0] += corner[1]
			
 
				+            refined_corner[1] += corner[2]
			
 
				+
			
 
				+            # Final results
			
 
				+            corner_address.append(refined_corner)
			
 
				+        computation_end_time = time.clock()
			
 
				+        print("TOTAL TIME : ", computation_end_time - computation_start_time)
			
 
				+        r2 = utils.intersection_with_corection_smart_doc_implementation(target, np.array(corner_address), img_array)
			
 
				+        r3 = utils.intersection_with_corection(target, np.array(corner_address), img_array)
			
 
				+
			
 
				+        if r3 - r2 > 0.1:
			
 
				+            print ("Image Name", img_path)
			
 
				+            print ("Prediction", np.array(corner_address), target)
			
 
				+            0/0
			
 
				+        assert (r2 > 0 and r2 < 1)
			
 
				+        iou_results.append(r2)
			
 
				+        my_results.append(r3)
			
 
				+        print("MEAN CORRECTED JI: ", np.mean(np.array(iou_results)))
			
 
				+        print("MEAN CORRECTED MY: ", np.mean(np.array(my_results)))
			
 
				+
			
 
				+    print(np.mean(np.array(iou_results)))
			
--- a/Dewarp/evaluation/__init__.py
+++ b/Dewarp/evaluation/__init__.py
@@ -0,0 +1,6 @@
 
				+''' Document Localization using Recursive CNN
			
 
				+ Maintainer : Khurram Javed
			
 
				+ Email : kjaved@ualberta.ca '''
			
 
				+
			
 
				+import evaluation.corner_extractor
			
 
				+import evaluation.corner_refiner
			
--- a/Dewarp/evaluation/corner_extractor.py
+++ b/Dewarp/evaluation/corner_extractor.py
@@ -0,0 +1,72 @@
 
				+''' Document Localization using Recursive CNN
			
 
				+ Maintainer : Khurram Javed
			
 
				+ Email : kjaved@ualberta.ca '''
			
 
				+
			
 
				+import numpy as np
			
 
				+import torch
			
 
				+from PIL import Image
			
 
				+from torchvision import transforms
			
 
				+
			
 
				+import model
			
 
				+
			
 
				+
			
 
				+class GetCorners:
			
 
				+    def __init__(self, checkpoint_dir):
			
 
				+        self.model = model.ModelFactory.get_model("resnet", 'document')
			
 
				+        self.model.load_state_dict(torch.load(checkpoint_dir, map_location='cpu'))
			
 
				+        if torch.cuda.is_available():
			
 
				+            self.model.cuda()
			
 
				+        self.model.eval()
			
 
				+
			
 
				+    def get(self, pil_image):
			
 
				+        with torch.no_grad():
			
 
				+            image_array = np.copy(pil_image)
			
 
				+            pil_image = Image.fromarray(pil_image)
			
 
				+            test_transform = transforms.Compose([transforms.Resize([32, 32]),
			
 
				+                                                 transforms.ToTensor()])
			
 
				+            img_temp = test_transform(pil_image)
			
 
				+
			
 
				+            img_temp = img_temp.unsqueeze(0)
			
 
				+            if torch.cuda.is_available():
			
 
				+                img_temp = img_temp.cuda()
			
 
				+
			
 
				+            model_prediction = self.model(img_temp).cpu().data.numpy()[0]
			
 
				+
			
 
				+            model_prediction = np.array(model_prediction)
			
 
				+
			
 
				+            x_cords = model_prediction[[0, 2, 4, 6]]
			
 
				+            y_cords = model_prediction[[1, 3, 5, 7]]
			
 
				+
			
 
				+            x_cords = x_cords * image_array.shape[1]
			
 
				+            y_cords = y_cords * image_array.shape[0]
			
 
				+
			
 
				+            # Extract the four corners of the image. Read "Region Extractor" in Section III of the paper for an explanation.
			
 
				+
			
 
				+            top_left = image_array[
			
 
				+                       max(0, int(2 * y_cords[0] - (y_cords[3] + y_cords[0]) / 2)):int((y_cords[3] + y_cords[0]) / 2),
			
 
				+                       max(0, int(2 * x_cords[0] - (x_cords[1] + x_cords[0]) / 2)):int((x_cords[1] + x_cords[0]) / 2)]
			
 
				+
			
 
				+            top_right = image_array[
			
 
				+                        max(0, int(2 * y_cords[1] - (y_cords[1] + y_cords[2]) / 2)):int((y_cords[1] + y_cords[2]) / 2),
			
 
				+                        int((x_cords[1] + x_cords[0]) / 2):min(image_array.shape[1] - 1,
			
 
				+                                                               int(x_cords[1] + (x_cords[1] - x_cords[0]) / 2))]
			
 
				+
			
 
				+            bottom_right = image_array[int((y_cords[1] + y_cords[2]) / 2):min(image_array.shape[0] - 1, int(
			
 
				+                y_cords[2] + (y_cords[2] - y_cords[1]) / 2)),
			
 
				+                           int((x_cords[2] + x_cords[3]) / 2):min(image_array.shape[1] - 1,
			
 
				+                                                                  int(x_cords[2] + (x_cords[2] - x_cords[3]) / 2))]
			
 
				+
			
 
				+            bottom_left = image_array[int((y_cords[0] + y_cords[3]) / 2):min(image_array.shape[0] - 1, int(
			
 
				+                y_cords[3] + (y_cords[3] - y_cords[0]) / 2)),
			
 
				+                          max(0, int(2 * x_cords[3] - (x_cords[2] + x_cords[3]) / 2)):int(
			
 
				+                              (x_cords[3] + x_cords[2]) / 2)]
			
 
				+
			
 
				+            top_left = (top_left, max(0, int(2 * x_cords[0] - (x_cords[1] + x_cords[0]) / 2)),
			
 
				+                        max(0, int(2 * y_cords[0] - (y_cords[3] + y_cords[0]) / 2)))
			
 
				+            top_right = (
			
 
				+            top_right, int((x_cords[1] + x_cords[0]) / 2), max(0, int(2 * y_cords[1] - (y_cords[1] + y_cords[2]) / 2)))
			
 
				+            bottom_right = (bottom_right, int((x_cords[2] + x_cords[3]) / 2), int((y_cords[1] + y_cords[2]) / 2))
			
 
				+            bottom_left = (bottom_left, max(0, int(2 * x_cords[3] - (x_cords[2] + x_cords[3]) / 2)),
			
 
				+                           int((y_cords[0] + y_cords[3]) / 2))
			
 
				+
			
 
				+            return top_left, top_right, bottom_right, bottom_left
			
--- a/Dewarp/evaluation/corner_refiner.py
+++ b/Dewarp/evaluation/corner_refiner.py
@@ -0,0 +1,84 @@
 
				+''' Document Localization using Recursive CNN
			
 
				+ Maintainer : Khurram Javed
			
 
				+ Email : kjaved@ualberta.ca '''
			
 
				+
			
 
				+import numpy as np
			
 
				+import torch
			
 
				+from PIL import Image
			
 
				+from torchvision import transforms
			
 
				+
			
 
				+import model
			
 
				+
			
 
				+
			
 
				+class corner_finder():
			
 
				+    def __init__(self, CHECKPOINT_DIR):
			
 
				+
			
 
				+        self.model = model.ModelFactory.get_model("resnet", "corner")
			
 
				+        self.model.load_state_dict(torch.load(CHECKPOINT_DIR, map_location='cpu'))
			
 
				+        if torch.cuda.is_available():
			
 
				+            self.model.cuda()
			
 
				+        self.model.eval()
			
 
				+
			
 
				+    def get_location(self, img, retainFactor=0.85):
			
 
				+        with torch.no_grad():
			
 
				+            ans_x = 0.0
			
 
				+            ans_y = 0.0
			
 
				+
			
 
				+            o_img = np.copy(img)
			
 
				+
			
 
				+            y = [0, 0]
			
 
				+            x_start = 0
			
 
				+            y_start = 0
			
 
				+            up_scale_factor = (img.shape[1], img.shape[0])
			
 
				+
			
 
				+            myImage = np.copy(o_img)
			
 
				+
			
 
				+            test_transform = transforms.Compose([transforms.Resize([32, 32]),
			
 
				+                                                 transforms.ToTensor()])
			
 
				+
			
 
				+            CROP_FRAC = retainFactor
			
 
				+            while (myImage.shape[0] > 10 and myImage.shape[1] > 10):
			
 
				+
			
 
				+                img_temp = Image.fromarray(myImage)
			
 
				+                img_temp = test_transform(img_temp)
			
 
				+                img_temp = img_temp.unsqueeze(0)
			
 
				+
			
 
				+                if torch.cuda.is_available():
			
 
				+                    img_temp = img_temp.cuda()
			
 
				+                response = self.model(img_temp).cpu().data.numpy()
			
 
				+                response = response[0]
			
 
				+
			
 
				+                response_up = response
			
 
				+
			
 
				+                response_up = response_up * up_scale_factor
			
 
				+                y = response_up + (x_start, y_start)
			
 
				+                x_loc = int(y[0])
			
 
				+                y_loc = int(y[1])
			
 
				+
			
 
				+                if x_loc > myImage.shape[1] / 2:
			
 
				+                    start_x = min(x_loc + int(round(myImage.shape[1] * CROP_FRAC / 2)), myImage.shape[1]) - int(round(
			
 
				+                        myImage.shape[1] * CROP_FRAC))
			
 
				+                else:
			
 
				+                    start_x = max(x_loc - int(myImage.shape[1] * CROP_FRAC / 2), 0)
			
 
				+                if y_loc > myImage.shape[0] / 2:
			
 
				+                    start_y = min(y_loc + int(myImage.shape[0] * CROP_FRAC / 2), myImage.shape[0]) - int(
			
 
				+                        myImage.shape[0] * CROP_FRAC)
			
 
				+                else:
			
 
				+                    start_y = max(y_loc - int(myImage.shape[0] * CROP_FRAC / 2), 0)
			
 
				+
			
 
				+                ans_x += start_x
			
 
				+                ans_y += start_y
			
 
				+
			
 
				+                myImage = myImage[start_y:start_y + int(myImage.shape[0] * CROP_FRAC),
			
 
				+                          start_x:start_x + int(myImage.shape[1] * CROP_FRAC)]
			
 
				+                img = img[start_y:start_y + int(img.shape[0] * CROP_FRAC),
			
 
				+                      start_x:start_x + int(img.shape[1] * CROP_FRAC)]
			
 
				+                up_scale_factor = (img.shape[1], img.shape[0])
			
 
				+
			
 
				+            ans_x += y[0]
			
 
				+            ans_y += y[1]
			
 
				+            return (int(round(ans_x)), int(round(ans_y)))
			
 
				+
			
 
				+
			
 
				+if __name__ == "__main__":
			
 
				+    pass
			
--- a/Dewarp/experiment/__init__.py
+++ b/Dewarp/experiment/__init__.py
@@ -0,0 +1 @@
 
				+from experiment.experiment import *
			
--- a/Dewarp/experiment/experiment.py
+++ b/Dewarp/experiment/experiment.py
@@ -0,0 +1,53 @@
 
				+''' Incremental-Classifier Learning 
			
 
				+ Authors : Khurram Javed, Muhammad Talha Paracha
			
 
				+ Maintainer : Khurram Javed
			
 
				+ Lab : TUKL-SEECS R&D Lab
			
 
				+ Email : 14besekjaved@seecs.edu.pk '''
			
 
				+
			
 
				+import json
			
 
				+import os
			
 
				+import subprocess
			
 
				+
			
 
				+
			
 
				+class experiment:
			
 
				+    '''
			
 
				+    Class to store results of any experiment 
			
 
				+    '''
			
 
				+
			
 
				+    def __init__(self, name, args, output_dir="../"):
			
 
				+        # self.gitHash = subprocess.check_output(['git', 'rev-parse', 'HEAD']).decode("utf-8")
			
 
				+        # print(self.gitHash)
			
 
				+        if not args is None:
			
 
				+            self.name = name
			
 
				+            self.params = vars(args)
			
 
				+            self.results = {}
			
 
				+            self.dir = output_dir
			
 
				+
			
 
				+            import datetime
			
 
				+            now = datetime.datetime.now()
			
 
				+            rootFolder = str(now.day) + str(now.month) + str(now.year)
			
 
				+            if not os.path.exists(output_dir + rootFolder):
			
 
				+                os.makedirs(output_dir + rootFolder)
			
 
				+            self.name = rootFolder + "/" + self.name
			
 
				+            ver = 0
			
 
				+
			
 
				+            while os.path.exists(output_dir + self.name + "_" + str(ver)):
			
 
				+                ver += 1
			
 
				+
			
 
				+            os.makedirs(output_dir + self.name + "_" + str(ver))
			
 
				+            self.path = output_dir + self.name + "_" + str(ver) + "/" + name
			
 
				+
			
 
				+            self.results["Temp Results"] = [[1, 2, 3, 4], [5, 6, 2, 6]]
			
 
				+
			
 
				+    def store_json(self):
			
 
				+        with open(self.path + "JSONDump.txt", 'w') as outfile:
			
 
				+            json.dump(json.dumps(self.__dict__), outfile)
			
 
				+
			
 
				+
			
 
				+import argparse
			
 
				+
			
 
				+if __name__ == "__main__":
			
 
				+    parser = argparse.ArgumentParser(description='iCarl2.0')
			
 
				+    args = parser.parse_args()
			
 
				+    e = experiment("TestExperiment", args)
			
 
				+    e.store_json()
			
--- a/Dewarp/json_to_csv.py
+++ b/Dewarp/json_to_csv.py
@@ -0,0 +1,28 @@
 
				+import argparse
			
 
				+import json
			
 
				+import os
			
 
				+
			
 
				+
			
 
				+def work(json_fold):
			
 
				+    json_list = os.listdir(json_fold)
			
 
				+    for json_path in json_list:
			
 
				+        path = json_fold + '/' + json_path
			
 
				+        # 处理json文件
			
 
				+        if str(path).endswith('.json'):
			
 
				+            with open(path, "r", encoding="utf-8") as f:
			
 
				+                content = json.load(f)
			
 
				+            # 将 JSON 数据写入 CSV 文件
			
 
				+            csv_path = str(path).replace('json', 'jpg') + '.csv'
			
 
				+            with open(csv_path, mode='w', newline='') as csv_file:
			
 
				+                # 使用 DictWriter 而不是 csv.DictWriter，因为需要将 JSON 中的键作为列名
			
 
				+                for point in content['shapes']:
			
 
				+                    line = str(point['points'][0][0]) + ' ' + str(point['points'][0][1]) + '\n'
			
 
				+                    print(line)
			
 
				+                    csv_file.write(line)
			
 
				+
			
 
				+
			
 
				+if __name__ == "__main__":
			
 
				+    parser = argparse.ArgumentParser()
			
 
				+    parser.add_argument('--json_fold', type=str, default='./my_dataset_origin')
			
 
				+    args = parser.parse_args()
			
 
				+    work(args.json_fold)
			
--- a/Dewarp/model/__init__.py
+++ b/Dewarp/model/__init__.py
@@ -0,0 +1 @@
 
				+from model.modelfactory import *
			
--- a/Dewarp/model/cornerModel.py
+++ b/Dewarp/model/cornerModel.py
@@ -0,0 +1,78 @@
 
				+# Reference : Taken from https://github.com/kuangliu/pytorch-cifar
			
 
				+
			
 
				+# License
			
 
				+# MIT License
			
 
				+#
			
 
				+# Copyright (c) 2017 liukuang
			
 
				+#
			
 
				+# Permission is hereby granted, free of charge, to any person obtaining a copy
			
 
				+# of this software and associated documentation files (the "Software"), to deal
			
 
				+# in the Software without restriction, including without limitation the rights
			
 
				+# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
			
 
				+# copies of the Software, and to permit persons to whom the Software is
			
 
				+# furnished to do so, subject to the following conditions:
			
 
				+#
			
 
				+# The above copyright notice and this permission notice shall be included in all
			
 
				+# copies or substantial portions of the Software.
			
 
				+#
			
 
				+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
			
 
				+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
			
 
				+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
			
 
				+# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
			
 
				+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
			
 
				+# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
			
 
				+# SOFTWARE.
			
 
				+
			
 
				+
			
 
				+'''MobileNet in PyTorch.
			
 
				+See the paper "MobileNets: Efficient Convolutional Neural Networks for Mobile Vision Applications"
			
 
				+for more details.
			
 
				+'''
			
 
				+import torch
			
 
				+import torch.nn as nn
			
 
				+import torch.nn.functional as F
			
 
				+
			
 
				+
			
 
				+class Block(nn.Module):
			
 
				+    '''Depthwise conv + Pointwise conv'''
			
 
				+    def __init__(self, in_planes, out_planes, stride=1):
			
 
				+        super(Block, self).__init__()
			
 
				+        self.conv1 = nn.Conv2d(in_planes, in_planes, kernel_size=3, stride=stride, padding=1, groups=in_planes, bias=False)
			
 
				+        self.bn1 = nn.BatchNorm2d(in_planes)
			
 
				+        self.conv2 = nn.Conv2d(in_planes, out_planes, kernel_size=1, stride=1, padding=0, bias=False)
			
 
				+        self.bn2 = nn.BatchNorm2d(out_planes)
			
 
				+
			
 
				+    def forward(self, x):
			
 
				+        out = F.relu(self.bn1(self.conv1(x)))
			
 
				+        out = F.relu(self.bn2(self.conv2(out)))
			
 
				+        return out
			
 
				+
			
 
				+
			
 
				+class MobileNet(nn.Module):
			
 
				+    # (128,2) means conv planes=128, conv stride=2, by default conv stride=1
			
 
				+    cfg = [64, (128,2), 128, (256,2), 256, (512,2), 512, 512, 512, 512, 512, (1024,2), 1024]
			
 
				+
			
 
				+    def __init__(self, num_classes=10):
			
 
				+        super(MobileNet, self).__init__()
			
 
				+        self.conv1 = nn.Conv2d(3, 32, kernel_size=3, stride=1, padding=1, bias=False)
			
 
				+        self.bn1 = nn.BatchNorm2d(32)
			
 
				+        self.layers = self._make_layers(in_planes=32)
			
 
				+        self.linear = nn.Linear(1024, num_classes)
			
 
				+
			
 
				+    def _make_layers(self, in_planes):
			
 
				+        layers = []
			
 
				+        for x in self.cfg:
			
 
				+            out_planes = x if isinstance(x, int) else x[0]
			
 
				+            stride = 1 if isinstance(x, int) else x[1]
			
 
				+            layers.append(Block(in_planes, out_planes, stride))
			
 
				+            in_planes = out_planes
			
 
				+        return nn.Sequential(*layers)
			
 
				+
			
 
				+    def forward(self, x, pretrain=False):
			
 
				+        out = F.relu(self.bn1(self.conv1(x)))
			
 
				+        out = self.layers(out)
			
 
				+        out = F.avg_pool2d(out, 2)
			
 
				+        out = out.view(out.size(0), -1)
			
 
				+        out = self.linear(out)
			
 
				+        return out
			
 
				+
			
--- a/Dewarp/model/modelfactory.py
+++ b/Dewarp/model/modelfactory.py
@@ -0,0 +1,37 @@
 
				+''' Document Localization using Recursive CNN
			
 
				+ Maintainer : Khurram Javed
			
 
				+ Email : kjaved@ualberta.ca '''
			
 
				+
			
 
				+import model.resnet32 as resnet
			
 
				+import model.cornerModel as tm
			
 
				+import torchvision.models as models
			
 
				+
			
 
				+class ModelFactory():
			
 
				+    def __init__(self):
			
 
				+        pass
			
 
				+
			
 
				+    @staticmethod
			
 
				+    def get_model(model_type, dataset):
			
 
				+        if model_type == "resnet":
			
 
				+            if dataset == 'document':
			
 
				+                return resnet.resnet20(8)
			
 
				+            elif dataset == 'corner':
			
 
				+                return resnet.resnet20(2)
			
 
				+        if model_type == "resnet8":
			
 
				+            if dataset == 'document':
			
 
				+                return resnet.resnet8(8)
			
 
				+            elif dataset == 'corner':
			
 
				+                return resnet.resnet8(2)
			
 
				+        elif model_type == 'shallow':
			
 
				+            if dataset == 'document':
			
 
				+                return tm.MobileNet(8)
			
 
				+            elif dataset == 'corner':
			
 
				+                return tm.MobileNet(2)
			
 
				+        elif model_type =="squeeze":
			
 
				+            if dataset == 'document':
			
 
				+                return models.squeezenet1_1(True)
			
 
				+            elif dataset == 'corner':
			
 
				+                return models.squeezenet1_1(True)
			
 
				+        else:
			
 
				+            print("Unsupported model; either implement the model in model/ModelFactory or choose a different model")
			
 
				+            assert (False)
			
--- a/Dewarp/model/res_utils.py
+++ b/Dewarp/model/res_utils.py
@@ -0,0 +1,37 @@
 
				+import torch
			
 
				+import torch.nn as nn
			
 
				+
			
 
				+
			
 
				+class DownsampleA(nn.Module):
			
 
				+    def __init__(self, nIn, nOut, stride):
			
 
				+        super(DownsampleA, self).__init__()
			
 
				+        assert stride == 2
			
 
				+        self.avg = nn.AvgPool2d(kernel_size=1, stride=stride)
			
 
				+
			
 
				+    def forward(self, x):
			
 
				+        x = self.avg(x)
			
 
				+        return torch.cat((x, x.mul(0)), 1)
			
 
				+
			
 
				+
			
 
				+class DownsampleC(nn.Module):
			
 
				+    def __init__(self, nIn, nOut, stride):
			
 
				+        super(DownsampleC, self).__init__()
			
 
				+        assert stride != 1 or nIn != nOut
			
 
				+        self.conv = nn.Conv2d(nIn, nOut, kernel_size=1, stride=stride, padding=0, bias=False)
			
 
				+
			
 
				+    def forward(self, x):
			
 
				+        x = self.conv(x)
			
 
				+        return x
			
 
				+
			
 
				+
			
 
				+class DownsampleD(nn.Module):
			
 
				+    def __init__(self, nIn, nOut, stride):
			
 
				+        super(DownsampleD, self).__init__()
			
 
				+        assert stride == 2
			
 
				+        self.conv = nn.Conv2d(nIn, nOut, kernel_size=2, stride=stride, padding=0, bias=False)
			
 
				+        self.bn = nn.BatchNorm2d(nOut)
			
 
				+
			
 
				+    def forward(self, x):
			
 
				+        x = self.conv(x)
			
 
				+        x = self.bn(x)
			
 
				+        return x
			
--- a/Dewarp/model/resnet32.py
+++ b/Dewarp/model/resnet32.py
@@ -0,0 +1,184 @@
 
				+# This is someone elses implementation of resnet optimized for CIFAR; I can't seem to find the repository again to reference the work.
			
 
				+# I will keep on looking.
			
 
				+import math
			
 
				+
			
 
				+import torch.nn as nn
			
 
				+import torch.nn.functional as F
			
 
				+from torch.nn import init
			
 
				+
			
 
				+from .res_utils import DownsampleA
			
 
				+
			
 
				+
			
 
				+class ResNetBasicblock(nn.Module):
			
 
				+    expansion = 1
			
 
				+    """
			
 
				+    RexNet basicblock (https://github.com/facebook/fb.resnet.torch/blob/master/models/resnet.lua)
			
 
				+    """
			
 
				+
			
 
				+    def __init__(self, inplanes, planes, stride=1, downsample=None):
			
 
				+        super(ResNetBasicblock, self).__init__()
			
 
				+
			
 
				+        self.conv_a = nn.Conv2d(inplanes, planes, kernel_size=3, stride=stride, padding=1, bias=False)
			
 
				+        self.bn_a = nn.BatchNorm2d(planes)
			
 
				+
			
 
				+        self.conv_b = nn.Conv2d(planes, planes, kernel_size=3, stride=1, padding=1, bias=False)
			
 
				+        self.bn_b = nn.BatchNorm2d(planes)
			
 
				+
			
 
				+        self.downsample = downsample
			
 
				+        self.featureSize = 64
			
 
				+
			
 
				+    def forward(self, x):
			
 
				+        residual = x
			
 
				+
			
 
				+        basicblock = self.conv_a(x)
			
 
				+        basicblock = self.bn_a(basicblock)
			
 
				+        basicblock = F.relu(basicblock, inplace=True)
			
 
				+
			
 
				+        basicblock = self.conv_b(basicblock)
			
 
				+        basicblock = self.bn_b(basicblock)
			
 
				+
			
 
				+        if self.downsample is not None:
			
 
				+            residual = self.downsample(x)
			
 
				+
			
 
				+        return F.relu(residual + basicblock, inplace=True)
			
 
				+
			
 
				+
			
 
				+class CifarResNet(nn.Module):
			
 
				+    """
			
 
				+    ResNet optimized for the Cifar Dataset, as specified in
			
 
				+    https://arxiv.org/abs/1512.03385.pdf
			
 
				+    """
			
 
				+
			
 
				+    def __init__(self, block, depth, num_classes, channels=3):
			
 
				+        """ Constructor
			
 
				+        Args:
			
 
				+          depth: number of layers.
			
 
				+          num_classes: number of classes
			
 
				+          base_width: base width
			
 
				+        """
			
 
				+        super(CifarResNet, self).__init__()
			
 
				+
			
 
				+        self.featureSize = 64
			
 
				+        # Model type specifies number of layers for CIFAR-10 and CIFAR-100 model
			
 
				+        assert (depth - 2) % 6 == 0, 'depth should be one of 20, 32, 44, 56, 110'
			
 
				+        layer_blocks = (depth - 2) // 6
			
 
				+
			
 
				+        self.num_classes = num_classes
			
 
				+
			
 
				+        self.conv_1_3x3 = nn.Conv2d(channels, 16, kernel_size=3, stride=1, padding=1, bias=False)
			
 
				+        self.bn_1 = nn.BatchNorm2d(16)
			
 
				+
			
 
				+        self.inplanes = 16
			
 
				+        self.stage_1 = self._make_layer(block, 16, layer_blocks, 1)
			
 
				+        self.stage_2 = self._make_layer(block, 32, layer_blocks, 2)
			
 
				+        self.stage_3 = self._make_layer(block, 64, layer_blocks, 2)
			
 
				+        self.avgpool = nn.AvgPool2d(8)
			
 
				+        self.fc = nn.Linear(64 * block.expansion, num_classes)
			
 
				+        self.fc2 = nn.Linear(64 * block.expansion, 100)
			
 
				+
			
 
				+        for m in self.modules():
			
 
				+            if isinstance(m, nn.Conv2d):
			
 
				+                n = m.kernel_size[0] * m.kernel_size[1] * m.out_channels
			
 
				+                m.weight.data.normal_(0, math.sqrt(2. / n))
			
 
				+                # m.bias.data.zero_()
			
 
				+            elif isinstance(m, nn.BatchNorm2d):
			
 
				+                m.weight.data.fill_(1)
			
 
				+                m.bias.data.zero_()
			
 
				+            elif isinstance(m, nn.Linear):
			
 
				+                init.kaiming_normal(m.weight)
			
 
				+                m.bias.data.zero_()
			
 
				+
			
 
				+    def _make_layer(self, block, planes, blocks, stride=1):
			
 
				+        downsample = None
			
 
				+        if stride != 1 or self.inplanes != planes * block.expansion:
			
 
				+            downsample = DownsampleA(self.inplanes, planes * block.expansion, stride)
			
 
				+
			
 
				+        layers = []
			
 
				+        layers.append(block(self.inplanes, planes, stride, downsample))
			
 
				+        self.inplanes = planes * block.expansion
			
 
				+        for i in range(1, blocks):
			
 
				+            layers.append(block(self.inplanes, planes))
			
 
				+
			
 
				+        return nn.Sequential(*layers)
			
 
				+
			
 
				+    def forward(self, x, pretrain=False):
			
 
				+
			
 
				+        x = self.conv_1_3x3(x)
			
 
				+        x = F.relu(self.bn_1(x), inplace=True)
			
 
				+        x = self.stage_1(x)
			
 
				+        x = self.stage_2(x)
			
 
				+        x = self.stage_3(x)
			
 
				+        x = self.avgpool(x)
			
 
				+        x = x.view(x.size(0), -1)
			
 
				+        if pretrain:
			
 
				+            return self.fc2(x)
			
 
				+        x = self.fc(x)
			
 
				+        return x
			
 
				+
			
 
				+
			
 
				+def resnet20(num_classes=10):
			
 
				+    """Constructs a ResNet-20 model for CIFAR-10 (by default)
			
 
				+    Args:
			
 
				+      num_classes (uint): number of classes
			
 
				+    """
			
 
				+    model = CifarResNet(ResNetBasicblock, 20, num_classes)
			
 
				+    return model
			
 
				+
			
 
				+
			
 
				+def resnet8(num_classes=10):
			
 
				+    """Constructs a ResNet-20 model for CIFAR-10 (by default)
			
 
				+    Args:
			
 
				+      num_classes (uint): number of classes
			
 
				+    """
			
 
				+    model = CifarResNet(ResNetBasicblock, 8, num_classes, 3)
			
 
				+    return model
			
 
				+
			
 
				+
			
 
				+def resnet20mnist(num_classes=10):
			
 
				+    """Constructs a ResNet-20 model for CIFAR-10 (by default)
			
 
				+    Args:
			
 
				+      num_classes (uint): number of classes
			
 
				+    """
			
 
				+    model = CifarResNet(ResNetBasicblock, 20, num_classes, 1)
			
 
				+    return model
			
 
				+
			
 
				+
			
 
				+def resnet32mnist(num_classes=10, channels=1):
			
 
				+    model = CifarResNet(ResNetBasicblock, 32, num_classes, channels)
			
 
				+    return model
			
 
				+
			
 
				+
			
 
				+def resnet32(num_classes=10):
			
 
				+    """Constructs a ResNet-32 model for CIFAR-10 (by default)
			
 
				+    Args:
			
 
				+      num_classes (uint): number of classes
			
 
				+    """
			
 
				+    model = CifarResNet(ResNetBasicblock, 32, num_classes)
			
 
				+    return model
			
 
				+
			
 
				+
			
 
				+def resnet44(num_classes=10):
			
 
				+    """Constructs a ResNet-44 model for CIFAR-10 (by default)
			
 
				+    Args:
			
 
				+      num_classes (uint): number of classes
			
 
				+    """
			
 
				+    model = CifarResNet(ResNetBasicblock, 44, num_classes)
			
 
				+    return model
			
 
				+
			
 
				+
			
 
				+def resnet56(num_classes=10):
			
 
				+    """Constructs a ResNet-56 model for CIFAR-10 (by default)
			
 
				+    Args:
			
 
				+      num_classes (uint): number of classes
			
 
				+    """
			
 
				+    model = CifarResNet(ResNetBasicblock, 56, num_classes)
			
 
				+    return model
			
 
				+
			
 
				+
			
 
				+def resnet110(num_classes=10):
			
 
				+    """Constructs a ResNet-110 model for CIFAR-10 (by default)
			
 
				+    Args:
			
 
				+      num_classes (uint): number of classes
			
 
				+    """
			
 
				+    model = CifarResNet(ResNetBasicblock, 110, num_classes)
			
 
				+    return model
			
--- a/Dewarp/plotter/__init__.py
+++ b/Dewarp/plotter/__init__.py
@@ -0,0 +1 @@
 
				+from plotter.plotter import *
			
--- a/Dewarp/plotter/plotter.py
+++ b/Dewarp/plotter/plotter.py
@@ -0,0 +1,88 @@
 
				+''' Incremental-Classifier Learning 
			
 
				+ Authors : Khurram Javed, Muhammad Talha Paracha
			
 
				+ Maintainer : Khurram Javed
			
 
				+ Lab : TUKL-SEECS R&D Lab
			
 
				+ Email : 14besekjaved@seecs.edu.pk '''
			
 
				+
			
 
				+import matplotlib
			
 
				+import matplotlib.pyplot as plt
			
 
				+
			
 
				+plt.switch_backend('agg')
			
 
				+
			
 
				+MEDIUM_SIZE = 18
			
 
				+
			
 
				+font = {'family': 'sans-serif',
			
 
				+        'weight': 'bold'}
			
 
				+
			
 
				+matplotlib.rc('xtick', labelsize=MEDIUM_SIZE)
			
 
				+matplotlib.rc('ytick', labelsize=MEDIUM_SIZE)
			
 
				+plt.rc('axes', labelsize=MEDIUM_SIZE)  # fontsize of the x and y labels
			
 
				+
			
 
				+# matplotlib.rc('font', **font)
			
 
				+from matplotlib import rcParams
			
 
				+
			
 
				+rcParams.update({'figure.autolayout': True})
			
 
				+
			
 
				+
			
 
				+class Plotter():
			
 
				+    def __init__(self):
			
 
				+        import itertools
			
 
				+        # plt.figure(figsize=(12, 9))
			
 
				+        self.marker = itertools.cycle(('o', '+', "v", "^", "8", '.', '*'))
			
 
				+        self.handles = []
			
 
				+        self.lines = itertools.cycle(('--', '-.', '-', ':'))
			
 
				+
			
 
				+    def plot(self, x, y, xLabel="Number of Classes", yLabel="Accuracy %", legend="none", title=None, error=None):
			
 
				+        self.x = x
			
 
				+        self.y = y
			
 
				+        plt.grid(color='0.89', linestyle='--', linewidth=1.0)
			
 
				+        if error is None:
			
 
				+            l, = plt.plot(x, y, linestyle=next(self.lines), marker=next(self.marker), label=legend, linewidth=3.0)
			
 
				+        else:
			
 
				+            l = plt.errorbar(x, y, yerr=error, capsize=4.0, capthick=2.0, linestyle=next(self.lines),
			
 
				+                             marker=next(self.marker), label=legend, linewidth=3.0)
			
 
				+
			
 
				+        self.handles.append(l)
			
 
				+        self.x_label = xLabel
			
 
				+        self.y_label = yLabel
			
 
				+        if title is not None:
			
 
				+            plt.title(title)
			
 
				+
			
 
				+    def save_fig(self, path, xticks=105, title=None, yStart=0, xRange=0, yRange=10):
			
 
				+        if title is not None:
			
 
				+            plt.title(title)
			
 
				+        plt.legend(handles=self.handles)
			
 
				+        plt.ylim((yStart, 100 + 0.2))
			
 
				+        plt.xlim((0, xticks + .2))
			
 
				+        plt.ylabel(self.y_label)
			
 
				+        plt.xlabel(self.x_label)
			
 
				+        plt.yticks(list(range(yStart, 101, yRange)))
			
 
				+        print(list(range(yStart, 105, yRange)))
			
 
				+        plt.xticks(list(range(0, xticks + 1, xRange + int(xticks / 10))))
			
 
				+        plt.savefig(path + ".eps", format='eps')
			
 
				+        plt.gcf().clear()
			
 
				+
			
 
				+    def save_fig2(self, path, xticks=105):
			
 
				+        plt.legend(handles=self.handles)
			
 
				+        plt.xlabel("Memory Budget")
			
 
				+        plt.ylabel("Average Incremental Accuracy")
			
 
				+        plt.savefig(path + ".jpg")
			
 
				+        plt.gcf().clear()
			
 
				+
			
 
				+    def plotMatrix(self, epoch, path, img):
			
 
				+
			
 
				+        plt.imshow(img, cmap='plasma', interpolation='nearest')
			
 
				+        plt.colorbar()
			
 
				+        plt.savefig(path + str(epoch) + ".svg", format='svg')
			
 
				+        plt.gcf().clear()
			
 
				+
			
 
				+    def saveImage(self, img, path, epoch):
			
 
				+        from PIL import Image
			
 
				+        im = Image.fromarray(img)
			
 
				+        im.save(path + str(epoch) + ".jpg")
			
 
				+
			
 
				+
			
 
				+if __name__ == "__main__":
			
 
				+    pl = Plotter()
			
 
				+    pl.plot([1, 2, 3, 4], [2, 3, 6, 2])
			
 
				+    pl.save_fig("test.jpg")
			
--- a/Dewarp/pytorch2onnx.py
+++ b/Dewarp/pytorch2onnx.py
@@ -0,0 +1,10 @@
 
				+import torch
			
 
				+import model
			
 
				+
			
 
				+
			
 
				+myModel = model.ModelFactory.get_model('resnet', 'document')
			
 
				+myModel.load_state_dict(torch.load('outputs/doc552023/doc_0505_0/doc_0505document_resnet.pth'))
			
 
				+myModel.eval()
			
 
				+
			
 
				+dummy_input = torch.randn(1, 3, 32, 32)
			
 
				+torch.onnx.export(myModel, dummy_input, "document_1.0.0.onnx", do_constant_folding=False)
			
--- a/Dewarp/pytorch2paddle.py
+++ b/Dewarp/pytorch2paddle.py
@@ -0,0 +1,19 @@
 
				+import torch
			
 
				+import numpy as np
			
 
				+
			
 
				+# 构建输入
			
 
				+import model
			
 
				+
			
 
				+input_data = np.random.rand(1, 3, 32, 32).astype("float32")
			
 
				+# 获取PyTorch Module
			
 
				+
			
 
				+myModel = model.ModelFactory.get_model('resnet', 'corner')
			
 
				+myModel.load_state_dict(torch.load('outputs/corner552023/corner_0505_1/corner_0505corner_resnet.pth'))
			
 
				+# 设置为eval模式
			
 
				+myModel.eval()
			
 
				+# 进行转换
			
 
				+from x2paddle.convert import pytorch2paddle
			
 
				+pytorch2paddle(myModel,
			
 
				+               save_dir="pd_model_trace1",
			
 
				+               jit_type="trace",
			
 
				+               input_examples=[torch.tensor(input_data)])
			
--- a/Dewarp/results/qualitativeResults.jpg
+++ b/Dewarp/results/qualitativeResults.jpg
--- a/Dewarp/smartdoc_data_processor/video_to_image.py
+++ b/Dewarp/smartdoc_data_processor/video_to_image.py
@@ -0,0 +1,41 @@
 
				+import os
			
 
				+
			
 
				+
			
 
				+def argsProcessor():
			
 
				+    import argparse
			
 
				+    parser = argparse.ArgumentParser()
			
 
				+    parser.add_argument("-d", "--dataPath", help="path to main data folder")
			
 
				+    parser.add_argument("-o", "--outputPath", help="output data")
			
 
				+    return parser.parse_args()
			
 
				+
			
 
				+
			
 
				+if __name__ == '__main__':
			
 
				+    args = argsProcessor()
			
 
				+    dir = args.dataPath
			
 
				+    output = args.outputPath
			
 
				+    print(dir)
			
 
				+    if not os.path.isdir(output):
			
 
				+        os.mkdir(output)
			
 
				+
			
 
				+    for folder in os.listdir(dir):
			
 
				+        if os.path.isdir(dir + "/" + folder):
			
 
				+            dir_temp = dir + '/' + folder + "/"
			
 
				+            for file in os.listdir(dir_temp):
			
 
				+                print(file)
			
 
				+                from subprocess import call
			
 
				+
			
 
				+                if file.endswith(".mp4"):
			
 
				+                    call("mkdir " + output + folder, shell=True)
			
 
				+                    if os.path.isdir(output + folder + "/" + file):
			
 
				+                        print("Folder already exist")
			
 
				+                    else:
			
 
				+                        call("cd " + output + folder + " && mkdir " + file, shell=True)
			
 
				+                        call("ls", shell=True)
			
 
				+
			
 
				+                        location = dir + folder + "/" + file
			
 
				+                        gt_address = "cp " + location[
			
 
				+                                             0:-4] + ".gt.xml " + output + folder + "/" + file + "/" + file + ".gt"
			
 
				+                        call(gt_address, shell=True)
			
 
				+                        command = "ffmpeg -i " + location + " " + output + folder + "/" + file + "/%3d.jpg"
			
 
				+                        print(command)
			
 
				+                        call(command, shell=True)
			
--- a/Dewarp/train_model.py
+++ b/Dewarp/train_model.py
@@ -0,0 +1,157 @@
 
				+''' Document Localization using Recursive CNN
			
 
				+ Maintainer : Khurram Javed
			
 
				+ Email : kjaved@ualberta.ca '''
			
 
				+
			
 
				+from __future__ import print_function
			
 
				+
			
 
				+import argparse
			
 
				+
			
 
				+import torch
			
 
				+import torch.utils.data as td
			
 
				+
			
 
				+import dataprocessor
			
 
				+import experiment as ex
			
 
				+import model
			
 
				+import trainer
			
 
				+import utils
			
 
				+
			
 
				+parser = argparse.ArgumentParser(description='Recursive-CNNs')
			
 
				+parser.add_argument('--batch-size', type=int, default=32, metavar='N',
			
 
				+                    help='input batch size for training (default: 32)')
			
 
				+parser.add_argument('--eval_interval', type=int, default=5)
			
 
				+parser.add_argument('--lr', type=float, default=0.005, metavar='LR',
			
 
				+                    help='learning rate (default: 0.005)')
			
 
				+parser.add_argument('--schedule', type=int, nargs='+', default=[10, 20, 30],
			
 
				+                    help='Decrease learning rate at these epochs.')
			
 
				+parser.add_argument('--gammas', type=float, nargs='+', default=[0.2, 0.2, 0.2],
			
 
				+                    help='LR is multiplied by gamma[k] on schedule[k], number of gammas should be equal to schedule')
			
 
				+parser.add_argument('--momentum', type=float, default=0.9, metavar='M',
			
 
				+                    help='SGD momentum (default: 0.9)')
			
 
				+parser.add_argument('--no-cuda', action='store_true', default=False,
			
 
				+                    help='disables CUDA training')
			
 
				+parser.add_argument('--pretrain', action='store_true', default=False,
			
 
				+                    help='Pretrain the model on CIFAR dataset?')
			
 
				+parser.add_argument('--load-ram', action='store_true', default=False,
			
 
				+                    help='Load data in ram: TODO : Remove this')
			
 
				+parser.add_argument('--debug', action='store_true', default=True,
			
 
				+                    help='Debug messages')
			
 
				+parser.add_argument('--seed', type=int, default=2323,
			
 
				+                    help='Seeds values to be used')
			
 
				+parser.add_argument('--log-interval', type=int, default=5, metavar='N',
			
 
				+                    help='how many batches to wait before logging training status')
			
 
				+parser.add_argument('--model-type', default="resnet",
			
 
				+                    help='model type to be used. Example : resnet32, resnet20, densenet, test')
			
 
				+parser.add_argument('--name', default="noname",
			
 
				+                    help='Name of the experiment')
			
 
				+parser.add_argument('--output-dir', default="./",
			
 
				+                    help='Directory to store the results; a new folder "DDMMYYYY" will be created '
			
 
				+                         'in the specified directory to save the results.')
			
 
				+parser.add_argument('--decay', type=float, default=0.00001, help='Weight decay (L2 penalty).')
			
 
				+parser.add_argument('--epochs', type=int, default=100, help='Number of epochs for trianing')
			
 
				+parser.add_argument('--dataset', default="document", help='Dataset to be used; example document, corner')
			
 
				+parser.add_argument('--loader', default="hdd", 
			
 
				+                    help='Loader to load data; hdd for reading from the hdd and ram for loading all data in the memory')
			
 
				+parser.add_argument("-i", "--data-dirs", nargs='+', default="/Users/khurramjaved96/documentTest64",
			
 
				+                    help="input Directory of train data")
			
 
				+parser.add_argument("-v", "--validation-dirs", nargs='+', default="/Users/khurramjaved96/documentTest64",
			
 
				+                    help="input Directory of val data")
			
 
				+
			
 
				+args = parser.parse_args()
			
 
				+
			
 
				+# Define an experiment.
			
 
				+my_experiment = ex.experiment(args.name, args, args.output_dir)
			
 
				+
			
 
				+# Add logging support
			
 
				+logger = utils.utils.setup_logger(my_experiment.path)
			
 
				+
			
 
				+args.cuda = not args.no_cuda and torch.cuda.is_available()
			
 
				+
			
 
				+dataset = dataprocessor.DatasetFactory.get_dataset(args.data_dirs, args.dataset)
			
 
				+
			
 
				+dataset_val = dataprocessor.DatasetFactory.get_dataset(args.validation_dirs, args.dataset)
			
 
				+
			
 
				+# Fix the seed.
			
 
				+seed = args.seed
			
 
				+torch.manual_seed(seed)
			
 
				+if args.cuda:
			
 
				+    torch.cuda.manual_seed(seed)
			
 
				+
			
 
				+train_dataset_loader = dataprocessor.LoaderFactory.get_loader(args.loader, dataset.myData,
			
 
				+                                                              transform=dataset.train_transform,
			
 
				+                                                              cuda=args.cuda)
			
 
				+# Loader used for training data
			
 
				+val_dataset_loader = dataprocessor.LoaderFactory.get_loader(args.loader, dataset_val.myData,
			
 
				+                                                            transform=dataset.test_transform,
			
 
				+                                                            cuda=args.cuda)
			
 
				+kwargs = {'num_workers': 1, 'pin_memory': True} if args.cuda else {}
			
 
				+
			
 
				+# Iterator to iterate over training data.
			
 
				+train_iterator = torch.utils.data.DataLoader(train_dataset_loader,
			
 
				+                                             batch_size=args.batch_size, shuffle=True, **kwargs)
			
 
				+# Iterator to iterate over training data.
			
 
				+val_iterator = torch.utils.data.DataLoader(val_dataset_loader,
			
 
				+                                           batch_size=args.batch_size, shuffle=True, **kwargs)
			
 
				+
			
 
				+# Get the required model
			
 
				+myModel = model.ModelFactory.get_model(args.model_type, args.dataset)
			
 
				+if args.cuda:
			
 
				+    myModel.cuda()
			
 
				+
			
 
				+# Should I pretrain the model on CIFAR?
			
 
				+if args.pretrain:
			
 
				+    trainset = dataprocessor.DatasetFactory.get_dataset(None, "CIFAR")
			
 
				+    train_iterator_cifar = torch.utils.data.DataLoader(trainset, batch_size=32, shuffle=True, num_workers=2)
			
 
				+
			
 
				+    # Define the optimizer used in the experiment
			
 
				+    cifar_optimizer = torch.optim.SGD(myModel.parameters(), args.lr, momentum=args.momentum,
			
 
				+                                      weight_decay=args.decay, nesterov=True)
			
 
				+
			
 
				+    # Trainer object used for training
			
 
				+    cifar_trainer = trainer.CIFARTrainer(train_iterator_cifar, myModel, args.cuda, cifar_optimizer)
			
 
				+
			
 
				+    for epoch in range(0, 70):
			
 
				+        logger.info("Epoch : %d", epoch)
			
 
				+        cifar_trainer.update_lr(epoch, [30, 45, 60], args.gammas)
			
 
				+        cifar_trainer.train(epoch)
			
 
				+
			
 
				+    # Freeze the model
			
 
				+    counter = 0
			
 
				+    for name, param in myModel.named_parameters():
			
 
				+        # Getting the length of total layers so I can freeze x% of layers
			
 
				+        gen_len = sum(1 for _ in myModel.parameters())
			
 
				+        if counter < int(gen_len * 0.5):
			
 
				+            param.requires_grad = False
			
 
				+            logger.warning(name)
			
 
				+        else:
			
 
				+            logger.info(name)
			
 
				+        counter += 1
			
 
				+
			
 
				+# Define the optimizer used in the experiment
			
 
				+optimizer = torch.optim.SGD(filter(lambda p: p.requires_grad, myModel.parameters()), args.lr,
			
 
				+                            momentum=args.momentum,
			
 
				+                            weight_decay=args.decay, nesterov=True)
			
 
				+
			
 
				+# Trainer object used for training
			
 
				+my_trainer = trainer.Trainer(train_iterator, myModel, args.cuda, optimizer)
			
 
				+
			
 
				+# Evaluator
			
 
				+my_eval = trainer.EvaluatorFactory.get_evaluator("rmse", args.cuda)
			
 
				+# Running epochs_class epochs
			
 
				+cnt = 1
			
 
				+max_loss = 100
			
 
				+for epoch in range(0, args.epochs):
			
 
				+    logger.info("Epoch : %d", epoch)
			
 
				+    my_trainer.update_lr(epoch, args.schedule, args.gammas)
			
 
				+    l = my_trainer.train(epoch)
			
 
				+    loss = float(l)
			
 
				+    if loss < max_loss:
			
 
				+        torch.save(myModel.state_dict(), my_experiment.path + "_" + args.dataset + "_" + args.model_type+ "_best.pth")
			
 
				+        logger.info("best_model saved, avg_loss is %s", l)
			
 
				+        max_loss = loss
			
 
				+    logger.info("the best model's avg_loss is %s", l)
			
 
				+    if cnt%args.eval_interval == 0:
			
 
				+        my_eval.evaluate(my_trainer.model, val_iterator)
			
 
				+    cnt += 1
			
 
				+torch.save(myModel.state_dict(), my_experiment.path + "_" + args.dataset + "_" + args.model_type+ "_final.pth")
			
 
				+# torch.save(myModel, my_experiment.path + args.dataset + "_" + args.model_type+ ".pth")
			
 
				+my_experiment.store_json()
			
--- a/Dewarp/train_seg_model.py
+++ b/Dewarp/train_seg_model.py
@@ -0,0 +1,149 @@
 
				+## Document Localization using Recursive CNN
			
 
				+## Maintainer : Khurram Javed
			
 
				+## Email : kjaved@ualberta.ca
			
 
				+
			
 
				+''' Document Localization using Recursive CNN
			
 
				+ Maintainer : Khurram Javed
			
 
				+ Email : kjaved@ualberta.ca '''
			
 
				+
			
 
				+from __future__ import print_function
			
 
				+
			
 
				+import argparse
			
 
				+
			
 
				+import torch
			
 
				+import torch.utils.data as td
			
 
				+
			
 
				+import dataprocessor
			
 
				+import experiment as ex
			
 
				+import model
			
 
				+import trainer
			
 
				+import utils
			
 
				+
			
 
				+parser = argparse.ArgumentParser(description='iCarl2.0')
			
 
				+parser.add_argument('--batch-size', type=int, default=32, metavar='N',
			
 
				+                    help='input batch size for training (default: 64)')
			
 
				+parser.add_argument('--lr', type=float, default=0.005, metavar='LR',
			
 
				+                    help='learning rate (default: 2.0)')
			
 
				+parser.add_argument('--schedule', type=int, nargs='+', default=[10, 20, 30],
			
 
				+                    help='Decrease learning rate at these epochs.')
			
 
				+parser.add_argument('--gammas', type=float, nargs='+', default=[0.2, 0.2, 0.2],
			
 
				+                    help='LR is multiplied by gamma on schedule, number of gammas should be equal to schedule')
			
 
				+parser.add_argument('--momentum', type=float, default=0.9, metavar='M',
			
 
				+                    help='SGD momentum (default: 0.9)')
			
 
				+parser.add_argument('--no-cuda', action='store_true', default=False,
			
 
				+                    help='disables CUDA training')
			
 
				+parser.add_argument('--pretrain', action='store_true', default=False,
			
 
				+                    help='Pretrain the model on CIFAR dataset?')
			
 
				+parser.add_argument('--load-ram', action='store_true', default=False,
			
 
				+                    help='Load data in ram')
			
 
				+parser.add_argument('--debug', action='store_true', default=True,
			
 
				+                    help='Debug messages')
			
 
				+parser.add_argument('--seed', type=int, default=2323,
			
 
				+                    help='Seeds values to be used')
			
 
				+parser.add_argument('--log-interval', type=int, default=5, metavar='N',
			
 
				+                    help='how many batches to wait before logging training status')
			
 
				+parser.add_argument('--model-type', default="resnet",
			
 
				+                    help='model type to be used. Example : resnet32, resnet20, densenet, test')
			
 
				+parser.add_argument('--name', default="noname",
			
 
				+                    help='Name of the experiment')
			
 
				+parser.add_argument('--output-dir', default="../",
			
 
				+                    help='Directory to store the results; a new folder "DDMMYYYY" will be created '
			
 
				+                         'in the specified directory to save the results.')
			
 
				+parser.add_argument('--decay', type=float, default=0.00001, help='Weight decay (L2 penalty).')
			
 
				+parser.add_argument('--epochs', type=int, default=40, help='Number of epochs for each increment')
			
 
				+parser.add_argument('--dataset', default="document", help='Dataset to be used; example CIFAR, MNIST')
			
 
				+parser.add_argument('--loader', default="hdd", help='Dataset to be used; example CIFAR, MNIST')
			
 
				+parser.add_argument("-i", "--data-dirs", nargs='+', default="/Users/khurramjaved96/documentTest64",
			
 
				+                    help="input Directory of train data")
			
 
				+parser.add_argument("-v", "--validation-dirs", nargs='+', default="/Users/khurramjaved96/documentTest64",
			
 
				+                    help="input Directory of val data")
			
 
				+
			
 
				+args = parser.parse_args()
			
 
				+
			
 
				+# Define an experiment.
			
 
				+my_experiment = ex.experiment(args.name, args, args.output_dir)
			
 
				+
			
 
				+# Add logging support
			
 
				+logger = utils.utils.setup_logger(my_experiment.path)
			
 
				+
			
 
				+args.cuda = not args.no_cuda and torch.cuda.is_available()
			
 
				+
			
 
				+dataset = dataprocessor.DatasetFactory.get_dataset(args.data_dirs, args.dataset)
			
 
				+
			
 
				+dataset_val = dataprocessor.DatasetFactory.get_dataset(args.validation_dirs, args.dataset)
			
 
				+
			
 
				+# Fix the seed.
			
 
				+seed = args.seed
			
 
				+torch.manual_seed(seed)
			
 
				+if args.cuda:
			
 
				+    torch.cuda.manual_seed(seed)
			
 
				+
			
 
				+train_dataset_loader = dataprocessor.LoaderFactory.get_loader(args.loader, dataset.myData,
			
 
				+                                                              transform=dataset.train_transform,
			
 
				+                                                              cuda=args.cuda)
			
 
				+# Loader used for training data
			
 
				+val_dataset_loader = dataprocessor.LoaderFactory.get_loader(args.loader, dataset_val.myData,
			
 
				+                                                            transform=dataset.test_transform,
			
 
				+                                                            cuda=args.cuda)
			
 
				+kwargs = {'num_workers': 1, 'pin_memory': True} if args.cuda else {}
			
 
				+
			
 
				+# Iterator to iterate over training data.
			
 
				+train_iterator = torch.utils.data.DataLoader(train_dataset_loader,
			
 
				+                                             batch_size=args.batch_size, shuffle=True, **kwargs)
			
 
				+# Iterator to iterate over training data.
			
 
				+val_iterator = torch.utils.data.DataLoader(val_dataset_loader,
			
 
				+                                           batch_size=args.batch_size, shuffle=True, **kwargs)
			
 
				+
			
 
				+# Get the required model
			
 
				+myModel = model.ModelFactory.get_model(args.model_type, args.dataset)
			
 
				+if args.cuda:
			
 
				+    myModel.cuda()
			
 
				+
			
 
				+# Should I pretrain the model on CIFAR?
			
 
				+if args.pretrain:
			
 
				+    trainset = dataprocessor.DatasetFactory.get_dataset(None, "CIFAR")
			
 
				+    train_iterator_cifar = torch.utils.data.DataLoader(trainset, batch_size=32, shuffle=True, num_workers=2)
			
 
				+
			
 
				+    # Define the optimizer used in the experiment
			
 
				+    cifar_optimizer = torch.optim.SGD(myModel.parameters(), args.lr, momentum=args.momentum,
			
 
				+                                      weight_decay=args.decay, nesterov=True)
			
 
				+
			
 
				+    # Trainer object used for training
			
 
				+    cifar_trainer = trainer.CIFARTrainer(train_iterator_cifar, myModel, args.cuda, cifar_optimizer)
			
 
				+
			
 
				+    for epoch in range(0, 70):
			
 
				+        logger.info("Epoch : %d", epoch)
			
 
				+        cifar_trainer.update_lr(epoch, [30, 45, 60], args.gammas)
			
 
				+        cifar_trainer.train(epoch)
			
 
				+
			
 
				+    # Freeze the model
			
 
				+    counter = 0
			
 
				+    for name, param in myModel.named_parameters():
			
 
				+        # Getting the length of total layers so I can freeze x% of layers
			
 
				+        gen_len = sum(1 for _ in myModel.parameters())
			
 
				+        if counter < int(gen_len * 0.5):
			
 
				+            param.requires_grad = False
			
 
				+            logger.warning(name)
			
 
				+        else:
			
 
				+            logger.info(name)
			
 
				+        counter += 1
			
 
				+
			
 
				+# Define the optimizer used in the experiment
			
 
				+optimizer = torch.optim.SGD(filter(lambda p: p.requires_grad, myModel.parameters()), args.lr,
			
 
				+                            momentum=args.momentum,
			
 
				+                            weight_decay=args.decay, nesterov=True)
			
 
				+
			
 
				+# Trainer object used for training
			
 
				+my_trainer = trainer.Trainer(train_iterator, myModel, args.cuda, optimizer)
			
 
				+
			
 
				+# Evaluator
			
 
				+my_eval = trainer.EvaluatorFactory.get_evaluator("rmse", args.cuda)
			
 
				+# Running epochs_class epochs
			
 
				+for epoch in range(0, args.epochs):
			
 
				+    logger.info("Epoch : %d", epoch)
			
 
				+    my_trainer.update_lr(epoch, args.schedule, args.gammas)
			
 
				+    my_trainer.train(epoch)
			
 
				+    my_eval.evaluate(my_trainer.model, val_iterator)
			
 
				+
			
 
				+torch.save(myModel.state_dict(), my_experiment.path + args.dataset + "_" + args.model_type+ ".pb")
			
 
				+my_experiment.store_json()
			
--- a/Dewarp/trainer/__init__.py
+++ b/Dewarp/trainer/__init__.py
@@ -0,0 +1,2 @@
 
				+from trainer.evaluator import *
			
 
				+from trainer.trainer import *
			
--- a/Dewarp/trainer/evaluator.py
+++ b/Dewarp/trainer/evaluator.py
@@ -0,0 +1,63 @@
 
				+''' Incremental-Classifier Learning 
			
 
				+ Authors : Khurram Javed, Muhammad Talha Paracha
			
 
				+ Maintainer : Khurram Javed
			
 
				+ Lab : TUKL-SEECS R&D Lab
			
 
				+ Email : 14besekjaved@seecs.edu.pk '''
			
 
				+
			
 
				+import logging
			
 
				+
			
 
				+import numpy as np
			
 
				+import torch
			
 
				+import torch.nn.functional as F
			
 
				+from torch.autograd import Variable
			
 
				+from torchnet.meter import confusionmeter
			
 
				+from tqdm import tqdm
			
 
				+
			
 
				+logger = logging.getLogger('iCARL')
			
 
				+
			
 
				+
			
 
				+class EvaluatorFactory():
			
 
				+    '''
			
 
				+    This class is used to get different versions of evaluators
			
 
				+    '''
			
 
				+    def __init__(self):
			
 
				+        pass
			
 
				+
			
 
				+    @staticmethod
			
 
				+    def get_evaluator(testType="rmse", cuda=True):
			
 
				+        if testType == "rmse":
			
 
				+            return DocumentMseEvaluator(cuda)
			
 
				+
			
 
				+
			
 
				+
			
 
				+class DocumentMseEvaluator():
			
 
				+    '''
			
 
				+    Evaluator class for softmax classification 
			
 
				+    '''
			
 
				+    def __init__(self, cuda):
			
 
				+        self.cuda = cuda
			
 
				+
			
 
				+
			
 
				+    def evaluate(self, model, iterator):
			
 
				+        model.eval()
			
 
				+        lossAvg = None
			
 
				+        with torch.no_grad():
			
 
				+            for img, target in tqdm(iterator):
			
 
				+                if self.cuda:
			
 
				+                    img, target = img.cuda(), target.cuda()
			
 
				+
			
 
				+                response = model(Variable(img))
			
 
				+                # print (response[0])
			
 
				+                # print (target[0])
			
 
				+                loss = F.mse_loss(response, Variable(target.float()))
			
 
				+                loss = torch.sqrt(loss)
			
 
				+                if lossAvg is None:
			
 
				+                    lossAvg = loss
			
 
				+                else:
			
 
				+                    lossAvg += loss
			
 
				+                # logger.debug("Cur loss %s", str(loss))
			
 
				+
			
 
				+        lossAvg /= len(iterator)
			
 
				+        logger.info("Avg Val Loss %s", str((lossAvg).cpu().data.numpy()))
			
 
				+
			
 
				+
			
--- a/Dewarp/trainer/trainer.py
+++ b/Dewarp/trainer/trainer.py
@@ -0,0 +1,111 @@
 
				+''' Pytorch Recursive CNN Trainer
			
 
				+ Authors : Khurram Javed
			
 
				+ Maintainer : Khurram Javed
			
 
				+ Lab : TUKL-SEECS R&D Lab
			
 
				+ Email : 14besekjaved@seecs.edu.pk '''
			
 
				+
			
 
				+from __future__ import print_function
			
 
				+
			
 
				+import logging
			
 
				+
			
 
				+from torch.autograd import Variable
			
 
				+
			
 
				+logger = logging.getLogger('iCARL')
			
 
				+import torch.nn.functional as F
			
 
				+import torch
			
 
				+from tqdm import tqdm
			
 
				+
			
 
				+
			
 
				+class GenericTrainer:
			
 
				+    '''
			
 
				+    Base class for trainer; to implement a new training routine, inherit from this. 
			
 
				+    '''
			
 
				+
			
 
				+    def __init__(self):
			
 
				+        pass
			
 
				+
			
 
				+
			
 
				+
			
 
				+class Trainer(GenericTrainer):
			
 
				+    def __init__(self, train_iterator, model, cuda, optimizer):
			
 
				+        super().__init__()
			
 
				+        self.cuda = cuda
			
 
				+        self.train_iterator = train_iterator
			
 
				+        self.model = model
			
 
				+        self.optimizer = optimizer
			
 
				+
			
 
				+    def update_lr(self, epoch, schedule, gammas):
			
 
				+        for temp in range(0, len(schedule)):
			
 
				+            if schedule[temp] == epoch:
			
 
				+                for param_group in self.optimizer.param_groups:
			
 
				+                    self.current_lr = param_group['lr']
			
 
				+                    param_group['lr'] = self.current_lr * gammas[temp]
			
 
				+                    logger.debug("Changing learning rate from %0.9f to %0.9f", self.current_lr,
			
 
				+                                 self.current_lr * gammas[temp])
			
 
				+                    self.current_lr *= gammas[temp]
			
 
				+
			
 
				+    def train(self, epoch):
			
 
				+        self.model.train()
			
 
				+        lossAvg = None
			
 
				+        for img, target in tqdm(self.train_iterator):
			
 
				+            if self.cuda:
			
 
				+                img, target = img.cuda(), target.cuda()
			
 
				+            self.optimizer.zero_grad()
			
 
				+            response = self.model(Variable(img))
			
 
				+            # print (response[0])
			
 
				+            # print (target[0])
			
 
				+            loss = F.mse_loss(response, Variable(target.float()))
			
 
				+            loss = torch.sqrt(loss)
			
 
				+            if lossAvg is None:
			
 
				+                lossAvg = loss
			
 
				+            else:
			
 
				+                lossAvg += loss
			
 
				+            # logger.debug("Cur loss %s", str(loss))
			
 
				+            loss.backward()
			
 
				+            self.optimizer.step()
			
 
				+
			
 
				+        lossAvg /= len(self.train_iterator)
			
 
				+        logger.info("Avg Loss %s", str((lossAvg).cpu().data.numpy()))
			
 
				+        return str((lossAvg).cpu().data.numpy())
			
 
				+
			
 
				+
			
 
				+class CIFARTrainer(GenericTrainer):
			
 
				+    def __init__(self, train_iterator, model, cuda, optimizer):
			
 
				+        super().__init__()
			
 
				+        self.cuda = cuda
			
 
				+        self.train_iterator = train_iterator
			
 
				+        self.model = model
			
 
				+        self.optimizer = optimizer
			
 
				+        self.criterion = torch.nn.CrossEntropyLoss()
			
 
				+
			
 
				+    def update_lr(self, epoch, schedule, gammas):
			
 
				+        for temp in range(0, len(schedule)):
			
 
				+            if schedule[temp] == epoch:
			
 
				+                for param_group in self.optimizer.param_groups:
			
 
				+                    self.current_lr = param_group['lr']
			
 
				+                    param_group['lr'] = self.current_lr * gammas[temp]
			
 
				+                    logger.debug("Changing learning rate from %0.9f to %0.9f", self.current_lr,
			
 
				+                                 self.current_lr * gammas[temp])
			
 
				+                    self.current_lr *= gammas[temp]
			
 
				+
			
 
				+    def train(self, epoch):
			
 
				+        self.model.train()
			
 
				+        train_loss = 0
			
 
				+        correct = 0
			
 
				+        total = 0
			
 
				+        for inputs, targets in tqdm(self.train_iterator):
			
 
				+            if self.cuda:
			
 
				+                inputs, targets = inputs.cuda(), targets.cuda()
			
 
				+            self.optimizer.zero_grad()
			
 
				+            outputs = self.model(Variable(inputs), pretrain=True)
			
 
				+            loss = self.criterion(outputs, Variable(targets))
			
 
				+            loss.backward()
			
 
				+            self.optimizer.step()
			
 
				+
			
 
				+            train_loss += loss.item()
			
 
				+            _, predicted = outputs.max(1)
			
 
				+            total += targets.size(0)
			
 
				+            correct += predicted.eq(targets).sum().item()
			
 
				+
			
 
				+        logger.info("Accuracy : %s", str((correct * 100) / total))
			
 
				+        return correct / total
			
--- a/Dewarp/utils/__init__.py
+++ b/Dewarp/utils/__init__.py
@@ -0,0 +1,2 @@
 
				+from utils import utils
			
 
				+from utils import colorer
			
--- a/Dewarp/utils/colorer.py
+++ b/Dewarp/utils/colorer.py
@@ -0,0 +1,114 @@
 
				+#!/usr/bin/env python
			
 
				+# encoding: utf-8
			
 
				+import logging
			
 
				+
			
 
				+# Source : # http://stackoverflow.com/questions/384076/how-can-i-color-python-logging-output
			
 
				+
			
 
				+# now we patch Python code to add color support to logging.StreamHandler
			
 
				+def add_coloring_to_emit_windows(fn):
			
 
				+    # add methods we need to the class
			
 
				+    def _out_handle(self):
			
 
				+        import ctypes
			
 
				+        return ctypes.windll.kernel32.GetStdHandle(self.STD_OUTPUT_HANDLE)
			
 
				+
			
 
				+    out_handle = property(_out_handle)
			
 
				+
			
 
				+    def _set_color(self, code):
			
 
				+        import ctypes
			
 
				+        # Constants from the Windows API
			
 
				+        self.STD_OUTPUT_HANDLE = -11
			
 
				+        hdl = ctypes.windll.kernel32.GetStdHandle(self.STD_OUTPUT_HANDLE)
			
 
				+        ctypes.windll.kernel32.SetConsoleTextAttribute(hdl, code)
			
 
				+
			
 
				+    setattr(logging.StreamHandler, '_set_color', _set_color)
			
 
				+
			
 
				+    def new(*args):
			
 
				+        FOREGROUND_BLUE = 0x0001  # text color contains blue.
			
 
				+        FOREGROUND_GREEN = 0x0002  # text color contains green.
			
 
				+        FOREGROUND_RED = 0x0004  # text color contains red.
			
 
				+        FOREGROUND_INTENSITY = 0x0008  # text color is intensified.
			
 
				+        FOREGROUND_WHITE = FOREGROUND_BLUE | FOREGROUND_GREEN | FOREGROUND_RED
			
 
				+        # winbase.h
			
 
				+        STD_INPUT_HANDLE = -10
			
 
				+        STD_OUTPUT_HANDLE = -11
			
 
				+        STD_ERROR_HANDLE = -12
			
 
				+
			
 
				+        # wincon.h
			
 
				+        FOREGROUND_BLACK = 0x0000
			
 
				+        FOREGROUND_BLUE = 0x0001
			
 
				+        FOREGROUND_GREEN = 0x0002
			
 
				+        FOREGROUND_CYAN = 0x0003
			
 
				+        FOREGROUND_RED = 0x0004
			
 
				+        FOREGROUND_MAGENTA = 0x0005
			
 
				+        FOREGROUND_YELLOW = 0x0006
			
 
				+        FOREGROUND_GREY = 0x0007
			
 
				+        FOREGROUND_INTENSITY = 0x0008  # foreground color is intensified.
			
 
				+
			
 
				+        BACKGROUND_BLACK = 0x0000
			
 
				+        BACKGROUND_BLUE = 0x0010
			
 
				+        BACKGROUND_GREEN = 0x0020
			
 
				+        BACKGROUND_CYAN = 0x0030
			
 
				+        BACKGROUND_RED = 0x0040
			
 
				+        BACKGROUND_MAGENTA = 0x0050
			
 
				+        BACKGROUND_YELLOW = 0x0060
			
 
				+        BACKGROUND_GREY = 0x0070
			
 
				+        BACKGROUND_INTENSITY = 0x0080  # background color is intensified.
			
 
				+
			
 
				+        levelno = args[1].levelno
			
 
				+        if (levelno >= 50):
			
 
				+            color = BACKGROUND_YELLOW | FOREGROUND_RED | FOREGROUND_INTENSITY | BACKGROUND_INTENSITY
			
 
				+        elif (levelno >= 40):
			
 
				+            color = FOREGROUND_RED | FOREGROUND_INTENSITY
			
 
				+        elif (levelno >= 30):
			
 
				+            color = FOREGROUND_YELLOW | FOREGROUND_INTENSITY
			
 
				+        elif (levelno >= 20):
			
 
				+            color = FOREGROUND_GREEN
			
 
				+        elif (levelno >= 10):
			
 
				+            color = FOREGROUND_MAGENTA
			
 
				+        else:
			
 
				+            color = FOREGROUND_WHITE
			
 
				+        args[0]._set_color(color)
			
 
				+
			
 
				+        ret = fn(*args)
			
 
				+        args[0]._set_color(FOREGROUND_WHITE)
			
 
				+        # print "after"
			
 
				+        return ret
			
 
				+
			
 
				+    return new
			
 
				+
			
 
				+
			
 
				+def add_coloring_to_emit_ansi(fn):
			
 
				+    # add methods we need to the class
			
 
				+    def new(*args):
			
 
				+        levelno = args[1].levelno
			
 
				+        if (levelno >= 50):
			
 
				+            color = '\x1b[31m'  # red
			
 
				+        elif (levelno >= 40):
			
 
				+            color = '\x1b[31m'  # red
			
 
				+        elif (levelno >= 30):
			
 
				+            color = '\x1b[33m'  # yellow
			
 
				+        elif (levelno >= 20):
			
 
				+            color = '\x1b[32m'  # green
			
 
				+        elif (levelno >= 10):
			
 
				+            color = '\x1b[35m'  # pink
			
 
				+        else:
			
 
				+            color = '\x1b[0m'  # normal
			
 
				+        args[1].msg = color + args[1].msg + '\x1b[0m'  # normal
			
 
				+        # print "after"
			
 
				+        return fn(*args)
			
 
				+
			
 
				+    return new
			
 
				+
			
 
				+
			
 
				+import platform
			
 
				+
			
 
				+if platform.system() == 'Windows':
			
 
				+    # Windows does not support ANSI escapes and we are using API calls to set the console color
			
 
				+    logging.StreamHandler.emit = add_coloring_to_emit_windows(logging.StreamHandler.emit)
			
 
				+else:
			
 
				+    # all non-Windows platforms are supporting ANSI escapes so we use them
			
 
				+    logging.StreamHandler.emit = add_coloring_to_emit_ansi(logging.StreamHandler.emit)
			
 
				+    # log = logging.getLogger()
			
 
				+    # log.addFilter(log_filter())
			
 
				+    # //hdlr = logging.StreamHandler()
			
 
				+    # //hdlr.setFormatter(formatter())
			
--- a/Dewarp/utils/utils.py
+++ b/Dewarp/utils/utils.py
@@ -0,0 +1,296 @@
 
				+''' Document Localization using Recursive CNN
			
 
				+ Maintainer : Khurram Javed
			
 
				+ Email : kjaved@ualberta.ca '''
			
 
				+
			
 
				+import random
			
 
				+
			
 
				+import cv2
			
 
				+import numpy as np
			
 
				+import Polygon
			
 
				+
			
 
				+def unison_shuffled_copies(a, b):
			
 
				+    assert len(a) == len(b)
			
 
				+    p = np.random.permutation(len(a))
			
 
				+    return a[p], b[p]
			
 
				+
			
 
				+
			
 
				+def intersection(a, b, img):
			
 
				+    img1 = np.zeros_like(img)
			
 
				+
			
 
				+    cv2.fillConvexPoly(img1, a, (255, 0, 0))
			
 
				+    img1 = np.sum(img1, axis=2)
			
 
				+
			
 
				+    img1 = img1 / 255
			
 
				+
			
 
				+    img2 = np.zeros_like(img)
			
 
				+    cv2.fillConvexPoly(img2, b, (255, 0, 0))
			
 
				+    img2 = np.sum(img2, axis=2)
			
 
				+    img2 = img2 / 255
			
 
				+
			
 
				+    inte = img1 * img2
			
 
				+    union = np.logical_or(img1, img2)
			
 
				+    iou = np.sum(inte) / np.sum(union)
			
 
				+    print(iou)
			
 
				+    return iou
			
 
				+
			
 
				+
			
 
				+def intersection_with_correction(a, b, img):
			
 
				+    img1 = np.zeros_like(img)
			
 
				+    cv2.fillConvexPoly(img1, a, (255, 0, 0))
			
 
				+
			
 
				+    img2 = np.zeros_like(img)
			
 
				+    cv2.fillConvexPoly(img2, b, (255, 0, 0))
			
 
				+    min_x = min(a[0][0], a[1][0], a[2][0], a[3][0])
			
 
				+    min_y = min(a[0][1], a[1][1], a[2][1], a[3][1])
			
 
				+    max_x = max(a[0][0], a[1][0], a[2][0], a[3][0])
			
 
				+    max_y = max(a[0][1], a[1][1], a[2][1], a[3][1])
			
 
				+
			
 
				+    dst = np.array(((min_x, min_y), (max_x, min_y), (max_x, max_y), (min_x, max_y)))
			
 
				+    mat = cv2.getPerspectiveTransform(a.astype(np.float32), dst.astype(np.float32))
			
 
				+    img1 = cv2.warpPerspective(img1, mat, tuple((img.shape[0], img.shape[1])))
			
 
				+    img2 = cv2.warpPerspective(img2, mat, tuple((img.shape[0], img.shape[1])))
			
 
				+
			
 
				+    img1 = np.sum(img1, axis=2)
			
 
				+    img1 = img1 / 255
			
 
				+    img2 = np.sum(img2, axis=2)
			
 
				+    img2 = img2 / 255
			
 
				+
			
 
				+    inte = img1 * img2
			
 
				+    union = np.logical_or(img1, img2)
			
 
				+    iou = np.sum(inte) / np.sum(union)
			
 
				+    return iou
			
 
				+
			
 
				+def intersection_with_correction_smart_doc_implementation(gt, prediction, img):
			
 
				+
			
 
				+    # Reference : https://github.com/jchazalon/smartdoc15-ch1-eval
			
 
				+
			
 
				+    gt = sort_gt(gt)
			
 
				+    prediction = sort_gt(prediction)
			
 
				+    img1 = np.zeros_like(img)
			
 
				+    cv2.fillConvexPoly(img1, gt, (255, 0, 0))
			
 
				+
			
 
				+    target_width = 2100
			
 
				+    target_height = 2970
			
 
				+    # Referential: (0,0) at TL, x > 0 toward right and y > 0 toward bottom
			
 
				+    # Corner order: TL, BL, BR, TR
			
 
				+    # object_coord_target = np.float32([[0, 0], [0, target_height], [target_width, target_height], [target_width, 0]])
			
 
				+    object_coord_target = np.array(np.float32([[0, 0], [target_width, 0], [target_width, target_height],[0, target_height]]))
			
 
				+    # print (gt, object_coord_target)
			
 
				+    H = cv2.getPerspectiveTransform(gt.astype(np.float32).reshape(-1, 1, 2), object_coord_target.reshape(-1, 1, 2))
			
 
				+
			
 
				+    # 2/ Apply to test result to project in target referential
			
 
				+    test_coords = cv2.perspectiveTransform(prediction.astype(np.float32).reshape(-1, 1, 2), H)
			
 
				+
			
 
				+    # 3/ Compute intersection between target region and test result region
			
 
				+    # poly = Polygon.Polygon([(0,0),(1,0),(0,1)])
			
 
				+    poly_target = Polygon.Polygon(object_coord_target.reshape(-1, 2))
			
 
				+    poly_test = Polygon.Polygon(test_coords.reshape(-1, 2))
			
 
				+    poly_inter = poly_target & poly_test
			
 
				+
			
 
				+    area_target = poly_target.area()
			
 
				+    area_test = poly_test.area()
			
 
				+    area_inter = poly_inter.area()
			
 
				+
			
 
				+    area_union = area_test + area_target - area_inter
			
 
				+    # Little hack to cope with float precision issues when dealing with polygons:
			
 
				+    #   If intersection area is close enough to target area or GT area, but slighlty >,
			
 
				+    #   then fix it, assuming it is due to rounding issues.
			
 
				+    area_min = min(area_target, area_test)
			
 
				+    if area_min < area_inter and area_min * 1.0000000001 > area_inter:
			
 
				+        area_inter = area_min
			
 
				+        print("Capping area_inter.")
			
 
				+
			
 
				+    jaccard_index = area_inter / area_union
			
 
				+    return jaccard_index
			
 
				+
			
 
				+
			
 
				+
			
 
				+def __rotateImage(image, angle):
			
 
				+    rot_mat = cv2.getRotationMatrix2D((image.shape[1] / 2, image.shape[0] / 2), angle, 1)
			
 
				+    result = cv2.warpAffine(image, rot_mat, (image.shape[1], image.shape[0]), flags=cv2.INTER_LINEAR)
			
 
				+    return result, rot_mat
			
 
				+
			
 
				+
			
 
				+def rotate(img, gt, angle):
			
 
				+    img, mat = __rotateImage(img, angle)
			
 
				+    gt = gt.astype(np.float64)
			
 
				+    for a in range(0, 4):
			
 
				+        gt[a] = np.dot(mat[..., 0:2], gt[a]) + mat[..., 2]
			
 
				+    return img, gt
			
 
				+
			
 
				+
			
 
				+def random_crop(img, gt):
			
 
				+    ptr1 = (min(gt[0][0], gt[1][0], gt[2][0], gt[3][0]),
			
 
				+            min(gt[0][1], gt[1][1], gt[2][1], gt[3][1]))
			
 
				+
			
 
				+    ptr2 = ((max(gt[0][0], gt[1][0], gt[2][0], gt[3][0]),
			
 
				+             max(gt[0][1], gt[1][1], gt[2][1], gt[3][1])))
			
 
				+
			
 
				+    start_x = np.random.randint(0, int(max(ptr1[0] - 1, 1)))
			
 
				+    start_y = np.random.randint(0, int(max(ptr1[1] - 1, 1)))
			
 
				+
			
 
				+    end_x = np.random.randint(int(min(ptr2[0] + 1, img.shape[1] - 1)), img.shape[1])
			
 
				+    end_y = np.random.randint(int(min(ptr2[1] + 1, img.shape[0] - 1)), img.shape[0])
			
 
				+
			
 
				+    img = img[start_y:end_y, start_x:end_x]
			
 
				+
			
 
				+    myGt = gt - (start_x, start_y)
			
 
				+    myGt = myGt * (1.0 / img.shape[1], 1.0 / img.shape[0])
			
 
				+
			
 
				+    myGtTemp = myGt * myGt
			
 
				+    sum_array = myGtTemp.sum(axis=1)
			
 
				+    tl_index = np.argmin(sum_array)
			
 
				+    tl = myGt[tl_index]
			
 
				+    tr = myGt[(tl_index + 1) % 4]
			
 
				+    br = myGt[(tl_index + 2) % 4]
			
 
				+    bl = myGt[(tl_index + 3) % 4]
			
 
				+
			
 
				+    return img, (tl, tr, br, bl)
			
 
				+
			
 
				+
			
 
				+def get_corners(img, gt):
			
 
				+    gt = gt.astype(int)
			
 
				+    list_of_points = {}
			
 
				+    myGt = gt
			
 
				+
			
 
				+    myGtTemp = myGt * myGt
			
 
				+    sum_array = myGtTemp.sum(axis=1)
			
 
				+
			
 
				+    tl_index = np.argmin(sum_array)
			
 
				+    tl = myGt[tl_index]
			
 
				+    tr = myGt[(tl_index + 1) % 4]
			
 
				+    br = myGt[(tl_index + 2) % 4]
			
 
				+    bl = myGt[(tl_index + 3) % 4]
			
 
				+
			
 
				+    list_of_points["tr"] = tr
			
 
				+    list_of_points["tl"] = tl
			
 
				+    list_of_points["br"] = br
			
 
				+    list_of_points["bl"] = bl
			
 
				+    gt_list = []
			
 
				+    images_list = []
			
 
				+    for k, v in list_of_points.items():
			
 
				+
			
 
				+        if (k == "tl"):
			
 
				+            cords_x = __get_cords(v[0], 0, list_of_points["tr"][0], buf=10, size=abs(list_of_points["tr"][0] - v[0]))
			
 
				+            cords_y = __get_cords(v[1], 0, list_of_points["bl"][1], buf=10, size=abs(list_of_points["bl"][1] - v[1]))
			
 
				+            # print cords_y, cords_x
			
 
				+            gt = (v[0] - cords_x[0], v[1] - cords_y[0])
			
 
				+
			
 
				+            cut_image = img[cords_y[0]:cords_y[1], cords_x[0]:cords_x[1]]
			
 
				+
			
 
				+        if (k == "tr"):
			
 
				+            cords_x = __get_cords(v[0], list_of_points["tl"][0], img.shape[1], buf=10,
			
 
				+                                  size=abs(list_of_points["tl"][0] - v[0]))
			
 
				+            cords_y = __get_cords(v[1], 0, list_of_points["br"][1], buf=10, size=abs(list_of_points["br"][1] - v[1]))
			
 
				+            # print cords_y, cords_x
			
 
				+            gt = (v[0] - cords_x[0], v[1] - cords_y[0])
			
 
				+
			
 
				+            cut_image = img[cords_y[0]:cords_y[1], cords_x[0]:cords_x[1]]
			
 
				+
			
 
				+        if (k == "bl"):
			
 
				+            cords_x = __get_cords(v[0], 0, list_of_points["br"][0], buf=10,
			
 
				+                                  size=abs(list_of_points["br"][0] - v[0]))
			
 
				+            cords_y = __get_cords(v[1], list_of_points["tl"][1], img.shape[0], buf=10,
			
 
				+                                  size=abs(list_of_points["tl"][1] - v[1]))
			
 
				+            # print cords_y, cords_x
			
 
				+            gt = (v[0] - cords_x[0], v[1] - cords_y[0])
			
 
				+
			
 
				+            cut_image = img[cords_y[0]:cords_y[1], cords_x[0]:cords_x[1]]
			
 
				+
			
 
				+        if (k == "br"):
			
 
				+            cords_x = __get_cords(v[0], list_of_points["bl"][0], img.shape[1], buf=10,
			
 
				+                                  size=abs(list_of_points["bl"][0] - v[0]))
			
 
				+            cords_y = __get_cords(v[1], list_of_points["tr"][1], img.shape[0], buf=10,
			
 
				+                                  size=abs(list_of_points["tr"][1] - v[1]))
			
 
				+            # print cords_y, cords_x
			
 
				+            gt = (v[0] - cords_x[0], v[1] - cords_y[0])
			
 
				+
			
 
				+            cut_image = img[cords_y[0]:cords_y[1], cords_x[0]:cords_x[1]]
			
 
				+
			
 
				+        # cv2.circle(cut_image, gt, 2, (255, 0, 0), 6)
			
 
				+        mah_size = cut_image.shape
			
 
				+        cut_image = cv2.resize(cut_image, (300, 300))
			
 
				+        a = int(gt[0] * 300 / mah_size[1])
			
 
				+        b = int(gt[1] * 300 / mah_size[0])
			
 
				+        images_list.append(cut_image)
			
 
				+        gt_list.append((a, b))
			
 
				+    return images_list, gt_list
			
 
				+
			
 
				+
			
 
				+def __get_cords(cord, min_start, max_end, size=299, buf=5, random_scale=True):
			
 
				+    # size = max(abs(cord-min_start), abs(cord-max_end))
			
 
				+    iter = 0
			
 
				+    if (random_scale):
			
 
				+        size /= random.randint(1, 4)
			
 
				+    while (max_end - min_start) < size:
			
 
				+        size = size * .9
			
 
				+    temp = -1
			
 
				+    while (temp < 1):
			
 
				+        temp = random.normalvariate(size / 2, size / 6)
			
 
				+    x_start = max(cord - temp, min_start)
			
 
				+    x_start = int(x_start)
			
 
				+    if x_start >= cord:
			
 
				+        print("XSTART AND CORD", x_start, cord)
			
 
				+    # assert (x_start < cord)
			
 
				+    while ((x_start < min_start) or (x_start + size > max_end) or (x_start + size <= cord)):
			
 
				+        # x_start = random.randint(int(min(max(min_start, int(cord - size + buf)), cord - buf - 1)), cord - buf)
			
 
				+        temp = -1
			
 
				+        while (temp < 1):
			
 
				+            temp = random.normalvariate(size / 2, size / 6)
			
 
				+        temp = max(temp, 1)
			
 
				+        x_start = max(cord - temp, min_start)
			
 
				+        x_start = int(x_start)
			
 
				+        size = size * .995
			
 
				+        iter += 1
			
 
				+        if (iter == 1000):
			
 
				+            x_start = int(cord - (size / 2))
			
 
				+            print("Gets here")
			
 
				+            break
			
 
				+    assert (x_start >= 0)
			
 
				+    if x_start >= cord:
			
 
				+        print("XSTART AND CORD", x_start, cord)
			
 
				+    # assert (x_start < cord)
			
 
				+    # assert (x_start + size <= max_end)
			
 
				+    # assert (x_start + size > cord)
			
 
				+    return (x_start, int(x_start + size))
			
 
				+
			
 
				+
			
 
				+def setup_logger(path):
			
 
				+    import logging
			
 
				+    logger = logging.getLogger('iCARL')
			
 
				+    logger.setLevel(logging.DEBUG)
			
 
				+
			
 
				+    fh = logging.FileHandler(path + ".log")
			
 
				+    fh.setLevel(logging.DEBUG)
			
 
				+
			
 
				+    fh2 = logging.FileHandler("../temp.log")
			
 
				+    fh2.setLevel(logging.DEBUG)
			
 
				+
			
 
				+    ch = logging.StreamHandler()
			
 
				+    ch.setLevel(logging.DEBUG)
			
 
				+
			
 
				+    formatter = logging.Formatter('%(asctime)s - %(name)s - %(levelname)s - %(message)s')
			
 
				+    fh.setFormatter(formatter)
			
 
				+    fh2.setFormatter(formatter)
			
 
				+
			
 
				+    logger.addHandler(fh)
			
 
				+    logger.addHandler(fh2)
			
 
				+    logger.addHandler(ch)
			
 
				+    return logger
			
 
				+
			
 
				+
			
 
				+def sort_gt(gt):
			
 
				+    '''
			
 
				+    Sort the ground truth labels so that TL corresponds to the label with smallest distance from O
			
 
				+    :param gt: 
			
 
				+    :return: sorted gt
			
 
				+    '''
			
 
				+    myGtTemp = gt * gt
			
 
				+    sum_array = myGtTemp.sum(axis=1)
			
 
				+    tl_index = np.argmin(sum_array)
			
 
				+    tl = gt[tl_index]
			
 
				+    tr = gt[(tl_index + 1) % 4]
			
 
				+    br = gt[(tl_index + 2) % 4]
			
 
				+    bl = gt[(tl_index + 3) % 4]
			
 
				+
			
 
				+    return np.asarray((tl, tr, br, bl))
			
--- a/Dewarp/video_to_images.py
+++ b/Dewarp/video_to_images.py
@@ -0,0 +1,40 @@
 
				+import argparse
			
 
				+import os
			
 
				+import uuid
			
 
				+import datetime
			
 
				+import cv2
			
 
				+from tqdm import tqdm
			
 
				+
			
 
				+
			
 
				+def work(video_folder, output_folder, interval):
			
 
				+    if not os.path.exists(output_folder):
			
 
				+        os.makedirs(output_folder)
			
 
				+    video_list = os.listdir(video_folder)
			
 
				+    num = 1
			
 
				+    cnt = 1
			
 
				+    for video in tqdm(video_list):
			
 
				+        video_path = video_folder + '/' + video
			
 
				+        vid = cv2.VideoCapture(video_path)
			
 
				+        time = datetime.datetime.now()
			
 
				+        t = str(time.year).zfill(4) + '-' + str(time.month).zfill(2) + '-' + str(time.day).zfill(2)
			
 
				+        while vid.isOpened():
			
 
				+            is_read, frame = vid.read()
			
 
				+            if is_read:
			
 
				+                if num % interval == 0:
			
 
				+                    file_name = '%04d' % cnt
			
 
				+                    cv2.imwrite(output_folder + '/' + 'kdan_' + t + '_' + str(file_name) + '_' + str(uuid.uuid1())[0:4] + '.jpg', frame)
			
 
				+                    # 00000111.jpg 代表第111帧
			
 
				+                    cv2.waitKey(1)
			
 
				+                    cnt += 1
			
 
				+                num += 1
			
 
				+            else:
			
 
				+                break
			
 
				+
			
 
				+
			
 
				+if __name__ == '__main__':
			
 
				+    parser = argparse.ArgumentParser()
			
 
				+    parser.add_argument('--video_folder', type=str, default='./video/01')
			
 
				+    parser.add_argument('--output_folder', type=str, default='./video_frame')
			
 
				+    parser.add_argument('--interval', type=int, default=10, help='帧率间隔')
			
 
				+    args = parser.parse_args()
			
 
				+    work(args.video_folder, args.output_folder, args.interval)
			
--- a/Dewarp/write_json.py
+++ b/Dewarp/write_json.py
@@ -0,0 +1,20 @@
 
				+import json
			
 
				+from base64 import b64encode
			
 
				+
			
 
				+
			
 
				+def make_json(img_fold, json_file_path, shapes_list, image_path, image_height, image_width):
			
 
				+    flags = {}
			
 
				+    # 读取二进制图片，获得原始字节码
			
 
				+    with open(str(img_fold) + '\\' + image_path, 'rb') as jpg_file:
			
 
				+        byte_content = jpg_file.read()
			
 
				+    jpg_file.close()
			
 
				+    # 把原始字节码编码成base64字节码
			
 
				+    base64_bytes = b64encode(byte_content)
			
 
				+    # 把base64字节码解码成utf-8格式的字符串
			
 
				+    base64_string = base64_bytes.decode('utf-8')
			
 
				+    data = {'version': '5.0.1', 'flags': flags, 'shapes': shapes_list, 'imagePath': image_path, 'imageData': base64_string,
			
 
				+            'imageHeight': image_height, 'imageWidth': image_width}
			
 
				+    with open(str(img_fold) + '\\' + json_file_path, 'w') as fp:
			
 
				+        json.dump(data, fp, sort_keys=False, indent=2)
			
 
				+    fp.close()
			
 
				+    return