xiaofengShi
diff --git a/‎Errorchcker_config.yml
+108 b/‎Errorchcker_config.yml
+108
diff --git a/‎Im2Katex_config.yml
+115 b/‎Im2Katex_config.yml
+115
diff --git a/‎LICENSE
+21 b/‎LICENSE
+21
diff --git a/‎README_en.md
+120 b/‎README_en.md
+120
@@ -0,0 +1,108 @@
+!!python/object/new:easydict.EasyDict
+dictitems:
+  dataset: &id002 !!python/object/new:easydict.EasyDict
+    dictitems:
+      id_end: 1
+      id_pad: 3
+      id_start: 0
+      id_unk: 2
+      prepared_folder: &id001
+      - ./data/errorchecker_dataset/prepared
+      vocabulary_file: ./data/errorchecker_dataset/prepared/properties.npy
+    state:
+      id_end: 1
+      id_pad: 3
+      id_start: 0
+      id_unk: 2
+      prepared_folder: *id001
+      vocabulary_file: ./data/errorchecker_dataset/prepared/properties.npy
+  model: &id003 !!python/object/new:easydict.EasyDict
+    dictitems:
+      MaxPredictLength: 200
+      att_dim: 256
+      batch_size: 16
+      beam_size: 5
+      ckpt_dir: /home/xiaofeng/data/image2latex/ErrorCheck/model_saved/Prenet/ckpt
+      ckpt_name: ErrorCheck
+      clip_value: 5
+      decoding: beams_search
+      display_iter: 100
+      div_gamma: 1
+      div_prob: 0
+      droupout: 0.3
+      errche_decoder_name: DecoderAtt_errche
+      errche_embeding_dims_source: 128
+      errche_embeding_dims_target: 128
+      errche_encoder_name: Encode_errche
+      errche_encoder_type: Prenet
+      errche_rnn_decoder_dim: 256
+      errche_rnn_encoder_dim: 128
+      eval_dir: /home/xiaofeng/data/image2latex/ErrorCheck/model_saved/Prenet/eval
+      gpu_fraction: 0.48
+      learning_decay_rate: 0.94
+      learning_decay_step: 8000
+      learning_init: 0.1
+      learning_type: exponential
+      log_dir: /home/xiaofeng/code/image2katex/log
+      log_file_name: ErrorChecker.log
+      log_name: ErrorChecker
+      metric_val: perplexity
+      model_saved: /home/xiaofeng/data/image2latex/ErrorCheck/model_saved/Prenet
+      n_epochs: 1000
+      optimizer: momentum
+      save_iter: 500
+      summary_dir: /home/xiaofeng/data/image2latex/ErrorCheck/model_saved/Prenet/summary
+      test_batch_size: 1
+    state:
+      MaxPredictLength: 200
+      att_dim: 256
+      batch_size: 16
+      beam_size: 5
+      ckpt_dir: /home/xiaofeng/data/image2latex/ErrorCheck/model_saved/Prenet/ckpt
+      ckpt_name: ErrorCheck
+      clip_value: 5
+      decoding: beams_search
+      display_iter: 100
+      div_gamma: 1
+      div_prob: 0
+      droupout: 0.3
+      errche_decoder_name: DecoderAtt_errche
+      errche_embeding_dims_source: 128
+      errche_embeding_dims_target: 128
+      errche_encoder_name: Encode_errche
+      errche_encoder_type: Prenet
+      errche_rnn_decoder_dim: 256
+      errche_rnn_encoder_dim: 128
+      eval_dir: /home/xiaofeng/data/image2latex/ErrorCheck/model_saved/Prenet/eval
+      gpu_fraction: 0.48
+      learning_decay_rate: 0.94
+      learning_decay_step: 8000
+      learning_init: 0.1
+      learning_type: exponential
+      log_dir: /home/xiaofeng/code/image2katex/log
+      log_file_name: ErrorChecker.log
+      log_name: ErrorChecker
+      metric_val: perplexity
+      model_saved: /home/xiaofeng/data/image2latex/ErrorCheck/model_saved/Prenet
+      n_epochs: 1000
+      optimizer: momentum
+      save_iter: 500
+      summary_dir: /home/xiaofeng/data/image2latex/ErrorCheck/model_saved/Prenet/summary
+      test_batch_size: 1
+  predict: &id004 !!python/object/new:easydict.EasyDict
+    dictitems:
+      npy_path: ./static/npy
+      preprocess_dir: ./static/preprocess
+      render_path: ./static/render
+      temp_path: ./static
+      web_path: ./templates
+    state:
+      npy_path: ./static/npy
+      preprocess_dir: ./static/preprocess
+      render_path: ./static/render
+      temp_path: ./static
+      web_path: ./templates
+state:
+  dataset: *id002
+  model: *id003
+  predict: *id004
@@ -0,0 +1,115 @@
+!!python/object/new:easydict.EasyDict
+dictitems:
+  dataset: &id003 !!python/object/new:easydict.EasyDict
+    dictitems:
+      id_end: 1
+      id_pad: 3
+      id_start: 0
+      id_unk: 2
+      image_folder: &id001
+      - /home/xiaofeng/data/image2latex/handwritten/process/img_padding
+      - /home/xiaofeng/data/image2latex/original/process/img_padding
+      prepared_folder: &id002
+      - ./data/im2latex_dataset/merged/prepared/handwritten/
+      - ./data/im2latex_dataset/merged/prepared/original/
+      vocabulary_file: ./data/im2latex_dataset/merged/prepared/handwritten/properties.npy
+    state:
+      id_end: 1
+      id_pad: 3
+      id_start: 0
+      id_unk: 2
+      image_folder: *id001
+      prepared_folder: *id002
+      vocabulary_file: ./data/im2latex_dataset/merged/prepared/handwritten/properties.npy
+  model: &id004 !!python/object/new:easydict.EasyDict
+    dictitems:
+      MaxPredictLength: 200
+      att_dim: 512
+      batch_size: 16
+      beam_size: 5
+      ckpt_dir: /home/xiaofeng/data/image2latex/merged/model_saved/conv/ckpt
+      ckpt_name: seq2seqAtt
+      clip_value: 5
+      decoder_name: DecoderAtt
+      decoding: beams_search
+      display_iter: 100
+      div_gamma: 1
+      div_prob: 0
+      droupout: 0.3
+      embeding_dims: 80
+      encoder_cnn: vanilla
+      encoder_name: Encode
+      encoder_type: conv
+      eval_dir: /home/xiaofeng/data/image2latex/merged/model_saved/conv/eval
+      gpu_fraction: 0.48
+      learning_decay_rate: 0.94
+      learning_decay_step: 8000
+      learning_init: 0.1
+      learning_type: exponential
+      log_dir: /home/xiaofeng/code/image2katex/log
+      log_file_name: Im2Katex.log
+      log_name: Im2Katex
+      metric_val: perplexity
+      model_saved: /home/xiaofeng/data/image2latex/merged/model_saved/conv
+      n_epochs: 1000
+      optimizer: momentum
+      positional_embeddings: true
+      rnn_decoder_dim: 512
+      rnn_encoder_dim: 256
+      save_iter: 500
+      summary_dir: /home/xiaofeng/data/image2latex/merged/model_saved/conv/summary
+      test_batch_size: 1
+    state:
+      MaxPredictLength: 200
+      att_dim: 512
+      batch_size: 16
+      beam_size: 5
+      ckpt_dir: /home/xiaofeng/data/image2latex/merged/model_saved/conv/ckpt
+      ckpt_name: seq2seqAtt
+      clip_value: 5
+      decoder_name: DecoderAtt
+      decoding: beams_search
+      display_iter: 100
+      div_gamma: 1
+      div_prob: 0
+      droupout: 0.3
+      embeding_dims: 80
+      encoder_cnn: vanilla
+      encoder_name: Encode
+      encoder_type: conv
+      eval_dir: /home/xiaofeng/data/image2latex/merged/model_saved/conv/eval
+      gpu_fraction: 0.48
+      learning_decay_rate: 0.94
+      learning_decay_step: 8000
+      learning_init: 0.1
+      learning_type: exponential
+      log_dir: /home/xiaofeng/code/image2katex/log
+      log_file_name: Im2Katex.log
+      log_name: Im2Katex
+      metric_val: perplexity
+      model_saved: /home/xiaofeng/data/image2latex/merged/model_saved/conv
+      n_epochs: 1000
+      optimizer: momentum
+      positional_embeddings: true
+      rnn_decoder_dim: 512
+      rnn_encoder_dim: 256
+      save_iter: 500
+      summary_dir: /home/xiaofeng/data/image2latex/merged/model_saved/conv/summary
+      test_batch_size: 1
+  predict: &id005 !!python/object/new:easydict.EasyDict
+    dictitems:
+      npy_path: ./static/npy
+      preprocess_dir: ./static/preprocess
+      render_path: ./static/render
+      temp_path: ./static
+      web_path: ./templates
+    state:
+      npy_path: ./static/npy
+      preprocess_dir: ./static/preprocess
+      render_path: ./static/render
+      temp_path: ./static
+      web_path: ./templates
+state:
+  dataset: *id003
+  model: *id004
+  predict: *id005
@@ -0,0 +1,21 @@
+MIT License
+
+ (c) 2019 xiaofeng
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above  notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR  HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
@@ -0,0 +1,120 @@
+# Convert Img To Katex
+
+## Abstract
+
+**Implement an attention model that takes an image of a PDF math formula, and outputs the characters of the LaTeX source that generates the formula.**
+
+	This is a tensorflow implementation of the HarvardNLP paper: What You Get Is What You See: A Visual Markup Decompiler.
+The model graphic is here:
+<p align="center"><img src="http://lstm.seas.harvard.edu/latex/network.png" width="300"></p>
+
+An example input is a rendered LaTeX formula:
+
+<p align="center"><img src="http://lstm.seas.harvard.edu/latex/results/website/images/119b93a445-orig.png"></p>
+
+The goal is to infer the LaTeX formula that can render such an image:
+
+```
+ d s _ { 1 1 } ^ { 2 } = d x ^ { + } d x ^ { - } + l _ { p } ^ { 9 } \frac { p _ { - } } { r ^ { 7 } } \delta ( x ^ { - } ) d x ^ { - } d x ^ { - } + d x _ { 1 } ^ { 2 } + \; \cdots \; + d x _ { 9 } ^ { 2 }
+```
+
+## Prerequsites
+
+`Most of the code is written in tensorflow, with Python for preprocessing.`
+
+#### Preprocess
+
+The proprocessing for this dataset is exactly reproduced as the original torch implementation by the HarvardNLP group
+
+Python
+
+- Pillow
+- numpy
+
+Optional: We use Node.js and KaTeX for preprocessing [Installation](https://nodejs.org/en/)
+
+##### pdflatex [Installaton](https://www.tug.org/texlive/)
+
+Pdflatex is used for rendering LaTex during evaluation.
+
+##### ImageMagick convert [Installation](http://www.imagemagick.org/script/index.php)
+
+Convert is used for rending LaTex during evaluation.
+
+- linux `sudo apt install imagemagick`
+- linux setup webpage
+  - https://imagemagick.org/script/install-source.php
+- Mac `brew install imagemagick`
+
+##### Webkit2png [Installation](http://www.paulhammond.org/webkit2png/)
+
+Webkit2png is used for rendering HTML during evaluation.
+
+## Make the dataset with own data
+Code directionart:
+```
+cd data
+```
+
+	For more details, see the readme.md in this folder
+Once the dataset is ready, saved them as the **npy** format: 
+`train_buckets.npy, valid_buckets.npy, test_buckets.npy can be generated using the **build_imglatex_data.py** script`
+
+## Train
+
+```
+python3 train_model.py
+```
+Default hyperparameters used:
+
+* BATCH_SIZE      = 32
+* EMB_DIM         = 80
+* ENC_DIM         = 256
+* DEC_DIM         = ENC_DIM*2
+* D               = 512 (**channels in feature grid**)
+* V=len(vocab)+3  = (vocab size)+3
+* NB_EPOCHS       = 50
+* H               = 20  (Maximum height of feature grid)
+* W               = 50  (Maximum width of feature grid)
+
+The train NLL drops to 0.08 after 18 epochs of training on 24GB Nvidia M40 GPU.
+
+## Test
+* python3 predict_to_img.py
+
+
+## Evaluate
+
+attention.py scores the train set and validation set after each epoch (measures mean train NLL, perplexity)
+
+#### Scores from this implementation
+
+![results_1](results_1.png)
+![results_2](results_2.png)
+
+## Dataset
+
+- Printed style https://zenodo.org/record/56198#.XA4GjfYzZZj
+- handwriting http://lstm.seas.harvard.edu/latex/data/
+
+## Weight files
+
+[Google Drive](https://drive.google.com/drive/folders/0BwbIUfIM1M8sc0tEMGk1NGlKZTA?usp=sharing)
+
+## Details of this package
+
+- `backup_predict_to_img.py` 原始仓库网络结构测试程序
+
+## Reference
+
+*  **OpenAI’s Requests For Research Problem**[Open AI-question source](https://openai.com/requests-for-research/#im2)
+*  
+	* [Official resolution](http://lstm.seas.harvard.edu/latex/)
+	* [Official repo-torch](https://github.com/harvardnlp/im2markup)
+	* [Source paper](https://arxiv.org/pdf/1609.04938v1.pdf)
+* [Seq2Seq for LaTeX generation](https://guillaumegenthial.github.io/image-to-latex.html)
+* [Original model repo-网络模型TF](https://github.com/ritheshkumar95/im2latex-tensorflow)
+* [Another model repo--网络模型TF](https://github.com/baoblackcoal/RFR-solution)
+* [知乎解释](https://zhuanlan.zhihu.com/p/25031185)
+* [Dataset ori repo-数据集制作](https://github.com/Miffyli/im2latex-dataset)
+